2 * Copyright (C) 2013-2019 Free Software Foundation, Inc.
4 * This file is part of GNU lightning.
6 * GNU lightning is free software; you can redistribute it and/or modify it
7 * under the terms of the GNU Lesser General Public License as published
8 * by the Free Software Foundation; either version 3, or (at your option)
11 * GNU lightning is distributed in the hope that it will be useful, but
12 * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
13 * or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public
14 * License for more details.
17 * Paulo Cesar Pereira de Andrade
20 #include <lightning.h>
21 #include <lightning/jit_private.h>
23 #define jit_arg_reg_p(i) (i >= 0 && i < 4)
26 # include "jit_hppa-cpu.c"
27 # include "jit_hppa-fpu.c"
28 # include "jit_fallback.c"
34 typedef jit_pointer_t jit_va_list;
39 #define patch(instr, node) _patch(_jit, instr, node)
40 static void _patch(jit_state_t*,jit_word_t,jit_node_t*);
43 extern void __clear_cache(void *, void *);
48 jit_register_t _rvs[] = {
49 { 0, "r0" }, /* Zero */
50 /* Not register starved, so, avoid allocating r1 and rp
51 * due to being implicit target of ADDIL and B,L */
52 { 1, "r1" }, /* Scratch */
53 { 2, "rp" }, /* Return Pointer and scratch */
54 { rc(sav) | 3, "r3" },
55 { 19, "r19" }, /* Linkage Table */
56 { rc(gpr) | 20, "r20" },
57 { rc(gpr) | 21, "r21" },
58 { rc(gpr) | 22, "r22" },
59 { rc(gpr) | 29, "ret1" },
60 { rc(gpr) | 28, "ret0" },
61 /* JIT_Rx in callee save registers due to need to call
62 * functions to implement some instructions */
64 { rc(gpr) | rc(sav) | 4, "r4" },
65 { rc(gpr) | rc(sav) | 5, "r5" },
66 { rc(gpr) | rc(sav) | 6, "r6" },
68 { rc(gpr) | rc(sav) | 7, "r7" },
69 { rc(sav) | rc(sav) | 8, "r8" },
70 { rc(gpr) | rc(sav) | 9, "r9" },
72 { rc(gpr) | rc(sav) | 10, "r10" },
74 { rc(gpr) | rc(sav) | 11, "r11" },
75 { rc(gpr) | rc(sav) | 12, "r12" },
76 { rc(gpr) | rc(sav) | 13, "r13" },
77 { rc(gpr) | rc(sav) | 14, "r14" },
78 { rc(gpr) | rc(sav) | 15, "r15" },
79 { rc(gpr) | rc(sav) | 16, "r16" },
80 { rc(gpr) | rc(sav) | 17, "r17" },
81 { rc(gpr) | rc(sav) | 18, "r18" },
83 { rc(gpr) | rc(arg) | 23, "r23" },
84 { rc(gpr) | rc(arg) | 24, "r24" },
85 { rc(gpr) | rc(arg) | 25, "r25" },
86 { rc(gpr) | rc(arg) | 26, "r26" },
87 { 27, "dp" }, /* Data Pointer */
89 { 31, "r31" }, /* Link Register */
90 { rc(fpr) | 31, "fr31" },
91 { rc(fpr) | 30, "fr30" },
92 { rc(fpr) | 29, "fr29" },
93 { rc(fpr) | 28, "fr28" },
94 { rc(fpr) | 27, "fr27" },
95 { rc(fpr) | 26, "fr26" },
96 { rc(fpr) | 25, "fr25" },
97 { rc(fpr) | 24, "fr24" },
98 { rc(fpr) | 23, "fr23" },
99 { rc(fpr) | 22, "fr22" },
100 { rc(fpr) | 11, "fr11" },
101 { rc(fpr) | 10, "fr10" },
102 { rc(fpr) | 9, "fr9" },
103 { rc(fpr) | 8, "fr8" },
105 { rc(fpr) | rc(arg) | 7, "fr7" },
106 { rc(fpr) | rc(arg) | 6, "fr6" },
107 { rc(fpr) | rc(arg) | 5, "fr5" },
108 { rc(fpr) | rc(arg) | 4, "fr4" },
110 { rc(fpr) | rc(sav) | 21, "fr21" },
111 { rc(fpr) | rc(sav) | 20, "fr20" },
112 { rc(fpr) | rc(sav) | 19, "fr19" },
113 { rc(fpr) | rc(sav) | 18, "fr18" },
114 { rc(fpr) | rc(sav) | 17, "fr17" },
115 { rc(fpr) | rc(sav) | 16, "fr16" },
116 { rc(fpr) | rc(sav) | 15, "fr15" },
117 { rc(fpr) | rc(sav) | 14, "fr14" },
118 { rc(fpr) | rc(sav) | 13, "fr13" },
119 { rc(fpr) | rc(sav) | 12, "fr12" },
124 { _NOREG, "<none>" },
133 /* FIXME Expecting PARISC 2.0, for PARISC 1.0 should not use fr16-fr31 */
137 _jit_init(jit_state_t *_jit)
139 _jitc->reglen = jit_size(_rvs) - 1;
143 _jit_prolog(jit_state_t *_jit)
149 assert(jit_regset_cmp_ui(&_jitc->regarg, 0) == 0);
150 jit_regset_set_ui(&_jitc->regsav, 0);
151 offset = _jitc->functions.offset;
152 if (offset >= _jitc->functions.length) {
153 jit_realloc((jit_pointer_t *)&_jitc->functions.ptr,
154 _jitc->functions.length * sizeof(jit_function_t),
155 (_jitc->functions.length + 16) * sizeof(jit_function_t));
156 _jitc->functions.length += 16;
158 _jitc->function = _jitc->functions.ptr + _jitc->functions.offset++;
159 _jitc->function->self.size = params_offset;
160 _jitc->function->self.argi = _jitc->function->self.alen = 0;
161 /* float conversion */
162 _jitc->function->self.aoff = alloca_offset;
163 _jitc->function->self.call = jit_call_default;
164 jit_alloc((jit_pointer_t *)&_jitc->function->regoff,
165 _jitc->reglen * sizeof(jit_int32_t));
167 /* _no_link here does not mean the jit_link() call can be removed
169 * _jitc->function->prolog = jit_new_node(jit_code_prolog);
171 _jitc->function->prolog = jit_new_node_no_link(jit_code_prolog);
172 jit_link(_jitc->function->prolog);
173 _jitc->function->prolog->w.w = offset;
174 _jitc->function->epilog = jit_new_node_no_link(jit_code_epilog);
176 * v: offset in blocks vector
177 * w: offset in functions vector
179 _jitc->function->epilog->w.w = offset;
181 jit_regset_new(&_jitc->function->regset);
185 _jit_allocai(jit_state_t *_jit, jit_int32_t length)
188 assert(_jitc->function);
193 _jitc->function->self.aoff = (_jitc->function->self.aoff + 1) & -2;
196 _jitc->function->self.aoff = (_jitc->function->self.aoff + 3) & -4;
199 _jitc->function->self.aoff = (_jitc->function->self.aoff + 7) & -8;
202 if (!_jitc->realize) {
203 jit_inc_synth_ww(allocai, _jitc->function->self.aoff, length);
206 offset = _jitc->function->self.aoff;
207 _jitc->function->self.aoff += length;
212 _jit_allocar(jit_state_t *_jit, jit_int32_t u, jit_int32_t v)
215 assert(_jitc->function);
216 jit_inc_synth_ww(allocar, u, v);
217 if (!_jitc->function->allocar) {
218 _jitc->function->aoffoff = jit_allocai(sizeof(jit_int32_t));
219 _jitc->function->allocar = 1;
221 reg = jit_get_reg(jit_class_gpr);
222 jit_addi(reg, v, 63);
223 jit_andi(reg, reg, -64);
224 jit_ldxi_i(u, JIT_FP, _jitc->function->aoffoff);
225 jit_addr(JIT_SP, JIT_SP, reg);
226 jit_stxi_i(_jitc->function->aoffoff, JIT_FP, u);
232 _jit_ret(jit_state_t *_jit)
235 assert(_jitc->function);
239 jit_patch_at(instr, _jitc->function->epilog);
244 _jit_retr(jit_state_t *_jit, jit_int32_t u)
246 jit_inc_synth_w(retr, u);
247 jit_movr(JIT_RET, u);
253 _jit_reti(jit_state_t *_jit, jit_word_t u)
255 jit_inc_synth_w(reti, u);
256 jit_movi(JIT_RET, u);
262 _jit_retr_f(jit_state_t *_jit, jit_int32_t u)
264 jit_inc_synth_w(retr_f, u);
265 jit_movr_f(JIT_FRET, u);
271 _jit_reti_f(jit_state_t *_jit, jit_float32_t u)
273 jit_inc_synth_f(reti_f, u);
274 jit_movi_f(JIT_FRET, u);
280 _jit_retr_d(jit_state_t *_jit, jit_int32_t u)
282 jit_inc_synth_w(retr_d, u);
283 jit_movr_d(JIT_FRET, u);
289 _jit_reti_d(jit_state_t *_jit, jit_float64_t u)
291 jit_inc_synth_d(reti_d, u);
292 jit_movi_d(JIT_FRET, u);
298 _jit_epilog(jit_state_t *_jit)
300 assert(_jitc->function);
301 assert(_jitc->function->epilog->next == NULL);
302 jit_link(_jitc->function->epilog);
303 _jitc->function = NULL;
307 _jit_arg_register_p(jit_state_t *_jit, jit_node_t *u)
309 assert(u->code == jit_code_arg ||
310 u->code == jit_code_arg_f || u->code == jit_code_arg_d);
311 return (jit_arg_reg_p(u->u.w));
315 _jit_ellipsis(jit_state_t *_jit)
317 jit_inc_synth(ellipsis);
318 if (_jitc->prepare) {
320 assert(!(_jitc->function->call.call & jit_call_varargs));
321 _jitc->function->call.call |= jit_call_varargs;
325 assert(!(_jitc->function->self.call & jit_call_varargs));
326 _jitc->function->self.call |= jit_call_varargs;
328 _jitc->function->vagp = _jitc->function->self.argi;
334 _jit_va_push(jit_state_t *_jit, jit_int32_t u)
336 jit_inc_synth_w(va_push, u);
342 _jit_arg(jit_state_t *_jit)
346 assert(_jitc->function);
347 _jitc->function->self.size -= sizeof(jit_word_t);
348 if (jit_arg_reg_p(_jitc->function->self.argi))
349 offset = _jitc->function->self.argi++;
351 offset = _jitc->function->self.size;
352 node = jit_new_node_ww(jit_code_arg, offset,
353 ++_jitc->function->self.argn);
359 _jit_arg_f(jit_state_t *_jit)
363 assert(_jitc->function);
364 _jitc->function->self.size -= sizeof(jit_word_t);
365 if (jit_arg_reg_p(_jitc->function->self.argi))
366 offset = _jitc->function->self.argi++;
368 offset = _jitc->function->self.size;
369 node = jit_new_node_ww(jit_code_arg_f, offset,
370 ++_jitc->function->self.argn);
376 _jit_arg_d(jit_state_t *_jit)
380 assert(_jitc->function);
381 if (_jitc->function->self.argi & 1) {
382 ++_jitc->function->self.argi;
383 _jitc->function->self.size -= sizeof(jit_word_t);
385 _jitc->function->self.size -= sizeof(jit_float64_t);
386 if (jit_arg_reg_p(_jitc->function->self.argi)) {
387 offset = _jitc->function->self.argi + 1;
388 _jitc->function->self.argi += 2;
391 /* "Standard" initial value (-52) is unaligned */
392 if (_jitc->function->self.size & 7)
393 _jitc->function->self.size -= sizeof(jit_word_t);
394 offset = _jitc->function->self.size;
396 node = jit_new_node_ww(jit_code_arg_d, offset,
397 ++_jitc->function->self.argn);
403 _jit_getarg_c(jit_state_t *_jit, jit_int32_t u, jit_node_t *v)
405 assert(v->code == jit_code_arg);
406 jit_inc_synth_wp(getarg_c, u, v);
408 jit_extr_c(u, _R26 - v->u.w);
410 jit_ldxi_c(u, JIT_FP, v->u.w + 3);
415 _jit_getarg_uc(jit_state_t *_jit, jit_int32_t u, jit_node_t *v)
417 assert(v->code == jit_code_arg);
418 jit_inc_synth_wp(getarg_uc, u, v);
420 jit_extr_uc(u, _R26 - v->u.w);
422 jit_ldxi_uc(u, JIT_FP, v->u.w + 3);
427 _jit_getarg_s(jit_state_t *_jit, jit_int32_t u, jit_node_t *v)
429 assert(v->code == jit_code_arg);
430 jit_inc_synth_wp(getarg_s, u, v);
432 jit_extr_s(u, _R26 - v->u.w);
434 jit_ldxi_s(u, JIT_FP, v->u.w + 2);
439 _jit_getarg_us(jit_state_t *_jit, jit_int32_t u, jit_node_t *v)
441 assert(v->code == jit_code_arg);
442 jit_inc_synth_wp(getarg_us, u, v);
444 jit_extr_us(u, _R26 - v->u.w);
446 jit_ldxi_us(u, JIT_FP, v->u.w + 2);
451 _jit_getarg_i(jit_state_t *_jit, jit_int32_t u, jit_node_t *v)
453 assert(v->code == jit_code_arg);
454 jit_inc_synth_wp(getarg_i, u, v);
456 jit_movr(u, _R26 - v->u.w);
458 jit_ldxi_i(u, JIT_FP, v->u.w);
463 _jit_putargr(jit_state_t *_jit, jit_int32_t u, jit_node_t *v)
465 assert(v->code == jit_code_arg);
466 jit_inc_synth_wp(putargr, u, v);
468 jit_movr(_R26 - v->u.w, u);
470 jit_stxi(v->u.w, JIT_FP, u);
475 _jit_putargi(jit_state_t *_jit, jit_word_t u, jit_node_t *v)
478 assert(v->code == jit_code_arg);
479 jit_inc_synth_wp(putargi, u, v);
481 jit_movi(_R26 - v->u.w, u);
483 regno = jit_get_reg(jit_class_gpr);
485 jit_stxi(v->u.w, JIT_FP, regno);
486 jit_unget_reg(regno);
492 _jit_getarg_f(jit_state_t *_jit, jit_int32_t u, jit_node_t *v)
494 assert(v->code == jit_code_arg_f);
495 jit_inc_synth_wp(getarg_f, u, v);
497 jit_movr_f(u, _F4 - v->u.w);
499 jit_ldxi_f(u, JIT_FP, v->u.w);
504 _jit_putargr_f(jit_state_t *_jit, jit_int32_t u, jit_node_t *v)
506 assert(v->code == jit_code_arg_f);
507 jit_inc_synth_wp(putargr_f, u, v);
509 jit_movr_f(_F4 - v->u.w, u);
511 jit_stxi_f(v->u.w, JIT_FP, u);
516 _jit_putargi_f(jit_state_t *_jit, jit_float32_t u, jit_node_t *v)
519 assert(v->code == jit_code_arg_f);
520 jit_inc_synth_fp(putargi_f, u, v);
522 jit_movi_f(_R26 - v->u.w, u);
524 regno = jit_get_reg(jit_class_fpr);
525 jit_movi_f(regno, u);
526 jit_stxi_f(v->u.w, JIT_FP, regno);
527 jit_unget_reg(regno);
533 _jit_getarg_d(jit_state_t *_jit, jit_int32_t u, jit_node_t *v)
535 assert(v->code == jit_code_arg_d);
536 jit_inc_synth_wp(getarg_d, u, v);
538 jit_movr_d(u, _F4 - v->u.w);
540 jit_ldxi_d(u, JIT_FP, v->u.w);
545 _jit_putargr_d(jit_state_t *_jit, jit_int32_t u, jit_node_t *v)
547 assert(v->code == jit_code_arg_d);
548 jit_inc_synth_wp(putargr_d, u, v);
550 jit_movr_d(_F4 - v->u.w, u);
552 jit_stxi_d(v->u.w, JIT_FP, u);
557 _jit_putargi_d(jit_state_t *_jit, jit_float64_t u, jit_node_t *v)
560 assert(v->code == jit_code_arg_d);
561 jit_inc_synth_dp(putargi_d, u, v);
563 jit_movi_d(_R26 - v->u.w, u);
565 regno = jit_get_reg(jit_class_fpr);
566 jit_movi_d(regno, u);
567 jit_stxi_d(v->u.w, JIT_FP, regno);
568 jit_unget_reg(regno);
574 _jit_pushargr(jit_state_t *_jit, jit_int32_t u)
576 assert(_jitc->function);
577 jit_inc_synth_w(pushargr, u);
579 _jitc->function->call.size -= sizeof(jit_word_t);
580 if (jit_arg_reg_p(_jitc->function->call.argi)) {
581 jit_movr(_R26 - _jitc->function->call.argi, u);
582 ++_jitc->function->call.argi;
585 jit_stxi(_jitc->function->call.size + params_offset, JIT_SP, u);
590 _jit_pushargi(jit_state_t *_jit, jit_word_t u)
593 assert(_jitc->function);
594 jit_inc_synth_w(pushargi, u);
596 _jitc->function->call.size -= sizeof(jit_word_t);
597 if (jit_arg_reg_p(_jitc->function->call.argi)) {
598 jit_movi(_R26 - _jitc->function->call.argi, u);
599 ++_jitc->function->call.argi;
602 regno = jit_get_reg(jit_class_gpr);
604 jit_stxi(_jitc->function->call.size + params_offset, JIT_SP, regno);
605 jit_unget_reg(regno);
611 _jit_pushargr_f(jit_state_t *_jit, jit_int32_t u)
613 assert(_jitc->function);
614 jit_inc_synth_w(pushargr_f, u);
616 _jitc->function->call.size -= sizeof(jit_word_t);
617 if (jit_arg_reg_p(_jitc->function->call.argi)) {
618 jit_movr_f(_F4 - _jitc->function->call.argi, u);
620 /* HP-UX appears to always pass float arguments in gpr registers */
621 if (_jitc->function->call.call & jit_call_varargs)
624 jit_stxi_f(alloca_offset - 8, JIT_FP, u);
625 jit_ldxi(_R26 - _jitc->function->call.argi, JIT_FP,
628 ++_jitc->function->call.argi;
631 jit_stxi_f(_jitc->function->call.size + params_offset, JIT_SP, u);
636 _jit_pushargi_f(jit_state_t *_jit, jit_float32_t u)
639 assert(_jitc->function);
640 jit_inc_synth_f(pushargi_f, u);
642 _jitc->function->call.size -= sizeof(jit_word_t);
643 if (jit_arg_reg_p(_jitc->function->call.argi)) {
644 jit_movi_f(_F4 - _jitc->function->call.argi, u);
646 /* HP-UX appears to always pass float arguments in gpr registers */
647 if (_jitc->function->call.call & jit_call_varargs)
650 jit_stxi_f(alloca_offset - 8, JIT_FP,
651 _F4 - _jitc->function->call.argi);
652 jit_ldxi(_R26 - _jitc->function->call.argi,
653 JIT_FP, alloca_offset - 8);
655 ++_jitc->function->call.argi;
658 regno = jit_get_reg(jit_class_fpr);
659 jit_movi_f(regno, u);
660 jit_stxi_f(_jitc->function->call.size + params_offset, JIT_SP, regno);
661 jit_unget_reg(regno);
667 _jit_pushargr_d(jit_state_t *_jit, jit_int32_t u)
669 assert(_jitc->function);
670 jit_inc_synth_w(pushargr_d, u);
672 _jitc->function->call.size -= sizeof(jit_float64_t);
673 if (_jitc->function->call.argi & 1) {
674 ++_jitc->function->call.argi;
675 _jitc->function->call.size -= sizeof(jit_word_t);
677 if (jit_arg_reg_p(_jitc->function->call.argi)) {
678 jit_movr_d(_F4 - (_jitc->function->call.argi + 1), u);
680 /* HP-UX appears to always pass float arguments in gpr registers */
681 if (_jitc->function->call.call & jit_call_varargs)
684 jit_stxi_d(alloca_offset - 8, JIT_FP, u);
685 jit_ldxi(_R26 - _jitc->function->call.argi,
686 JIT_FP, alloca_offset - 4);
687 jit_ldxi(_R25 - _jitc->function->call.argi,
688 JIT_FP, alloca_offset - 8);
690 _jitc->function->call.argi += 2;
693 /* "Standard" initial value (-52) is unaligned */
694 if ((_jitc->function->call.size + params_offset) & 7)
695 _jitc->function->call.size -= sizeof(jit_word_t);
696 jit_stxi_d(_jitc->function->call.size + params_offset, JIT_SP, u);
702 _jit_pushargi_d(jit_state_t *_jit, jit_float64_t u)
705 assert(_jitc->function);
706 jit_inc_synth_d(pushargi_d, u);
708 _jitc->function->call.size -= sizeof(jit_float64_t);
709 if (_jitc->function->call.argi & 1) {
710 ++_jitc->function->call.argi;
711 _jitc->function->call.size -= sizeof(jit_word_t);
713 if (jit_arg_reg_p(_jitc->function->call.argi)) {
714 jit_movi_d(_F4 - (_jitc->function->call.argi + 1), u);
716 /* HP-UX appears to always pass float arguments in gpr registers */
717 if (_jitc->function->call.call & jit_call_varargs)
720 jit_stxi_d(alloca_offset - 8, JIT_FP,
721 _F4 - (_jitc->function->call.argi + 1));
722 jit_ldxi(_R26 - _jitc->function->call.argi,
723 JIT_FP, alloca_offset - 4);
724 jit_ldxi(_R25 - _jitc->function->call.argi,
725 JIT_FP, alloca_offset - 8);
727 _jitc->function->call.argi += 2;
730 regno = jit_get_reg(jit_class_fpr);
731 jit_movi_d(regno, u);
732 if ((_jitc->function->call.size + params_offset) & 7)
733 _jitc->function->call.size -= sizeof(jit_word_t);
734 jit_stxi_d(_jitc->function->call.size + params_offset, JIT_SP, regno);
735 jit_unget_reg(regno);
741 _jit_regarg_p(jit_state_t *_jit, jit_node_t *node, jit_int32_t regno)
744 spec = jit_class(_rvs[regno].spec);
745 if (spec & jit_class_arg) {
746 if (spec & jit_class_gpr) {
748 if (regno >= 0 && regno < node->v.w)
751 else if (spec & jit_class_fpr) {
753 if (regno >= 0 && regno < node->w.w)
761 _jit_finishr(jit_state_t *_jit, jit_int32_t r0)
764 assert(_jitc->function);
765 jit_inc_synth_w(finishr, r0);
766 if (_jitc->function->self.alen > _jitc->function->call.size)
767 _jitc->function->self.alen = _jitc->function->call.size;
768 call = jit_callr(r0);
769 call->v.w = call->w.w = _jitc->function->call.argi;
770 _jitc->function->call.argi = _jitc->function->call.size = 0;
776 _jit_finishi(jit_state_t *_jit, jit_pointer_t i0)
779 assert(_jitc->function);
780 jit_inc_synth_w(finishi, (jit_word_t)i0);
781 if (_jitc->function->self.alen > _jitc->function->call.size)
782 _jitc->function->self.alen = _jitc->function->call.size;
783 node = jit_calli(i0);
784 node->v.w = node->w.w = _jitc->function->call.argi;
785 _jitc->function->call.argi = _jitc->function->call.size = 0;
792 _jit_retval_c(jit_state_t *_jit, jit_int32_t r0)
794 jit_inc_synth_w(retval_c, r0);
795 jit_extr_c(r0, JIT_RET);
800 _jit_retval_uc(jit_state_t *_jit, jit_int32_t r0)
802 jit_inc_synth_w(retval_uc, r0);
803 jit_extr_uc(r0, JIT_RET);
808 _jit_retval_s(jit_state_t *_jit, jit_int32_t r0)
810 jit_inc_synth_w(retval_s, r0);
811 jit_extr_s(r0, JIT_RET);
816 _jit_retval_us(jit_state_t *_jit, jit_int32_t r0)
818 jit_inc_synth_w(retval_us, r0);
819 jit_extr_us(r0, JIT_RET);
824 _jit_retval_i(jit_state_t *_jit, jit_int32_t r0)
826 jit_inc_synth_w(retval_i, r0);
827 jit_movr(r0, JIT_RET);
832 _jit_retval_f(jit_state_t *_jit, jit_int32_t r0)
834 jit_inc_synth_w(retval_f, r0);
835 jit_movr_f(r0, JIT_FRET);
840 _jit_retval_d(jit_state_t *_jit, jit_int32_t r0)
842 jit_inc_synth_w(retval_d, r0);
843 jit_movr_d(r0, JIT_FRET);
848 _emit_code(jit_state_t *_jit)
858 #if DEVEL_DISASSEMBLER
861 jit_int32_t patch_offset;
863 #if DEVEL_DISASSEMBLER
867 _jitc->function = NULL;
873 undo.patch_offset = 0;
875 #define case_rr(name, type) \
876 case jit_code_##name##r##type: \
877 name##r##type(rn(node->u.w), rn(node->v.w)); \
879 #define case_rw(name, type) \
880 case jit_code_##name##i##type: \
881 name##i##type(rn(node->u.w), node->v.w); \
883 #define case_wr(name, type) \
884 case jit_code_##name##i##type: \
885 name##i##type(node->u.w, rn(node->v.w)); \
887 #define case_rrr(name, type) \
888 case jit_code_##name##r##type: \
889 name##r##type(rn(node->u.w), \
890 rn(node->v.w), rn(node->w.w)); \
892 #define case_rrrr(name, type) \
893 case jit_code_##name##r##type: \
894 name##r##type(rn(node->u.q.l), rn(node->u.q.h), \
895 rn(node->v.w), rn(node->w.w)); \
897 #define case_rrw(name, type) \
898 case jit_code_##name##i##type: \
899 name##i##type(rn(node->u.w),rn(node->v.w), node->w.w); \
901 #define case_rrrw(name, type) \
902 case jit_code_##name##i##type: \
903 name##i##type(rn(node->u.q.l), rn(node->u.q.h), \
904 rn(node->v.w), node->w.w); \
906 #define case_rrf(name, type, size) \
907 case jit_code_##name##i##type: \
908 assert(node->flag & jit_flag_data); \
909 name##i##type(rn(node->u.w), rn(node->v.w), \
910 (jit_float##size##_t *)node->w.n->u.w); \
912 #define case_wrr(name, type) \
913 case jit_code_##name##i##type: \
914 name##i##type(node->u.w,rn(node->v.w), rn(node->w.w)); \
916 #define case_brr(name, type) \
917 case jit_code_##name##r##type: \
919 assert(temp->code == jit_code_label || \
920 temp->code == jit_code_epilog); \
921 if (temp->flag & jit_flag_patch) \
922 name##r##type(temp->u.w, rn(node->v.w), \
925 word = name##r##type(_jit->pc.w, \
926 rn(node->v.w), rn(node->w.w)); \
930 #define case_brw(name, type) \
931 case jit_code_##name##i##type: \
933 assert(temp->code == jit_code_label || \
934 temp->code == jit_code_epilog); \
935 if (temp->flag & jit_flag_patch) \
936 name##i##type(temp->u.w, \
937 rn(node->v.w), node->w.w); \
939 word = name##i##type(_jit->pc.w, \
940 rn(node->v.w), node->w.w); \
944 #define case_brf(name, type, size) \
945 case jit_code_##name##i##type: \
947 assert(temp->code == jit_code_label || \
948 temp->code == jit_code_epilog); \
949 if (temp->flag & jit_flag_patch) \
950 name##i##type(temp->u.w, rn(node->v.w), \
951 (jit_float##size##_t *)node->w.n->u.w); \
953 word = name##i##type(_jit->pc.w, rn(node->v.w), \
954 (jit_float##size##_t *)node->w.n->u.w); \
958 #if DEVEL_DISASSEMBLER
961 for (node = _jitc->head; node; node = node->next) {
962 if (_jit->pc.uc >= _jitc->code.end)
965 #if DEVEL_DISASSEMBLER
966 node->offset = (jit_uword_t)_jit->pc.w - (jit_uword_t)prevw;
969 value = jit_classify(node->code);
970 jit_regarg_set(node, value);
971 switch (node->code) {
973 assert(!(node->u.w & (node->u.w - 1)) &&
974 node->u.w <= sizeof(jit_word_t));
975 if (node->u.w == sizeof(jit_word_t) &&
976 (word = _jit->pc.w & (sizeof(jit_word_t) - 1)))
977 nop(sizeof(jit_word_t) - word);
979 case jit_code_note: case jit_code_name:
980 node->u.w = _jit->pc.w;
983 /* remember label is defined */
984 node->flag |= jit_flag_patch;
985 node->u.w = _jit->pc.w;
1004 case_rrrr(qmul, _u);
1005 case_rrrw(qmul, _u);
1016 case_rrrr(qdiv, _u);
1017 case_rrrw(qdiv, _u);
1033 casr(rn(node->u.w), rn(node->v.w),
1034 rn(node->w.q.l), rn(node->w.q.h));
1037 casi(rn(node->u.w), node->v.w,
1038 rn(node->w.q.l), rn(node->w.q.h));
1042 if (node->flag & jit_flag_node) {
1044 if (temp->code == jit_code_data ||
1045 (temp->code == jit_code_label &&
1046 (temp->flag & jit_flag_patch)))
1047 movi(rn(node->u.w), temp->u.w);
1049 assert(temp->code == jit_code_label ||
1050 temp->code == jit_code_epilog);
1051 word = movi_p(rn(node->u.w), node->v.w);
1056 movi(rn(node->u.w), node->v.w);
1066 case_rr(bswap, _us);
1067 case_rr(bswap, _ui);
1146 case_brr(boadd, _u);
1147 case_brw(boadd, _u);
1150 case_brr(bxadd, _u);
1151 case_brw(bxadd, _u);
1154 case_brr(bosub, _u);
1155 case_brw(bosub, _u);
1158 case_brr(bxsub, _u);
1159 case_brw(bxsub, _u);
1161 case jit_code_movi_f:
1162 assert(node->flag & jit_flag_data);
1163 movi_f(rn(node->u.w), (jit_float32_t *)node->v.n->u.w);
1166 case jit_code_movi_d:
1167 assert(node->flag & jit_flag_data);
1168 movi_d(rn(node->u.w), (jit_float64_t *)node->v.n->u.w);
1170 case_rr(trunc, _f_i);
1171 case_rr(trunc, _d_i);
1183 case_rrf(add, _f, 32);
1185 case_rrf(add, _d, 64);
1187 case_rrf(sub, _f, 32);
1188 case_rrf(rsb, _f, 32);
1190 case_rrf(sub, _d, 64);
1191 case_rrf(rsb, _d, 64);
1193 case_rrf(mul, _f, 32);
1195 case_rrf(mul, _d, 64);
1197 case_rrf(div, _f, 32);
1199 case_rrf(div, _d, 64);
1201 case_rrf(lt, _f, 32);
1203 case_rrf(lt, _d, 64);
1205 case_rrf(le, _f, 32);
1207 case_rrf(le, _d, 64);
1209 case_rrf(eq, _f, 32);
1211 case_rrf(eq, _d, 64);
1213 case_rrf(ge, _f, 32);
1215 case_rrf(ge, _d, 64);
1217 case_rrf(gt, _f, 32);
1219 case_rrf(gt, _d, 64);
1221 case_rrf(ne, _f, 32);
1223 case_rrf(ne, _d, 64);
1225 case_rrf(unlt, _f, 32);
1227 case_rrf(unlt, _d, 64);
1229 case_rrf(unle, _f, 32);
1231 case_rrf(unle, _d, 64);
1233 case_rrf(uneq, _f, 32);
1235 case_rrf(uneq, _d, 64);
1237 case_rrf(unge, _f, 32);
1239 case_rrf(unge, _d, 64);
1241 case_rrf(ungt, _f, 32);
1243 case_rrf(ungt, _d, 64);
1245 case_rrf(ltgt, _f, 32);
1247 case_rrf(ltgt, _d, 64);
1249 case_rrf(ord, _f, 32);
1251 case_rrf(ord, _d, 64);
1252 case_rrr(unord, _f);
1253 case_rrf(unord, _f, 32);
1254 case_rrr(unord, _d);
1255 case_rrf(unord, _d, 64);
1273 case_brf(blt, _f, 32);
1275 case_brf(blt, _d, 64);
1277 case_brf(ble, _f, 32);
1279 case_brf(ble, _d, 64);
1281 case_brf(beq, _f, 32);
1283 case_brf(beq, _d, 64);
1285 case_brf(bge, _f, 32);
1287 case_brf(bge, _d, 64);
1289 case_brf(bgt, _f, 32);
1291 case_brf(bgt, _d, 64);
1293 case_brf(bne, _f, 32);
1295 case_brf(bne, _d, 64);
1296 case_brr(bunlt, _f);
1297 case_brf(bunlt, _f, 32);
1298 case_brr(bunlt, _d);
1299 case_brf(bunlt, _d, 64);
1300 case_brr(bunle, _f);
1301 case_brf(bunle, _f, 32);
1302 case_brr(bunle, _d);
1303 case_brf(bunle, _d, 64);
1304 case_brr(buneq, _f);
1305 case_brf(buneq, _f, 32);
1306 case_brr(buneq, _d);
1307 case_brf(buneq, _d, 64);
1308 case_brr(bunge, _f);
1309 case_brf(bunge, _f, 32);
1310 case_brr(bunge, _d);
1311 case_brf(bunge, _d, 64);
1312 case_brr(bungt, _f);
1313 case_brf(bungt, _f, 32);
1314 case_brr(bungt, _d);
1315 case_brf(bungt, _d, 64);
1316 case_brr(bltgt, _f);
1317 case_brf(bltgt, _f, 32);
1318 case_brr(bltgt, _d);
1319 case_brf(bltgt, _d, 64);
1321 case_brf(bord, _f, 32);
1323 case_brf(bord, _d, 64);
1324 case_brr(bunord, _f);
1325 case_brf(bunord, _f, 32);
1326 case_brr(bunord, _d);
1327 case_brf(bunord, _d, 64);
1329 jmpr(rn(node->u.w));
1332 if (node->flag & jit_flag_node) {
1334 assert(temp->code == jit_code_label ||
1335 temp->code == jit_code_epilog);
1336 if (temp->flag & jit_flag_patch)
1339 word = jmpi_p(_jit->pc.w);
1346 case jit_code_callr:
1347 callr(rn(node->u.w));
1349 case jit_code_calli:
1350 if (node->flag & jit_flag_node) {
1352 assert(temp->code == jit_code_label ||
1353 temp->code == jit_code_epilog);
1354 if (!(temp->flag & jit_flag_patch)) {
1355 word = calli_p(temp->u.w);
1364 case jit_code_prolog:
1365 _jitc->function = _jitc->functions.ptr + node->w.w;
1367 undo.word = _jit->pc.w;
1368 #if DEVEL_DISASSEMBLER
1371 undo.patch_offset = _jitc->patches.offset;
1376 case jit_code_epilog:
1377 assert(_jitc->function == _jitc->functions.ptr + node->w.w);
1379 for (temp = undo.node->next;
1380 temp != node; temp = temp->next) {
1381 if (temp->code == jit_code_label ||
1382 temp->code == jit_code_epilog)
1383 temp->flag &= ~jit_flag_patch;
1385 temp->flag &= ~jit_flag_patch;
1387 _jit->pc.w = undo.word;
1388 #if DEVEL_DISASSEMBLER
1391 _jitc->patches.offset = undo.patch_offset;
1392 goto restart_function;
1394 /* remember label is defined */
1395 node->flag |= jit_flag_patch;
1396 node->u.w = _jit->pc.w;
1398 _jitc->function = NULL;
1400 case jit_code_va_start:
1401 vastart(rn(node->u.w));
1403 case jit_code_va_arg:
1404 vaarg(rn(node->u.w), rn(node->v.w));
1406 case jit_code_va_arg_d:
1407 vaarg_d(rn(node->u.w), rn(node->v.w));
1410 case jit_code_arg: case jit_code_ellipsis:
1411 case jit_code_va_push:
1412 case jit_code_allocai: case jit_code_allocar:
1413 case jit_code_arg_f: case jit_code_arg_d:
1414 case jit_code_va_end:
1416 case jit_code_retr: case jit_code_reti:
1417 case jit_code_retr_f: case jit_code_reti_f:
1418 case jit_code_retr_d: case jit_code_reti_d:
1419 case jit_code_getarg_c: case jit_code_getarg_uc:
1420 case jit_code_getarg_s: case jit_code_getarg_us:
1421 case jit_code_getarg_i:
1422 case jit_code_getarg_f: case jit_code_getarg_d:
1423 case jit_code_putargr: case jit_code_putargi:
1424 case jit_code_putargr_f: case jit_code_putargi_f:
1425 case jit_code_putargr_d: case jit_code_putargi_d:
1426 case jit_code_pushargr: case jit_code_pushargi:
1427 case jit_code_pushargr_f: case jit_code_pushargi_f:
1428 case jit_code_pushargr_d: case jit_code_pushargi_d:
1429 case jit_code_retval_c: case jit_code_retval_uc:
1430 case jit_code_retval_s: case jit_code_retval_us:
1431 case jit_code_retval_i:
1432 case jit_code_retval_f: case jit_code_retval_d:
1433 case jit_code_prepare:
1434 case jit_code_finishr: case jit_code_finishi:
1439 jit_regarg_clr(node, value);
1440 assert(_jitc->regarg == 0 && _jitc->synth == 0);
1441 /* update register live state */
1457 for (offset = 0; offset < _jitc->patches.offset; offset++) {
1458 node = _jitc->patches.ptr[offset].node;
1459 word = node->code == jit_code_movi ? node->v.n->u.w : node->u.n->u.w;
1460 patch_at(_jitc->patches.ptr[offset].inst, word);
1463 jit_flush(_jit->code.ptr, _jit->pc.uc);
1465 return (_jit->code.ptr);
1469 # include "jit_hppa-cpu.c"
1470 # include "jit_hppa-fpu.c"
1471 # include "jit_fallback.c"
1475 jit_flush(void *fptr, void *tptr)
1478 s = sysconf(_SC_PAGE_SIZE);
1479 f = (jit_word_t)fptr & -s;
1480 t = (((jit_word_t)tptr) + s - 1) & -s;
1482 /* --- parisc2.0.pdf ---
1485 The minimum spacing that is guaranteed to work for "self-modifying code" is
1486 shown in the code segment below. Since instruction prefetching is permitted,
1487 any data cache flushes must be separated from any instruction cache flushes
1488 by a SYNC. This will ensure that the "new" instruction will be written to
1489 memory prior to any attempts at prefetching it as an instruction.
1491 LDIL l%newinstr,rnew
1492 LDW r%newinstr(0,rnew),temp
1494 STW temp,r%instr(0,rinstr)
1495 FDC r%instr(0,rinstr)
1500 (at least seven instructions)
1502 This sequence assumes a uniprocessor system. In a multiprocessor system,
1503 software must ensure no processor is executing code which is in the process
1508 Adapted from ffcall/trampoline/cache-hppa.c:__TR_clear_cache to
1509 loop over addresses as it is unlikely from and to addresses would fit in
1510 at most two cachelines.
1511 FIXME A cache line can be 16, 32, or 64 bytes.
1514 * Copyright 1995-1997 Bruno Haible, <bruno@clisp.org>
1516 * This is free software distributed under the GNU General Public Licence
1517 * described in the file COPYING. Contact the author if you don't have this
1518 * or can't live with it. There is ABSOLUTELY NO WARRANTY, explicit or implied,
1522 jit_word_t n = f + 32;
1524 for (; f <= t; n = f + 32, f += 64) {
1525 asm volatile ("fdc 0(0,%0)"
1526 "\n\t" "fdc 0(0,%1)"
1531 asm volatile ("mfsp %%sr0,%1"
1532 "\n\t" "ldsid (0,%4),%0"
1533 "\n\t" "mtsp %0,%%sr0"
1534 "\n\t" "fic 0(%%sr0,%2)"
1535 "\n\t" "fic 0(%%sr0,%3)"
1537 "\n\t" "mtsp %1,%%sr0"
1544 : "=r" (u), "=r" (v)
1545 : "r" (f), "r" (n), "r" (f)
1550 /* This is supposed to work but appears to fail on multiprocessor systems */
1551 __clear_cache((void *)f, (void *)t);
1556 _emit_ldxi(jit_state_t *_jit, jit_gpr_t r0, jit_gpr_t r1, jit_word_t i0)
1558 ldxi(rn(r0), rn(r1), i0);
1562 _emit_stxi(jit_state_t *_jit, jit_word_t i0, jit_gpr_t r0, jit_gpr_t r1)
1564 stxi(i0, rn(r0), rn(r1));
1568 _emit_ldxi_d(jit_state_t *_jit, jit_fpr_t r0, jit_gpr_t r1, jit_word_t i0)
1570 ldxi_d(rn(r0), rn(r1), i0);
1574 _emit_stxi_d(jit_state_t *_jit, jit_word_t i0, jit_gpr_t r0, jit_fpr_t r1)
1576 stxi_d(i0, rn(r0), rn(r1));
1580 _patch(jit_state_t *_jit, jit_word_t instr, jit_node_t *node)
1584 assert(node->flag & jit_flag_node);
1585 if (node->code == jit_code_movi)
1586 flag = node->v.n->flag;
1588 flag = node->u.n->flag;
1589 assert(!(flag & jit_flag_patch));
1590 if (_jitc->patches.offset >= _jitc->patches.length) {
1591 jit_realloc((jit_pointer_t *)&_jitc->patches.ptr,
1592 _jitc->patches.length * sizeof(jit_patch_t),
1593 (_jitc->patches.length + 1024) * sizeof(jit_patch_t));
1594 _jitc->patches.length += 1024;
1596 _jitc->patches.ptr[_jitc->patches.offset].inst = instr;
1597 _jitc->patches.ptr[_jitc->patches.offset].node = node;
1598 ++_jitc->patches.offset;