2 * Copyright (C) 2013-2023 Free Software Foundation, Inc.
4 * This file is part of GNU lightning.
6 * GNU lightning is free software; you can redistribute it and/or modify it
7 * under the terms of the GNU Lesser General Public License as published
8 * by the Free Software Foundation; either version 3, or (at your option)
11 * GNU lightning is distributed in the hope that it will be useful, but
12 * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
13 * or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public
14 * License for more details.
17 * Paulo Cesar Pereira de Andrade
26 #include <lightning.h>
27 #include <lightning/jit_private.h>
30 # define NUM_FLOAT_REG_ARGS 2
32 # define NUM_FLOAT_REG_ARGS 4
34 #define jit_arg_reg_p(i) ((i) >= 0 && (i) < 5)
35 #define jit_arg_f_reg_p(i) ((i) >= 0 && (i) < NUM_FLOAT_REG_ARGS)
40 typedef struct jit_va_list {
41 /* The offsets are "1" based, as addresses are fixed in the
42 * standard stack frame format. */
46 /* Easier when there is an explicitly defined type...
48 type = struct __va_list_tag {
51 void *__overflow_arg_area;
52 void *__reg_save_area;
54 Note that gopff (__gpr) and fpoff (__fpr) are jit_word_t equivalent
55 and, again, "1" (unit) based, so must be adjusted at va_arg time.
60 /* For variadic functions, always allocate space to save callee
62 * Note that s390 has a standard stack frame format that lightning
63 * does not fully comply with, but for variadic functions it must,
64 * for those (variadic) do not use the "empty" spaces for any
65 * callee save fpr register, but save them after the va_list
66 * space; and use the standard stack frame format, as required
67 * by variadic functions (and have a compatible va_list pointer). */
81 #define jit_get_reg_pair() _jit_get_reg_pair(_jit)
82 static jit_int32_t _jit_get_reg_pair(jit_state_t*);
83 #define jit_unget_reg_pair(regno) _jit_unget_reg_pair(_jit,regno)
84 static void _jit_unget_reg_pair(jit_state_t*,jit_int32_t);
85 #define jit_get_reg_but_zero(flags) _jit_get_reg_but_zero(_jit,flags)
86 static jit_int32_t _jit_get_reg_but_zero(jit_state_t*,jit_int32_t);
87 #define jit_unget_reg_but_zero(reg) jit_unget_reg(reg)
88 #define patch(instr, node) _patch(_jit, instr, node)
89 static void _patch(jit_state_t*,jit_word_t,jit_node_t*);
92 extern void __clear_cache(void *, void *);
95 # include "jit_s390-cpu.c"
96 # include "jit_s390-fpu.c"
98 # include "jit_fallback.c"
106 jit_register_t _rvs[] = {
107 { rc(gpr) | 0x0, "%r0" },
108 { rc(gpr) | 0x1, "%r1" },
109 { rc(gpr) | rc(sav) | 0xc, "%r12" },
110 { rc(gpr) | rc(sav) | 0xb, "%r11" },
111 { rc(gpr) | rc(sav) | 0xa, "%r10" },
112 { rc(gpr) | rc(sav) | 0x9, "%r9" },
113 { rc(gpr) | rc(sav) | 0x8, "%r8" },
114 { rc(gpr) | rc(sav) | 0x7, "%r7" },
115 { rc(gpr) | rc(arg) | rc(sav) | 0x6,"%r6" },
116 { rc(gpr) | rc(arg) | 0x5, "%r5" },
117 { rc(gpr) | rc(arg) | 0x4, "%r4" },
118 { rc(gpr) | rc(arg) | 0x3, "%r3" },
119 { rc(gpr) | rc(arg) | 0x2, "%r2" },
120 { rc(sav) | 0xd, "%r13" }, /* used as JIT_FP */
122 { rc(sav) | 0xf, "%r15" },
123 { rc(fpr) | 0x1, "%f1" },
124 { rc(fpr) | 0x3, "%f3" },
125 { rc(fpr) | 0x5, "%f5" },
126 { rc(fpr) | 0x7, "%f7" },
127 { rc(fpr) | rc(sav) | 0xe, "%f14" },
128 /* Do not use as temporary to simplify stack layout */
130 { rc(fpr) | rc(sav) | 0x8, "%f8" },
131 { rc(fpr) | rc(sav) | 0x9, "%f9" },
132 { rc(fpr) | rc(sav) | 0xa, "%f10" },
133 { rc(fpr) | rc(sav) | 0xb, "%f11" },
134 { rc(fpr) | rc(sav) | 0xc, "%f12" },
135 { rc(fpr) | rc(sav) | 0xd, "%f13" },
136 { rc(fpr) | rc(arg) | 0x6, "%f6" },
137 { rc(fpr) | rc(arg) | 0x4, "%f4" },
138 { rc(fpr) | rc(arg) | 0x2, "%f2" },
139 { rc(fpr) | rc(arg) | 0x0, "%f0" },
140 { _NOREG, "<none>" },
143 static sigjmp_buf jit_env;
151 sigill_handler(int signum)
154 siglongjmp(jit_env, 1);
163 struct sigaction new_action, old_action;
164 new_action.sa_handler = sigill_handler;
165 sigemptyset(&new_action.sa_mask);
166 new_action.sa_flags = 0;
167 sigaction(SIGILL, NULL, &old_action);
168 if (old_action.sa_handler != SIG_IGN) {
169 sigaction(SIGILL, &new_action, NULL);
170 if (!sigsetjmp(jit_env, 1)) {
172 /* flogr %r12, %r12 */
173 __asm__ volatile("lgr %%r12, %0; lgr %%r13, %1;"
174 "flogr %%r12, %%r12;"
175 "lgr %1, %%r13; lgr %0, %%r12;"
176 : "=r" (r12), "=r" (r13));
177 sigaction(SIGILL, &old_action, NULL);
181 /* By default, assume it is available */
187 _jit_init(jit_state_t *_jit)
189 _jitc->reglen = jit_size(_rvs) - 1;
193 _jit_prolog(jit_state_t *_jit)
199 assert(jit_regset_cmp_ui(&_jitc->regarg, 0) == 0);
200 jit_regset_set_ui(&_jitc->regsav, 0);
201 offset = _jitc->functions.offset;
202 if (offset >= _jitc->functions.length) {
203 jit_realloc((jit_pointer_t *)&_jitc->functions.ptr,
204 _jitc->functions.length * sizeof(jit_function_t),
205 (_jitc->functions.length + 16) * sizeof(jit_function_t));
206 _jitc->functions.length += 16;
208 _jitc->function = _jitc->functions.ptr + _jitc->functions.offset++;
209 _jitc->function->self.size = stack_framesize;
210 _jitc->function->self.argi = _jitc->function->self.argf =
211 _jitc->function->self.aoff = _jitc->function->self.alen = 0;
212 /* preallocate 8 bytes if not using a constant data buffer */
214 _jitc->function->self.aoff = -8;
215 _jitc->function->self.call = jit_call_default;
216 jit_alloc((jit_pointer_t *)&_jitc->function->regoff,
217 _jitc->reglen * sizeof(jit_int32_t));
219 /* _no_link here does not mean the jit_link() call can be removed
221 * _jitc->function->prolog = jit_new_node(jit_code_prolog);
223 _jitc->function->prolog = jit_new_node_no_link(jit_code_prolog);
224 jit_link(_jitc->function->prolog);
225 _jitc->function->prolog->w.w = offset;
226 _jitc->function->epilog = jit_new_node_no_link(jit_code_epilog);
228 * v: offset in blocks vector
229 * w: offset in functions vector
231 _jitc->function->epilog->w.w = offset;
233 jit_regset_new(&_jitc->function->regset);
237 _jit_allocai(jit_state_t *_jit, jit_int32_t length)
239 assert(_jitc->function);
241 case 0: case 1: break;
242 case 2: _jitc->function->self.aoff &= -2; break;
243 case 3: case 4: _jitc->function->self.aoff &= -4; break;
244 default: _jitc->function->self.aoff &= -8; break;
246 _jitc->function->self.aoff -= length;
247 if (!_jitc->realize) {
248 jit_inc_synth_ww(allocai, _jitc->function->self.aoff, length);
251 return (_jitc->function->self.aoff);
255 _jit_allocar(jit_state_t *_jit, jit_int32_t u, jit_int32_t v)
258 assert(_jitc->function);
259 jit_inc_synth_ww(allocar, u, v);
260 if (!_jitc->function->allocar) {
261 _jitc->function->aoffoff = jit_allocai(sizeof(jit_int32_t));
262 _jitc->function->allocar = 1;
264 reg = jit_get_reg(jit_class_gpr);
266 jit_andi(reg, reg, -8);
267 jit_ldxi_i(u, JIT_FP, _jitc->function->aoffoff);
269 jit_addr(JIT_SP, JIT_SP, reg);
270 jit_stxi_i(_jitc->function->aoffoff, JIT_FP, u);
276 _jit_ret(jit_state_t *_jit)
279 assert(_jitc->function);
283 jit_patch_at(instr, _jitc->function->epilog);
288 _jit_retr(jit_state_t *_jit, jit_int32_t u, jit_code_t code)
290 jit_code_inc_synth_w(code, u);
291 jit_movr(JIT_RET, u);
297 _jit_reti(jit_state_t *_jit, jit_word_t u, jit_code_t code)
299 jit_code_inc_synth_w(code, u);
300 jit_movi(JIT_RET, u);
306 _jit_retr_f(jit_state_t *_jit, jit_int32_t u)
308 jit_inc_synth_w(retr_f, u);
309 jit_movr_f(JIT_FRET, u);
315 _jit_reti_f(jit_state_t *_jit, jit_float32_t u)
317 jit_inc_synth_f(reti_f, u);
318 jit_movi_f(JIT_FRET, u);
324 _jit_retr_d(jit_state_t *_jit, jit_int32_t u)
326 jit_inc_synth_w(retr_d, u);
327 jit_movr_d(JIT_FRET, u);
333 _jit_reti_d(jit_state_t *_jit, jit_float64_t u)
335 jit_inc_synth_d(reti_d, u);
336 jit_movi_d(JIT_FRET, u);
342 _jit_epilog(jit_state_t *_jit)
344 assert(_jitc->function);
345 assert(_jitc->function->epilog->next == NULL);
346 jit_link(_jitc->function->epilog);
347 _jitc->function = NULL;
351 _jit_arg_register_p(jit_state_t *_jit, jit_node_t *u)
353 if (u->code >= jit_code_arg_c && u->code <= jit_code_arg)
354 return (jit_arg_reg_p(u->u.w));
355 assert(u->code == jit_code_arg_f || u->code == jit_code_arg_d);
356 return (jit_arg_f_reg_p(u->u.w));
360 _jit_ellipsis(jit_state_t *_jit)
362 jit_inc_synth(ellipsis);
363 if (_jitc->prepare) {
365 assert(!(_jitc->function->call.call & jit_call_varargs));
366 _jitc->function->call.call |= jit_call_varargs;
370 assert(!(_jitc->function->self.call & jit_call_varargs));
371 _jitc->function->self.call |= jit_call_varargs;
373 /* Allocate va_list like object in the stack. */
374 _jitc->function->vaoff = jit_allocai(sizeof(jit_va_list_t));
376 /* Initialize gp offset in save area. */
377 if (jit_arg_reg_p(_jitc->function->self.argi))
378 _jitc->function->vagp = _jitc->function->self.argi;
380 _jitc->function->vagp = 5;
382 /* Initialize fp offset in save area. */
383 if (jit_arg_f_reg_p(_jitc->function->self.argf))
384 _jitc->function->vafp = _jitc->function->self.argf;
386 _jitc->function->vafp = NUM_FLOAT_REG_ARGS;
392 _jit_va_push(jit_state_t *_jit, jit_int32_t u)
394 jit_inc_synth_w(va_push, u);
400 _jit_arg(jit_state_t *_jit, jit_code_t code)
404 assert(_jitc->function);
405 assert(!(_jitc->function->self.call & jit_call_varargs));
406 #if STRONG_TYPE_CHECKING
407 assert(code >= jit_code_arg_c && code <= jit_code_arg);
409 if (jit_arg_reg_p(_jitc->function->self.argi))
410 offset = _jitc->function->self.argi++;
412 offset = _jitc->function->self.size;
413 _jitc->function->self.size += sizeof(jit_word_t);
415 node = jit_new_node_ww(code, offset,
416 ++_jitc->function->self.argn);
422 _jit_arg_f(jit_state_t *_jit)
426 assert(_jitc->function);
427 if (jit_arg_f_reg_p(_jitc->function->self.argf))
428 offset = _jitc->function->self.argf++;
430 offset = _jitc->function->self.size;
431 _jitc->function->self.size += sizeof(jit_word_t);
433 node = jit_new_node_ww(jit_code_arg_f, offset,
434 ++_jitc->function->self.argn);
440 _jit_arg_d(jit_state_t *_jit)
444 assert(_jitc->function);
445 if (jit_arg_f_reg_p(_jitc->function->self.argf))
446 offset = _jitc->function->self.argf++;
448 offset = _jitc->function->self.size;
449 _jitc->function->self.size += sizeof(jit_float64_t);
451 node = jit_new_node_ww(jit_code_arg_d, offset,
452 ++_jitc->function->self.argn);
458 _jit_getarg_c(jit_state_t *_jit, jit_int32_t u, jit_node_t *v)
460 assert_arg_type(v->code, jit_code_arg_c);
461 jit_inc_synth_wp(getarg_c, u, v);
462 if (jit_arg_reg_p(v->u.w))
463 jit_extr_c(u, _R2 - v->u.w);
465 jit_ldxi_c(u, JIT_FP,
466 v->u.w + (__WORDSIZE >> 3) - sizeof(jit_int8_t));
471 _jit_getarg_uc(jit_state_t *_jit, jit_int32_t u, jit_node_t *v)
473 assert_arg_type(v->code, jit_code_arg_c);
474 jit_inc_synth_wp(getarg_uc, u, v);
475 if (jit_arg_reg_p(v->u.w))
476 jit_extr_uc(u, _R2 - v->u.w);
478 jit_ldxi_uc(u, JIT_FP,
479 v->u.w + (__WORDSIZE >> 3) - sizeof(jit_uint8_t));
484 _jit_getarg_s(jit_state_t *_jit, jit_int32_t u, jit_node_t *v)
486 assert_arg_type(v->code, jit_code_arg_s);
487 jit_inc_synth_wp(getarg_s, u, v);
488 if (jit_arg_reg_p(v->u.w))
489 jit_extr_s(u, _R2 - v->u.w);
491 jit_ldxi_s(u, JIT_FP,
492 v->u.w + (__WORDSIZE >> 3) - sizeof(jit_int16_t));
497 _jit_getarg_us(jit_state_t *_jit, jit_int32_t u, jit_node_t *v)
499 assert_arg_type(v->code, jit_code_arg_s);
500 jit_inc_synth_wp(getarg_us, u, v);
501 if (jit_arg_reg_p(v->u.w))
502 jit_extr_us(u, _R2 - v->u.w);
504 jit_ldxi_us(u, JIT_FP,
505 v->u.w + (__WORDSIZE >> 3) - sizeof(jit_uint16_t));
510 _jit_getarg_i(jit_state_t *_jit, jit_int32_t u, jit_node_t *v)
512 assert_arg_type(v->code, jit_code_arg_i);
513 jit_inc_synth_wp(getarg_i, u, v);
514 if (jit_arg_reg_p(v->u.w)) {
516 jit_movr(u, _R2 - v->u.w);
518 jit_extr_i(u, _R2 - v->u.w);
522 jit_ldxi_i(u, JIT_FP,
523 v->u.w + (__WORDSIZE >> 3) - sizeof(jit_int32_t));
529 _jit_getarg_ui(jit_state_t *_jit, jit_int32_t u, jit_node_t *v)
531 assert_arg_type(v->code, jit_code_arg_i);
532 jit_inc_synth_wp(getarg_ui, u, v);
533 if (jit_arg_reg_p(v->u.w))
534 jit_extr_ui(u, _R2 - v->u.w);
536 jit_ldxi_ui(u, JIT_FP,
537 v->u.w + (__WORDSIZE >> 3) - sizeof(jit_uint32_t));
542 _jit_getarg_l(jit_state_t *_jit, jit_int32_t u, jit_node_t *v)
544 assert_arg_type(v->code, jit_code_arg_l);
545 jit_inc_synth_wp(getarg_l, u, v);
546 if (jit_arg_reg_p(v->u.w))
547 jit_movr(u, _R2 - v->u.w);
549 jit_ldxi_l(u, JIT_FP, v->u.w);
555 _jit_putargr(jit_state_t *_jit, jit_int32_t u, jit_node_t *v, jit_code_t code)
557 assert_putarg_type(code, v->code);
558 jit_code_inc_synth_wp(code, u, v);
559 if (jit_arg_reg_p(v->u.w))
560 jit_movr(_R2 - v->u.w, u);
562 jit_stxi(v->u.w, JIT_FP, u);
567 _jit_putargi(jit_state_t *_jit, jit_word_t u, jit_node_t *v, jit_code_t code)
570 assert_putarg_type(code, v->code);
571 jit_code_inc_synth_wp(code, u, v);
572 if (jit_arg_reg_p(v->u.w))
573 jit_movi(_R2 - v->u.w, u);
575 regno = jit_get_reg(jit_class_gpr);
577 jit_stxi(v->u.w, JIT_FP, regno);
578 jit_unget_reg(regno);
584 _jit_getarg_f(jit_state_t *_jit, jit_int32_t u, jit_node_t *v)
586 assert(v->code == jit_code_arg_f);
587 jit_inc_synth_wp(getarg_f, u, v);
588 if (jit_arg_f_reg_p(v->u.w))
589 jit_movr_f(u, _F0 - v->u.w);
591 jit_ldxi_f(u, JIT_FP,
594 + (__WORDSIZE >> 3) - sizeof(jit_float32_t)
601 _jit_putargr_f(jit_state_t *_jit, jit_int32_t u, jit_node_t *v)
603 assert(v->code == jit_code_arg_f);
604 jit_inc_synth_wp(putargr_f, u, v);
605 if (jit_arg_f_reg_p(v->u.w))
606 jit_movr_f(_F0 - v->u.w, u);
610 + (__WORDSIZE >> 3) - sizeof(jit_float32_t)
617 _jit_putargi_f(jit_state_t *_jit, jit_float32_t u, jit_node_t *v)
620 assert(v->code == jit_code_arg_f);
621 jit_inc_synth_fp(putargi_f, u, v);
622 if (jit_arg_f_reg_p(v->u.w))
623 jit_movi_f(_F0 - v->u.w, u);
625 regno = jit_get_reg(jit_class_fpr);
626 jit_movi_f(regno, u);
629 + (__WORDSIZE >> 3) - sizeof(jit_float32_t)
632 jit_unget_reg(regno);
638 _jit_getarg_d(jit_state_t *_jit, jit_int32_t u, jit_node_t *v)
640 assert(v->code == jit_code_arg_d);
641 jit_inc_synth_wp(getarg_d, u, v);
642 if (jit_arg_f_reg_p(v->u.w))
643 jit_movr_d(u, _F0 - v->u.w);
645 jit_ldxi_d(u, JIT_FP, v->u.w);
650 _jit_putargr_d(jit_state_t *_jit, jit_int32_t u, jit_node_t *v)
652 assert(v->code == jit_code_arg_d);
653 jit_inc_synth_wp(putargr_d, u, v);
654 if (jit_arg_f_reg_p(v->u.w))
655 jit_movr_d(_F0 - v->u.w, u);
657 jit_stxi_d(v->u.w, JIT_FP, u);
662 _jit_putargi_d(jit_state_t *_jit, jit_float64_t u, jit_node_t *v)
665 assert(v->code == jit_code_arg_d);
666 jit_inc_synth_dp(putargi_d, u, v);
667 if (jit_arg_f_reg_p(v->u.w))
668 jit_movi_d(_F0 - v->u.w, u);
670 regno = jit_get_reg(jit_class_fpr);
671 jit_movi_d(regno, u);
672 jit_stxi_d(v->u.w, JIT_FP, regno);
673 jit_unget_reg(regno);
679 _jit_pushargr(jit_state_t *_jit, jit_int32_t u, jit_code_t code)
681 assert(_jitc->function);
682 jit_code_inc_synth_w(code, u);
684 if (jit_arg_reg_p(_jitc->function->call.argi)) {
685 jit_movr(_R2 - _jitc->function->call.argi, u);
686 ++_jitc->function->call.argi;
689 jit_stxi(_jitc->function->call.size + stack_framesize, JIT_SP, u);
690 _jitc->function->call.size += sizeof(jit_word_t);
696 _jit_pushargi(jit_state_t *_jit, jit_word_t u, jit_code_t code)
699 assert(_jitc->function);
700 jit_code_inc_synth_w(code, u);
702 if (jit_arg_reg_p(_jitc->function->call.argi)) {
703 jit_movi(_R2 - _jitc->function->call.argi, u);
704 ++_jitc->function->call.argi;
707 regno = jit_get_reg(jit_class_gpr);
709 jit_stxi(_jitc->function->call.size + stack_framesize, JIT_SP, regno);
710 jit_unget_reg(regno);
711 _jitc->function->call.size += sizeof(jit_word_t);
717 _jit_pushargr_f(jit_state_t *_jit, jit_int32_t u)
719 assert(_jitc->function);
720 jit_inc_synth_w(pushargr_f, u);
722 if (jit_arg_f_reg_p(_jitc->function->call.argf)) {
723 jit_movr_f(_F0 - _jitc->function->call.argf, u);
724 ++_jitc->function->call.argf;
727 jit_stxi_f(_jitc->function->call.size + stack_framesize
729 + (__WORDSIZE >> 3) - sizeof(jit_float32_t)
732 _jitc->function->call.size += sizeof(jit_word_t);
738 _jit_pushargi_f(jit_state_t *_jit, jit_float32_t u)
741 assert(_jitc->function);
742 jit_inc_synth_f(pushargi_f, u);
744 if (jit_arg_f_reg_p(_jitc->function->call.argf)) {
745 jit_movi_f(_F0 - _jitc->function->call.argf, u);
746 ++_jitc->function->call.argf;
749 regno = jit_get_reg(jit_class_fpr);
750 jit_movi_f(regno, u);
751 jit_stxi_f(_jitc->function->call.size + stack_framesize
753 + (__WORDSIZE >> 3) - sizeof(jit_float32_t)
756 jit_unget_reg(regno);
757 _jitc->function->call.size += sizeof(jit_word_t);
763 _jit_pushargr_d(jit_state_t *_jit, jit_int32_t u)
765 assert(_jitc->function);
766 jit_inc_synth_w(pushargr_d, u);
768 if (jit_arg_f_reg_p(_jitc->function->call.argf)) {
769 jit_movr_d(_F0 - _jitc->function->call.argf, u);
770 ++_jitc->function->call.argf;
773 jit_stxi_d(_jitc->function->call.size + stack_framesize, JIT_SP, u);
774 _jitc->function->call.size += sizeof(jit_float64_t);
780 _jit_pushargi_d(jit_state_t *_jit, jit_float64_t u)
783 assert(_jitc->function);
784 jit_inc_synth_d(pushargi_d, u);
786 if (jit_arg_f_reg_p(_jitc->function->call.argf)) {
787 jit_movi_d(_F0 - _jitc->function->call.argf, u);
788 ++_jitc->function->call.argf;
791 regno = jit_get_reg(jit_class_fpr);
792 jit_movi_d(regno, u);
793 jit_stxi_d(_jitc->function->call.size + stack_framesize, JIT_SP, regno);
794 jit_unget_reg(regno);
795 _jitc->function->call.size += sizeof(jit_float64_t);
801 _jit_regarg_p(jit_state_t *_jit, jit_node_t *node, jit_int32_t regno)
804 spec = jit_class(_rvs[regno].spec);
805 if (spec & jit_class_arg) {
807 if (regno >= 0 && regno < node->v.w)
809 if (spec & jit_class_fpr) {
811 if (regno >= 0 && regno < node->w.w)
819 _jit_finishr(jit_state_t *_jit, jit_int32_t r0)
822 assert(_jitc->function);
823 jit_inc_synth_w(finishr, r0);
824 if (_jitc->function->self.alen < _jitc->function->call.size)
825 _jitc->function->self.alen = _jitc->function->call.size;
826 call = jit_callr(r0);
827 call->v.w = _jitc->function->call.argi;
828 call->w.w = _jitc->function->call.argf;
829 _jitc->function->call.argi = _jitc->function->call.argf =
830 _jitc->function->call.size = 0;
836 _jit_finishi(jit_state_t *_jit, jit_pointer_t i0)
839 assert(_jitc->function);
840 jit_inc_synth_w(finishi, (jit_word_t)i0);
841 if (_jitc->function->self.alen < _jitc->function->call.size)
842 _jitc->function->self.alen = _jitc->function->call.size;
843 node = jit_calli(i0);
844 node->v.w = _jitc->function->call.argi;
845 node->w.w = _jitc->function->call.argf;
846 _jitc->function->call.argi = _jitc->function->call.argf =
847 _jitc->function->call.size = 0;
854 _jit_retval_c(jit_state_t *_jit, jit_int32_t r0)
856 jit_inc_synth_w(retval_c, r0);
857 jit_extr_c(r0, JIT_RET);
862 _jit_retval_uc(jit_state_t *_jit, jit_int32_t r0)
864 jit_inc_synth_w(retval_uc, r0);
865 jit_extr_uc(r0, JIT_RET);
870 _jit_retval_s(jit_state_t *_jit, jit_int32_t r0)
872 jit_inc_synth_w(retval_s, r0);
873 jit_extr_s(r0, JIT_RET);
878 _jit_retval_us(jit_state_t *_jit, jit_int32_t r0)
880 jit_inc_synth_w(retval_us, r0);
881 jit_extr_us(r0, JIT_RET);
886 _jit_retval_i(jit_state_t *_jit, jit_int32_t r0)
888 jit_inc_synth_w(retval_i, r0);
890 jit_extr_i(r0, JIT_RET);
892 jit_movr(r0, JIT_RET);
899 _jit_retval_ui(jit_state_t *_jit, jit_int32_t r0)
901 jit_inc_synth_w(retval_ui, r0);
902 jit_extr_ui(r0, JIT_RET);
907 _jit_retval_l(jit_state_t *_jit, jit_int32_t r0)
909 jit_inc_synth_w(retval_l, r0);
910 jit_movr(r0, JIT_RET);
916 _jit_retval_f(jit_state_t *_jit, jit_int32_t r0)
918 jit_inc_synth_w(retval_f, r0);
919 jit_movr_f(r0, JIT_FRET);
924 _jit_retval_d(jit_state_t *_jit, jit_int32_t r0)
926 jit_inc_synth_w(retval_d, r0);
927 jit_movr_d(r0, JIT_FRET);
932 _emit_code(jit_state_t *_jit)
943 #if DEVEL_DISASSEMBLER
946 jit_int32_t patch_offset;
948 #if DEVEL_DISASSEMBLER
952 _jitc->function = NULL;
958 undo.patch_offset = 0;
960 #define assert_data(node) /**/
961 #define case_rr(name, type) \
962 case jit_code_##name##r##type: \
963 name##r##type(rn(node->u.w), rn(node->v.w)); \
965 #define case_rw(name, type) \
966 case jit_code_##name##i##type: \
967 name##i##type(rn(node->u.w), node->v.w); \
969 #define case_wr(name, type) \
970 case jit_code_##name##i##type: \
971 name##i##type(node->u.w, rn(node->v.w)); \
973 #define case_rrr(name, type) \
974 case jit_code_##name##r##type: \
975 name##r##type(rn(node->u.w), \
976 rn(node->v.w), rn(node->w.w)); \
978 #define case_rrrr(name, type) \
979 case jit_code_##name##r##type: \
980 name##r##type(rn(node->u.q.l), rn(node->u.q.h), \
981 rn(node->v.w), rn(node->w.w)); \
983 #define case_rrw(name, type) \
984 case jit_code_##name##i##type: \
985 name##i##type(rn(node->u.w), rn(node->v.w), node->w.w); \
987 #define case_rrrw(name, type) \
988 case jit_code_##name##i##type: \
989 name##i##type(rn(node->u.q.l), rn(node->u.q.h), \
990 rn(node->v.w), node->w.w); \
992 #define case_rrf(name) \
993 case jit_code_##name##i_f: \
995 name##i_f(rn(node->u.w), rn(node->v.w), \
996 (jit_float32_t *)node->w.n->u.w); \
998 #define case_rrd(name) \
999 case jit_code_##name##i_d: \
1000 assert_data(node); \
1001 name##i_d(rn(node->u.w), rn(node->v.w), \
1002 (jit_float64_t *)node->w.n->u.w); \
1004 #define case_wrr(name, type) \
1005 case jit_code_##name##i##type: \
1006 name##i##type(node->u.w, rn(node->v.w), rn(node->w.w)); \
1008 #define case_brr(name, type) \
1009 case jit_code_##name##r##type: \
1011 assert(temp->code == jit_code_label || \
1012 temp->code == jit_code_epilog); \
1013 if (temp->flag & jit_flag_patch) \
1014 name##r##type(temp->u.w, rn(node->v.w), \
1017 word = name##r##type##_p(_jit->pc.w, \
1020 patch(word, node); \
1023 #define case_brw(name, type) \
1024 case jit_code_##name##i##type: \
1026 assert(temp->code == jit_code_label || \
1027 temp->code == jit_code_epilog); \
1028 if (temp->flag & jit_flag_patch) \
1029 name##i##type(temp->u.w, \
1030 rn(node->v.w), node->w.w); \
1032 word = name##i##type##_p(_jit->pc.w, \
1033 rn(node->v.w), node->w.w); \
1034 patch(word, node); \
1037 #define case_brf(name) \
1038 case jit_code_##name##i_f: \
1040 assert(temp->code == jit_code_label || \
1041 temp->code == jit_code_epilog); \
1042 if (temp->flag & jit_flag_patch) \
1043 name##i_f(temp->u.w, rn(node->v.w), \
1044 (jit_float32_t *)node->w.n->u.w); \
1046 word = name##i_f_p(_jit->pc.w, rn(node->v.w), \
1047 (jit_float32_t *)node->w.n->u.w);\
1048 patch(word, node); \
1051 #define case_brd(name) \
1052 case jit_code_##name##i_d: \
1054 assert(temp->code == jit_code_label || \
1055 temp->code == jit_code_epilog); \
1056 if (temp->flag & jit_flag_patch) \
1057 name##i_d(temp->u.w, rn(node->v.w), \
1058 (jit_float64_t *)node->w.n->u.w); \
1060 word = name##i_d_p(_jit->pc.w, rn(node->v.w), \
1061 (jit_float64_t *)node->w.n->u.w);\
1062 patch(word, node); \
1065 #if DEVEL_DISASSEMBLER
1068 for (node = _jitc->head; node; node = node->next) {
1069 if (_jit->pc.uc >= _jitc->code.end)
1072 #if DEVEL_DISASSEMBLER
1073 node->offset = (jit_uword_t)_jit->pc.w - (jit_uword_t)prevw;
1076 value = jit_classify(node->code);
1077 jit_regarg_set(node, value);
1078 switch (node->code) {
1079 case jit_code_align:
1080 /* Must align to a power of two */
1081 assert(!(node->u.w & (node->u.w - 1)));
1082 if ((word = _jit->pc.w & (node->u.w - 1)))
1083 nop(node->u.w - word);
1086 nop((node->u.w + 1) & ~1);
1088 case jit_code_note: case jit_code_name:
1089 node->u.w = _jit->pc.w;
1091 case jit_code_label:
1092 if ((node->link || (node->flag & jit_flag_use)) &&
1093 (word = _jit->pc.w & 3))
1095 /* remember label is defined */
1096 node->flag |= jit_flag_patch;
1097 node->u.w = _jit->pc.w;
1116 case_rrrr(qmul, _u);
1117 case_rrrw(qmul, _u);
1128 case_rrrr(qdiv, _u);
1129 case_rrrw(qdiv, _u);
1148 case_rr(trunc, _f_i);
1149 case_rr(trunc, _d_i);
1150 #if __WORDSIZE == 64
1151 case_rr(trunc, _f_l);
1152 case_rr(trunc, _d_l);
1164 #if __WORDSIZE == 64
1180 #if __WORDSIZE == 64
1192 #if __WORDSIZE == 64
1202 #if __WORDSIZE == 64
1208 #if __WORDSIZE == 64
1211 case_rr(bswap, _us);
1212 case_rr(bswap, _ui);
1213 #if __WORDSIZE == 64
1214 case_rr(bswap, _ul);
1220 #if __WORDSIZE == 64
1225 casr(rn(node->u.w), rn(node->v.w),
1226 rn(node->w.q.l), rn(node->w.q.h));
1229 casi(rn(node->u.w), node->v.w,
1230 rn(node->w.q.l), rn(node->w.q.h));
1236 if (node->flag & jit_flag_node) {
1238 if (temp->code == jit_code_data ||
1239 (temp->code == jit_code_label &&
1240 (temp->flag & jit_flag_patch)))
1241 movi(rn(node->u.w), temp->u.w);
1243 assert(temp->code == jit_code_label ||
1244 temp->code == jit_code_epilog);
1245 word = movi_p(rn(node->u.w), temp->u.w);
1250 movi(rn(node->u.w), node->v.w);
1294 case_brr(boadd, _u);
1295 case_brw(boadd, _u);
1298 case_brr(bxadd, _u);
1299 case_brw(bxadd, _u);
1302 case_brr(bosub, _u);
1303 case_brw(bosub, _u);
1306 case_brr(bxsub, _u);
1307 case_brw(bxsub, _u);
1334 case jit_code_movi_f:
1336 movi_f(rn(node->u.w), (jit_float32_t *)node->v.n->u.w);
1365 case_rrr(unord, _f);
1379 case_brr(bunlt, _f);
1381 case_brr(bunle, _f);
1383 case_brr(buneq, _f);
1385 case_brr(bunge, _f);
1387 case_brr(bungt, _f);
1389 case_brr(bltgt, _f);
1393 case_brr(bunord, _f);
1417 case jit_code_movi_d:
1419 movi_d(rn(node->u.w), (jit_float64_t *)node->v.n->u.w);
1448 case_rrr(unord, _d);
1462 case_brr(bunlt, _d);
1464 case_brr(bunle, _d);
1466 case_brr(buneq, _d);
1468 case_brr(bunge, _d);
1470 case_brr(bungt, _d);
1472 case_brr(bltgt, _d);
1476 case_brr(bunord, _d);
1479 jmpr(rn(node->u.w));
1482 if (node->flag & jit_flag_node) {
1484 assert(temp->code == jit_code_label ||
1485 temp->code == jit_code_epilog);
1486 if (temp->flag & jit_flag_patch)
1489 word = _jit->code.length -
1490 (_jit->pc.uc - _jit->code.ptr);
1492 offset = s16_p(word);
1493 word = jmpi(_jit->pc.w, offset);
1496 word = jmpi_p(_jit->pc.w);
1503 case jit_code_callr:
1504 callr(rn(node->u.w));
1506 case jit_code_calli:
1507 if (node->flag & jit_flag_node) {
1509 assert(temp->code == jit_code_label ||
1510 temp->code == jit_code_epilog);
1511 if (temp->flag & jit_flag_patch)
1512 calli(temp->u.w, 1);
1514 word = _jit->code.length -
1515 (_jit->pc.uc - _jit->code.ptr);
1517 offset =s16_p(word);
1518 word = calli(_jit->pc.w, offset);
1521 word = calli_p(_jit->pc.w);
1526 calli(node->u.w, 1);
1528 case jit_code_prolog:
1529 _jitc->function = _jitc->functions.ptr + node->w.w;
1531 undo.word = _jit->pc.w;
1532 memcpy(&undo.func, _jitc->function, sizeof(undo.func));
1533 #if DEVEL_DISASSEMBLER
1536 undo.patch_offset = _jitc->patches.offset;
1541 case jit_code_epilog:
1542 assert(_jitc->function == _jitc->functions.ptr + node->w.w);
1544 for (temp = undo.node->next;
1545 temp != node; temp = temp->next) {
1546 if (temp->code == jit_code_label ||
1547 temp->code == jit_code_epilog)
1548 temp->flag &= ~jit_flag_patch;
1550 temp->flag &= ~jit_flag_patch;
1552 _jit->pc.w = undo.word;
1553 /* undo.func.self.aoff and undo.func.regset should not
1554 * be undone, as they will be further updated, and are
1555 * the reason of the undo. */
1556 undo.func.self.aoff = _jitc->function->frame +
1557 _jitc->function->self.aoff;
1558 jit_regset_set(&undo.func.regset, &_jitc->function->regset);
1559 /* allocar information also does not need to be undone */
1560 undo.func.aoffoff = _jitc->function->aoffoff;
1561 undo.func.allocar = _jitc->function->allocar;
1562 memcpy(_jitc->function, &undo.func, sizeof(undo.func));
1563 #if DEVEL_DISASSEMBLER
1566 _jitc->patches.offset = undo.patch_offset;
1567 goto restart_function;
1569 if (node->link && (word = _jit->pc.w & 3))
1571 /* remember label is defined */
1572 node->flag |= jit_flag_patch;
1573 node->u.w = _jit->pc.w;
1575 _jitc->function = NULL;
1577 case jit_code_va_start:
1578 vastart(rn(node->u.w));
1580 case jit_code_va_arg:
1581 vaarg(rn(node->u.w), rn(node->v.w));
1583 case jit_code_va_arg_d:
1584 vaarg_d(rn(node->u.w), rn(node->v.w));
1586 case jit_code_live: case jit_code_ellipsis:
1587 case jit_code_va_push:
1588 case jit_code_allocai: case jit_code_allocar:
1589 case jit_code_arg_c: case jit_code_arg_s:
1590 case jit_code_arg_i:
1591 # if __WORDSIZE == 64
1592 case jit_code_arg_l:
1594 case jit_code_arg_f: case jit_code_arg_d:
1595 case jit_code_va_end:
1597 case jit_code_retr_c: case jit_code_reti_c:
1598 case jit_code_retr_uc: case jit_code_reti_uc:
1599 case jit_code_retr_s: case jit_code_reti_s:
1600 case jit_code_retr_us: case jit_code_reti_us:
1601 case jit_code_retr_i: case jit_code_reti_i:
1602 #if __WORDSIZE == 64
1603 case jit_code_retr_ui: case jit_code_reti_ui:
1604 case jit_code_retr_l: case jit_code_reti_l:
1606 case jit_code_retr_f: case jit_code_reti_f:
1607 case jit_code_retr_d: case jit_code_reti_d:
1608 case jit_code_getarg_c: case jit_code_getarg_uc:
1609 case jit_code_getarg_s: case jit_code_getarg_us:
1610 case jit_code_getarg_i:
1611 #if __WORDSIZE == 64
1612 case jit_code_getarg_ui: case jit_code_getarg_l:
1614 case jit_code_getarg_f: case jit_code_getarg_d:
1615 case jit_code_putargr_c: case jit_code_putargi_c:
1616 case jit_code_putargr_uc: case jit_code_putargi_uc:
1617 case jit_code_putargr_s: case jit_code_putargi_s:
1618 case jit_code_putargr_us: case jit_code_putargi_us:
1619 case jit_code_putargr_i: case jit_code_putargi_i:
1620 #if __WORDSIZE == 64
1621 case jit_code_putargr_ui: case jit_code_putargi_ui:
1622 case jit_code_putargr_l: case jit_code_putargi_l:
1624 case jit_code_putargr_f: case jit_code_putargi_f:
1625 case jit_code_putargr_d: case jit_code_putargi_d:
1626 case jit_code_pushargr_c: case jit_code_pushargi_c:
1627 case jit_code_pushargr_uc: case jit_code_pushargi_uc:
1628 case jit_code_pushargr_s: case jit_code_pushargi_s:
1629 case jit_code_pushargr_us: case jit_code_pushargi_us:
1630 case jit_code_pushargr_i: case jit_code_pushargi_i:
1631 #if __WORDSIZE == 64
1632 case jit_code_pushargr_ui: case jit_code_pushargi_ui:
1633 case jit_code_pushargr_l: case jit_code_pushargi_l:
1635 case jit_code_pushargr_f: case jit_code_pushargi_f:
1636 case jit_code_pushargr_d: case jit_code_pushargi_d:
1637 case jit_code_retval_c: case jit_code_retval_uc:
1638 case jit_code_retval_s: case jit_code_retval_us:
1639 case jit_code_retval_i:
1640 #if __WORDSIZE == 64
1641 case jit_code_retval_ui: case jit_code_retval_l:
1643 case jit_code_retval_f: case jit_code_retval_d:
1644 case jit_code_prepare:
1645 case jit_code_finishr: case jit_code_finishi:
1650 jit_regarg_clr(node, value);
1651 assert(_jitc->regarg == 0 && _jitc->synth == 0);
1652 /* update register live state */
1664 for (offset = 0; offset < _jitc->patches.offset; offset++) {
1665 node = _jitc->patches.ptr[offset].node;
1666 word = node->code == jit_code_movi ? node->v.n->u.w : node->u.n->u.w;
1667 patch_at(_jitc->patches.ptr[offset].inst, word);
1670 jit_flush(_jit->code.ptr, _jit->pc.uc);
1672 return (_jit->code.ptr);
1676 # include "jit_s390-cpu.c"
1677 # include "jit_s390-fpu.c"
1679 # include "jit_fallback.c"
1684 jit_flush(void *fptr, void *tptr)
1686 #if defined(__GNUC__)
1689 s = sysconf(_SC_PAGE_SIZE);
1690 f = (jit_word_t)fptr & -s;
1691 t = (((jit_word_t)tptr) + s - 1) & -s;
1692 __clear_cache((void *)f, (void *)t);
1697 _emit_ldxi(jit_state_t *_jit, jit_gpr_t r0, jit_gpr_t r1, jit_word_t i0)
1699 ldxi(rn(r0), rn(r1), i0);
1703 _emit_stxi(jit_state_t *_jit, jit_word_t i0, jit_gpr_t r0, jit_gpr_t r1)
1705 stxi(i0, rn(r0), rn(r1));
1709 _emit_ldxi_d(jit_state_t *_jit, jit_fpr_t r0, jit_gpr_t r1, jit_word_t i0)
1711 ldxi_d(rn(r0), rn(r1), i0);
1715 _emit_stxi_d(jit_state_t *_jit, jit_word_t i0, jit_gpr_t r0, jit_fpr_t r1)
1717 stxi_d(i0, rn(r0), rn(r1));
1721 _jit_get_reg_pair(jit_state_t *_jit)
1724 /* Try to find a register pair for use with operations that
1725 * require a odd based register pair. Search for the best
1726 * match to avoid spills or at least a valid operation.
1729 /* Try non callee save first */
1730 if (jit_reg_free_p(_R0) && jit_reg_free_p(_R1))
1732 else if (jit_reg_free_p(_R2) && jit_reg_free_p(_R3))
1734 else if (jit_reg_free_p(_R4) && jit_reg_free_p(_R5))
1736 /* Try callee save registers */
1737 else if (jit_reg_free_p(_R10) && jit_reg_free_p(_R11))
1738 r1 = _R10, r2 = _R11;
1739 else if (jit_reg_free_p(_R8) && jit_reg_free_p(_R9))
1741 else if (jit_reg_free_p(_R6) && jit_reg_free_p(_R7))
1744 /* We *must* find a register pair */
1745 else if (jit_reg_free_if_spill_p(_R0) && jit_reg_free_if_spill_p(_R1))
1747 else if (jit_reg_free_if_spill_p(_R2) && jit_reg_free_if_spill_p(_R3))
1749 else if (jit_reg_free_if_spill_p(_R4) && jit_reg_free_if_spill_p(_R5))
1751 else if (jit_reg_free_if_spill_p(_R10) && jit_reg_free_if_spill_p(_R11))
1752 r1 = _R10, r2 = _R11;
1753 else if (jit_reg_free_if_spill_p(_R8) && jit_reg_free_if_spill_p(_R9))
1755 else if (jit_reg_free_if_spill_p(_R6) && jit_reg_free_if_spill_p(_R7))
1758 /* Do not jit_get_reg() all registers to avoid it */
1761 (void)jit_get_reg(jit_class_gpr|jit_class_named|r1);
1762 (void)jit_get_reg(jit_class_gpr|jit_class_named|r2);
1768 _jit_unget_reg_pair(jit_state_t *_jit, jit_int32_t reg)
1773 case _R0: r2 = _R1; break;
1774 case _R2: r2 = _R3; break;
1775 case _R4: r2 = _R5; break;
1776 case _R6: r2 = _R7; break;
1777 case _R8: r2 = _R9; break;
1778 case _R10: r2 = _R11; break;
1786 _jit_get_reg_but_zero(jit_state_t *_jit, jit_int32_t flags)
1789 reg = jit_get_reg(jit_class_gpr);
1791 reg = jit_get_reg(jit_class_gpr|flags);
1798 _patch(jit_state_t *_jit, jit_word_t instr, jit_node_t *node)
1802 assert(node->flag & jit_flag_node);
1803 if (node->code == jit_code_movi)
1804 flag = node->v.n->flag;
1806 flag = node->u.n->flag;
1807 assert(!(flag & jit_flag_patch));
1808 if (_jitc->patches.offset >= _jitc->patches.length) {
1809 jit_realloc((jit_pointer_t *)&_jitc->patches.ptr,
1810 _jitc->patches.length * sizeof(jit_patch_t),
1811 (_jitc->patches.length + 1024) * sizeof(jit_patch_t));
1812 _jitc->patches.length += 1024;
1814 _jitc->patches.ptr[_jitc->patches.offset].inst = instr;
1815 _jitc->patches.ptr[_jitc->patches.offset].node = node;
1816 ++_jitc->patches.offset;