# define I_DISP (__WORDSIZE >> 3) - sizeof(jit_int32_t)
# define F_DISP (__WORDSIZE >> 3) - sizeof(jit_float32_t)
#endif
+#define CVT_OFFSET _jitc->function->cvt_offset
+#define CHECK_CVT_OFFSET() \
+ do { \
+ if (!_jitc->function->cvt_offset) { \
+ _jitc->again = 1; \
+ _jitc->function->cvt_offset = \
+ jit_allocai(sizeof(jit_float64_t)); \
+ } \
+ } while (0)
/*
* Types
#define PROTO 1
# include "jit_ppc-cpu.c"
# include "jit_ppc-fpu.c"
+# include "jit_fallback.c"
#undef PROTO
/*
{ _NOREG, "<none>" },
};
+static jit_int32_t iregs[] = {
+ _R14, _R15, _R16, _R17, _R18, _R19, _R20, _R21, _R22,
+ _R23, _R24, _R25, _R26, _R27, _R28, _R29, _R30
+};
+
+static jit_int32_t fregs[] = {
+ _F14, _F15, _F16, _F17, _F18, _F19, _F20, _F21,
+};
+
/*
* Implementation
*/
_jitc->function->self.argi = _jitc->function->self.argf =
_jitc->function->self.alen = 0;
/* float conversion */
+ _jitc->function->cvt_offset = 0;
_jitc->function->self.aoff = alloca_offset - 8;
_jitc->function->self.call = jit_call_default;
jit_alloc((jit_pointer_t *)&_jitc->function->regoff,
_jit_allocai(jit_state_t *_jit, jit_int32_t length)
{
assert(_jitc->function);
+ jit_check_frame();
switch (length) {
case 0: case 1: break;
case 2: _jitc->function->self.aoff &= -2; break;
jit_inc_synth_wp(getarg_c, u, v);
if (jit_arg_reg_p(v->u.w))
jit_extr_c(u, JIT_RA0 - v->u.w);
- else
+ else {
+ jit_check_frame();
jit_ldxi_c(u, JIT_FP, v->u.w + C_DISP);
+ }
jit_dec_synth();
}
jit_inc_synth_wp(getarg_uc, u, v);
if (jit_arg_reg_p(v->u.w))
jit_extr_uc(u, JIT_RA0 - v->u.w);
- else
+ else {
+ jit_check_frame();
jit_ldxi_uc(u, JIT_FP, v->u.w + C_DISP);
+ }
jit_dec_synth();
}
jit_inc_synth_wp(getarg_s, u, v);
if (jit_arg_reg_p(v->u.w))
jit_extr_s(u, JIT_RA0 - v->u.w);
- else
+ else {
+ jit_check_frame();
jit_ldxi_s(u, JIT_FP, v->u.w + S_DISP);
+ }
jit_dec_synth();
}
jit_inc_synth_wp(getarg_us, u, v);
if (jit_arg_reg_p(v->u.w))
jit_extr_us(u, JIT_RA0 - v->u.w);
- else
+ else {
+ jit_check_frame();
jit_ldxi_us(u, JIT_FP, v->u.w + S_DISP);
+ }
jit_dec_synth();
}
jit_extr_i(u, JIT_RA0 - v->u.w);
#endif
}
- else
+ else {
+ jit_check_frame();
jit_ldxi_i(u, JIT_FP, v->u.w + I_DISP);
+ }
jit_dec_synth();
}
jit_inc_synth_wp(getarg_ui, u, v);
if (jit_arg_reg_p(v->u.w))
jit_extr_ui(u, JIT_RA0 - v->u.w);
- else
+ else {
+ jit_check_frame();
jit_ldxi_ui(u, JIT_FP, v->u.w + I_DISP);
+ }
jit_dec_synth();
}
jit_inc_synth_wp(getarg_l, u, v);
if (jit_arg_reg_p(v->u.w))
jit_movr(u, JIT_RA0 - v->u.w);
- else
+ else {
+ jit_check_frame();
jit_ldxi_l(u, JIT_FP, v->u.w);
+ }
jit_dec_synth();
}
#endif
jit_code_inc_synth_wp(code, u, v);
if (jit_arg_reg_p(v->u.w))
jit_movr(JIT_RA0 - v->u.w, u);
- else
+ else {
+ jit_check_frame();
jit_stxi(v->u.w, JIT_FP, u);
+ }
jit_dec_synth();
}
if (jit_arg_reg_p(v->u.w))
jit_movi(JIT_RA0 - v->u.w, u);
else {
+ jit_check_frame();
regno = jit_get_reg(jit_class_gpr);
jit_movi(regno, u);
jit_stxi(v->u.w, JIT_FP, regno);
jit_inc_synth_wp(getarg_f, u, v);
if (jit_arg_f_reg_p(v->u.w))
jit_movr_d(u, JIT_FA0 - v->u.w);
- else
+ else {
+ jit_check_frame();
jit_ldxi_f(u, JIT_FP, v->u.w);
+ }
jit_dec_synth();
}
jit_inc_synth_wp(putargr_f, u, v);
if (jit_arg_f_reg_p(v->u.w))
jit_movr_d(JIT_FA0 - v->u.w, u);
- else
+ else {
+ jit_check_frame();
jit_stxi_f(v->u.w, JIT_FP, u);
+ }
jit_dec_synth();
}
if (jit_arg_f_reg_p(v->u.w))
jit_movi_d(JIT_FA0 - v->u.w, u);
else {
+ jit_check_frame();
regno = jit_get_reg(jit_class_fpr);
jit_movi_d(regno, u);
jit_stxi_f(v->u.w, JIT_FP, regno);
jit_inc_synth_wp(getarg_d, u, v);
if (jit_arg_f_reg_p(v->u.w))
jit_movr_d(u, JIT_FA0 - v->u.w);
- else
+ else {
+ jit_check_frame();
jit_ldxi_d(u, JIT_FP, v->u.w);
+ }
jit_dec_synth();
}
jit_inc_synth_wp(putargr_d, u, v);
if (jit_arg_f_reg_p(v->u.w))
jit_movr_d(JIT_FA0 - v->u.w, u);
- else
+ else {
+ jit_check_frame();
jit_stxi_d(v->u.w, JIT_FP, u);
+ }
jit_dec_synth();
}
if (jit_arg_f_reg_p(v->u.w))
jit_movi_d(JIT_FA0 - v->u.w, u);
else {
+ jit_check_frame();
regno = jit_get_reg(jit_class_fpr);
jit_movi_d(regno, u);
jit_stxi_d(v->u.w, JIT_FP, regno);
+ 1
# endif
)) {
- /* use reserved 8 bytes area */
- jit_stxi_d(alloca_offset - 8, JIT_FP, u);
- jit_ldxi(JIT_RA0 - _jitc->function->call.argi, JIT_FP,
- alloca_offset - 8);
+ CHECK_CVT_OFFSET();
+ jit_check_frame();
+ jit_stxi_d(CVT_OFFSET, JIT_FP, u);
+ jit_ldxi(JIT_RA0 - _jitc->function->call.argi, JIT_FP, CVT_OFFSET);
_jitc->function->call.argi++;
# if __WORDSIZE == 32
jit_ldxi(JIT_RA0 - _jitc->function->call.argi, JIT_FP,
- alloca_offset - 4);
+ CVT_OFFSET + 4);
_jitc->function->call.argi++;
# endif
}
+ 1
# endif
)) {
- /* use reserved 8 bytes area */
- jit_stxi_d(alloca_offset - 8, JIT_FP, regno);
+ CHECK_CVT_OFFSET();
+ jit_check_frame();
+ jit_stxi_d(CVT_OFFSET, JIT_FP, regno);
jit_ldxi(JIT_RA0 - _jitc->function->call.argi, JIT_FP,
- alloca_offset - 8);
+ CVT_OFFSET);
_jitc->function->call.argi++;
# if __WORDSIZE == 32
jit_ldxi(JIT_RA0 - _jitc->function->call.argi, JIT_FP,
- alloca_offset - 4);
+ CVT_OFFSET + 4);
_jitc->function->call.argi++;
# endif
}
+ 1
# endif
)) {
- /* use reserved 8 bytes area */
- jit_stxi_d(alloca_offset - 8, JIT_FP, u);
- jit_ldxi(JIT_RA0 - _jitc->function->call.argi, JIT_FP,
- alloca_offset - 8);
+ CHECK_CVT_OFFSET();
+ jit_check_frame();
+ jit_stxi_d(CVT_OFFSET, JIT_FP, u);
+ jit_ldxi(JIT_RA0 - _jitc->function->call.argi, JIT_FP, CVT_OFFSET);
_jitc->function->call.argi++;
# if __WORDSIZE == 32
- jit_ldxi(JIT_RA0 - _jitc->function->call.argi, JIT_FP,
- alloca_offset - 4);
+ jit_ldxi(JIT_RA0 - _jitc->function->call.argi, JIT_FP, CVT_OFFSET + 4);
_jitc->function->call.argi++;
# endif
}
+ 1
# endif
)) {
- /* use reserved 8 bytes area */
- jit_stxi_d(alloca_offset - 8, JIT_FP, regno);
+ CHECK_CVT_OFFSET();
+ jit_check_frame();
+ jit_stxi_d(CVT_OFFSET, JIT_FP, regno);
jit_ldxi(JIT_RA0 - _jitc->function->call.argi, JIT_FP,
- alloca_offset - 8);
+ CVT_OFFSET);
_jitc->function->call.argi++;
# if __WORDSIZE == 32
jit_ldxi(JIT_RA0 - _jitc->function->call.argi, JIT_FP,
- alloca_offset - 4);
+ CVT_OFFSET + 4);
_jitc->function->call.argi++;
# endif
}
name##r##type(rn(node->u.q.l), rn(node->u.q.h), \
rn(node->v.w), rn(node->w.w)); \
break
+#define case_rqr(name, type) \
+ case jit_code_##name##r##type: \
+ name##r##type(rn(node->u.w), rn(node->v.q.l), \
+ rn(node->v.q.h), rn(node->w.w)); \
+ case jit_code_##name##i##type: \
+ break;
#define case_rrw(name, type) \
case jit_code_##name##i##type: \
name##i##type(rn(node->u.w), rn(node->v.w), node->w.w); \
case_rrw(rsb,);
case_rrr(mul,);
case_rrw(mul,);
+ case_rrr(hmul,);
+ case_rrw(hmul,);
+ case_rrr(hmul, _u);
+ case_rrw(hmul, _u);
case_rrrr(qmul,);
case_rrrw(qmul,);
case_rrrr(qmul, _u);
case_rrw(xor,);
case_rrr(lsh,);
case_rrw(lsh,);
+ case_rrrr(qlsh,);
+ case_rrrw(qlsh,);
+ case_rrrr(qlsh, _u);
+ case_rrrw(qlsh, _u);
case_rrr(rsh,);
case_rrw(rsh,);
case_rrr(rsh, _u);
case_rrw(rsh, _u);
+ case_rrrr(qrsh,);
+ case_rrrw(qrsh,);
+ case_rrrr(qrsh, _u);
+ case_rrrw(qrsh, _u);
+ case_rrr(lrot,);
+ case_rrw(lrot,);
+ case_rrr(rrot,);
+ case_rrw(rrot,);
+ case jit_code_extr:
+ extr(rn(node->u.w), rn(node->v.w), node->w.q.l, node->w.q.h);
+ break;
+ case jit_code_extr_u:
+ extr_u(rn(node->u.w), rn(node->v.w), node->w.q.l, node->w.q.h);
+ break;
+ case jit_code_depr:
+ depr(rn(node->u.w), rn(node->v.w), node->w.q.l, node->w.q.h);
+ break;
+ case jit_code_depi:
+ depi(rn(node->u.w), node->v.w, node->w.q.l, node->w.q.h);
+ break;
case_rr(ext, _c);
case_rr(ext, _uc);
case_rr(ext, _s);
case_rr(clz,);
case_rr(cto,);
case_rr(ctz,);
+#define rbitr(r0, r1) fallback_rbit(r0, r1)
+ case_rr(rbit,);
+ case_rr(popcnt,);
case jit_code_casr:
casr(rn(node->u.w), rn(node->v.w),
rn(node->w.q.l), rn(node->w.q.h));
case_rrr(ldx, _l);
case_rrw(ldx, _l);
#endif
+#define unldr(r0, r1, i0) fallback_unldr(r0, r1, i0)
+ case jit_code_unldr:
+ unldr(rn(node->u.w), rn(node->v.w), node->w.w);
+ break;
+#define unldi(r0, i0, i1) fallback_unldi(r0, i0, i1)
+ case jit_code_unldi:
+ unldi(rn(node->u.w), node->v.w, node->w.w);
+ break;
+#define unldr_u(r0, r1, i0) fallback_unldr_u(r0, r1, i0)
+ case jit_code_unldr_u:
+ unldr_u(rn(node->u.w), rn(node->v.w), node->w.w);
+ break;
+#define unldi_u(r0, i0, i1) fallback_unldi_u(r0, i0, i1)
+ case jit_code_unldi_u:
+ unldi_u(rn(node->u.w), node->v.w, node->w.w);
+ break;
case_rr(st, _c);
case_wr(st, _c);
case_rrr(stx, _c);
case_rrr(stx, _l);
case_wrr(stx, _l);
#endif
+#define unstr(r0, r1, i0) fallback_unstr(r0, r1, i0)
+ case jit_code_unstr:
+ unstr(rn(node->u.w), rn(node->v.w), node->w.w);
+ break;
+#define unsti(i0, r0, i1) fallback_unsti(i0, r0, i1)
+ case jit_code_unsti:
+ unsti(node->u.w, rn(node->v.w), node->w.w);
+ break;
case_rr(mov, _f);
case jit_code_movi_f:
assert(node->flag & jit_flag_data);
case_rr(abs, _f);
case_rr(neg, _f);
case_rr(sqrt, _f);
+ case_rqr(fma, _f);
+ case_rqr(fms, _f);
+ case_rqr(fnma, _f);
+ case_rqr(fnms, _f);
case_rrr(add, _f);
case_rrf(add, _f, 32);
case_rrr(sub, _f);
case_rw(ld, _f);
case_rrr(ldx, _f);
case_rrw(ldx, _f);
+#define unldr_x(r0, r1, i0) fallback_unldr_x(r0, r1, i0)
+ case jit_code_unldr_x:
+ unldr_x(rn(node->u.w), rn(node->v.w), node->w.w);
+ break;
+#define unldi_x(r0, i0, i1) fallback_unldi_x(r0, i0, i1)
+ case jit_code_unldi_x:
+ unldi_x(rn(node->u.w), node->v.w, node->w.w);
+ break;
case_rr(st, _f);
case_wr(st, _f);
case_rrr(stx, _f);
case_wrr(stx, _f);
+#define unstr_x(r0, r1, i0) fallback_unstr_x(r0, r1, i0)
+ case jit_code_unstr_x:
+ unstr_x(rn(node->u.w), rn(node->v.w), node->w.w);
+ break;
+#define unsti_x(i0, r0, i1) fallback_unsti_x(i0, r0, i1)
+ case jit_code_unsti_x:
+ unsti_x(node->u.w, rn(node->v.w), node->w.w);
+ break;
case_rr(mov, _d);
case jit_code_movi_d:
assert(node->flag & jit_flag_data);
case_rr(abs, _d);
case_rr(neg, _d);
case_rr(sqrt, _d);
+ case_rqr(fma, _d);
+ case_rqr(fms, _d);
+ case_rqr(fnma, _d);
+ case_rqr(fnms, _d);
case_rrr(add, _d);
case_rrf(add, _d, 64);
case_rrr(sub, _d);
case_rrr(stx, _d);
case_wrr(stx, _d);
case jit_code_jmpr:
+ jit_check_frame();
jmpr(rn(node->u.w));
break;
case jit_code_jmpi:
patch(word, node);
}
}
- else
+ else {
+ jit_check_frame();
jmpi(node->u.w);
+ }
break;
case jit_code_callr:
#if _CALL_SYSV
# define xcalli_p(u, v) calli_p(u)
# define xcalli(u, v) calli(u)
#endif
+ jit_check_frame();
xcallr(rn(node->u.w), !!(node->flag & jit_flag_varargs));
break;
case jit_code_calli:
value = !!(node->flag & jit_flag_varargs);
if (node->flag & jit_flag_node) {
+ _jitc->function->need_return = 1;
temp = node->u.n;
assert(temp->code == jit_code_label ||
temp->code == jit_code_epilog);
patch(word, node);
}
}
- else
+ else {
+ jit_check_frame();
xcalli(node->u.w, value);
+ }
break;
case jit_code_prolog:
_jitc->function = _jitc->functions.ptr + node->w.w;
* the reason of the undo. */
undo.func.self.aoff = _jitc->function->frame +
_jitc->function->self.aoff;
+ undo.func.need_frame = _jitc->function->need_frame;
+ undo.func.need_stack = _jitc->function->need_stack;
+ undo.func.need_return = _jitc->function->need_return;
jit_regset_set(&undo.func.regset, &_jitc->function->regset);
/* allocar information also does not need to be undone */
undo.func.aoffoff = _jitc->function->aoffoff;
undo.func.allocar = _jitc->function->allocar;
+ /* cvt_offset must also not be undone */
+ undo.func.cvt_offset = _jitc->function->cvt_offset;
memcpy(_jitc->function, &undo.func, sizeof(undo.func));
#if DEVEL_DISASSEMBLER
prevw = undo.prevw;
epilog(node);
_jitc->function = NULL;
break;
+ case jit_code_movr_w_f:
+ movr_w_f(rn(node->u.w), rn(node->v.w));
+ break;
+ case jit_code_movr_f_w:
+ movr_f_w(rn(node->u.w), rn(node->v.w));
+ break;
+ case jit_code_movi_f_w:
+ assert(node->flag & jit_flag_data);
+ movi_f_w(rn(node->u.w), *(jit_float32_t *)node->v.n->u.w);
+ break;
+ case jit_code_movi_w_f:
+ movi_w_f(rn(node->u.w), node->v.w);
+ break;
+#if __WORDSIZE == 64
+ case jit_code_movr_d_w:
+ movr_d_w(rn(node->u.w), rn(node->v.w));
+ break;
+ case jit_code_movi_d_w:
+ assert(node->flag & jit_flag_data);
+ movi_d_w(rn(node->u.w), *(jit_float64_t *)node->v.n->u.w);
+ break;
+ case jit_code_movr_w_d:
+ movr_w_d(rn(node->u.w), rn(node->v.w));
+ break;
+ case jit_code_movi_w_d:
+ movi_w_d(rn(node->u.w), node->v.w);
+ break;
+#else
+ case jit_code_movr_ww_d:
+ movr_ww_d(rn(node->u.w), rn(node->v.w), rn(node->w.w));
+ break;
+ case jit_code_movr_d_ww:
+ movr_d_ww(rn(node->u.w), rn(node->v.w), rn(node->w.w));
+ break;
+ case jit_code_movi_d_ww:
+ assert(node->flag & jit_flag_data);
+ movi_d_ww(rn(node->u.w), rn(node->v.w),
+ *(jit_float64_t *)node->w.n->u.w);
+ break;
+ case jit_code_movi_ww_d:
+ movi_ww_d(rn(node->u.w), node->v.w, node->w.w);
+ break;
+#endif
case jit_code_va_start:
vastart(rn(node->u.w));
break;
case jit_code_retval_f: case jit_code_retval_d:
case jit_code_prepare:
case jit_code_finishr: case jit_code_finishi:
+ case jit_code_negi_f: case jit_code_absi_f:
+ case jit_code_sqrti_f: case jit_code_negi_d:
+ case jit_code_absi_d: case jit_code_sqrti_d:
+ break;
+ case jit_code_negi:
+ negi(rn(node->u.w), node->v.w);
+ break;
+ case jit_code_comi:
+ comi(rn(node->u.w), node->v.w);
+ break;
+ case jit_code_exti_c:
+ exti_c(rn(node->u.w), node->v.w);
+ break;
+ case jit_code_exti_uc:
+ exti_uc(rn(node->u.w), node->v.w);
+ break;
+ case jit_code_exti_s:
+ exti_s(rn(node->u.w), node->v.w);
+ break;
+ case jit_code_exti_us:
+ exti_us(rn(node->u.w), node->v.w);
+ break;
+ case jit_code_bswapi_us:
+ bswapi_us(rn(node->u.w), node->v.w);
+ break;
+ case jit_code_bswapi_ui:
+ bswapi_ui(rn(node->u.w), node->v.w);
+ break;
+ case jit_code_htoni_us:
+ htoni_us(rn(node->u.w), node->v.w);
+ break;
+ case jit_code_htoni_ui:
+ htoni_ui(rn(node->u.w), node->v.w);
+ break;
+#if __WORDSIZE == 64
+ case jit_code_exti_i:
+ exti_i(rn(node->u.w), node->v.w);
+ break;
+ case jit_code_exti_ui:
+ exti_ui(rn(node->u.w), node->v.w);
+ break;
+ case jit_code_bswapi_ul:
+ bswapi_ul(rn(node->u.w), node->v.w);
+ break;
+ case jit_code_htoni_ul:
+ htoni_ul(rn(node->u.w), node->v.w);
+ break;
+#endif
+ case jit_code_cloi:
+ cloi(rn(node->u.w), node->v.w);
+ break;
+ case jit_code_clzi:
+ clzi(rn(node->u.w), node->v.w);
+ break;
+ case jit_code_ctoi:
+ ctoi(rn(node->u.w), node->v.w);
+ break;
+ case jit_code_ctzi:
+ ctzi(rn(node->u.w), node->v.w);
+ break;
+ case jit_code_rbiti:
+ rbiti(rn(node->u.w), node->v.w);
+ break;
+ case jit_code_popcnti:
+ popcnti(rn(node->u.w), node->v.w);
+ break;
+ case jit_code_exti:
+ exti(rn(node->u.w), node->v.w, node->w.q.l, node->w.q.h);
+ break;
+ case jit_code_exti_u:
+ exti_u(rn(node->u.w), node->v.w, node->w.q.l, node->w.q.h);
break;
default:
abort();
#define CODE 1
# include "jit_ppc-cpu.c"
# include "jit_ppc-fpu.c"
+# include "jit_fallback.c"
#undef CODE
void