2 * Copyright (C) 2012-2019 Free Software Foundation, Inc.
4 * This file is part of GNU lightning.
6 * GNU lightning is free software; you can redistribute it and/or modify it
7 * under the terms of the GNU Lesser General Public License as published
8 * by the Free Software Foundation; either version 3, or (at your option)
11 * GNU lightning is distributed in the hope that it will be useful, but
12 * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
13 * or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public
14 * License for more details.
17 * Paulo Cesar Pereira de Andrade
20 /* avoid using it due to partial stalls */
24 # if __X32 || __X64_32
26 # define ldi(u, v) ldi_i(u, v)
27 # define ldr(u, v) ldr_i(u, v)
28 # define ldxr(u, v, w) ldxr_i(u, v, w)
29 # define ldxi(u, v, w) ldxi_i(u, v, w)
30 # define sti(u, v) sti_i(u, v)
31 # define stxi(u, v, w) stxi_i(u, v, w)
32 # define can_sign_extend_int_p(im) 1
33 # define can_zero_extend_int_p(im) 1
34 # define fits_uint32_p(im) 1
37 # define ldi(u, v) ldi_l(u, v)
38 # define ldr(u, v) ldr_l(u, v)
39 # define ldxr(u, v, w) ldxr_l(u, v, w)
40 # define ldxi(u, v, w) ldxi_l(u, v, w)
41 # define sti(u, v) sti_l(u, v)
42 # define stxi(u, v, w) stxi_l(u, v, w)
43 # define can_sign_extend_int_p(im) \
44 (((im) >= 0 && (long long)(im) <= 0x7fffffffLL) || \
45 ((im) < 0 && (long long)(im) > -0x80000000LL))
46 # define can_zero_extend_int_p(im) \
47 ((im) >= 0 && (im) < 0x80000000LL)
48 # define fits_uint32_p(im) (((im) & 0xffffffff00000000LL) == 0)
50 # if __X32 || __CYGWIN__ || __X64_32 || _WIN32
52 ((rn) >= _RAX_REGNO && (rn) <= _RBX_REGNO)
66 # define _R10_REGNO 10
67 # define _R11_REGNO 11
68 # define _R12_REGNO 12
69 # define _R13_REGNO 13
70 # define _R14_REGNO 14
71 # define _R15_REGNO 15
72 # define r7(reg) ((reg) & 7)
73 # define r8(reg) ((reg) & 15)
79 # define X86_OR 1 << 3
80 # define X86_ADC 2 << 3
81 # define X86_SBB 3 << 3
82 # define X86_AND 4 << 3
83 # define X86_SUB 5 << 3
84 # define X86_XOR 6 << 3
85 # define X86_CMP 7 << 3
100 # define X86_CC_NO 0x1
101 # define X86_CC_NAE 0x2
102 # define X86_CC_B 0x2
103 # define X86_CC_C 0x2
104 # define X86_CC_AE 0x3
105 # define X86_CC_NB 0x3
106 # define X86_CC_NC 0x3
107 # define X86_CC_E 0x4
108 # define X86_CC_Z 0x4
109 # define X86_CC_NE 0x5
110 # define X86_CC_NZ 0x5
111 # define X86_CC_BE 0x6
112 # define X86_CC_NA 0x6
113 # define X86_CC_A 0x7
114 # define X86_CC_NBE 0x7
115 # define X86_CC_S 0x8
116 # define X86_CC_NS 0x9
117 # define X86_CC_P 0xa
118 # define X86_CC_PE 0xa
119 # define X86_CC_NP 0xb
120 # define X86_CC_PO 0xb
121 # define X86_CC_L 0xc
122 # define X86_CC_NGE 0xc
123 # define X86_CC_GE 0xd
124 # define X86_CC_NL 0xd
125 # define X86_CC_LE 0xe
126 # define X86_CC_NG 0xe
127 # define X86_CC_G 0xf
128 # define X86_CC_NLE 0xf
129 # define mrm(md, r, m) *_jit->pc.uc++ = (md<<6) | (r<<3) | m
130 # define sib(sc, i, b) *_jit->pc.uc++ = (sc<<6) | (i<<3) | b
131 # define ic(c) *_jit->pc.uc++ = c
132 # define is(s) *_jit->pc.us++ = s
133 # define ii(i) *_jit->pc.ui++ = i
134 # if __X64 && !__X64_32
135 # define il(l) *_jit->pc.ul++ = l
139 # define patch_abs(instr, label) \
140 *(jit_word_t *)(instr - sizeof(jit_word_t)) = label
141 # define patch_rel(instr, label) \
142 *(jit_int32_t *)(instr - 4) = label - instr
143 # define patch_rel_char(instr, label) \
144 *(jit_int8_t *)(instr - 1) = label - instr
145 # define rex(l, w, r, x, b) _rex(_jit, l, w, r, x, b)
147 _rex(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t,jit_int32_t,jit_int32_t);
148 # define rx(rd, md, rb, ri, ms) _rx(_jit, rd, md, rb, ri, ms)
150 _rx(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t,jit_int32_t,jit_int32_t);
151 # define nop(n) _nop(_jit, n)
152 static void _nop(jit_state_t*, jit_int32_t);
153 # define emms() is(0x770f)
154 # define lea(md, rb, ri, ms, rd) _lea(_jit, md, rb, ri, ms, rd)
156 _lea(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t,jit_int32_t,jit_int32_t);
157 # define pushr(r0) _pushr(_jit, r0)
158 static void _pushr(jit_state_t*, jit_int32_t) maybe_unused;
159 # define popr(r0) _popr(_jit, r0)
160 static void _popr(jit_state_t*, jit_int32_t) maybe_unused;
161 # define xchgr(r0, r1) _xchgr(_jit, r0, r1)
162 static void _xchgr(jit_state_t*, jit_int32_t, jit_int32_t);
163 # define testr(r0, r1) _testr(_jit, r0, r1)
164 static void _testr(jit_state_t*, jit_int32_t, jit_int32_t);
165 # define testi(r0, i0) _testi(_jit, r0, i0)
166 static void _testi(jit_state_t*, jit_int32_t, jit_word_t);
167 # define cc(code, r0) _cc(_jit, code, r0)
168 static void _cc(jit_state_t*, jit_int32_t, jit_int32_t);
169 # define icmpr(r0, r1) alur(X86_CMP, r0, r1)
170 # define alur(code, r0, r1) _alur(_jit, code, r0, r1)
171 static void _alur(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
172 # define icmpi(r0, i0) alui(X86_CMP, r0, i0)
173 # define alui(code, r0, i0) _alui(_jit, code, r0, i0)
174 static void _alui(jit_state_t*, jit_int32_t, jit_int32_t, jit_word_t);
175 # define iaddr(r0, r1) alur(X86_ADD, r0, r1)
176 # define save(r0) _save(_jit, r0)
177 static void _save(jit_state_t*, jit_int32_t);
178 # define load(r0) _load(_jit, r0)
179 static void _load(jit_state_t*, jit_int32_t);
180 # define addr(r0, r1, r2) _addr(_jit, r0, r1, r2)
181 static void _addr(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
182 # define iaddi(r0, i0) alui(X86_ADD, r0, i0)
183 # define addi(r0, r1, i0) _addi(_jit, r0, r1, i0)
184 static void _addi(jit_state_t*, jit_int32_t, jit_int32_t, jit_word_t);
185 #define addcr(r0, r1, r2) _addcr(_jit, r0, r1, r2)
186 static void _addcr(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
187 #define addci(r0, r1, i0) _addci(_jit, r0, r1, i0)
188 static void _addci(jit_state_t*, jit_int32_t, jit_int32_t, jit_word_t);
189 # define iaddxr(r0, r1) alur(X86_ADC, r0, r1)
190 # define addxr(r0, r1, r2) _addxr(_jit, r0, r1, r2)
191 static void _addxr(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
192 # define iaddxi(r0, i0) alui(X86_ADC, r0, i0)
193 # define addxi(r0, r1, i0) _addxi(_jit, r0, r1, i0)
194 static void _addxi(jit_state_t*, jit_int32_t, jit_int32_t, jit_word_t);
195 # define isubr(r0, r1) alur(X86_SUB, r0, r1)
196 # define subr(r0, r1, r2) _subr(_jit, r0, r1, r2)
197 static void _subr(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
198 # define isubi(r0, i0) alui(X86_SUB, r0, i0)
199 # define subi(r0, r1, i0) _subi(_jit, r0, r1, i0)
200 static void _subi(jit_state_t*, jit_int32_t, jit_int32_t, jit_word_t);
201 # define subcr(r0, r1, r2) _subcr(_jit, r0, r1, r2)
202 static void _subcr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
203 # define subci(r0, r1, i0) _subci(_jit, r0, r1, i0)
204 static void _subci(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
205 # define isubxr(r0, r1) alur(X86_SBB, r0, r1)
206 # define subxr(r0, r1, r2) _subxr(_jit, r0, r1, r2)
207 static void _subxr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
208 # define isubxi(r0, i0) alui(X86_SBB, r0, i0)
209 # define subxi(r0, r1, i0) _subxi(_jit, r0, r1, i0)
210 static void _subxi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
211 # define rsbi(r0, r1, i0) _rsbi(_jit, r0, r1, i0)
212 static void _rsbi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
213 # define imulr(r0, r1) _imulr(_jit, r0, r1)
214 static void _imulr(jit_state_t*, jit_int32_t, jit_int32_t);
215 # define imuli(r0, r1, i0) _imuli(_jit, r0, r1, i0)
216 static void _imuli(jit_state_t*, jit_int32_t, jit_int32_t, jit_word_t);
217 # define mulr(r0, r1, r2) _mulr(_jit, r0, r1, r2)
218 static void _mulr(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
219 # define muli(r0, r1, i0) _muli(_jit, r0, r1, i0)
220 static void _muli(jit_state_t*, jit_int32_t, jit_int32_t, jit_word_t);
221 # define umulr(r0) unr(X86_IMUL, r0)
222 # define umulr_u(r0) unr(X86_MUL, r0)
223 # define qmulr(r0, r1, r2, r3) _iqmulr(_jit, r0, r1, r2, r3, 1)
224 # define qmulr_u(r0, r1, r2, r3) _iqmulr(_jit, r0, r1, r2, r3, 0)
225 # define iqmulr(r0, r1, r2, r3, sign) _iqmulr(_jit, r0, r1, r2, r3, sign)
226 static void _iqmulr(jit_state_t*, jit_int32_t, jit_int32_t,
227 jit_int32_t,jit_int32_t, jit_bool_t);
228 # define qmuli(r0, r1, r2, i0) _iqmuli(_jit, r0, r1, r2, i0, 1)
229 # define qmuli_u(r0, r1, r2, i0) _iqmuli(_jit, r0, r1, r2, i0, 0)
230 # define iqmuli(r0, r1, r2, i0, sign) _iqmuli(_jit, r0, r1, r2, i0, sign)
231 static void _iqmuli(jit_state_t*, jit_int32_t, jit_int32_t,
232 jit_int32_t,jit_word_t, jit_bool_t);
233 # define sign_extend_rdx_rax() _sign_extend_rdx_rax(_jit)
234 static void _sign_extend_rdx_rax(jit_state_t*);
235 # define idivr(r0) unr(X86_IDIV, r0)
236 # define idivr_u(r0) unr(X86_DIV, r0)
237 # define divremr(r0, r1, r2, i0, i1) _divremr(_jit, r0, r1, r2, i0, i1)
239 _divremr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t,
240 jit_bool_t,jit_bool_t);
241 # define divremi(r0, r1, i0, i1, i2) _divremi(_jit, r0, r1, i0, i1, i2)
243 _divremi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t,jit_bool_t,jit_bool_t);
244 # define divr(r0, r1, r2) divremr(r0, r1, r2, 1, 1)
245 # define divi(r0, r1, i0) divremi(r0, r1, i0, 1, 1)
246 # define divr_u(r0, r1, r2) divremr(r0, r1, r2, 0, 1)
247 # define divi_u(r0, r1, i0) divremi(r0, r1, i0, 0, 1)
248 # define qdivr(r0, r1, r2, r3) _iqdivr(_jit, r0, r1, r2, r3, 1)
249 # define qdivr_u(r0, r1, r2, r3) _iqdivr(_jit, r0, r1, r2, r3, 0)
250 # define iqdivr(r0, r1, r2, r3, sign) _iqdivr(_jit, r0, r1, r2, r3, sign)
251 static void _iqdivr(jit_state_t*, jit_int32_t, jit_int32_t,
252 jit_int32_t,jit_int32_t, jit_bool_t);
253 # define qdivi(r0, r1, r2, i0) _iqdivi(_jit, r0, r1, r2, i0, 1)
254 # define qdivi_u(r0, r1, r2, i0) _iqdivi(_jit, r0, r1, r2, i0, 0)
255 # define iqdivi(r0, r1, r2, i0, sign) _iqdivi(_jit, r0, r1, r2, i0, sign)
256 static void _iqdivi(jit_state_t*, jit_int32_t, jit_int32_t,
257 jit_int32_t,jit_word_t, jit_bool_t);
258 # define remr(r0, r1, r2) divremr(r0, r1, r2, 1, 0)
259 # define remi(r0, r1, i0) divremi(r0, r1, i0, 1, 0)
260 # define remr_u(r0, r1, r2) divremr(r0, r1, r2, 0, 0)
261 # define remi_u(r0, r1, i0) divremi(r0, r1, i0, 0, 0)
262 # define iandr(r0, r1) alur(X86_AND, r0, r1)
263 # define andr(r0, r1, r2) _andr(_jit, r0, r1, r2)
264 static void _andr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
265 # define iandi(r0, i0) alui(X86_AND, r0, i0)
266 # define andi(r0, r1, i0) _andi(_jit, r0, r1, i0)
267 static void _andi(jit_state_t*, jit_int32_t,jit_int32_t,jit_word_t);
268 # define iorr(r0, r1) alur(X86_OR, r0, r1)
269 # define orr(r0, r1, r2) _orr(_jit, r0, r1, r2)
270 static void _orr(jit_state_t*, jit_int32_t,jit_int32_t,jit_int32_t);
271 # define iori(r0, i0) alui(X86_OR, r0, i0)
272 # define ori(r0, r1, i0) _ori(_jit, r0, r1, i0)
273 static void _ori(jit_state_t*, jit_int32_t,jit_int32_t,jit_word_t);
274 # define ixorr(r0, r1) alur(X86_XOR, r0, r1)
275 # define xorr(r0, r1, r2) _xorr(_jit, r0, r1, r2)
276 static void _xorr(jit_state_t*, jit_int32_t,jit_int32_t,jit_int32_t);
277 # define ixori(r0, i0) alui(X86_XOR, r0, i0)
278 # define xori(r0, r1, i0) _xori(_jit, r0, r1, i0)
279 static void _xori(jit_state_t*, jit_int32_t,jit_int32_t,jit_word_t);
280 # define irotshr(code, r0) _irotshr(_jit, code, r0)
281 static void _irotshr(jit_state_t*, jit_int32_t, jit_int32_t);
282 # define rotshr(code, r0, r1, r2) _rotshr(_jit, code, r0, r1, r2)
284 _rotshr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t,jit_int32_t);
285 # define irotshi(code, r0, i0) _irotshi(_jit, code, r0, i0)
286 static void _irotshi(jit_state_t*, jit_int32_t, jit_int32_t, jit_word_t);
287 # define rotshi(code, r0, r1, i0) _rotshi(_jit, code, r0, r1, i0)
289 _rotshi(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t,jit_word_t);
290 # define lshr(r0, r1, r2) rotshr(X86_SHL, r0, r1, r2)
291 # define lshi(r0, r1, i0) _lshi(_jit, r0, r1, i0)
292 static void _lshi(jit_state_t*, jit_int32_t, jit_int32_t, jit_word_t);
293 # define rshr(r0, r1, r2) rotshr(X86_SAR, r0, r1, r2)
294 # define rshi(r0, r1, i0) rotshi(X86_SAR, r0, r1, i0)
295 # define rshr_u(r0, r1, r2) rotshr(X86_SHR, r0, r1, r2)
296 # define rshi_u(r0, r1, i0) rotshi(X86_SHR, r0, r1, i0)
297 # define unr(code, r0) _unr(_jit, code, r0)
298 static void _unr(jit_state_t*, jit_int32_t, jit_int32_t);
299 # define inegr(r0) unr(X86_NEG, r0)
300 # define negr(r0, r1) _negr(_jit, r0, r1)
301 static void _negr(jit_state_t*, jit_int32_t, jit_int32_t);
302 # define icomr(r0) unr(X86_NOT, r0)
303 # define comr(r0, r1) _comr(_jit, r0, r1)
304 static void _comr(jit_state_t*, jit_int32_t, jit_int32_t);
306 # define incr(r0, r1) _incr(_jit, r0, r1)
307 static void _incr(jit_state_t*, jit_int32_t, jit_int32_t);
308 # define decr(r0, r1) _decr(_jit, r0, r1)
309 static void _decr(jit_state_t*, jit_int32_t, jit_int32_t);
311 # define cr(code, r0, r1, r2) _cr(_jit, code, r0, r1, r2)
313 _cr(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t, jit_int32_t);
314 # define ci(code, r0, r1, i0) _ci(_jit, code, r0, r1, i0)
316 _ci(jit_state_t *_jit, jit_int32_t, jit_int32_t, jit_int32_t, jit_word_t);
317 # define ci0(code, r0, r1) _ci0(_jit, code, r0, r1)
318 static void _ci0(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
319 # define ltr(r0, r1, r2) _ltr(_jit, r0, r1, r2)
320 static void _ltr(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
321 # define lti(r0, r1, i0) _lti(_jit, r0, r1, i0)
322 static void _lti(jit_state_t*, jit_int32_t, jit_int32_t, jit_word_t);
323 # define ltr_u(r0, r1, r2) _ltr_u(_jit, r0, r1, r2)
324 static void _ltr_u(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
325 # define lti_u(r0, r1, i0) ci(X86_CC_B, r0, r1, i0)
326 # define ler(r0, r1, r2) _ler(_jit, r0, r1, r2)
327 static void _ler(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
328 # define lei(r0, r1, i0) ci(X86_CC_LE, r0, r1, i0)
329 # define ler_u(r0, r1, r2) _ler_u(_jit, r0, r1, r2)
330 static void _ler_u(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
331 # define lei_u(r0, r1, i0) _lei_u(_jit, r0, r1, i0)
332 static void _lei_u(jit_state_t*, jit_int32_t, jit_int32_t, jit_word_t);
333 # define eqr(r0, r1, r2) _eqr(_jit, r0, r1, r2)
334 static void _eqr(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
335 # define eqi(r0, r1, i0) _eqi(_jit, r0, r1, i0)
336 static void _eqi(jit_state_t*, jit_int32_t, jit_int32_t, jit_word_t);
337 # define ger(r0, r1, r2) _ger(_jit, r0, r1, r2)
338 static void _ger(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
339 # define gei(r0, r1, i0) _gei(_jit, r0, r1, i0)
340 static void _gei(jit_state_t*, jit_int32_t, jit_int32_t, jit_word_t);
341 # define ger_u(r0, r1, r2) _ger_u(_jit, r0, r1, r2)
342 static void _ger_u(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
343 # define gei_u(r0, r1, i0) _gei_u(_jit, r0, r1, i0)
344 static void _gei_u(jit_state_t*, jit_int32_t, jit_int32_t, jit_word_t);
345 # define gtr(r0, r1, r2) _gtr(_jit, r0, r1, r2)
346 static void _gtr(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
347 # define gti(r0, r1, i0) _ci(_jit, X86_CC_G, r0, r1, i0)
348 # define gtr_u(r0, r1, r2) _gtr_u(_jit, r0, r1, r2)
349 static void _gtr_u(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
350 # define gti_u(r0, r1, i0) _gti_u(_jit, r0, r1, i0)
351 static void _gti_u(jit_state_t*, jit_int32_t, jit_int32_t, jit_word_t);
352 # define ner(r0, r1, r2) _ner(_jit, r0, r1, r2)
353 static void _ner(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
354 # define nei(r0, r1, i0) _nei(_jit, r0, r1, i0)
355 static void _nei(jit_state_t*, jit_int32_t, jit_int32_t, jit_word_t);
356 # define movr(r0, r1) _movr(_jit, r0, r1)
357 static void _movr(jit_state_t*, jit_int32_t, jit_int32_t);
358 # define imovi(r0, i0) _imovi(_jit, r0, i0)
359 static void _imovi(jit_state_t*, jit_int32_t, jit_word_t);
360 # define movi(r0, i0) _movi(_jit, r0, i0)
361 static void _movi(jit_state_t*, jit_int32_t, jit_word_t);
362 # define movi_p(r0, i0) _movi_p(_jit, r0, i0)
363 static jit_word_t _movi_p(jit_state_t*, jit_int32_t, jit_word_t);
364 # define movcr(r0, r1) _movcr(_jit, r0, r1)
365 static void _movcr(jit_state_t*,jit_int32_t,jit_int32_t);
366 # define movcr_u(r0, r1) _movcr_u(_jit, r0, r1)
367 static void _movcr_u(jit_state_t*,jit_int32_t,jit_int32_t);
368 # define movsr(r0, r1) _movsr(_jit, r0, r1)
369 static void _movsr(jit_state_t*,jit_int32_t,jit_int32_t);
370 # define movsr_u(r0, r1) _movsr_u(_jit, r0, r1)
371 static void _movsr_u(jit_state_t*,jit_int32_t,jit_int32_t);
372 # define casx(r0, r1, r2, r3, i0) _casx(_jit, r0, r1, r2, r3, i0)
373 static void _casx(jit_state_t *_jit,jit_int32_t,jit_int32_t,
374 jit_int32_t,jit_int32_t,jit_word_t);
375 #define casr(r0, r1, r2, r3) casx(r0, r1, r2, r3, 0)
376 #define casi(r0, i0, r1, r2) casx(r0, _NOREG, r1, r2, i0)
377 #define movnr(r0, r1, r2) _movnr(_jit, r0, r1, r2)
378 static void _movnr(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
379 #define movzr(r0, r1, r2) _movzr(_jit, r0, r1, r2)
380 static void _movzr(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
381 # if __X64 && !__X64_32
382 # define movir(r0, r1) _movir(_jit, r0, r1)
383 static void _movir(jit_state_t*,jit_int32_t,jit_int32_t);
384 # define movir_u(r0, r1) _movir_u(_jit, r0, r1)
385 static void _movir_u(jit_state_t*,jit_int32_t,jit_int32_t);
387 # define bswapr_us(r0, r1) _bswapr_us(_jit, r0, r1)
388 static void _bswapr_us(jit_state_t*,jit_int32_t,jit_int32_t);
389 # define bswapr_ui(r0, r1) _bswapr_ui(_jit, r0, r1)
390 static void _bswapr_ui(jit_state_t*,jit_int32_t,jit_int32_t);
391 # if __X64 && !__X64_32
392 #define bswapr_ul(r0, r1) _bswapr_ul(_jit, r0, r1)
393 static void _bswapr_ul(jit_state_t*,jit_int32_t,jit_int32_t);
395 # define extr_c(r0, r1) _extr_c(_jit, r0, r1)
396 static void _extr_c(jit_state_t*,jit_int32_t,jit_int32_t);
397 # define extr_uc(r0, r1) _extr_uc(_jit, r0, r1)
398 static void _extr_uc(jit_state_t*,jit_int32_t,jit_int32_t);
399 # define extr_s(r0, r1) movsr(r0, r1)
400 # define extr_us(r0, r1) movsr_u(r0, r1)
401 # if __X64 && !__X64_32
402 # define extr_i(r0, r1) movir(r0, r1)
403 # define extr_ui(r0, r1) movir_u(r0, r1)
405 # define ldr_c(r0, r1) _ldr_c(_jit, r0, r1)
406 static void _ldr_c(jit_state_t*, jit_int32_t, jit_int32_t);
407 # define ldi_c(r0, i0) _ldi_c(_jit, r0, i0)
408 static void _ldi_c(jit_state_t*, jit_int32_t, jit_word_t);
409 # define ldr_uc(r0, r1) _ldr_uc(_jit, r0, r1)
410 static void _ldr_uc(jit_state_t*, jit_int32_t, jit_int32_t);
411 # define ldi_uc(r0, i0) _ldi_uc(_jit, r0, i0)
412 static void _ldi_uc(jit_state_t*, jit_int32_t, jit_word_t);
413 # define ldr_s(r0, r1) _ldr_s(_jit, r0, r1)
414 static void _ldr_s(jit_state_t*, jit_int32_t, jit_int32_t);
415 # define ldi_s(r0, i0) _ldi_s(_jit, r0, i0)
416 static void _ldi_s(jit_state_t*, jit_int32_t, jit_word_t);
417 # define ldr_us(r0, r1) _ldr_us(_jit, r0, r1)
418 static void _ldr_us(jit_state_t*, jit_int32_t, jit_int32_t);
419 # define ldi_us(r0, i0) _ldi_us(_jit, r0, i0)
420 static void _ldi_us(jit_state_t*, jit_int32_t, jit_word_t);
421 # if __X32 || !__X64_32
422 # define ldr_i(r0, r1) _ldr_i(_jit, r0, r1)
423 static void _ldr_i(jit_state_t*, jit_int32_t, jit_int32_t);
424 # define ldi_i(r0, i0) _ldi_i(_jit, r0, i0)
425 static void _ldi_i(jit_state_t*, jit_int32_t, jit_word_t);
429 # define ldr_i(r0, r1) _ldr_ui(_jit, r0, r1)
430 # define ldi_i(r0, i0) _ldi_ui(_jit, r0, i0)
432 # define ldr_ui(r0, r1) _ldr_ui(_jit, r0, r1)
433 # define ldi_ui(r0, i0) _ldi_ui(_jit, r0, i0)
435 static void _ldr_ui(jit_state_t*, jit_int32_t, jit_int32_t);
436 static void _ldi_ui(jit_state_t*, jit_int32_t, jit_word_t);
438 # define ldr_l(r0, r1) _ldr_l(_jit, r0, r1)
439 static void _ldr_l(jit_state_t*, jit_int32_t, jit_int32_t);
440 # define ldi_l(r0, i0) _ldi_l(_jit, r0, i0)
441 static void _ldi_l(jit_state_t*, jit_int32_t, jit_word_t);
444 # define ldxr_c(r0, r1, r2) _ldxr_c(_jit, r0, r1, r2)
445 static void _ldxr_c(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
446 # define ldxi_c(r0, r1, i0) _ldxi_c(_jit, r0, r1, i0)
447 static void _ldxi_c(jit_state_t*, jit_int32_t, jit_int32_t, jit_word_t);
448 # define ldxr_uc(r0, r1, r2) _ldxr_uc(_jit, r0, r1, r2)
449 static void _ldxr_uc(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
450 # define ldxi_uc(r0, r1, i0) _ldxi_uc(_jit, r0, r1, i0)
451 static void _ldxi_uc(jit_state_t*, jit_int32_t, jit_int32_t, jit_word_t);
452 # define ldxr_s(r0, r1, r2) _ldxr_s(_jit, r0, r1, r2)
453 static void _ldxr_s(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
454 # define ldxi_s(r0, r1, i0) _ldxi_s(_jit, r0, r1, i0)
455 static void _ldxi_s(jit_state_t*, jit_int32_t, jit_int32_t, jit_word_t);
456 # define ldxr_us(r0, r1, r2) _ldxr_us(_jit, r0, r1, r2)
457 static void _ldxr_us(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
458 # define ldxi_us(r0, r1, i0) _ldxi_us(_jit, r0, r1, i0)
459 static void _ldxi_us(jit_state_t*, jit_int32_t, jit_int32_t, jit_word_t);
460 # if __X32 || !__X64_32
461 # define ldxr_i(r0, r1, r2) _ldxr_i(_jit, r0, r1, r2)
462 static void _ldxr_i(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
463 # define ldxi_i(r0, r1, i0) _ldxi_i(_jit, r0, r1, i0)
464 static void _ldxi_i(jit_state_t*, jit_int32_t, jit_int32_t, jit_word_t);
468 # define ldxr_i(r0, r1, r2) _ldxr_ui(_jit, r0, r1, r2)
469 # define ldxi_i(r0, r1, i0) _ldxi_ui(_jit, r0, r1, i0)
471 # define ldxr_ui(r0, r1, r2) _ldxr_ui(_jit, r0, r1, r2)
472 # define ldxi_ui(r0, r1, i0) _ldxi_ui(_jit, r0, r1, i0)
474 static void _ldxr_ui(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
475 static void _ldxi_ui(jit_state_t*, jit_int32_t, jit_int32_t, jit_word_t);
477 # define ldxr_l(r0, r1, r2) _ldxr_l(_jit, r0, r1, r2)
478 static void _ldxr_l(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
479 # define ldxi_l(r0, r1, i0) _ldxi_l(_jit, r0, r1, i0)
480 static void _ldxi_l(jit_state_t*, jit_int32_t, jit_int32_t, jit_word_t);
483 # define str_c(r0, r1) _str_c(_jit, r0, r1)
484 static void _str_c(jit_state_t*, jit_int32_t, jit_int32_t);
485 # define sti_c(i0, r0) _sti_c(_jit, i0, r0)
486 static void _sti_c(jit_state_t*, jit_word_t, jit_int32_t);
487 # define str_s(r0, r1) _str_s(_jit, r0, r1)
488 static void _str_s(jit_state_t*, jit_int32_t, jit_int32_t);
489 # define sti_s(i0, r0) _sti_s(_jit, i0, r0)
490 static void _sti_s(jit_state_t*, jit_word_t, jit_int32_t);
491 # define str_i(r0, r1) _str_i(_jit, r0, r1)
492 static void _str_i(jit_state_t*, jit_int32_t, jit_int32_t);
493 # define sti_i(i0, r0) _sti_i(_jit, i0, r0)
494 static void _sti_i(jit_state_t*, jit_word_t, jit_int32_t);
495 # if __X64 && !__X64_32
496 # define str_l(r0, r1) _str_l(_jit, r0, r1)
497 static void _str_l(jit_state_t*, jit_int32_t, jit_int32_t);
498 # define sti_l(i0, r0) _sti_l(_jit, i0, r0)
499 static void _sti_l(jit_state_t*, jit_word_t, jit_int32_t);
501 # define stxr_c(r0, r1, r2) _stxr_c(_jit, r0, r1, r2)
502 static void _stxr_c(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
503 # define stxi_c(i0, r0, r1) _stxi_c(_jit, i0, r0, r1)
504 static void _stxi_c(jit_state_t*, jit_word_t, jit_int32_t, jit_int32_t);
505 # define stxr_s(r0, r1, r2) _stxr_s(_jit, r0, r1, r2)
506 static void _stxr_s(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
507 # define stxi_s(i0, r0, r1) _stxi_s(_jit, i0, r0, r1)
508 static void _stxi_s(jit_state_t*, jit_word_t, jit_int32_t, jit_int32_t);
509 # define stxr_i(r0, r1, r2) _stxr_i(_jit, r0, r1, r2)
510 static void _stxr_i(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
511 # define stxi_i(i0, r0, r1) _stxi_i(_jit, i0, r0, r1)
512 static void _stxi_i(jit_state_t*, jit_word_t, jit_int32_t, jit_int32_t);
513 # if __X64 && !__X64_32
514 # define stxr_l(r0, r1, r2) _stxr_l(_jit, r0, r1, r2)
515 static void _stxr_l(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
516 # define stxi_l(i0, r0, r1) _stxi_l(_jit, i0, r0, r1)
517 static void _stxi_l(jit_state_t*, jit_word_t, jit_int32_t, jit_int32_t);
519 # define jcc(code, i0) _jcc(_jit, code, i0)
520 # define jo(i0) jcc(X86_CC_O, i0)
521 # define jno(i0) jcc(X86_CC_NO, i0)
522 # define jnae(i0) jcc(X86_CC_NAE, i0)
523 # define jb(i0) jcc(X86_CC_B, i0)
524 # define jc(i0) jcc(X86_CC_C, i0)
525 # define jae(i0) jcc(X86_CC_AE, i0)
526 # define jnb(i0) jcc(X86_CC_NB, i0)
527 # define jnc(i0) jcc(X86_CC_NC, i0)
528 # define je(i0) jcc(X86_CC_E, i0)
529 # define jz(i0) jcc(X86_CC_Z, i0)
530 # define jne(i0) jcc(X86_CC_NE, i0)
531 # define jnz(i0) jcc(X86_CC_NZ, i0)
532 # define jbe(i0) jcc(X86_CC_BE, i0)
533 # define jna(i0) jcc(X86_CC_NA, i0)
534 # define ja(i0) jcc(X86_CC_A, i0)
535 # define jnbe(i0) jcc(X86_CC_NBE, i0)
536 # define js(i0) jcc(X86_CC_S, i0)
537 # define jns(i0) jcc(X86_CC_NS, i0)
538 # define jp(i0) jcc(X86_CC_P, i0)
539 # define jpe(i0) jcc(X86_CC_PE, i0)
540 # define jnp(i0) jcc(X86_CC_NP, i0)
541 # define jpo(i0) jcc(X86_CC_PO, i0)
542 # define jl(i0) jcc(X86_CC_L, i0)
543 # define jnge(i0) jcc(X86_CC_NGE, i0)
544 # define jge(i0) jcc(X86_CC_GE, i0)
545 # define jnl(i0) jcc(X86_CC_NL, i0)
546 # define jle(i0) jcc(X86_CC_LE, i0)
547 # define jng(i0) jcc(X86_CC_NG, i0)
548 # define jg(i0) jcc(X86_CC_G, i0)
549 # define jnle(i0) jcc(X86_CC_NLE, i0)
550 static void _jcc(jit_state_t*, jit_int32_t, jit_word_t);
551 # define jccs(code, i0) _jccs(_jit, code, i0)
552 # define jos(i0) jccs(X86_CC_O, i0)
553 # define jnos(i0) jccs(X86_CC_NO, i0)
554 # define jnaes(i0) jccs(X86_CC_NAE, i0)
555 # define jbs(i0) jccs(X86_CC_B, i0)
556 # define jcs(i0) jccs(X86_CC_C, i0)
557 # define jaes(i0) jccs(X86_CC_AE, i0)
558 # define jnbs(i0) jccs(X86_CC_NB, i0)
559 # define jncs(i0) jccs(X86_CC_NC, i0)
560 # define jes(i0) jccs(X86_CC_E, i0)
561 # define jzs(i0) jccs(X86_CC_Z, i0)
562 # define jnes(i0) jccs(X86_CC_NE, i0)
563 # define jnzs(i0) jccs(X86_CC_NZ, i0)
564 # define jbes(i0) jccs(X86_CC_BE, i0)
565 # define jnas(i0) jccs(X86_CC_NA, i0)
566 # define jas(i0) jccs(X86_CC_A, i0)
567 # define jnbes(i0) jccs(X86_CC_NBE, i0)
568 # define jss(i0) jccs(X86_CC_S, i0)
569 # define jnss(i0) jccs(X86_CC_NS, i0)
570 # define jps(i0) jccs(X86_CC_P, i0)
571 # define jpes(i0) jccs(X86_CC_PE, i0)
572 # define jnps(i0) jccs(X86_CC_NP, i0)
573 # define jpos(i0) jccs(X86_CC_PO, i0)
574 # define jls(i0) jccs(X86_CC_L, i0)
575 # define jnges(i0) jccs(X86_CC_NGE, i0)
576 # define jges(i0) jccs(X86_CC_GE, i0)
577 # define jnls(i0) jccs(X86_CC_NL, i0)
578 # define jles(i0) jccs(X86_CC_LE, i0)
579 # define jngs(i0) jccs(X86_CC_NG, i0)
580 # define jgs(i0) jccs(X86_CC_G, i0)
581 # define jnles(i0) jccs(X86_CC_NLE, i0)
582 static void _jccs(jit_state_t*, jit_int32_t, jit_word_t);
583 # define jcr(code, i0, r0, r1) _jcr(_jit, code, i0, r0, r1)
584 static void _jcr(jit_state_t*,jit_int32_t,jit_word_t,jit_int32_t,jit_int32_t);
585 # define jci(code, i0, r0, i1) _jci(_jit, code, i0, r0, i1)
586 static void _jci(jit_state_t*,jit_int32_t,jit_word_t,jit_int32_t,jit_word_t);
587 # define jci0(code, i0, r0) _jci0(_jit, code, i0, r0)
588 static void _jci0(jit_state_t*, jit_int32_t, jit_word_t, jit_int32_t);
589 # define bltr(i0, r0, r1) _bltr(_jit, i0, r0, r1)
590 static jit_word_t _bltr(jit_state_t*, jit_word_t, jit_int32_t, jit_int32_t);
591 # define blti(i0, r0, i1) _blti(_jit, i0, r0, i1)
592 static jit_word_t _blti(jit_state_t*, jit_word_t, jit_int32_t, jit_word_t);
593 # define bltr_u(i0, r0, r1) _bltr_u(_jit, i0, r0, r1)
594 static jit_word_t _bltr_u(jit_state_t*, jit_word_t, jit_int32_t, jit_int32_t);
595 # define blti_u(i0, r0, i1) _blti_u(_jit, i0, r0, i1)
596 static jit_word_t _blti_u(jit_state_t*, jit_word_t, jit_int32_t, jit_word_t);
597 # define bler(i0, r0, r1) _bler(_jit, i0, r0, r1)
598 static jit_word_t _bler(jit_state_t*, jit_word_t, jit_int32_t, jit_int32_t);
599 # define blei(i0, r0, i1) _blei(_jit, i0, r0, i1)
600 static jit_word_t _blei(jit_state_t*, jit_word_t, jit_int32_t, jit_word_t);
601 # define bler_u(i0, r0, r1) _bler_u(_jit, i0, r0, r1)
602 static jit_word_t _bler_u(jit_state_t*, jit_word_t, jit_int32_t, jit_int32_t);
603 # define blei_u(i0, r0, i1) _blei_u(_jit, i0, r0, i1)
604 static jit_word_t _blei_u(jit_state_t*, jit_word_t, jit_int32_t, jit_word_t);
605 # define beqr(i0, r0, r1) _beqr(_jit, i0, r0, r1)
606 static jit_word_t _beqr(jit_state_t*, jit_word_t, jit_int32_t, jit_int32_t);
607 # define beqi(i0, r0, i1) _beqi(_jit, i0, r0, i1)
608 static jit_word_t _beqi(jit_state_t*, jit_word_t, jit_int32_t, jit_word_t);
609 # define bger(i0, r0, r1) _bger(_jit, i0, r0, r1)
610 static jit_word_t _bger(jit_state_t*, jit_word_t, jit_int32_t, jit_int32_t);
611 # define bgei(i0, r0, i1) _bgei(_jit, i0, r0, i1)
612 static jit_word_t _bgei(jit_state_t*, jit_word_t, jit_int32_t, jit_word_t);
613 # define bger_u(i0, r0, r1) _bger_u(_jit, i0, r0, r1)
614 static jit_word_t _bger_u(jit_state_t*, jit_word_t, jit_int32_t, jit_int32_t);
615 # define bgei_u(i0, r0, i1) _bgei_u(_jit, i0, r0, i1)
616 static jit_word_t _bgei_u(jit_state_t*, jit_word_t, jit_int32_t, jit_word_t);
617 # define bgtr(i0, r0, r1) _bgtr(_jit, i0, r0, r1)
618 static jit_word_t _bgtr(jit_state_t*, jit_word_t, jit_int32_t, jit_int32_t);
619 # define bgti(i0, r0, i1) _bgti(_jit, i0, r0, i1)
620 static jit_word_t _bgti(jit_state_t*, jit_word_t, jit_int32_t, jit_word_t);
621 # define bgtr_u(i0, r0, r1) _bgtr_u(_jit, i0, r0, r1)
622 static jit_word_t _bgtr_u(jit_state_t*, jit_word_t, jit_int32_t, jit_int32_t);
623 # define bgti_u(i0, r0, i1) _bgti_u(_jit, i0, r0, i1)
624 static jit_word_t _bgti_u(jit_state_t*, jit_word_t, jit_int32_t, jit_word_t);
625 # define bner(i0, r0, r1) _bner(_jit, i0, r0, r1)
626 static jit_word_t _bner(jit_state_t*, jit_word_t, jit_int32_t, jit_int32_t);
627 # define bnei(i0, r0, i1) _bnei(_jit, i0, r0, i1)
628 static jit_word_t _bnei(jit_state_t*, jit_word_t, jit_int32_t, jit_word_t);
629 # define bmsr(i0, r0, r1) _bmsr(_jit, i0, r0, r1)
630 static jit_word_t _bmsr(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
631 # define bmsi(i0, r0, i1) _bmsi(_jit, i0, r0, i1)
632 static jit_word_t _bmsi(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
633 # define bmcr(i0, r0, r1) _bmcr(_jit, i0, r0, r1)
634 static jit_word_t _bmcr(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
635 # define bmci(i0, r0, i1) _bmci(_jit, i0, r0, i1)
636 static jit_word_t _bmci(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
637 # define boaddr(i0, r0, r1) _boaddr(_jit, i0, r0, r1)
638 static jit_word_t _boaddr(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
639 # define boaddi(i0, r0, i1) _boaddi(_jit, i0, r0, i1)
640 static jit_word_t _boaddi(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
641 # define boaddr_u(i0, r0, r1) _boaddr_u(_jit, i0, r0, r1)
642 static jit_word_t _boaddr_u(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
643 # define boaddi_u(i0, r0, i1) _boaddi_u(_jit, i0, r0, i1)
644 static jit_word_t _boaddi_u(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
645 # define bxaddr(i0, r0, r1) _bxaddr(_jit, i0, r0, r1)
646 static jit_word_t _bxaddr(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
647 # define bxaddi(i0, r0, i1) _bxaddi(_jit, i0, r0, i1)
648 static jit_word_t _bxaddi(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
649 # define bxaddr_u(i0, r0, r1) _bxaddr_u(_jit, i0, r0, r1)
650 static jit_word_t _bxaddr_u(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
651 # define bxaddi_u(i0, r0, i1) _bxaddi_u(_jit, i0, r0, i1)
652 static jit_word_t _bxaddi_u(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
653 # define bosubr(i0, r0, r1) _bosubr(_jit, i0, r0, r1)
654 static jit_word_t _bosubr(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
655 # define bosubi(i0, r0, i1) _bosubi(_jit, i0, r0, i1)
656 static jit_word_t _bosubi(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
657 # define bosubr_u(i0, r0, r1) _bosubr_u(_jit, i0, r0, r1)
658 static jit_word_t _bosubr_u(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
659 # define bosubi_u(i0, r0, i1) _bosubi_u(_jit, i0, r0, i1)
660 static jit_word_t _bosubi_u(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
661 # define bxsubr(i0, r0, r1) _bxsubr(_jit, i0, r0, r1)
662 static jit_word_t _bxsubr(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
663 # define bxsubi(i0, r0, i1) _bxsubi(_jit, i0, r0, i1)
664 static jit_word_t _bxsubi(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
665 # define bxsubr_u(i0, r0, r1) _bxsubr_u(_jit, i0, r0, r1)
666 static jit_word_t _bxsubr_u(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
667 # define bxsubi_u(i0, r0, i1) _bxsubi_u(_jit, i0, r0, i1)
668 static jit_word_t _bxsubi_u(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
669 # define callr(r0) _callr(_jit, r0)
670 static void _callr(jit_state_t*, jit_int32_t);
671 # define calli(i0) _calli(_jit, i0)
672 static jit_word_t _calli(jit_state_t*, jit_word_t);
674 # define calli_p(i0) _calli_p(_jit, i0)
675 static jit_word_t _calli_p(jit_state_t*, jit_word_t);
677 # define calli_p(i0) calli(i0)
679 # define jmpr(r0) _jmpr(_jit, r0)
680 static void _jmpr(jit_state_t*, jit_int32_t);
681 # define jmpi(i0) _jmpi(_jit, i0)
682 static jit_word_t _jmpi(jit_state_t*, jit_word_t);
684 # define jmpi_p(i0) _jmpi_p(_jit, i0)
685 static jit_word_t _jmpi_p(jit_state_t*, jit_word_t);
687 # define jmpi_p(i0) jmpi(i0)
689 # define jmpsi(i0) _jmpsi(_jit, i0)
690 static void _jmpsi(jit_state_t*, jit_uint8_t);
691 # define prolog(node) _prolog(_jit, node)
692 static void _prolog(jit_state_t*, jit_node_t*);
693 # define epilog(node) _epilog(_jit, node)
694 static void _epilog(jit_state_t*, jit_node_t*);
695 # define vastart(r0) _vastart(_jit, r0)
696 static void _vastart(jit_state_t*, jit_int32_t);
697 # define vaarg(r0, r1) _vaarg(_jit, r0, r1)
698 static void _vaarg(jit_state_t*, jit_int32_t, jit_int32_t);
699 # define vaarg_d(r0, r1, i0) _vaarg_d(_jit, r0, r1, i0)
700 static void _vaarg_d(jit_state_t*, jit_int32_t, jit_int32_t, jit_bool_t);
701 # define patch_at(node, instr, label) _patch_at(_jit, node, instr, label)
702 static void _patch_at(jit_state_t*, jit_node_t*, jit_word_t, jit_word_t);
703 # if !defined(HAVE_FFSL)
705 # define ffsl(i) __builtin_ffs(i)
707 # define ffsl(l) __builtin_ffsl(l)
710 # define jit_cmov_p() jit_cpu.cmov
715 _rex(jit_state_t *_jit, jit_int32_t l, jit_int32_t w,
716 jit_int32_t r, jit_int32_t x, jit_int32_t b)
719 jit_int32_t v = 0x40 | (w << 3);
733 _rx(jit_state_t *_jit, jit_int32_t rd, jit_int32_t md,
734 jit_int32_t rb, jit_int32_t ri, jit_int32_t ms)
739 mrm(0x00, r7(rd), 0x05);
741 mrm(0x00, r7(rd), 0x04);
742 sib(_SCL1, 0x04, 0x05);
746 else if (r7(rb) == _RSP_REGNO) {
748 mrm(0x00, r7(rd), 0x04);
751 else if ((jit_int8_t)md == md) {
752 mrm(0x01, r7(rd), 0x04);
757 mrm(0x02, r7(rd), 0x04);
763 if (md == 0 && r7(rb) != _RBP_REGNO)
764 mrm(0x00, r7(rd), r7(rb));
765 else if ((jit_int8_t)md == md) {
766 mrm(0x01, r7(rd), r7(rb));
770 mrm(0x02, r7(rd), r7(rb));
775 else if (rb == _NOREG) {
776 mrm(0x00, r7(rd), 0x04);
777 sib(ms, r7(ri), 0x05);
780 else if (r8(ri) != _RSP_REGNO) {
781 if (md == 0 && r7(rb) != _RBP_REGNO) {
782 mrm(0x00, r7(rd), 0x04);
783 sib(ms, r7(ri), r7(rb));
785 else if ((jit_int8_t)md == md) {
786 mrm(0x01, r7(rd), 0x04);
787 sib(ms, r7(ri), r7(rb));
791 mrm(0x02, r7(rd), 0x04);
792 sib(ms, r7(ri), r7(rb));
797 fprintf(stderr, "illegal index register");
803 _nop(jit_state_t *_jit, jit_int32_t count)
813 case 3: /* NOP DWORD ptr [EAX] */
814 ic(0x0f); ic(0x1f); ic(0x00);
816 case 4: /* NOP DWORD ptr [EAX + 00H] */
817 ic(0x0f); ic(0x1f); ic(0x40); ic(0x00);
819 case 5: /* NOP DWORD ptr [EAX + EAX*1 + 00H] */
820 ic(0x0f); ic(0x1f); ic(0x44); ic(0x00);
823 case 6: /* 66 NOP DWORD ptr [EAX + EAX*1 + 00H] */
824 ic(0x66); ic(0x0f); ic(0x1f); ic(0x44);
827 case 7: /* NOP DWORD ptr [EAX + 00000000H] */
828 ic(0x0f); ic(0x1f); ic(0x80); ii(0x0000);
830 case 8: /* NOP DWORD ptr [EAX + EAX*1 + 00000000H] */
831 ic(0x0f); ic(0x1f); ic(0x84); ic(0x00);
834 case 9: /* 66 NOP DWORD ptr [EAX + EAX*1 + 00000000H] */
835 ic(0x66); ic(0x0f); ic(0x1f); ic(0x84);
836 ic(0x00); ii(0x0000);
844 _lea(jit_state_t *_jit, jit_int32_t md, jit_int32_t rb,
845 jit_int32_t ri, jit_int32_t ms, jit_int32_t rd)
847 rex(0, WIDE, rd, ri, rb);
849 rx(rd, md, rb, ri, ms);
853 _pushr(jit_state_t *_jit, jit_int32_t r0)
855 rex(0, WIDE, 0, 0, r0);
860 _popr(jit_state_t *_jit, jit_int32_t r0)
862 rex(0, WIDE, 0, 0, r0);
867 _xchgr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
869 rex(0, WIDE, r1, _NOREG, r0);
871 mrm(0x03, r7(r1), r7(r0));
875 _testr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
877 rex(0, WIDE, r1, _NOREG, r0);
879 mrm(0x03, r7(r1), r7(r0));
883 _testi(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
885 rex(0, WIDE, _NOREG, _NOREG, r0);
886 if (r0 == _RAX_REGNO)
890 mrm(0x03, 0x00, r7(r0));
896 _cc(jit_state_t *_jit, jit_int32_t code, jit_int32_t r0)
898 rex(0, 0, _NOREG, _NOREG, r0);
901 mrm(0x03, 0x00, r7(r0));
905 _alur(jit_state_t *_jit, jit_int32_t code, jit_int32_t r0, jit_int32_t r1)
907 rex(0, WIDE, r1, _NOREG, r0);
909 mrm(0x03, r7(r1), r7(r0));
913 _alui(jit_state_t *_jit, jit_int32_t code, jit_int32_t r0, jit_word_t i0)
916 if (can_sign_extend_int_p(i0)) {
917 rex(0, WIDE, _NOREG, _NOREG, r0);
918 if ((jit_int8_t)i0 == i0) {
920 ic(0xc0 | code | r7(r0));
924 if (r0 == _RAX_REGNO)
928 ic(0xc0 | code | r7(r0));
934 reg = jit_get_reg(jit_class_gpr);
936 alur(code, r0, rn(reg));
942 _save(jit_state_t *_jit, jit_int32_t r0)
944 if (!_jitc->function->regoff[r0]) {
945 _jitc->function->regoff[r0] = jit_allocai(sizeof(jit_word_t));
948 assert(!jit_regset_tstbit(&_jitc->regsav, r0));
949 jit_regset_setbit(&_jitc->regsav, r0);
950 stxi(_jitc->function->regoff[r0], _RBP_REGNO, r0);
954 _load(jit_state_t *_jit, jit_int32_t r0)
956 assert(_jitc->function->regoff[r0]);
957 assert(jit_regset_tstbit(&_jitc->regsav, r0));
958 jit_regset_clrbit(&_jitc->regsav, r0);
959 ldxi(r0, _RBP_REGNO, _jitc->function->regoff[r0]);
963 _addr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
970 lea(0, r1, r2, _SCL1, r0);
974 _addi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
985 else if (can_sign_extend_int_p(i0)) {
989 lea(i0, r1, _NOREG, _SCL1, r0);
996 reg = jit_get_reg(jit_class_gpr);
1004 _addcr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1015 _addci(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1018 if (can_sign_extend_int_p(i0)) {
1022 else if (r0 == r1) {
1023 reg = jit_get_reg(jit_class_gpr);
1035 _addxr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1046 _addxi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1049 if (can_sign_extend_int_p(i0)) {
1053 else if (r0 == r1) {
1054 reg = jit_get_reg(jit_class_gpr);
1056 iaddxr(r0, rn(reg));
1066 _subr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1070 else if (r0 == r2) {
1081 _subi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1092 else if (can_sign_extend_int_p(i0)) {
1096 lea(-i0, r1, _NOREG, _SCL1, r0);
1098 else if (r0 != r1) {
1103 reg = jit_get_reg(jit_class_gpr);
1111 _subcr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1114 if (r0 == r2 && r0 != r1) {
1115 reg = jit_get_reg(jit_class_gpr);
1128 _subci(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1132 if (can_sign_extend_int_p(i0))
1135 reg = jit_get_reg(jit_class_gpr);
1143 _subxr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1146 if (r0 == r2 && r0 != r1) {
1147 reg = jit_get_reg(jit_class_gpr);
1150 isubxr(r0, rn(reg));
1160 _subxi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1164 if (can_sign_extend_int_p(i0))
1167 reg = jit_get_reg(jit_class_gpr);
1169 isubxr(r0, rn(reg));
1175 _rsbi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1182 _imulr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
1184 rex(0, WIDE, r0, _NOREG, r1);
1187 mrm(0x03, r7(r0), r7(r1));
1191 _imuli(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1194 if (can_sign_extend_int_p(i0)) {
1195 rex(0, WIDE, r0, _NOREG, r1);
1196 if ((jit_int8_t)i0 == i0) {
1198 mrm(0x03, r7(r0), r7(r1));
1203 mrm(0x03, r7(r0), r7(r1));
1208 reg = jit_get_reg(jit_class_gpr);
1216 _mulr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1229 _muli(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1242 lea(0, _NOREG, r1, _SCL2, r0);
1245 lea(0, _NOREG, r1, _SCL4, r0);
1248 lea(0, _NOREG, r1, _SCL8, r0);
1251 if (i0 > 0 && !(i0 & (i0 - 1)))
1252 lshi(r0, r1, ffsl(i0) - 1);
1253 else if (can_sign_extend_int_p(i0))
1255 else if (r0 != r1) {
1265 #define savset(rn) \
1268 if (r1 != rn && r2 != rn) \
1271 #define isavset(rn) \
1277 #define qsavset(rn) \
1278 if (r0 != rn && r1 != rn) { \
1280 if (r2 != rn && r3 != rn) \
1283 #define allocr(rn, rv) \
1284 if (set & (1 << rn)) \
1285 (void)jit_get_reg(rv|jit_class_gpr|jit_class_named); \
1286 if (sav & (1 << rn)) { \
1287 if ( jit_regset_tstbit(&_jitc->regsav, rv) || \
1288 !jit_regset_tstbit(&_jitc->reglive, rv)) \
1289 sav &= ~(1 << rn); \
1293 #define clear(rn, rv) \
1294 if (set & (1 << rn)) \
1295 jit_unget_reg(rv); \
1296 if (sav & (1 << rn)) \
1299 _iqmulr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1,
1300 jit_int32_t r2, jit_int32_t r3, jit_bool_t sign)
1307 qsavset(_RDX_REGNO);
1308 qsavset(_RAX_REGNO);
1309 allocr(_RDX_REGNO, _RDX);
1310 allocr(_RAX_REGNO, _RAX);
1312 if (r3 == _RAX_REGNO)
1316 movr(_RAX_REGNO, r2);
1323 if (r0 == _RDX_REGNO && r1 == _RAX_REGNO)
1324 xchgr(_RAX_REGNO, _RDX_REGNO);
1326 if (r0 != _RDX_REGNO)
1327 movr(r0, _RAX_REGNO);
1328 movr(r1, _RDX_REGNO);
1329 if (r0 == _RDX_REGNO)
1330 movr(r0, _RAX_REGNO);
1333 clear(_RDX_REGNO, _RDX);
1334 clear(_RAX_REGNO, _RAX);
1338 _iqmuli(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1,
1339 jit_int32_t r2, jit_word_t i0, jit_bool_t sign)
1348 reg = jit_get_reg(jit_class_gpr);
1351 qmulr(r0, r1, r2, rn(reg));
1353 qmulr_u(r0, r1, r2, rn(reg));
1359 _sign_extend_rdx_rax(jit_state_t *_jit)
1361 rex(0, WIDE, 0, 0, 0);
1366 _divremr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2,
1367 jit_bool_t sign, jit_bool_t divide)
1375 sav = set = use = 0;
1378 allocr(_RDX_REGNO, _RDX);
1379 allocr(_RAX_REGNO, _RAX);
1381 if (r2 == _RAX_REGNO) {
1382 if (r0 == _RAX_REGNO || r0 == _RDX_REGNO) {
1383 if ((reg = jit_get_reg(jit_class_gpr|jit_class_chk)) == JIT_NOREG)
1384 reg = jit_get_reg((r1 == _RCX_REGNO ? _RBX : _RCX) |
1385 jit_class_gpr|jit_class_named);
1388 movr(div, _RAX_REGNO);
1389 if (r1 != _RAX_REGNO)
1390 movr(_RAX_REGNO, r1);
1394 xchgr(r0, _RAX_REGNO);
1396 if (r0 != _RAX_REGNO)
1397 movr(r0, _RAX_REGNO);
1398 if (r1 != _RAX_REGNO)
1399 movr(_RAX_REGNO, r1);
1404 else if (r2 == _RDX_REGNO) {
1405 if (r0 == _RAX_REGNO || r0 == _RDX_REGNO) {
1406 if ((reg = jit_get_reg(jit_class_gpr|jit_class_chk)) == JIT_NOREG)
1407 reg = jit_get_reg((r1 == _RCX_REGNO ? _RBX : _RCX) |
1408 jit_class_gpr|jit_class_named);
1411 movr(div, _RDX_REGNO);
1412 if (r1 != _RAX_REGNO)
1413 movr(_RAX_REGNO, r1);
1416 if (r1 != _RAX_REGNO)
1417 movr(_RAX_REGNO, r1);
1418 movr(r0, _RDX_REGNO);
1423 if (r1 != _RAX_REGNO)
1424 movr(_RAX_REGNO, r1);
1429 sign_extend_rdx_rax();
1433 ixorr(_RDX_REGNO, _RDX_REGNO);
1441 movr(r0, _RAX_REGNO);
1443 movr(r0, _RDX_REGNO);
1445 clear(_RDX_REGNO, _RDX);
1446 clear(_RAX_REGNO, _RAX);
1450 _divremi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0,
1451 jit_bool_t sign, jit_bool_t divide)
1471 if (i0 > 0 && !(i0 & (i0 - 1))) {
1474 rshi(r0, r0, ffsl(i0) - 1);
1476 rshi_u(r0, r0, ffsl(i0) - 1);
1482 else if (i0 == 1 || (sign && i0 == -1)) {
1486 else if (!sign && i0 > 0 && !(i0 & (i0 - 1))) {
1487 if (can_sign_extend_int_p(i0)) {
1491 else if (r0 != r1) {
1496 reg = jit_get_reg(jit_class_gpr);
1497 movi(rn(reg), i0 - 1);
1504 sav = set = use = 0;
1505 isavset(_RDX_REGNO);
1506 isavset(_RAX_REGNO);
1507 allocr(_RDX_REGNO, _RDX);
1508 allocr(_RAX_REGNO, _RAX);
1510 if (r0 == _RAX_REGNO || r0 == _RDX_REGNO || r0 == r1) {
1511 if ((reg = jit_get_reg(jit_class_gpr|jit_class_chk)) == JIT_NOREG)
1512 reg = jit_get_reg((r1 == _RCX_REGNO ? _RBX : _RCX) |
1513 jit_class_gpr|jit_class_named);
1521 movr(_RAX_REGNO, r1);
1524 sign_extend_rdx_rax();
1528 ixorr(_RDX_REGNO, _RDX_REGNO);
1536 movr(r0, _RAX_REGNO);
1538 movr(r0, _RDX_REGNO);
1540 clear(_RDX_REGNO, _RDX);
1541 clear(_RAX_REGNO, _RAX);
1545 _iqdivr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1,
1546 jit_int32_t r2, jit_int32_t r3, jit_bool_t sign)
1554 sav = set = use = 0;
1555 qsavset(_RDX_REGNO);
1556 qsavset(_RAX_REGNO);
1557 allocr(_RDX_REGNO, _RDX);
1558 allocr(_RAX_REGNO, _RAX);
1559 if (r3 == _RAX_REGNO) {
1560 if (r0 == _RAX_REGNO || r0 == _RDX_REGNO) {
1561 if ((reg = jit_get_reg(jit_class_gpr|jit_class_chk)) == JIT_NOREG)
1562 reg = jit_get_reg((r1 == _RCX_REGNO ? _RBX : _RCX) |
1563 jit_class_gpr|jit_class_named);
1566 movr(div, _RAX_REGNO);
1567 if (r2 != _RAX_REGNO)
1568 movr(_RAX_REGNO, r2);
1572 xchgr(r0, _RAX_REGNO);
1574 if (r0 != _RAX_REGNO)
1575 movr(r0, _RAX_REGNO);
1576 if (r2 != _RAX_REGNO)
1577 movr(_RAX_REGNO, r2);
1582 else if (r3 == _RDX_REGNO) {
1583 if (r0 == _RAX_REGNO || r0 == _RDX_REGNO) {
1584 if ((reg = jit_get_reg(jit_class_gpr|jit_class_chk)) == JIT_NOREG)
1585 reg = jit_get_reg((r1 == _RCX_REGNO ? _RBX : _RCX) |
1586 jit_class_gpr|jit_class_named);
1589 movr(div, _RDX_REGNO);
1590 if (r2 != _RAX_REGNO)
1591 movr(_RAX_REGNO, r2);
1594 if (r2 != _RAX_REGNO)
1595 movr(_RAX_REGNO, r2);
1596 movr(r0, _RDX_REGNO);
1601 if (r2 != _RAX_REGNO)
1602 movr(_RAX_REGNO, r2);
1606 sign_extend_rdx_rax();
1610 ixorr(_RDX_REGNO, _RDX_REGNO);
1616 if (r0 == _RDX_REGNO && r1 == _RAX_REGNO)
1617 xchgr(_RAX_REGNO, _RDX_REGNO);
1619 if (r0 != _RDX_REGNO)
1620 movr(r0, _RAX_REGNO);
1621 movr(r1, _RDX_REGNO);
1622 if (r0 == _RDX_REGNO)
1623 movr(r0, _RAX_REGNO);
1626 clear(_RDX_REGNO, _RDX);
1627 clear(_RAX_REGNO, _RAX);
1631 _iqdivi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1,
1632 jit_int32_t r2, jit_word_t i0, jit_bool_t sign)
1636 reg = jit_get_reg(jit_class_gpr);
1639 qdivr(r0, r1, r2, rn(reg));
1641 qdivr_u(r0, r1, r2, rn(reg));
1649 _andr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1664 _andi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1672 else if (r0 == r1) {
1673 if (can_sign_extend_int_p(i0))
1676 reg = jit_get_reg(jit_class_gpr);
1689 _orr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1704 _ori(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1711 else if (can_sign_extend_int_p(i0)) {
1715 else if (r0 != r1) {
1720 reg = jit_get_reg(jit_class_gpr);
1728 _xorr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1743 _xori(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1750 else if (can_sign_extend_int_p(i0)) {
1754 else if (r0 != r1) {
1759 reg = jit_get_reg(jit_class_gpr);
1767 _irotshr(jit_state_t *_jit, jit_int32_t code, jit_int32_t r0)
1769 rex(0, WIDE, _RCX_REGNO, _NOREG, r0);
1771 mrm(0x03, code, r7(r0));
1775 _rotshr(jit_state_t *_jit, jit_int32_t code,
1776 jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1781 if (r0 == _RCX_REGNO) {
1782 reg = jit_get_reg(jit_class_gpr);
1784 if (r2 != _RCX_REGNO)
1785 movr(_RCX_REGNO, r2);
1786 irotshr(code, rn(reg));
1787 movr(_RCX_REGNO, rn(reg));
1790 else if (r2 != _RCX_REGNO) {
1791 use = !jit_reg_free_p(_RCX);
1793 reg = jit_get_reg(jit_class_gpr);
1794 movr(rn(reg), _RCX_REGNO);
1798 if (r1 == _RCX_REGNO) {
1800 xchgr(r0, _RCX_REGNO);
1803 movr(_RCX_REGNO, r2);
1807 movr(_RCX_REGNO, r2);
1812 movr(_RCX_REGNO, rn(reg));
1823 _irotshi(jit_state_t *_jit, jit_int32_t code, jit_int32_t r0, jit_word_t i0)
1825 rex(0, WIDE, _NOREG, _NOREG, r0);
1828 mrm(0x03, code, r7(r0));
1832 mrm(0x03, code, r7(r0));
1838 _rotshi(jit_state_t *_jit, jit_int32_t code,
1839 jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1843 irotshi(code, r0, i0);
1847 _lshi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1852 lea(0, _NOREG, r1, i0 == 1 ? _SCL2 : i0 == 2 ? _SCL4 : _SCL8, r0);
1854 rotshi(X86_SHL, r0, r1, i0);
1858 _unr(jit_state_t *_jit, jit_int32_t code, jit_int32_t r0)
1860 rex(0, WIDE, _NOREG, _NOREG, r0);
1862 mrm(0x03, code, r7(r0));
1866 _negr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
1877 _comr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
1885 _incr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
1889 rex(0, WIDE, _NOREG, _NOREG, r0);
1898 _decr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
1902 rex(0, WIDE, _NOREG, _NOREG, r0);
1912 _cr(jit_state_t *_jit,
1913 jit_int32_t code, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1918 same = r0 == r1 || r0 == r2;
1927 reg = jit_get_reg(jit_class_gpr|jit_class_rg8);
1928 ixorr(rn(reg), rn(reg));
1937 _ci(jit_state_t *_jit,
1938 jit_int32_t code, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1952 reg = jit_get_reg(jit_class_gpr|jit_class_rg8);
1953 ixorr(rn(reg), rn(reg));
1962 _ci0(jit_state_t *_jit, jit_int32_t code, jit_int32_t r0, jit_int32_t r1)
1976 reg = jit_get_reg(jit_class_gpr|jit_class_rg8);
1977 ixorr(rn(reg), rn(reg));
1986 _ltr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1991 cr(X86_CC_L, r0, r1, r2);
1995 _lti(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1998 ci(X86_CC_L, r0, r1, i0);
2000 ci0(X86_CC_S, r0, r1);
2004 _ltr_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2009 cr(X86_CC_B, r0, r1, r2);
2013 _ler(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2018 cr(X86_CC_LE, r0, r1, r2);
2022 _ler_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2027 cr(X86_CC_BE, r0, r1, r2);
2031 _lei_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2034 ci(X86_CC_BE, r0, r1, i0);
2036 ci0(X86_CC_E, r0, r1);
2040 _eqr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2045 cr(X86_CC_E, r0, r1, r2);
2049 _eqi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2052 ci(X86_CC_E, r0, r1, i0);
2054 ci0(X86_CC_E, r0, r1);
2058 _ger(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2063 cr(X86_CC_GE, r0, r1, r2);
2067 _gei(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2070 ci(X86_CC_GE, r0, r1, i0);
2072 ci0(X86_CC_NS, r0, r1);
2076 _ger_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2081 cr(X86_CC_AE, r0, r1, r2);
2085 _gei_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2088 ci(X86_CC_AE, r0, r1, i0);
2090 ci0(X86_CC_NB, r0, r1);
2094 _gtr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2099 cr(X86_CC_G, r0, r1, r2);
2103 _gtr_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2108 cr(X86_CC_A, r0, r1, r2);
2112 _gti_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2115 ci(X86_CC_A, r0, r1, i0);
2117 ci0(X86_CC_NE, r0, r1);
2121 _ner(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2126 cr(X86_CC_NE, r0, r1, r2);
2130 _nei(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2133 ci(X86_CC_NE, r0, r1, i0);
2135 ci0(X86_CC_NE, r0, r1);
2139 _movr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2142 rex(0, 1, r1, _NOREG, r0);
2144 ic(0xc0 | (r1 << 3) | r7(r0));
2149 _imovi(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
2153 if (fits_uint32_p(i0)) {
2155 rex(0, 0, _NOREG, _NOREG, r0);
2161 rex(0, 1, _NOREG, _NOREG, r0);
2173 _movi(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
2182 _movi_p(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
2184 rex(0, WIDE, _NOREG, _NOREG, r0);
2187 return (_jit->pc.w);
2191 _movcr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2193 rex(0, WIDE, r0, _NOREG, r1);
2196 mrm(0x03, r7(r0), r7(r1));
2200 _movcr_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2202 rex(0, WIDE, r0, _NOREG, r1);
2205 mrm(0x03, r7(r0), r7(r1));
2209 _movsr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2211 rex(0, WIDE, r0, _NOREG, r1);
2214 mrm(0x03, r7(r0), r7(r1));
2218 _movsr_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2220 rex(0, WIDE, r0, _NOREG, r1);
2223 mrm(0x03, r7(r0), r7(r1));
2227 _casx(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1,
2228 jit_int32_t r2, jit_int32_t r3, jit_word_t i0)
2230 jit_int32_t save_rax, restore_rax;
2231 jit_int32_t ascasr_reg, ascasr_use;
2232 if (r0 != _RAX_REGNO) { /* result not in %rax */
2233 if (r2 != _RAX_REGNO) { /* old value not in %rax */
2234 save_rax = jit_get_reg(jit_class_gpr);
2235 movr(rn(save_rax), _RAX_REGNO);
2243 if (r2 != _RAX_REGNO)
2244 movr(_RAX_REGNO, r2);
2245 if (r1 == _NOREG) { /* using immediate address */
2246 if (!can_sign_extend_int_p(i0)) {
2247 ascasr_reg = jit_get_reg(jit_class_gpr);
2248 if (ascasr_reg == _RAX) {
2249 ascasr_reg = jit_get_reg(jit_class_gpr);
2250 jit_unget_reg(_RAX);
2253 movi(rn(ascasr_reg), i0);
2260 ic(0xf0); /* lock */
2262 rex(0, WIDE, r3, _NOREG, rn(ascasr_reg));
2264 rex(0, WIDE, r3, _NOREG, r1);
2267 if (r1 != _NOREG) /* casr */
2268 rx(r3, 0, r1, _NOREG, _SCL1);
2271 rx(r3, 0, rn(ascasr_reg), _NOREG, _SCL1); /* address in reg */
2273 rx(r3, i0, _NOREG, _NOREG, _SCL1); /* address in offset */
2276 if (r0 != _RAX_REGNO)
2277 movr(r0, _RAX_REGNO);
2279 movr(_RAX_REGNO, rn(save_rax));
2280 jit_unget_reg(save_rax);
2283 jit_unget_reg(ascasr_reg);
2287 _movnr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2289 assert(jit_cmov_p());
2293 rex(0, WIDE, r0, _NOREG, r1);
2296 mrm(0x03, r7(r0), r7(r1));
2300 _movzr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2302 assert(jit_cmov_p());
2306 rex(0, WIDE, r0, _NOREG, r1);
2309 mrm(0x03, r7(r0), r7(r1));
2314 _movir(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2316 rex(0, 1, r0, _NOREG, r1);
2318 mrm(0x03, r7(r0), r7(r1));
2322 _movir_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2324 rex(0, 0, r1, _NOREG, r0);
2326 ic(0xc0 | (r1 << 3) | r7(r0));
2331 _bswapr_us(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2335 rex(0, 0, _NOREG, _NOREG, r0);
2337 mrm(0x03, X86_ROR, r7(r0));
2342 _bswapr_ui(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2345 rex(0, 0, _NOREG, _NOREG, r0);
2350 #if __X64 && !__X64_32
2352 _bswapr_ul(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2355 rex(0, 1, _NOREG, _NOREG, r0);
2362 _extr_c(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2368 reg = jit_get_reg(jit_class_gpr|jit_class_rg8);
2376 _extr_uc(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2382 reg = jit_get_reg(jit_class_gpr|jit_class_rg8);
2384 movcr_u(r0, rn(reg));
2390 _ldr_c(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2392 rex(0, WIDE, r0, _NOREG, r1);
2395 rx(r0, 0, r1, _NOREG, _SCL1);
2399 _ldi_c(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
2402 if (can_sign_extend_int_p(i0)) {
2403 rex(0, WIDE, r0, _NOREG, _NOREG);
2406 rx(r0, i0, _NOREG, _NOREG, _SCL1);
2409 reg = jit_get_reg(jit_class_gpr);
2417 _ldr_uc(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2419 rex(0, WIDE, r0, _NOREG, r1);
2422 rx(r0, 0, r1, _NOREG, _SCL1);
2426 _ldi_uc(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
2429 if (can_sign_extend_int_p(i0)) {
2430 rex(0, WIDE, r0, _NOREG, _NOREG);
2433 rx(r0, i0, _NOREG, _NOREG, _SCL1);
2436 reg = jit_get_reg(jit_class_gpr);
2438 ldr_uc(r0, rn(reg));
2444 _ldr_s(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2446 rex(0, WIDE, r0, _NOREG, r1);
2449 rx(r0, 0, r1, _NOREG, _SCL1);
2453 _ldi_s(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
2456 if (can_sign_extend_int_p(i0)) {
2457 rex(0, WIDE, r0, _NOREG, _NOREG);
2460 rx(r0, i0, _NOREG, _NOREG, _SCL1);
2463 reg = jit_get_reg(jit_class_gpr);
2471 _ldr_us(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2473 rex(0, WIDE, r0, _NOREG, r1);
2476 rx(r0, 0, r1, _NOREG, _SCL1);
2480 _ldi_us(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
2483 if (can_sign_extend_int_p(i0)) {
2484 rex(0, WIDE, r0, _NOREG, _NOREG);
2487 rx(r0, i0, _NOREG, _NOREG, _SCL1);
2490 reg = jit_get_reg(jit_class_gpr);
2492 ldr_us(r0, rn(reg));
2497 #if __X32 || !__X64_32
2499 _ldr_i(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2502 rex(0, WIDE, r0, _NOREG, r1);
2507 rx(r0, 0, r1, _NOREG, _SCL1);
2511 _ldi_i(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
2514 if (can_sign_extend_int_p(i0)) {
2516 rex(0, WIDE, r0, _NOREG, _NOREG);
2521 rx(r0, i0, _NOREG, _NOREG, _SCL1);
2524 reg = jit_get_reg(jit_class_gpr);
2534 _ldr_ui(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2536 rex(0, 0, r0, _NOREG, r1);
2538 rx(r0, 0, r1, _NOREG, _SCL1);
2542 _ldi_ui(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
2545 if (can_sign_extend_int_p(i0)) {
2546 rex(0, 0, r0, _NOREG, _NOREG);
2548 rx(r0, i0, _NOREG, _NOREG, _SCL1);
2551 reg = jit_get_reg(jit_class_gpr);
2553 ldr_ui(r0, rn(reg));
2560 _ldr_l(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2562 rex(0, 1, r0, _NOREG, r1);
2564 rx(r0, 0, r1, _NOREG, _SCL1);
2568 _ldi_l(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
2571 if (can_sign_extend_int_p(i0)) {
2572 rex(0, 1, r0, _NOREG, _NOREG);
2574 rx(r0, i0, _NOREG, _NOREG, _SCL1);
2577 reg = jit_get_reg(jit_class_gpr);
2587 _ldxr_c(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2593 rex(0, WIDE, r0, r1, r2);
2596 rx(r0, 0, r2, r1, _SCL1);
2601 _ldxi_c(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2604 if (can_sign_extend_int_p(i0)) {
2605 rex(0, WIDE, r0, _NOREG, r1);
2608 rx(r0, i0, r1, _NOREG, _SCL1);
2611 reg = jit_get_reg(jit_class_gpr);
2613 ldxr_c(r0, r1, rn(reg));
2619 _ldxr_uc(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2625 rex(0, WIDE, r0, r1, r2);
2628 rx(r0, 0, r2, r1, _SCL1);
2633 _ldxi_uc(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2636 if (can_sign_extend_int_p(i0)) {
2637 rex(0, WIDE, r0, _NOREG, r1);
2640 rx(r0, i0, r1, _NOREG, _SCL1);
2643 reg = jit_get_reg(jit_class_gpr);
2645 ldxr_uc(r0, r1, rn(reg));
2651 _ldxr_s(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2657 rex(0, WIDE, r0, r1, r2);
2660 rx(r0, 0, r2, r1, _SCL1);
2665 _ldxi_s(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2668 if (can_sign_extend_int_p(i0)) {
2669 rex(0, WIDE, r0, _NOREG, r1);
2672 rx(r0, i0, r1, _NOREG, _SCL1);
2675 reg = jit_get_reg(jit_class_gpr);
2677 ldxr_s(r0, r1, rn(reg));
2683 _ldxr_us(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2689 rex(0, WIDE, r0, r1, r2);
2692 rx(r0, 0, r2, r1, _SCL1);
2697 _ldxi_us(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2700 if (can_sign_extend_int_p(i0)) {
2701 rex(0, WIDE, r0, _NOREG, r1);
2704 rx(r0, i0, r1, _NOREG, _SCL1);
2707 reg = jit_get_reg(jit_class_gpr);
2709 ldxr_us(r0, r1, rn(reg));
2714 #if __X64 || !__X64_32
2716 _ldxr_i(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2719 rex(0, WIDE, r0, r1, r2);
2724 rx(r0, 0, r2, r1, _SCL1);
2728 _ldxi_i(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2731 if (can_sign_extend_int_p(i0)) {
2733 rex(0, WIDE, r0, _NOREG, r1);
2738 rx(r0, i0, r1, _NOREG, _SCL1);
2741 reg = jit_get_reg(jit_class_gpr);
2743 ldxr_i(r0, r1, rn(reg));
2751 _ldxr_ui(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2755 /* to avoid confusion with macro renames */
2756 _ldr_ui(_jit, r0, r0);
2758 rex(0, 0, r0, r1, r2);
2760 rx(r0, 0, r2, r1, _SCL1);
2765 _ldxi_ui(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2768 if (can_sign_extend_int_p(i0)) {
2769 rex(0, 0, r0, _NOREG, r1);
2771 rx(r0, i0, r1, _NOREG, _SCL1);
2774 reg = jit_get_reg(jit_class_gpr);
2776 ldxr_ui(r0, r1, rn(reg));
2783 _ldxr_l(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2785 rex(0, 1, r0, r1, r2);
2787 rx(r0, 0, r2, r1, _SCL1);
2791 _ldxi_l(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2794 if (can_sign_extend_int_p(i0)) {
2795 rex(0, 1, r0, _NOREG, r1);
2797 rx(r0, i0, r1, _NOREG, _SCL1);
2800 reg = jit_get_reg(jit_class_gpr);
2802 ldxr_l(r0, r1, rn(reg));
2810 _str_c(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2814 rex(0, 0, r1, _NOREG, r0);
2816 rx(r1, 0, r0, _NOREG, _SCL1);
2819 reg = jit_get_reg(jit_class_gpr|jit_class_rg8);
2821 rex(0, 0, rn(reg), _NOREG, r0);
2823 rx(rn(reg), 0, r0, _NOREG, _SCL1);
2829 _sti_c(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0)
2832 if (can_sign_extend_int_p(i0)) {
2834 rex(0, 0, r0, _NOREG, _NOREG);
2836 rx(r0, i0, _NOREG, _NOREG, _SCL1);
2839 reg = jit_get_reg(jit_class_gpr|jit_class_rg8);
2841 rex(0, 0, rn(reg), _NOREG, _NOREG);
2843 rx(rn(reg), i0, _NOREG, _NOREG, _SCL1);
2848 reg = jit_get_reg(jit_class_gpr);
2856 _str_s(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2859 rex(0, 0, r1, _NOREG, r0);
2861 rx(r1, 0, r0, _NOREG, _SCL1);
2865 _sti_s(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0)
2868 if (can_sign_extend_int_p(i0)) {
2870 rex(0, 0, r0, _NOREG, _NOREG);
2872 rx(r0, i0, _NOREG, _NOREG, _SCL1);
2875 reg = jit_get_reg(jit_class_gpr);
2883 _str_i(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2885 rex(0, 0, r1, _NOREG, r0);
2887 rx(r1, 0, r0, _NOREG, _SCL1);
2891 _sti_i(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0)
2894 if (can_sign_extend_int_p(i0)) {
2895 rex(0, 0, r0, _NOREG, _NOREG);
2897 rx(r0, i0, _NOREG, _NOREG, _SCL1);
2900 reg = jit_get_reg(jit_class_gpr);
2907 #if __X64 && !__X64_32
2909 _str_l(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2911 rex(0, 1, r1, _NOREG, r0);
2913 rx(r1, 0, r0, _NOREG, _SCL1);
2917 _sti_l(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0)
2920 if (can_sign_extend_int_p(i0)) {
2921 rex(0, 1, r0, _NOREG, _NOREG);
2923 rx(r0, i0, _NOREG, _NOREG, _SCL1);
2926 reg = jit_get_reg(jit_class_gpr);
2935 _stxr_c(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2939 reg = jit_get_reg(jit_class_gpr);
2940 addr(rn(reg), r0, r1);
2945 rex(0, 0, r2, r1, r0);
2947 rx(r2, 0, r0, r1, _SCL1);
2950 reg = jit_get_reg(jit_class_gpr|jit_class_rg8);
2952 rex(0, 0, rn(reg), r1, r0);
2954 rx(rn(reg), 0, r0, r1, _SCL1);
2961 _stxi_c(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
2964 if (can_sign_extend_int_p(i0)) {
2966 rex(0, 0, r1, _NOREG, r0);
2968 rx(r1, i0, r0, _NOREG, _SCL1);
2971 reg = jit_get_reg(jit_class_gpr|jit_class_rg8);
2973 rex(0, 0, rn(reg), _NOREG, r0);
2975 rx(rn(reg), i0, r0, _NOREG, _SCL1);
2980 reg = jit_get_reg(jit_class_gpr);
2982 stxr_c(rn(reg), r0, r1);
2988 _stxr_s(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2992 reg = jit_get_reg(jit_class_gpr);
2993 addr(rn(reg), r0, r1);
2998 rex(0, 0, r2, r1, r0);
3000 rx(r2, 0, r0, r1, _SCL1);
3005 _stxi_s(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3008 if (can_sign_extend_int_p(i0)) {
3010 rex(0, 0, r1, _NOREG, r0);
3012 rx(r1, i0, r0, _NOREG, _SCL1);
3015 reg = jit_get_reg(jit_class_gpr);
3017 stxr_s(rn(reg), r0, r1);
3023 _stxr_i(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
3027 reg = jit_get_reg(jit_class_gpr);
3028 addr(rn(reg), r0, r1);
3032 rex(0, 0, r2, r1, r0);
3034 rx(r2, 0, r0, r1, _SCL1);
3039 _stxi_i(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3042 if (can_sign_extend_int_p(i0)) {
3043 rex(0, 0, r1, _NOREG, r0);
3045 rx(r1, i0, r0, _NOREG, _SCL1);
3048 reg = jit_get_reg(jit_class_gpr);
3050 stxr_i(rn(reg), r0, r1);
3055 #if __X64 && !__X64_32
3057 _stxr_l(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
3059 rex(0, 1, r2, r1, r0);
3061 rx(r2, 0, r0, r1, _SCL1);
3065 _stxi_l(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3068 if (can_sign_extend_int_p(i0)) {
3069 rex(0, 1, r1, _NOREG, r0);
3071 rx(r1, i0, r0, _NOREG, _SCL1);
3074 reg = jit_get_reg(jit_class_gpr);
3076 stxr_l(rn(reg), r0, r1);
3083 _jccs(jit_state_t *_jit, jit_int32_t code, jit_word_t i0)
3087 w = i0 - (_jit->pc.w + 1);
3092 _jcc(jit_state_t *_jit, jit_int32_t code, jit_word_t i0)
3097 w = i0 - (_jit->pc.w + 4);
3102 _jcr(jit_state_t *_jit,
3103 jit_int32_t code, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3105 alur(X86_CMP, r0, r1);
3110 _jci(jit_state_t *_jit,
3111 jit_int32_t code, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
3113 alui(X86_CMP, r0, i1);
3118 _jci0(jit_state_t *_jit, jit_int32_t code, jit_word_t i0, jit_int32_t r0)
3125 _bltr(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3127 jcr(X86_CC_L, i0, r0, r1);
3128 return (_jit->pc.w);
3132 _blti(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
3134 if (i1) jci (X86_CC_L, i0, r0, i1);
3135 else jci0(X86_CC_S, i0, r0);
3136 return (_jit->pc.w);
3140 _bltr_u(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3142 jcr(X86_CC_B, i0, r0, r1);
3143 return (_jit->pc.w);
3147 _blti_u(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
3149 if (i1) jci (X86_CC_B, i0, r0, i1);
3150 else jci0(X86_CC_B, i0, r0);
3151 return (_jit->pc.w);
3155 _bler(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3157 if (r0 == r1) jmpi(i0);
3158 else jcr (X86_CC_LE, i0, r0, r1);
3159 return (_jit->pc.w);
3163 _blei(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
3165 if (i1) jci (X86_CC_LE, i0, r0, i1);
3166 else jci0(X86_CC_LE, i0, r0);
3167 return (_jit->pc.w);
3171 _bler_u(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3173 if (r0 == r1) jmpi(i0);
3174 else jcr (X86_CC_BE, i0, r0, r1);
3175 return (_jit->pc.w);
3179 _blei_u(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
3181 if (i1) jci (X86_CC_BE, i0, r0, i1);
3182 else jci0(X86_CC_BE, i0, r0);
3183 return (_jit->pc.w);
3187 _beqr(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3189 if (r0 == r1) jmpi(i0);
3190 else jcr (X86_CC_E, i0, r0, r1);
3191 return (_jit->pc.w);
3195 _beqi(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
3197 if (i1) jci (X86_CC_E, i0, r0, i1);
3198 else jci0(X86_CC_E, i0, r0);
3199 return (_jit->pc.w);
3203 _bger(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3205 if (r0 == r1) jmpi(i0);
3206 else jcr (X86_CC_GE, i0, r0, r1);
3207 return (_jit->pc.w);
3211 _bgei(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
3213 if (i1) jci (X86_CC_GE, i0, r0, i1);
3214 else jci0(X86_CC_NS, i0, r0);
3215 return (_jit->pc.w);
3219 _bger_u(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3221 if (r0 == r1) jmpi(i0);
3222 else jcr (X86_CC_AE, i0, r0, r1);
3223 return (_jit->pc.w);
3227 _bgei_u(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
3229 if (i1) jci (X86_CC_AE, i0, r0, i1);
3231 return (_jit->pc.w);
3235 _bgtr(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3237 jcr(X86_CC_G, i0, r0, r1);
3238 return (_jit->pc.w);
3242 _bgti(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
3244 jci(X86_CC_G, i0, r0, i1);
3245 return (_jit->pc.w);
3249 _bgtr_u(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3251 jcr(X86_CC_A, i0, r0, r1);
3252 return (_jit->pc.w);
3256 _bgti_u(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
3258 if (i1) jci (X86_CC_A, i0, r0, i1);
3259 else jci0(X86_CC_NE, i0, r0);
3260 return (_jit->pc.w);
3264 _bner(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3266 jcr(X86_CC_NE, i0, r0, r1);
3267 return (_jit->pc.w);
3271 _bnei(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
3273 if (i1) jci (X86_CC_NE, i0, r0, i1);
3274 else jci0(X86_CC_NE, i0, r0);
3275 return (_jit->pc.w);
3279 _bmsr(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3283 return (_jit->pc.w);
3287 _bmsi(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
3290 if (can_zero_extend_int_p(i1))
3293 reg = jit_get_reg(jit_class_gpr);
3299 return (_jit->pc.w);
3303 _bmcr(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3307 return (_jit->pc.w);
3311 _bmci(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
3314 if (can_zero_extend_int_p(i1))
3317 reg = jit_get_reg(jit_class_gpr);
3323 return (_jit->pc.w);
3327 _boaddr(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3331 return (_jit->pc.w);
3335 _boaddi(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
3338 if (can_sign_extend_int_p(i1)) {
3341 return (_jit->pc.w);
3343 reg = jit_get_reg(jit_class_gpr|jit_class_nospill);
3346 return (boaddr(i0, r0, rn(reg)));
3350 _boaddr_u(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3354 return (_jit->pc.w);
3358 _boaddi_u(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
3361 if (can_sign_extend_int_p(i1)) {
3364 return (_jit->pc.w);
3366 reg = jit_get_reg(jit_class_gpr|jit_class_nospill);
3369 return (boaddr_u(i0, r0, rn(reg)));
3373 _bxaddr(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3377 return (_jit->pc.w);
3381 _bxaddi(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
3384 if (can_sign_extend_int_p(i1)) {
3387 return (_jit->pc.w);
3389 reg = jit_get_reg(jit_class_gpr|jit_class_nospill);
3392 return (bxaddr(i0, r0, rn(reg)));
3396 _bxaddr_u(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3400 return (_jit->pc.w);
3404 _bxaddi_u(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
3407 if (can_sign_extend_int_p(i1)) {
3410 return (_jit->pc.w);
3412 reg = jit_get_reg(jit_class_gpr|jit_class_nospill);
3415 return (bxaddr_u(i0, r0, rn(reg)));
3419 _bosubr(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3423 return (_jit->pc.w);
3427 _bosubi(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
3430 if (can_sign_extend_int_p(i1)) {
3433 return (_jit->pc.w);
3435 reg = jit_get_reg(jit_class_gpr|jit_class_nospill);
3438 return (bosubr(i0, r0, rn(reg)));
3442 _bosubr_u(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3446 return (_jit->pc.w);
3450 _bosubi_u(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
3453 if (can_sign_extend_int_p(i1)) {
3456 return (_jit->pc.w);
3458 reg = jit_get_reg(jit_class_gpr|jit_class_nospill);
3461 return (bosubr_u(i0, r0, rn(reg)));
3465 _bxsubr(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3469 return (_jit->pc.w);
3473 _bxsubi(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
3476 if (can_sign_extend_int_p(i1)) {
3479 return (_jit->pc.w);
3481 reg = jit_get_reg(jit_class_gpr|jit_class_nospill);
3484 return (bxsubr(i0, r0, rn(reg)));
3488 _bxsubr_u(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3492 return (_jit->pc.w);
3496 _bxsubi_u(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
3499 if (can_sign_extend_int_p(i1)) {
3502 return (_jit->pc.w);
3504 reg = jit_get_reg(jit_class_gpr|jit_class_nospill);
3507 return (bxsubr_u(i0, r0, rn(reg)));
3511 _callr(jit_state_t *_jit, jit_int32_t r0)
3513 rex(0, 0, _NOREG, _NOREG, r0);
3515 mrm(0x03, 0x02, r7(r0));
3519 _calli(jit_state_t *_jit, jit_word_t i0)
3524 w = i0 - (_jit->pc.w + 5);
3525 if ((jit_int32_t)w == w) {
3528 w = i0 - (_jit->pc.w + 4);
3541 _calli_p(jit_state_t *_jit, jit_word_t i0)
3545 reg = jit_get_reg(jit_class_gpr);
3546 word = movi_p(rn(reg), i0);
3554 _jmpr(jit_state_t *_jit, jit_int32_t r0)
3556 rex(0, 0, _NOREG, _NOREG, r0);
3558 mrm(0x03, 0x04, r7(r0));
3562 _jmpi(jit_state_t *_jit, jit_word_t i0)
3567 w = i0 - (_jit->pc.w + 5);
3568 if ((jit_int32_t)w == w) {
3571 w = i0 - (_jit->pc.w + 4);
3584 _jmpi_p(jit_state_t *_jit, jit_word_t i0)
3588 reg = jit_get_reg(jit_class_gpr|jit_class_nospill);
3589 word = movi_p(rn(reg), i0);
3597 _jmpsi(jit_state_t *_jit, jit_uint8_t i0)
3604 _prolog(jit_state_t *_jit, jit_node_t *node)
3607 if (_jitc->function->define_frame || _jitc->function->assume_frame) {
3608 jit_int32_t frame = -_jitc->function->frame;
3609 assert(_jitc->function->self.aoff >= frame);
3610 if (_jitc->function->assume_frame)
3612 _jitc->function->self.aoff = frame;
3614 if (_jitc->function->allocar)
3615 _jitc->function->self.aoff &= -16;
3616 #if __X64 && (__CYGWIN__ || _WIN32)
3617 _jitc->function->stack = (((/* first 32 bytes must be allocated */
3618 (_jitc->function->self.alen > 32 ?
3619 _jitc->function->self.alen : 32) -
3620 /* align stack at 16 bytes */
3621 _jitc->function->self.aoff) + 15) & -16) +
3624 _jitc->function->stack = (((_jitc->function->self.alen -
3625 _jitc->function->self.aoff) + 15) & -16) +
3628 subi(_RSP_REGNO, _RSP_REGNO, stack_framesize - REAL_WORDSIZE);
3629 /* callee save registers */
3631 if (jit_regset_tstbit(&_jitc->function->regset, _RDI))
3632 stxi(12, _RSP_REGNO, _RDI_REGNO);
3633 if (jit_regset_tstbit(&_jitc->function->regset, _RSI))
3634 stxi( 8, _RSP_REGNO, _RSI_REGNO);
3635 if (jit_regset_tstbit(&_jitc->function->regset, _RBX))
3636 stxi( 4, _RSP_REGNO, _RBX_REGNO);
3638 # if __CYGWIN__ || _WIN32
3639 if (jit_regset_tstbit(&_jitc->function->regset, _XMM15))
3640 sse_stxi_d(136, _RSP_REGNO, _XMM15_REGNO);
3641 if (jit_regset_tstbit(&_jitc->function->regset, _XMM14))
3642 sse_stxi_d(128, _RSP_REGNO, _XMM14_REGNO);
3643 if (jit_regset_tstbit(&_jitc->function->regset, _XMM13))
3644 sse_stxi_d(120, _RSP_REGNO, _XMM13_REGNO);
3645 if (jit_regset_tstbit(&_jitc->function->regset, _XMM12))
3646 sse_stxi_d(112, _RSP_REGNO, _XMM12_REGNO);
3647 if (jit_regset_tstbit(&_jitc->function->regset, _XMM11))
3648 sse_stxi_d(104, _RSP_REGNO, _XMM11_REGNO);
3649 if (jit_regset_tstbit(&_jitc->function->regset, _XMM10))
3650 sse_stxi_d(96, _RSP_REGNO, _XMM10_REGNO);
3651 if (jit_regset_tstbit(&_jitc->function->regset, _XMM9))
3652 sse_stxi_d(88, _RSP_REGNO, _XMM9_REGNO);
3653 if (jit_regset_tstbit(&_jitc->function->regset, _XMM8))
3654 sse_stxi_d(80, _RSP_REGNO, _XMM8_REGNO);
3655 if (jit_regset_tstbit(&_jitc->function->regset, _XMM7))
3656 sse_stxi_d(72, _RSP_REGNO, _XMM7_REGNO);
3657 if (jit_regset_tstbit(&_jitc->function->regset, _XMM6))
3658 sse_stxi_d(64, _RSP_REGNO, _XMM6_REGNO);
3659 if (jit_regset_tstbit(&_jitc->function->regset, _R15))
3660 stxi(56, _RSP_REGNO, _R15_REGNO);
3661 if (jit_regset_tstbit(&_jitc->function->regset, _R14))
3662 stxi(48, _RSP_REGNO, _R14_REGNO);
3663 if (jit_regset_tstbit(&_jitc->function->regset, _R13))
3664 stxi(40, _RSP_REGNO, _R13_REGNO);
3665 if (jit_regset_tstbit(&_jitc->function->regset, _R12))
3666 stxi(32, _RSP_REGNO, _R12_REGNO);
3667 if (jit_regset_tstbit(&_jitc->function->regset, _RSI))
3668 stxi(24, _RSP_REGNO, _RSI_REGNO);
3669 if (jit_regset_tstbit(&_jitc->function->regset, _RDI))
3670 stxi(16, _RSP_REGNO, _RDI_REGNO);
3671 if (jit_regset_tstbit(&_jitc->function->regset, _RBX))
3672 stxi( 8, _RSP_REGNO, _RBX_REGNO);
3674 if (jit_regset_tstbit(&_jitc->function->regset, _RBX))
3675 stxi(40, _RSP_REGNO, _RBX_REGNO);
3676 if (jit_regset_tstbit(&_jitc->function->regset, _R12))
3677 stxi(32, _RSP_REGNO, _R12_REGNO);
3678 if (jit_regset_tstbit(&_jitc->function->regset, _R13))
3679 stxi(24, _RSP_REGNO, _R13_REGNO);
3680 if (jit_regset_tstbit(&_jitc->function->regset, _R14))
3681 stxi(16, _RSP_REGNO, _R14_REGNO);
3682 if (jit_regset_tstbit(&_jitc->function->regset, _R15))
3683 stxi( 8, _RSP_REGNO, _R15_REGNO);
3686 stxi(0, _RSP_REGNO, _RBP_REGNO);
3687 movr(_RBP_REGNO, _RSP_REGNO);
3690 subi(_RSP_REGNO, _RSP_REGNO, _jitc->function->stack);
3691 if (_jitc->function->allocar) {
3692 reg = jit_get_reg(jit_class_gpr);
3693 movi(rn(reg), _jitc->function->self.aoff);
3694 stxi_i(_jitc->function->aoffoff, _RBP_REGNO, rn(reg));
3698 #if __X64 && !(__CYGWIN__ || _WIN32)
3699 if (_jitc->function->self.call & jit_call_varargs) {
3700 jit_word_t nofp_code;
3702 /* Save gp registers in the save area, if any is a vararg */
3703 for (reg = first_gp_from_offset(_jitc->function->vagp);
3704 jit_arg_reg_p(reg); ++reg)
3705 stxi(_jitc->function->vaoff + first_gp_offset +
3706 reg * 8, _RBP_REGNO, rn(JIT_RA0 - reg));
3708 reg = first_fp_from_offset(_jitc->function->vafp);
3709 if (jit_arg_f_reg_p(reg)) {
3710 /* Skip over if no float registers were passed as argument */
3715 nofp_code = _jit->pc.w;
3717 /* Save fp registers in the save area, if any is a vararg */
3718 /* Note that the full 16 byte xmm is not saved, because
3719 * lightning only handles float and double, and, while
3720 * attempting to provide a va_list compatible pointer as
3721 * jit_va_start return, does not guarantee it (on all ports). */
3722 for (; jit_arg_f_reg_p(reg); ++reg)
3723 sse_stxi_d(_jitc->function->vaoff + first_fp_offset +
3724 reg * va_fp_increment, _RBP_REGNO, rn(_XMM0 - reg));
3726 patch_rel_char(nofp_code, _jit->pc.w);
3733 _epilog(jit_state_t *_jit, jit_node_t *node)
3735 if (_jitc->function->assume_frame)
3737 /* callee save registers */
3738 movr(_RSP_REGNO, _RBP_REGNO);
3740 if (jit_regset_tstbit(&_jitc->function->regset, _RDI))
3741 ldxi(_RDI_REGNO, _RSP_REGNO, 12);
3742 if (jit_regset_tstbit(&_jitc->function->regset, _RSI))
3743 ldxi(_RSI_REGNO, _RSP_REGNO, 8);
3744 if (jit_regset_tstbit(&_jitc->function->regset, _RBX))
3745 ldxi(_RBX_REGNO, _RSP_REGNO, 4);
3747 # if __CYGWIN__ || _WIN32
3748 if (jit_regset_tstbit(&_jitc->function->regset, _XMM15))
3749 sse_ldxi_d(_XMM15_REGNO, _RSP_REGNO, 136);
3750 if (jit_regset_tstbit(&_jitc->function->regset, _XMM14))
3751 sse_ldxi_d(_XMM14_REGNO, _RSP_REGNO, 128);
3752 if (jit_regset_tstbit(&_jitc->function->regset, _XMM13))
3753 sse_ldxi_d(_XMM13_REGNO, _RSP_REGNO, 120);
3754 if (jit_regset_tstbit(&_jitc->function->regset, _XMM12))
3755 sse_ldxi_d(_XMM12_REGNO, _RSP_REGNO, 112);
3756 if (jit_regset_tstbit(&_jitc->function->regset, _XMM11))
3757 sse_ldxi_d(_XMM11_REGNO, _RSP_REGNO, 104);
3758 if (jit_regset_tstbit(&_jitc->function->regset, _XMM10))
3759 sse_ldxi_d(_XMM10_REGNO, _RSP_REGNO, 96);
3760 if (jit_regset_tstbit(&_jitc->function->regset, _XMM9))
3761 sse_ldxi_d(_XMM9_REGNO, _RSP_REGNO, 88);
3762 if (jit_regset_tstbit(&_jitc->function->regset, _XMM8))
3763 sse_ldxi_d(_XMM8_REGNO, _RSP_REGNO, 80);
3764 if (jit_regset_tstbit(&_jitc->function->regset, _XMM7))
3765 sse_ldxi_d(_XMM7_REGNO, _RSP_REGNO, 72);
3766 if (jit_regset_tstbit(&_jitc->function->regset, _XMM6))
3767 sse_ldxi_d(_XMM6_REGNO, _RSP_REGNO, 64);
3768 if (jit_regset_tstbit(&_jitc->function->regset, _R15))
3769 ldxi(_R15_REGNO, _RSP_REGNO, 56);
3770 if (jit_regset_tstbit(&_jitc->function->regset, _R14))
3771 ldxi(_R14_REGNO, _RSP_REGNO, 48);
3772 if (jit_regset_tstbit(&_jitc->function->regset, _R13))
3773 ldxi(_R13_REGNO, _RSP_REGNO, 40);
3774 if (jit_regset_tstbit(&_jitc->function->regset, _R12))
3775 ldxi(_R12_REGNO, _RSP_REGNO, 32);
3776 if (jit_regset_tstbit(&_jitc->function->regset, _RSI))
3777 ldxi(_RSI_REGNO, _RSP_REGNO, 24);
3778 if (jit_regset_tstbit(&_jitc->function->regset, _RDI))
3779 ldxi(_RDI_REGNO, _RSP_REGNO, 16);
3780 if (jit_regset_tstbit(&_jitc->function->regset, _RBX))
3781 ldxi(_RBX_REGNO, _RSP_REGNO, 8);
3783 if (jit_regset_tstbit(&_jitc->function->regset, _RBX))
3784 ldxi(_RBX_REGNO, _RSP_REGNO, 40);
3785 if (jit_regset_tstbit(&_jitc->function->regset, _R12))
3786 ldxi(_R12_REGNO, _RSP_REGNO, 32);
3787 if (jit_regset_tstbit(&_jitc->function->regset, _R13))
3788 ldxi(_R13_REGNO, _RSP_REGNO, 24);
3789 if (jit_regset_tstbit(&_jitc->function->regset, _R14))
3790 ldxi(_R14_REGNO, _RSP_REGNO, 16);
3791 if (jit_regset_tstbit(&_jitc->function->regset, _R15))
3792 ldxi(_R15_REGNO, _RSP_REGNO, 8);
3795 ldxi(_RBP_REGNO, _RSP_REGNO, 0);
3796 addi(_RSP_REGNO, _RSP_REGNO, stack_framesize - REAL_WORDSIZE);
3802 _vastart(jit_state_t *_jit, jit_int32_t r0)
3804 #if __X32 || __CYGWIN__ || _WIN32
3805 assert(_jitc->function->self.call & jit_call_varargs);
3806 addi(r0, _RBP_REGNO, _jitc->function->self.size);
3810 assert(_jitc->function->self.call & jit_call_varargs);
3812 /* Return jit_va_list_t in the register argument */
3813 addi(r0, _RBP_REGNO, _jitc->function->vaoff);
3814 reg = jit_get_reg(jit_class_gpr);
3816 /* Initialize gp offset in the save area. */
3817 movi(rn(reg), _jitc->function->vagp);
3818 stxi_i(offsetof(jit_va_list_t, gpoff), r0, rn(reg));
3820 /* Initialize fp offset in the save area. */
3821 movi(rn(reg), _jitc->function->vafp);
3822 stxi_i(offsetof(jit_va_list_t, fpoff), r0, rn(reg));
3824 /* Initialize overflow pointer to the first stack argument. */
3825 addi(rn(reg), _RBP_REGNO, _jitc->function->self.size);
3826 stxi(offsetof(jit_va_list_t, over), r0, rn(reg));
3828 /* Initialize register save area pointer. */
3829 addi(rn(reg), r0, first_gp_offset);
3830 stxi(offsetof(jit_va_list_t, save), r0, rn(reg));
3837 _vaarg(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3839 #if __X32 || __CYGWIN__ || _WIN32
3840 assert(_jitc->function->self.call & jit_call_varargs);
3842 addi(r1, r1, va_gp_increment);
3849 assert(_jitc->function->self.call & jit_call_varargs);
3851 rg0 = jit_get_reg(jit_class_gpr);
3852 rg1 = jit_get_reg(jit_class_gpr);
3854 /* Load the gp offset in save area in the first temporary. */
3855 ldxi_i(rn(rg0), r1, offsetof(jit_va_list_t, gpoff));
3857 /* Jump over if there are no remaining arguments in the save area. */
3858 icmpi(rn(rg0), va_gp_max_offset);
3860 ge_code = _jit->pc.w;
3862 /* Load the save area pointer in the second temporary. */
3863 ldxi(rn(rg1), r1, offsetof(jit_va_list_t, save));
3865 /* Load the vararg argument in the first argument. */
3866 ldxr(r0, rn(rg1), rn(rg0));
3868 /* Update the gp offset. */
3869 addi(rn(rg0), rn(rg0), 8);
3870 stxi_i(offsetof(jit_va_list_t, gpoff), r1, rn(rg0));
3872 /* Will only need one temporary register below. */
3875 /* Jump over overflow code. */
3877 lt_code = _jit->pc.w;
3879 /* Where to land if argument is in overflow area. */
3880 patch_rel_char(ge_code, _jit->pc.w);
3882 /* Load overflow pointer. */
3883 ldxi(rn(rg0), r1, offsetof(jit_va_list_t, over));
3885 /* Load argument. */
3888 /* Update overflow pointer. */
3889 addi(rn(rg0), rn(rg0), va_gp_increment);
3890 stxi(offsetof(jit_va_list_t, over), r1, rn(rg0));
3892 /* Where to land if argument is in save area. */
3893 patch_rel_char(lt_code, _jit->pc.w);
3899 /* The x87 boolean argument tells if will put the result in a x87
3900 * register if non false, in a sse register otherwise. */
3902 _vaarg_d(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_bool_t x87)
3904 #if __X32 || __CYGWIN__ || _WIN32
3905 assert(_jitc->function->self.call & jit_call_varargs);
3917 assert(_jitc->function->self.call & jit_call_varargs);
3919 rg0 = jit_get_reg(jit_class_gpr);
3920 rg1 = jit_get_reg(jit_class_gpr);
3922 /* Load the fp offset in save area in the first temporary. */
3923 ldxi_i(rn(rg0), r1, offsetof(jit_va_list_t, fpoff));
3925 /* Jump over if there are no remaining arguments in the save area. */
3926 icmpi(rn(rg0), va_fp_max_offset);
3928 ge_code = _jit->pc.w;
3930 /* Load the save area pointer in the second temporary. */
3931 ldxi(rn(rg1), r1, offsetof(jit_va_list_t, save));
3933 /* Load the vararg argument in the first argument. */
3935 x87_ldxr_d(r0, rn(rg1), rn(rg0));
3937 sse_ldxr_d(r0, rn(rg1), rn(rg0));
3939 /* Update the fp offset. */
3940 addi(rn(rg0), rn(rg0), va_fp_increment);
3941 stxi_i(offsetof(jit_va_list_t, fpoff), r1, rn(rg0));
3943 /* Will only need one temporary register below. */
3946 /* Jump over overflow code. */
3948 lt_code = _jit->pc.w;
3950 /* Where to land if argument is in overflow area. */
3951 patch_rel_char(ge_code, _jit->pc.w);
3953 /* Load overflow pointer. */
3954 ldxi(rn(rg0), r1, offsetof(jit_va_list_t, over));
3956 /* Load argument. */
3958 x87_ldr_d(r0, rn(rg0));
3960 sse_ldr_d(r0, rn(rg0));
3962 /* Update overflow pointer. */
3963 addi(rn(rg0), rn(rg0), 8);
3964 stxi(offsetof(jit_va_list_t, over), r1, rn(rg0));
3966 /* Where to land if argument is in save area. */
3967 patch_rel_char(lt_code, _jit->pc.w);
3974 _patch_at(jit_state_t *_jit, jit_node_t *node,
3975 jit_word_t instr, jit_word_t label)
3977 switch (node->code) {
3979 case jit_code_calli:
3983 patch_abs(instr, label);
3986 patch_rel(instr, label);