2 * Copyright (C) 2019 Free Software Foundation, Inc.
4 * This file is part of GNU lightning.
6 * GNU lightning is free software; you can redistribute it and/or modify it
7 * under the terms of the GNU Lesser General Public License as published
8 * by the Free Software Foundation; either version 3, or (at your option)
11 * GNU lightning is distributed in the hope that it will be useful, but
12 * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
13 * or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public
14 * License for more details.
17 * Paulo Cesar Pereira de Andrade
26 # define ui jit_uint32_t
95 # define ii(i) *_jit->pc.ui++ = i
96 /* FIXME could jit_rewind_prolog() to only use extra 64 bytes
97 * if a variadic jit function that have variadic arguments in
99 # define stack_framesize (200 + 64)
100 # define ldr(r0, r1) ldr_l(r0, r1)
101 # define ldi(r0, im) ldi_l(r0, im)
102 # define ldxr(r0, r1, r2) ldxr_l(r0, r1, r2)
103 # define ldxi(r0, r1, im) ldxi_l(r0, r1, im)
104 # define str(r0, r1) str_l(r0, r1)
105 # define sti(im, r0) sti_l(im, r0)
106 # define stxr(r0, r1, r2) stxr_l(r0, r1, r2)
107 # define stxi(im, r0, r1) stxi_l(im, r0, r1)
108 # define simm6_p(im) ((im) <= 31 && (im) >= -32)
109 # define simm12_p(im) ((im) <= 2047 && (im) >= -2048)
110 # define simm20_p(im) ((im) <= 524287 && (im) >= -524288)
111 # define simm32_p(im) ((im) <= 2147483647LL && (im) >= -2147483648LL)
114 * RV32I Base Instruction Set
116 # define LUI(rd, imm) Utype(55, rd, imm)
117 # define AUIPC(rd, imm) Utype(23, rd, imm)
118 # define JAL(rd, imm) Jtype(111, rd, imm)
119 # define JALR(rd, rs1, imm) Itype(103, rd, 0, rs1, imm)
120 # define BEQ(rs1, rs2, imm) Btype(99, 0, rs1, rs2, imm)
121 # define BNE(rs1, rs2, imm) Btype(99, 1, rs1, rs2, imm)
122 # define BLT(rs1, rs2, imm) Btype(99, 4, rs1, rs2, imm)
123 # define BGE(rs1, rs2, imm) Btype(99, 5, rs1, rs2, imm)
124 # define BLTU(rs1, rs2, imm) Btype(99, 6, rs1, rs2, imm)
125 # define BGEU(rs1, rs2, imm) Btype(99, 7, rs1, rs2, imm)
126 # define LB(rd, rs1, imm) Itype(3, rd, 0, rs1, imm)
127 # define LH(rd, rs1, imm) Itype(3, rd, 1, rs1, imm)
128 # define LW(rd, rs1, imm) Itype(3, rd, 2, rs1, imm)
129 # define LBU(rd, rs1, imm) Itype(3, rd, 4, rs1, imm)
130 # define LHU(rd, rs1, imm) Itype(3, rd, 5, rs1, imm)
131 # define SB(rs1, rs2, imm) Stype(35, 0, rs1, rs2, imm)
132 # define SH(rs1, rs2, imm) Stype(35, 1, rs1, rs2, imm)
133 # define SW(rs1, rs2, imm) Stype(35, 2, rs1, rs2, imm)
134 # define ADDI(rd, rs1, imm) Itype(19, rd, 0, rs1, imm)
135 # define SLTI(rd, rs1, imm) Itype(19, rd, 2, rs1, imm)
136 # define SLTIU(rd, rs1, imm) Itype(19, rd, 3, rs1, imm)
137 # define XORI(rd, rs1, imm) Itype(19, rd, 4, rs1, imm)
138 # define ORI(rd, rs1, imm) Itype(19, rd, 6, rs1, imm)
139 # define ANDI(rd, rs1, imm) Itype(19, rd, 7, rs1, imm)
140 # if __WORDSIZE == 32
141 # define SLLI(rd, rs1, imm) Rtype(19, rd, 1, rs1, imm, 0)
142 # define SRLI(rd, rs1, imm) Rtype(19, rd, 5, rs1, imm, 0)
143 # define SRAI(rd, rs1, imm) Rtype(19, rd, 5, rs1, imm, 32)
145 # define ADD(rd, rs1, rs2) Rtype(51, rd, 0, rs1, rs2, 0)
146 # define SUB(rd, rs1, rs2) Rtype(51, rd, 0, rs1, rs2, 32)
147 # define SLL(rd, rs1, rs2) Rtype(51, rd, 1, rs1, rs2, 0)
148 # define SLT(rd, rs1, rs2) Rtype(51, rd, 2, rs1, rs2, 0)
149 # define SLTU(rd, rs1, rs2) Rtype(51, rd, 3, rs1, rs2, 0)
150 # define XOR(rd, rs1, rs2) Rtype(51, rd, 4, rs1, rs2, 0)
151 # define SRL(rd, rs1, rs2) Rtype(51, rd, 5, rs1, rs2, 0)
152 # define SRA(rd, rs1, rs2) Rtype(51, rd, 5, rs1, rs2, 32)
153 # define OR(rd, rs1, rs2) Rtype(51, rd, 6, rs1, rs2, 0)
154 # define AND(rd, rs1, rs2) Rtype(51, rd, 7, rs1, rs2, 0)
155 # define FENCE(imm) Itype(15, 0, 0, 0, im)
156 # define FENCE_I(imm) Itype(15, 0, 1, 0, im)
157 # define ECALL() Itype(115, 0, 0, 0, 0)
158 # define EBREAK() Itype(115, 0, 0, 0, 1)
159 # define CSRRW(rd, rs1, csr) Itype(115, rd, 1, rs1, csr)
160 # define CSRRS(rd, rs1, csr) Itype(115, rd, 2, rs1, csr)
161 # define CSRRC(rd, rs1, csr) Itype(115, rd, 3, rs1, csr)
162 # define CSRRWI(rd, zimm, csr) Itype(115, rd, 5, zimm, csr)
163 # define CSRRSI(rd, zimm, csr) Itype(115, rd, 6, zimm, csr)
164 # define CSRRCI(rd, zimm, csr) Itype(115, rd, 7, zimm, csr)
166 * RV64I Base Instruction Set (in addition to RV32I)
168 # define LWU(rd, rs1, imm) Itype(3, rd, 6, rs1, imm)
169 # define LD(rd, rs1, imm) Itype(3, rd, 3, rs1, imm)
170 # define SD(rs1, rs2, imm) Stype(35, 3, rs1, rs2, imm)
171 # if __WORDSIZE == 64
172 # define SLLI(rd, rs1, sh) IStype(19, rd, 1, rs1, sh, 0)
173 # define SRLI(rd, rs1, sh) IStype(19, rd, 5, rs1, sh, 0)
174 # define SRAI(rd, rs1, sh) IStype(19, rd, 5, rs1, sh, 16)
176 # define ADDIW(rd, rs1, imm) Itype(27, rd, 0, rs1, imm)
177 # define SLLIW(rd, rs1, imm) Rtype(27, rd, 1, rs1, imm, 0)
178 # define SRLIW(rd, rs1, imm) Rtype(27, rd, 3, rs1, imm, 0)
179 # define SRAIW(rd, rs1, imm) Rtype(27, rd, 3, rs1, imm, 32)
180 # define ADDW(rd, rs1, imm) Rtype(59, rd, 0, rs1, imm, 0)
181 # define SUBW(rd, rs1, imm) Rtype(59, rd, 0, rs1, imm, 32)
182 # define SLLW(rd, rs1, imm) Rtype(59, rd, 1, rs1, imm, 0)
183 # define SRLW(rd, rs1, imm) Rtype(59, rd, 5, rs1, imm, 0)
184 # define SRAW(rd, rs1, imm) Rtype(59, rd, 5, rs1, imm, 32)
186 * RV32M Standard Extension
188 # define MUL(rd, rs1, rs2) Rtype(51, rd, 0, rs1, rs2, 1)
189 # define MULH(rd, rs1, rs2) Rtype(51, rd, 1, rs1, rs2, 1)
190 # define MULHSU(rd, rs1, rs2) Rtype(51, rd, 2, rs1, rs2, 1)
191 # define MULHU(rd, rs1, rs2) Rtype(51, rd, 3, rs1, rs2, 1)
192 # define DIV(rd, rs1, rs2) Rtype(51, rd, 4, rs1, rs2, 1)
193 # define DIVU(rd, rs1, rs2) Rtype(51, rd, 5, rs1, rs2, 1)
194 # define REM(rd, rs1, rs2) Rtype(51, rd, 6, rs1, rs2, 1)
195 # define REMU(rd, rs1, rs2) Rtype(51, rd, 7, rs1, rs2, 1)
197 * RV64M Standard Extension (in addition to RV32M)
199 # define MULW(rd, rs1, rs2) Rtype(59, rd, 0, rs1, rs2, 1)
200 # define DIVW(rd, rs1, rs2) Rtype(59, rd, 4, rs1, rs2, 1)
201 # define DIVUW(rd, rs1, rs2) Rtype(59, rd, 5, rs1, rs2, 1)
202 # define REMW(rd, rs1, rs2) Rtype(59, rd, 6, rs1, rs2, 1)
203 # define REMUW(rd, rs1, rs2) Rtype(59, rd, 7, rs1, rs2, 1)
205 * RV32A Standard Extension
207 # define LR_W(rd, rs1) R4type(47, rd, 2, rs1, 0, 0, 2)
208 # define SC_W(rd, rs1, rs2) R4type(47, rd, 2, rs1, rs2, 0, 3)
209 # define AMOSWAP_W(rd, rs1, rs2) R4type(47, rd, 2, rs1, rs2, 0, 1)
210 # define AMOADD_W(rd, rs1, rs2) R4type(47, rd, 2, rs1, rs2, 0, 0)
211 # define AMOXOR_W(rd, rs1, rs2) R4type(47, rd, 2, rs1, rs2, 0, 4)
212 # define AMOAND_W(rd, rs1, rs2) R4type(47, rd, 2, rs1, rs2, 0, 12)
213 # define AMOOR_W(rd, rs1, rs2) R4type(47, rd, 2, rs1, rs2, 0, 8)
214 # define AMOMIN_W(rd, rs1, rs2) R4type(47, rd, 2, rs1, rs2, 0, 16)
215 # define AMOMAX_W(rd, rs1, rs2) R4type(47, rd, 2, rs1, rs2, 0, 20)
216 # define AMOMINU_W(rd, rs1, rs2) R4type(47, rd, 2, rs1, rs2, 0, 24)
217 # define AMOMAXU_W(rd, rs1, rs2) R4type(47, rd, 2, rs1, rs2, 0, 28)
219 * RV64A Standard Extension (in addition to RV32A)
221 # define LR_D(rd, rs1) R4type(47, rd, 3, rs1, 0, 0, 2)
222 # define SC_D(rd, rs1, rs2) R4type(47, rd, 3, rs1, rs2, 0, 3)
223 # define AMOSWAP_D(rd, rs1, rs2) R4type(47, rd, 3, rs1, rs2, 0, 1)
224 # define AMOADD_D(rd, rs1, rs2) R4type(47, rd, 3, rs1, rs2, 0, 0)
225 # define AMOXOR_D(rd, rs1, rs2) R4type(47, rd, 3, rs1, rs2, 0, 4)
226 # define AMOAND_D(rd, rs1, rs2) R4type(47, rd, 3, rs1, rs2, 0, 12)
227 # define AMOOR_D(rd, rs1, rs2) R4type(47, rd, 3, rs1, rs2, 0, 8)
228 # define AMOMIN_D(rd, rs1, rs2) R4type(47, rd, 3, rs1, rs2, 0, 16)
229 # define AMOMAX_D(rd, rs1, rs2) R4type(47, rd, 3, rs1, rs2, 0, 20)
230 # define AMOMINU_D(rd, rs1, rs2) R4type(47, rd, 3, rs1, rs2, 0, 24)
231 # define AMOMAXU_D(rd, rs1, rs2) R4type(47, rd, 3, rs1, rs2, 0, 28)
233 * Pseudo Instructions
235 # define NOP() ADDI(_ZERO_REGNO, _ZERO_REGNO, 0)
236 # define MV(r0, r1) ADDI(r0, r1, 0)
237 # define NOT(r0, r1) XORI(r0, r1, -1)
238 # define NEG(r0, r1) SUB(r0, _ZERO_REGNO, r1)
239 # define NEGW(r0, r1) SUBW(r0, _ZERO_REGNO, r1)
240 # define SEXT_W(r0, r1) ADDIW(r0, r1, 0)
241 # define RET() JALR(0, 1, 0)
244 * Enconding functions
246 # define Rtype(op, rd, fct, rs1, rs2, fct2) \
247 _Rtype(_jit, op, rd, fct, rs1, rs2, fct2)
248 static void _Rtype(jit_state_t*, jit_int32_t, jit_int32_t,
249 jit_int32_t, jit_int32_t, jit_int32_t, jit_int32_t);
250 # define R4type(op, rd, fct, rs1,rs2,fct2,rs3) \
251 _R4type(_jit, op, rd, fct, rs1, rs2, fct2, rs3)
252 static void _R4type(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t,
253 jit_int32_t, jit_int32_t, jit_int32_t, jit_int32_t);
254 # define Itype(op, rd, fct, rs1, imm) \
255 _Itype(_jit, op, rd, fct, rs1, imm)
256 static void _Itype(jit_state_t*, jit_int32_t, jit_int32_t,
257 jit_int32_t, jit_int32_t, jit_int32_t);
258 # if __WORDSIZE == 64
259 # define IStype(op, rd, fct, rs1, sh, imm) \
260 _IStype(_jit, op, rd, fct, rs1, sh, imm)
261 static void _IStype(jit_state_t*, jit_int32_t, jit_int32_t,
262 jit_int32_t, jit_int32_t, jit_int32_t,jit_int32_t);
264 # define Stype(op, fct, rs1, rs2, imm) \
265 _Stype(_jit, op, fct, rs1, rs2, imm)
266 static void _Stype(jit_state_t*, jit_int32_t, jit_int32_t,
267 jit_int32_t, jit_int32_t, jit_int32_t);
268 # define Btype(op, fct, rs1, rs2, imm) \
269 _Btype(_jit, op, fct, rs1, rs2, imm)
270 static void _Btype(jit_state_t*, jit_int32_t, jit_int32_t,
271 jit_int32_t, jit_int32_t, jit_int32_t);
272 # define Utype(op, rd, imm) _Utype(_jit, op, rd, imm)
273 static void _Utype(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
274 # define Jtype(op, rd, imm) _Jtype(_jit, op, rd, imm)
275 static void _Jtype(jit_state_t*, jit_int32_t, jit_int32_t, jit_int32_t);
277 * Lightning instructions
279 # define nop(im) _nop(_jit, im)
280 static void _nop(jit_state_t*, jit_int32_t);
281 # define addr(r0, r1, r2) ADD(r0, r1, r2)
282 # define addi(r0, r1, im) _addi(_jit, r0, r1, im)
283 static void _addi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
284 # define addcr(r0, r1, r2) _addcr(_jit, r0, r1, r2)
285 static void _addcr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
286 # define addci(r0, r1, im) _addci(_jit, r0, r1, im)
287 static void _addci(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
288 # define addxr(r0, r1, r2) _addxr(_jit, r0, r1, r2)
289 static void _addxr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
290 # define addxi(r0, r1, im) _addxi(_jit, r0, r1, im)
291 static void _addxi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
292 # define subr(r0, r1, r2) SUB(r0, r1, r2)
293 # define subi(r0, r1, im) _subi(_jit, r0, r1, im)
294 static void _subi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
295 # define subcr(r0, r1, r2) _subcr(_jit, r0, r1, r2)
296 static void _subcr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
297 # define subci(r0, r1, im) _subci(_jit, r0, r1, im)
298 static void _subci(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
299 # define subxr(r0, r1, r2) _subxr(_jit, r0, r1, r2)
300 static void _subxr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
301 # define subxi(r0, r1, im) _subxi(_jit, r0, r1, im)
302 static void _subxi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
303 # define rsbi(r0, r1, im) _rsbi(_jit, r0, r1, im)
304 static void _rsbi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
305 # define mulr(r0, r1, r2) MUL(r0, r1, r2)
306 # define muli(r0, r1, im) _muli(_jit, r0, r1, im)
307 static void _muli(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
308 # define divr(r0, r1, r2) DIV(r0, r1, r2)
309 # define divi(r0, r1, im) _divi(_jit, r0, r1, im)
310 static void _divi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
311 # define divr_u(r0, r1, r2) DIVU(r0, r1, r2)
312 # define divi_u(r0, r1, im) _divi_u(_jit, r0, r1, im)
313 static void _divi_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
314 # define remr(r0, r1, r2) REM(r0, r1, r2)
315 # define remi(r0, r1, im) _remi(_jit, r0, r1, im)
316 static void _remi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
317 # define remr_u(r0, r1, r2) REMU(r0, r1, r2)
318 # define remi_u(r0, r1, im) _remi_u(_jit, r0, r1, im)
319 static void _remi_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
320 # define qmulr(r0, r1, r2, r3) _qmulr(_jit,r0,r1,r2,r3)
321 static void _qmulr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t,jit_int32_t);
322 # define qmuli(r0, r1, r2, i0) _qmuli(_jit,r0,r1,r2,i0)
323 static void _qmuli(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t,jit_word_t);
324 # define qmulr_u(r0, r1, r2, r3) _qmulr_u(_jit,r0,r1,r2,r3)
325 static void _qmulr_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t,jit_int32_t);
326 # define qmuli_u(r0, r1, r2, i0) _qmuli_u(_jit,r0,r1,r2,i0)
327 static void _qmuli_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t,jit_word_t);
328 static void _iqdivr(jit_state_t*,jit_bool_t,
329 jit_int32_t,jit_int32_t,jit_int32_t,jit_int32_t);
330 # define qdivr(r0,r1,r2,r3) _iqdivr(_jit,1,r0,r1,r2,r3)
331 # define qdivr_u(r0,r1,r2,r3) _iqdivr(_jit,0,r0,r1,r2,r3)
332 static void _iqdivr(jit_state_t*,jit_bool_t,
333 jit_int32_t,jit_int32_t,jit_int32_t,jit_int32_t);
334 # define qdivi(r0,r1,r2,i0) _qdivi(_jit,r0,r1,r2,i0)
335 static void _qdivi(jit_state_t*,jit_int32_t,
336 jit_int32_t,jit_int32_t,jit_word_t);
337 # define qdivi_u(r0,r1,r2,i0) _qdivi_u(_jit,r0,r1,r2,i0)
338 static void _qdivi_u(jit_state_t*,jit_int32_t,
339 jit_int32_t,jit_int32_t,jit_word_t);
340 # define lshr(r0, r1, r2) SLL(r0, r1, r2)
341 # define lshi(r0, r1, im) _lshi(_jit, r0, r1, im)
342 static void _lshi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
343 # define rshr(r0, r1, r2) SRA(r0, r1, r2)
344 # define rshi(r0, r1, im) _rshi(_jit, r0, r1, im)
345 static void _rshi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
346 # define rshr_u(r0, r1, r2) SRL(r0, r1, r2)
347 # define rshi_u(r0, r1, im) _rshi_u(_jit, r0, r1, im)
348 static void _rshi_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
349 # define negr(r0, r1) NEG(r0, r1)
350 # define comr(r0, r1) NOT(r0, r1)
351 # define andr(r0, r1, r2) AND(r0, r1, r2)
352 # define andi(r0, r1, im) _andi(_jit, r0, r1, im)
353 static void _andi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
354 # define orr(r0, r1, r2) OR(r0, r1, r2)
355 # define ori(r0, r1, im) _ori(_jit, r0, r1, im)
356 static void _ori(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
357 # define xorr(r0, r1, r2) XOR(r0, r1, r2)
358 # define xori(r0, r1, im) _xori(_jit, r0, r1, im)
359 static void _xori(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
360 # define ldr_c(r0, r1) LB(r0, r1, 0)
361 # define ldi_c(r0, im) _ldi_c(_jit, r0, im)
362 static void _ldi_c(jit_state_t*,jit_int32_t,jit_word_t);
363 # define ldr_uc(r0, r1) LBU(r0, r1, 0)
364 # define ldi_uc(r0, im) _ldi_uc(_jit, r0, im)
365 static void _ldi_uc(jit_state_t*,jit_int32_t,jit_word_t);
366 # define ldr_s(r0, r1) LH(r0, r1, 0)
367 # define ldi_s(r0, im) _ldi_s(_jit, r0, im)
368 static void _ldi_s(jit_state_t*,jit_int32_t,jit_word_t);
369 # define ldr_us(r0, r1) LHU(r0, r1, 0)
370 # define ldi_us(r0, im) _ldi_us(_jit, r0, im)
371 static void _ldi_us(jit_state_t*,jit_int32_t,jit_word_t);
372 # define ldr_i(r0, r1) LW(r0, r1, 0)
373 # define ldi_i(r0, im) _ldi_i(_jit, r0, im)
374 static void _ldi_i(jit_state_t*,jit_int32_t,jit_word_t);
375 # define ldr_ui(r0, r1) LWU(r0, r1, 0)
376 # define ldi_ui(r0, im) _ldi_ui(_jit, r0, im)
377 static void _ldi_ui(jit_state_t*,jit_int32_t,jit_word_t);
378 # define ldr_l(r0, r1) LD(r0, r1, 0)
379 # define ldi_l(r0, im) _ldi_l(_jit, r0, im)
380 static void _ldi_l(jit_state_t*,jit_int32_t,jit_word_t);
381 # define ldxr_c(r0, r1, r2) _ldxr_c(_jit, r0, r1, r2)
382 static void _ldxr_c(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
383 # define ldxi_c(r0, r1, im) _ldxi_c(_jit, r0, r1, im)
384 static void _ldxi_c(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
385 # define ldxr_uc(r0, r1, r2) _ldxr_uc(_jit, r0, r1, r2)
386 static void _ldxr_uc(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
387 # define ldxi_uc(r0, r1, im) _ldxi_uc(_jit, r0, r1, im)
388 static void _ldxi_uc(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
389 # define ldxr_s(r0, r1, r2) _ldxr_s(_jit, r0, r1, r2)
390 static void _ldxr_s(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
391 # define ldxi_s(r0, r1, im) _ldxi_s(_jit, r0, r1, im)
392 static void _ldxi_s(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
393 # define ldxr_us(r0, r1, r2) _ldxr_us(_jit, r0, r1, r2)
394 static void _ldxr_us(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
395 # define ldxi_us(r0, r1, im) _ldxi_us(_jit, r0, r1, im)
396 static void _ldxi_us(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
397 # define ldxr_i(r0, r1, r2) _ldxr_i(_jit, r0, r1, r2)
398 static void _ldxr_i(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
399 # define ldxi_i(r0, r1, im) _ldxi_i(_jit, r0, r1, im)
400 static void _ldxi_i(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
401 # define ldxr_ui(r0, r1, r2) _ldxr_ui(_jit, r0, r1, r2)
402 static void _ldxr_ui(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
403 # define ldxi_ui(r0, r1, im) _ldxi_ui(_jit, r0, r1, im)
404 static void _ldxi_ui(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
405 # define ldxr_l(r0, r1, r2) _ldxr_l(_jit, r0, r1, r2)
406 static void _ldxr_l(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
407 # define ldxi_l(r0, r1, im) _ldxi_l(_jit, r0, r1, im)
408 static void _ldxi_l(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
409 # define str_c(r0, r1) SB(r0, r1, 0)
410 # define sti_c(im, r0) _sti_c(_jit, im, r0)
411 static void _sti_c(jit_state_t*,jit_word_t,jit_int32_t);
412 # define str_s(r0, r1) SH(r0, r1, 0)
413 # define sti_s(im, r0) _sti_s(_jit, im, r0)
414 static void _sti_s(jit_state_t*,jit_word_t,jit_int32_t);
415 # define str_i(r0, r1) SW(r0, r1, 0)
416 # define sti_i(im, r0) _sti_i(_jit, im, r0)
417 static void _sti_i(jit_state_t*,jit_word_t,jit_int32_t);
418 # define str_l(r0, r1) SD(r0, r1, 0)
419 # define sti_l(im, r0) _sti_l(_jit, im, r0)
420 static void _sti_l(jit_state_t*,jit_word_t,jit_int32_t);
421 # define stxr_c(r0, r1, r2) _stxr_c(_jit, r0, r1, r2)
422 static void _stxr_c(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
423 # define stxi_c(i0, r0, r1) _stxi_c(_jit, i0, r0, r1)
424 static void _stxi_c(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
425 # define stxr_s(r0, r1, r2) _stxr_s(_jit, r0, r1, r2)
426 static void _stxr_s(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
427 # define stxi_s(i0, r0, r1) _stxi_s(_jit, i0, r0, r1)
428 static void _stxi_s(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
429 # define stxr_i(r0, r1, r2) _stxr_i(_jit, r0, r1, r2)
430 static void _stxr_i(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
431 # define stxi_i(i0, r0, r1) _stxi_i(_jit, i0, r0, r1)
432 static void _stxi_i(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
433 # define stxr_l(r0, r1, r2) _stxr_l(_jit, r0, r1, r2)
434 static void _stxr_l(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
435 # define stxi_l(i0, r0, r1) _stxi_l(_jit, i0, r0, r1)
436 static void _stxi_l(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
437 # define htonr_us(r0, r1) _htonr_us(_jit, r0, r1)
438 static void _htonr_us(jit_state_t*,jit_int32_t,jit_int32_t);
439 # define htonr_ui(r0, r1) _htonr_ui(_jit, r0, r1)
440 static void _htonr_ui(jit_state_t*,jit_int32_t,jit_int32_t);
441 # define htonr_ul(r0, r1) _htonr_ul(_jit, r0, r1)
442 static void _htonr_ul(jit_state_t*,jit_int32_t,jit_int32_t);
443 # define extr_c(r0, r1) _extr_c(_jit, r0, r1)
444 static void _extr_c(jit_state_t*,jit_int32_t,jit_int32_t);
445 # define extr_uc(r0, r1) andi(r0, r1, 0xff)
446 # define extr_s(r0, r1) _extr_s(_jit, r0, r1)
447 static void _extr_s(jit_state_t*,jit_int32_t,jit_int32_t);
448 # define extr_us(r0, r1) _extr_us(_jit, r0, r1)
449 static void _extr_us(jit_state_t*,jit_int32_t,jit_int32_t);
450 # define extr_i(r0, r1) SEXT_W(r0, r1)
451 # define extr_ui(r0, r1) _extr_ui(_jit, r0, r1)
452 static void _extr_ui(jit_state_t*,jit_int32_t,jit_int32_t);
453 # define movr(r0, r1) MV(r0, r1)
454 # define movi(r0, im) _movi(_jit, r0, im)
455 static void _movi(jit_state_t*,jit_int32_t,jit_word_t);
456 # define movi_p(r0, im) _movi_p(_jit, r0, im)
457 static jit_word_t _movi_p(jit_state_t*,jit_int32_t,jit_word_t);
458 # define ltr(r0, r1, r2) SLT(r0, r1, r2)
459 # define lti(r0, r1, im) _lti(_jit, r0, r1, im)
460 static void _lti(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
461 # define ltr_u(r0, r1, r2) SLTU(r0, r1, r2)
462 # define lti_u(r0, r1, im) _lti_u(_jit, r0, r1, im)
463 static void _lti_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
464 # define ler(r0, r1, r2) _ler(_jit, r0, r1, r2)
465 static void _ler(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
466 # define lei(r0, r1, im) _lei(_jit, r0, r1, im)
467 static void _lei(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
468 # define ler_u(r0, r1, r2) _ler_u(_jit, r0, r1, r2)
469 static void _ler_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
470 # define lei_u(r0, r1, im) _lei_u(_jit, r0, r1, im)
471 static void _lei_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
472 # define eqr(r0, r1, r2) _eqr(_jit, r0, r1, r2)
473 static void _eqr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
474 # define eqi(r0, r1, im) _eqi(_jit, r0, r1, im)
475 static void _eqi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
476 # define ger(r0, r1, r2) _ger(_jit, r0, r1, r2)
477 static void _ger(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
478 # define gei(r0, r1, r2) _gei(_jit, r0, r1, r2)
479 static void _gei(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
480 # define ger_u(r0, r1, r2) _ger_u(_jit, r0, r1, r2)
481 static void _ger_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
482 # define gei_u(r0, r1, im) _gei_u(_jit, r0, r1, im)
483 static void _gei_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
484 # define gtr(r0, r1, r2) SLT(r0, r2, r1)
485 # define gti(r0, r1, im) _gti(_jit, r0, r1, im)
486 static void _gti(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
487 # define gtr_u(r0, r1, r2) SLTU(r0, r2, r1)
488 # define gti_u(r0, r1, im) _gti_u(_jit, r0, r1, im)
489 static void _gti_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
490 # define ner(r0, r1, r2) _ner(_jit, r0, r1, r2)
491 static void _ner(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
492 # define nei(r0, r1, im) _nei(_jit, r0, r1, im)
493 static void _nei(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
494 # define bltr(br, r0, r1) _bltr(_jit, br, r0, r1)
495 static jit_word_t _bltr(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
496 # define blti(br, r0, im) _blti(_jit, br, r0, im)
497 static jit_word_t _blti(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
498 # define bltr_u(br, r0, r1) _bltr_u(_jit, br, r0, r1)
499 static jit_word_t _bltr_u(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
500 # define blti_u(br, r0, im) _blti_u(_jit, br, r0, im)
501 static jit_word_t _blti_u(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
502 # define bler(br, r0, r1) _bler(_jit, br, r0, r1)
503 static jit_word_t _bler(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
504 # define blei(br, r0, im) _blei(_jit, br, r0, im)
505 static jit_word_t _blei(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
506 # define bler_u(br, r0, r1) _bler_u(_jit, br, r0, r1)
507 static jit_word_t _bler_u(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
508 # define blei_u(br, r0, im) _blei_u(_jit, br, r0, im)
509 static jit_word_t _blei_u(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
510 # define beqr(br, r0, r1) _beqr(_jit, br, r0, r1)
511 static jit_word_t _beqr(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
512 # define beqi(br, r0, im) _beqi(_jit, br, r0, im)
513 static jit_word_t _beqi(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
514 # define bger(br, r0, r1) _bger(_jit, br, r0, r1)
515 static jit_word_t _bger(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
516 # define bgei(br, r0, im) _bgei(_jit, br, r0, im)
517 static jit_word_t _bgei(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
518 # define bger_u(br, r0, r1) _bger_u(_jit, br, r0, r1)
519 static jit_word_t _bger_u(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
520 # define bgei_u(br, r0, im) _bgei_u(_jit, br, r0, im)
521 static jit_word_t _bgei_u(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
522 # define bgtr(br, r0, r1) _bgtr(_jit, br, r0, r1)
523 static jit_word_t _bgtr(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
524 # define bgti(br, r0, im) _bgti(_jit, br, r0, im)
525 static jit_word_t _bgti(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
526 # define bgtr_u(br, r0, r1) _bgtr_u(_jit, br, r0, r1)
527 static jit_word_t _bgtr_u(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
528 # define bgti_u(br, r0, im) _bgti_u(_jit, br, r0, im)
529 static jit_word_t _bgti_u(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
530 # define bner(br, r0, r1) _bner(_jit, br, r0, r1)
531 static jit_word_t _bner(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
532 # define bnei(br, r0, im) _bnei(_jit, br, r0, im)
533 static jit_word_t _bnei(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
534 # define boaddr(br, r0, r1) _boaddr(_jit, br, r0, r1)
535 # define boaddi(br, r0, im) _boaddi(_jit, br, r0, im)
536 static jit_word_t _boaddr(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
537 static jit_word_t _boaddi(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
538 # define boaddr_u(br, r0, r1) _boaddr_u(_jit, br, r0, r1)
539 # define boaddi_u(br, r0, im) _boaddi_u(_jit, br, r0, im)
540 static jit_word_t _boaddr_u(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
541 static jit_word_t _boaddi_u(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
542 # define bxaddr(br, r0, r1) _bxaddr(_jit, br, r0, r1)
543 # define bxaddi(br, r0, im) _bxaddi(_jit, br, r0, im)
544 static jit_word_t _bxaddr(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
545 static jit_word_t _bxaddi(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
546 # define bxaddr_u(br, r0, r1) _bxaddr_u(_jit, br, r0, r1)
547 # define bxaddi_u(br, r0, im) _bxaddi_u(_jit, br, r0, im)
548 static jit_word_t _bxaddr_u(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
549 static jit_word_t _bxaddi_u(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
550 # define bosubr(br, r0, r1) _bosubr(_jit, br, r0, r1)
551 # define bosubi(br, r0, im) _bosubi(_jit, br, r0, im)
552 static jit_word_t _bosubr(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
553 static jit_word_t _bosubi(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
554 # define bosubr_u(br, r0, r1) _bosubr_u(_jit, br, r0, r1)
555 # define bosubi_u(br, r0, im) _bosubi_u(_jit, br, r0, im)
556 static jit_word_t _bosubr_u(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
557 static jit_word_t _bosubi_u(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
558 # define bxsubr(br, r0, r1) _bxsubr(_jit, br, r0, r1)
559 # define bxsubi(br, r0, im) _bxsubi(_jit, br, r0, im)
560 static jit_word_t _bxsubr(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
561 static jit_word_t _bxsubi(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
562 # define bxsubr_u(br, r0, r1) _bxsubr_u(_jit, br, r0, r1)
563 # define bxsubi_u(br, r0, im) _bxsubi_u(_jit, br, r0, im)
564 static jit_word_t _bxsubr_u(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
565 static jit_word_t _bxsubi_u(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
566 # define bmsr(br, r0, r1) _bmsr(_jit, br, r0, r1)
567 # define bmsi(br, r0, im) _bmsi(_jit, br, r0, im)
568 static jit_word_t _bmsr(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
569 static jit_word_t _bmsi(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
570 # define bmcr(br, r0, r1) _bmcr(_jit, br, r0, r1)
571 # define bmci(br, r0, im) _bmci(_jit, br, r0, im)
572 static jit_word_t _bmcr(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
573 static jit_word_t _bmci(jit_state_t*,jit_word_t,jit_int32_t,jit_word_t);
574 # define jmpr(r0) JALR(_ZERO_REGNO, r0, 0)
575 # define jmpi(im) _jmpi(_jit, im)
576 static void _jmpi(jit_state_t*,jit_word_t);
577 # define jmpi_p(im) _jmpi_p(_jit, im)
578 static jit_word_t _jmpi_p(jit_state_t*,jit_word_t);
579 # define callr(r0) JALR(_RA_REGNO, r0, 0)
580 # define calli(im) _calli(_jit, im)
581 static void _calli(jit_state_t*,jit_word_t);
582 # define calli_p(im) _calli_p(_jit, im)
583 static jit_word_t _calli_p(jit_state_t*,jit_word_t);
584 # define prolog(i0) _prolog(_jit,i0)
585 static void _prolog(jit_state_t*,jit_node_t*);
586 # define epilog(i0) _epilog(_jit,i0)
587 static void _epilog(jit_state_t*,jit_node_t*);
588 # define vastart(r0) _vastart(_jit, r0)
589 static void _vastart(jit_state_t*, jit_int32_t);
590 # define vaarg(r0, r1) _vaarg(_jit, r0, r1)
591 static void _vaarg(jit_state_t*, jit_int32_t, jit_int32_t);
592 #define patch_abs(instr,label) _patch_at(_jit,instr,label)
593 #define patch_at(instr,label) _patch_at(_jit,instr,label)
594 static void _patch_at(jit_state_t*,jit_word_t,jit_word_t);
599 _Rtype(jit_state_t *_jit, jit_int32_t op, jit_int32_t rd,
600 jit_int32_t fct, jit_int32_t rs1, jit_int32_t rs2, jit_int32_t fct2)
603 assert(!(op & ~0x7f));
604 assert(!(rd & ~0x1f));
605 assert(!(fct & ~0x07));
606 assert(!(rs1 & ~0x1f));
607 assert(!(rs2 & ~0x1f));
608 assert(!(fct2 & ~0x7f));
619 _R4type(jit_state_t *_jit, jit_int32_t op, jit_int32_t rd, jit_int32_t fct,
620 jit_int32_t rs1, jit_int32_t rs2, jit_int32_t fct2, jit_int32_t rs3)
623 assert(!(op & ~0x7f));
624 assert(!(rd & ~0x1f));
625 assert(!(fct & ~0x07));
626 assert(!(rs1 & ~0x1f));
627 assert(!(rs2 & ~0x1f));
628 assert(!(fct2 & ~0x03));
629 assert(!(rs3 & ~0x1f));
641 _Itype(jit_state_t *_jit, jit_int32_t op, jit_int32_t rd,
642 jit_int32_t fct, jit_int32_t rs1, jit_int32_t imm)
645 assert(!(op & ~0x7f));
646 assert(!(rd & ~0x1f));
647 assert(!(fct & ~0x07));
648 assert(!(rs1 & ~0x1f));
649 assert(simm12_p(imm));
658 # if __WORDSIZE == 64
660 _IStype(jit_state_t *_jit, jit_int32_t op, jit_int32_t rd,
661 jit_int32_t fct, jit_int32_t rs1, jit_int32_t sh, jit_int32_t imm)
664 assert(!(op & ~0x7f));
665 assert(!(rd & ~0x1f));
666 assert(!(fct & ~0x07));
667 assert(!(rs1 & ~0x1f));
668 assert(!(sh & ~0x3f));
669 assert(simm6_p(imm));
681 _Stype(jit_state_t *_jit, jit_int32_t op, jit_int32_t fct,
682 jit_int32_t rs1, jit_int32_t rs2, jit_int32_t imm)
685 assert(!(op & ~0x7f));
686 assert(!(fct & ~0x07));
687 assert(!(rs1 & ~0x1f));
688 assert(!(rs2 & ~0x1f));
689 assert(simm12_p(imm));
691 i.S.imm4_0 = imm & 0x1f;
695 i.S.imm11_5 = (imm >> 5) & 0x7f;
700 _Btype(jit_state_t *_jit, jit_int32_t op, jit_int32_t fct,
701 jit_int32_t rs1, jit_int32_t rs2, jit_int32_t imm)
704 assert(!(op & ~0x7f));
705 assert(!(fct & ~0x07));
706 assert(!(rs1 & ~0x1f));
707 assert(!(rs2 & ~0x1f));
708 assert(!(imm & 1) && simm12_p(imm));
710 i.B.imm11 = (imm >> 11) & 0x1;
711 i.B.imm4_1 = (imm >> 1) & 0xf;
715 i.B.imm10_5 = (imm >> 5) & 0x3f;
716 i.B.imm12 = (imm >> 12) & 0x1;
721 _Utype(jit_state_t *_jit, jit_int32_t op, jit_int32_t rd, jit_int32_t imm)
724 assert(!(op & ~0x7f));
725 assert(!(rd & ~0x1f));
726 assert(simm20_p(imm));
734 _Jtype(jit_state_t *_jit, jit_int32_t op, jit_int32_t rd, jit_int32_t imm)
737 assert(!(op & ~0x7f));
738 assert(!(rd & ~0x1f));
739 assert(!(imm & 1) && imm <= 1048575 && imm >= -1048576);
742 i.J.imm19_12= (imm >> 12) & 0xff;
743 i.J.imm11 = (imm >> 11) & 0x1;
744 i.J.imm10_1 = (imm >> 1) & 0x3ff;
745 i.J.imm20 = (imm >> 20) & 0x1;
750 _nop(jit_state_t *_jit, jit_int32_t im)
752 for (; im > 0; im -= 4)
758 _addi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
764 t0 = jit_get_reg(jit_class_gpr);
766 addr(r0, r1, rn(t0));
772 _addcr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
775 if (jit_carry == _NOREG)
776 jit_carry = jit_get_reg(jit_class_gpr);
778 t0 = jit_get_reg(jit_class_gpr);
779 addr(rn(t0), r1, r2);
780 SLTU(rn(jit_carry), rn(t0), r1);
786 SLTU(rn(jit_carry), r0, r1);
791 _addci(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
794 if (jit_carry == _NOREG)
795 jit_carry = jit_get_reg(jit_class_gpr);
797 t0 = jit_get_reg(jit_class_gpr);
798 addi(rn(t0), r1, i0);
799 SLTU(rn(jit_carry), rn(t0), r1);
805 SLTU(rn(jit_carry), r0, r1);
810 _addxr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
813 assert(jit_carry != _NOREG);
814 t0 = jit_get_reg(jit_class_gpr);
815 movr(rn(t0), rn(jit_carry));
817 addcr(r0, r0, rn(t0));
822 _addxi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
825 assert(jit_carry != _NOREG);
826 t0 = jit_get_reg(jit_class_gpr);
827 movr(rn(t0), rn(jit_carry));
829 addcr(r0, r0, rn(t0));
834 _subi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
840 t0 = jit_get_reg(jit_class_gpr);
842 subr(r0, r1, rn(t0));
848 _subcr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
851 if (jit_carry == _NOREG)
852 jit_carry = jit_get_reg(jit_class_gpr);
854 t0 = jit_get_reg(jit_class_gpr);
855 subr(rn(t0), r1, r2);
856 SLTU(rn(jit_carry), r1, rn(t0));
862 SLTU(rn(jit_carry), r1, r0);
867 _subci(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
870 if (jit_carry == _NOREG)
871 jit_carry = jit_get_reg(jit_class_gpr);
873 t0 = jit_get_reg(jit_class_gpr);
874 subi(rn(t0), r1, i0);
875 SLTU(rn(jit_carry), r1, rn(t0));
881 SLTU(rn(jit_carry), r1, r0);
886 _subxr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
889 assert(jit_carry != _NOREG);
890 t0 = jit_get_reg(jit_class_gpr);
891 movr(rn(t0), rn(jit_carry));
893 subcr(r0, r0, rn(t0));
898 _subxi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
901 assert(jit_carry != _NOREG);
902 t0 = jit_get_reg(jit_class_gpr);
903 movr(rn(t0), rn(jit_carry));
905 subcr(r0, r0, rn(t0));
910 _rsbi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
917 _muli(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
920 t0 = jit_get_reg(jit_class_gpr);
922 mulr(r0, r1, rn(t0));
927 _divi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
930 t0 = jit_get_reg(jit_class_gpr);
932 divr(r0, r1, rn(t0));
937 _divi_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
940 t0 = jit_get_reg(jit_class_gpr);
942 divr_u(r0, r1, rn(t0));
947 _remi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
950 t0 = jit_get_reg(jit_class_gpr);
952 remr(r0, r1, rn(t0));
957 _remi_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
960 t0 = jit_get_reg(jit_class_gpr);
962 remr_u(r0, r1, rn(t0));
967 _qmulr(jit_state_t *_jit, jit_int32_t r0,
968 jit_int32_t r1, jit_int32_t r2, jit_int32_t r3)
971 if (r0 == r2 || r0 == r3) {
972 t0 = jit_get_reg(jit_class_gpr);
973 mulr(rn(t0), r2, r3);
978 if (r0 == r2 || r0 == r3) {
985 _qmuli(jit_state_t *_jit, jit_int32_t r0,
986 jit_int32_t r1, jit_int32_t r2, jit_word_t i0)
989 t0 = jit_get_reg(jit_class_gpr);
991 qmulr(r0, r1, r2, rn(t0));
996 _qmulr_u(jit_state_t *_jit, jit_int32_t r0,
997 jit_int32_t r1, jit_int32_t r2, jit_int32_t r3)
1000 if (r0 == r2 || r0 == r3) {
1001 t0 = jit_get_reg(jit_class_gpr);
1002 mulr(rn(t0), r2, r3);
1007 if (r0 == r2 || r0 == r3) {
1014 _qmuli_u(jit_state_t *_jit, jit_int32_t r0,
1015 jit_int32_t r1, jit_int32_t r2, jit_word_t i0)
1018 t0 = jit_get_reg(jit_class_gpr);
1020 qmulr_u(r0, r1, r2, rn(t0));
1025 _iqdivr(jit_state_t *_jit, jit_bool_t sign,
1026 jit_int32_t r0, jit_int32_t r1, jit_int32_t r2, jit_int32_t r3)
1028 jit_int32_t sv0, rg0;
1029 jit_int32_t sv1, rg1;
1030 if (r0 == r2 || r0 == r3) {
1031 sv0 = jit_get_reg(jit_class_gpr);
1036 if (r1 == r2 || r1 == r3) {
1037 sv1 = jit_get_reg(jit_class_gpr);
1045 divr_u(rg0, r2, r3);
1059 _qdivi(jit_state_t *_jit, jit_int32_t r0,
1060 jit_int32_t r1, jit_int32_t r2, jit_word_t i0)
1063 t0 = jit_get_reg(jit_class_gpr);
1065 qdivr(r0, r1, r2, rn(t0));
1070 _qdivi_u(jit_state_t *_jit, jit_int32_t r0,
1071 jit_int32_t r1, jit_int32_t r2, jit_word_t i0)
1074 t0 = jit_get_reg(jit_class_gpr);
1076 qdivr_u(r0, r1, r2, rn(t0));
1081 _lshi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1086 assert(i0 > 0 && i0 < 64);
1092 _rshi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1097 assert(i0 > 0 && i0 < 64);
1103 _rshi_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1108 assert(i0 > 0 && i0 < 64);
1114 _andi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1120 t0 = jit_get_reg(jit_class_gpr);
1122 andr(r0, r1, rn(t0));
1128 _ori(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1134 t0 = jit_get_reg(jit_class_gpr);
1136 orr(r0, r1, rn(t0));
1142 _xori(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1148 t0 = jit_get_reg(jit_class_gpr);
1150 xorr(r0, r1, rn(t0));
1155 # define DEFLD(T,O) \
1157 _ldi_##T(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0) \
1160 L##O(r0, _ZERO_REGNO, i0); \
1163 t0 = jit_get_reg(jit_class_gpr); \
1165 ldr_##T(r0, rn(t0)); \
1166 jit_unget_reg(t0); \
1171 _ldxr_##T(jit_state_t *_jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)\
1174 t0 = jit_get_reg(jit_class_gpr); \
1175 addr(rn(t0), r1, r2); \
1176 ldr_##T(r0, rn(t0)); \
1177 jit_unget_reg(t0); \
1181 _ldxi_##T(jit_state_t *_jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)\
1187 t0 = jit_get_reg(jit_class_gpr); \
1188 addi(rn(t0), r1, i0); \
1189 ldr_##T(r0, rn(t0)); \
1190 jit_unget_reg(t0); \
1202 # define DEFST(T, O) \
1204 _sti_##T(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0) \
1207 S##O(_ZERO_REGNO, r0, i0); \
1210 t0 = jit_get_reg(jit_class_gpr); \
1212 str_##T(rn(t0), r0); \
1213 jit_unget_reg(t0); \
1218 _stxr_##T(jit_state_t *_jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)\
1221 t0 = jit_get_reg(jit_class_gpr); \
1222 addr(rn(t0), r0, r1); \
1223 str_##T(rn(t0), r2); \
1224 jit_unget_reg(t0); \
1228 _stxi_##T(jit_state_t *_jit,jit_word_t i0,jit_int32_t r0,jit_int32_t r1)\
1234 t0 = jit_get_reg(jit_class_gpr); \
1235 addi(rn(t0), r0, i0); \
1236 str_##T(rn(t0), r1); \
1237 jit_unget_reg(t0); \
1247 _htonr_us(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
1250 t0 = jit_get_reg(jit_class_gpr);
1251 rshi(rn(t0), r1, 8);
1253 andi(rn(t0), rn(t0), 0xff);
1255 orr(r0, r0, rn(t0));
1260 _htonr_ui(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
1265 t0 = jit_get_reg(jit_class_gpr);
1266 t1 = jit_get_reg(jit_class_gpr);
1267 t2 = jit_get_reg(jit_class_gpr);
1268 rshi(rn(t0), r1, 24);
1269 rshi(rn(t1), r1, 16);
1270 rshi(rn(t2), r1, 8);
1271 andi(rn(t0), rn(t0), 0xff);
1272 andi(rn(t1), rn(t1), 0xff);
1273 andi(rn(t2), rn(t2), 0xff);
1276 lshi(rn(t1), rn(t1), 8);
1277 orr(r0, r0, rn(t0));
1278 lshi(rn(t2), rn(t2), 16);
1279 orr(r0, r0, rn(t1));
1280 orr(r0, r0, rn(t2));
1287 _htonr_ul(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
1290 t0 = jit_get_reg(jit_class_gpr);
1291 rshi_u(rn(t0), r1, 32);
1293 htonr_ui(rn(t0), rn(t0));
1295 orr(r0, r0, rn(t0));
1300 _extr_c(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
1307 _extr_s(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
1314 _extr_us(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
1321 _extr_ui(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
1328 _movi(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
1331 jit_int32_t lo = (jit_int32_t)i0 << 20 >> 20;
1332 jit_int32_t hi = i0 - lo;
1339 ADDIW(r0, _ZERO_REGNO, lo);
1342 jit_int32_t lo = i0 << 32 >> 32;
1343 jit_word_t hi = i0 - lo;
1344 jit_int32_t t0 = jit_get_reg(jit_class_gpr);
1345 movi(rn(t0), (jit_int32_t)(hi >> 32));
1347 lshi(rn(t0), rn(t0), 32);
1348 addr(r0, r0, rn(t0));
1354 _movi_p(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
1358 jit_int32_t ww = i0 << 32 >> 32;
1359 jit_int32_t lo = ww << 20 >> 20;
1360 jit_int32_t hi = ww - lo;
1362 t0 = jit_get_reg(jit_class_gpr);
1366 lo = ww << 20 >> 20;
1368 LUI(rn(t0), hi >> 12);
1369 ADDIW(rn(t0), rn(t0), lo);
1370 SLLI(rn(t0), rn(t0), 32);
1371 ADD(r0, r0, rn(t0));
1377 _lti(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1383 t0 = jit_get_reg(jit_class_gpr);
1385 ltr(r0, r1, rn(t0));
1391 _lti_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1397 t0 = jit_get_reg(jit_class_gpr);
1399 ltr_u(r0, r1, rn(t0));
1405 _ler(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1412 _lei(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1416 SLT(r0, _ZERO_REGNO, r1);
1420 t0 = jit_get_reg(jit_class_gpr);
1422 ler(r0, r1, rn(t0));
1428 _ler_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1435 _lei_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1439 SLTU(r0, _ZERO_REGNO, r1);
1443 t0 = jit_get_reg(jit_class_gpr);
1445 ler_u(r0, r1, rn(t0));
1451 _eqr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1454 SLTU(r0, _ZERO_REGNO, r0);
1459 _eqi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1463 SLTU(r0, _ZERO_REGNO, r0);
1466 SLTU(r0, _ZERO_REGNO, r1);
1471 _ger(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1478 _gei(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1481 t0 = jit_get_reg(jit_class_gpr);
1483 ger(r0, r1, rn(t0));
1488 _ger_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1495 _gei_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1498 t0 = jit_get_reg(jit_class_gpr);
1500 ger_u(r0, r1, rn(t0));
1505 _gti(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1508 t0 = jit_get_reg(jit_class_gpr);
1510 ltr(r0, rn(t0), r1);
1515 _gti_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1518 t0 = jit_get_reg(jit_class_gpr);
1520 ltr_u(r0, rn(t0), r1);
1525 _ner(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1528 SLTU(r0, _ZERO_REGNO, r0);
1532 _nei(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1536 SLTU(r0, _ZERO_REGNO, r0);
1539 SLTU(r0, _ZERO_REGNO, r1);
1543 _bltr(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_int32_t r1)
1547 BLT(r0, r1, br - w);
1552 _blti(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_word_t i0)
1556 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1558 w = bltr(br, r0, rn(t0));
1564 _bltr_u(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_int32_t r1)
1568 BLTU(r0, r1, br - w);
1573 _blti_u(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_word_t i0)
1577 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1579 w = bltr_u(br, r0, rn(t0));
1585 _bler(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_int32_t r1)
1589 BGE(r1, r0, br - w);
1594 _blei(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_word_t i0)
1598 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1600 w = bler(br, r0, rn(t0));
1606 _bler_u(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_int32_t r1)
1610 BGEU(r1, r0, br - w);
1615 _blei_u(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_word_t i0)
1619 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1621 w = bler_u(br, r0, rn(t0));
1627 _beqr(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_int32_t r1)
1631 BEQ(r1, r0, br - w);
1636 _beqi(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_word_t i0)
1640 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1642 w = beqr(br, r0, rn(t0));
1648 _bger(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_int32_t r1)
1652 BGE(r0, r1, br - w);
1657 _bgei(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_word_t i0)
1661 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1663 w = bger(br, r0, rn(t0));
1669 _bger_u(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_int32_t r1)
1673 BGEU(r0, r1, br - w);
1678 _bgei_u(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_word_t i0)
1682 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1684 w = bger_u(br, r0, rn(t0));
1690 _bgtr(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_int32_t r1)
1694 BLT(r1, r0, br - w);
1699 _bgti(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_word_t i0)
1703 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1705 w = bgtr(br, r0, rn(t0));
1711 _bgtr_u(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_int32_t r1)
1715 BLTU(r1, r0, br - w);
1720 _bgti_u(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_word_t i0)
1724 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1726 w = bgtr_u(br, r0, rn(t0));
1732 _bner(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_int32_t r1)
1736 BNE(r1, r0, br - w);
1741 _bnei(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_word_t i0)
1745 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1747 w = bner(br, r0, rn(t0));
1753 _boaddr(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_int32_t r1)
1757 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1758 t1 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1760 SLT(rn(t0), r1, _ZERO_REGNO);
1765 /* overflow = r1 < 0 ? t1 < r0 : r0 < t1 */
1767 BNE(rn(t0), _ZERO_REGNO, 0);
1769 SLT(rn(t1), r0, rn(t1));
1771 JAL(_ZERO_REGNO, 0);
1773 patch_at(w, _jit->pc.w);
1774 SLT(rn(t1), rn(t1), r0);
1776 patch_at(jal, _jit->pc.w);
1778 BNE(rn(t1), _ZERO_REGNO, br - w);
1785 _boaddi(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_word_t i0)
1789 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1791 w = boaddr(br, r0, rn(t0));
1797 _boaddr_u(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_int32_t r1)
1801 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1802 t1 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1803 addr(rn(t0), r0, r1);
1804 SLTU(rn(t1), rn(t0), r0);
1807 BNE(_ZERO_REGNO, rn(t1), br - w);
1814 _boaddi_u(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_word_t i0)
1818 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1820 w = boaddr_u(br, r0, rn(t0));
1826 _bxaddr(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_int32_t r1)
1830 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1831 t1 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1833 SLT(rn(t0), r1, _ZERO_REGNO);
1838 /* overflow = r1 < 0 ? t1 < r0 : r0 < t1 */
1840 BNE(rn(t0), _ZERO_REGNO, 0);
1842 SLT(rn(t1), r0, rn(t1));
1844 JAL(_ZERO_REGNO, 0);
1846 patch_at(w, _jit->pc.w);
1847 SLT(rn(t1), rn(t1), r0);
1849 patch_at(jal, _jit->pc.w);
1851 BEQ(rn(t1), _ZERO_REGNO, br - w);
1858 _bxaddi(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_word_t i0)
1862 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1864 w = bxaddr(br, r0, rn(t0));
1870 _bxaddr_u(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_int32_t r1)
1874 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1875 t1 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1876 addr(rn(t0), r0, r1);
1877 SLTU(rn(t1), rn(t0), r0);
1880 BEQ(_ZERO_REGNO, rn(t1), br - w);
1887 _bxaddi_u(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_word_t i0)
1891 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1893 w = bxaddr_u(br, r0, rn(t0));
1899 _bosubr(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_int32_t r1)
1903 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1904 t1 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1906 SLT(rn(t0), _ZERO_REGNO, r1);
1911 /* overflow = r1 < 0 ? t1 < r0 : r0 < t1 */
1913 BNE(rn(t0), _ZERO_REGNO, 0);
1915 SLT(rn(t1), r0, rn(t1));
1917 JAL(_ZERO_REGNO, 0);
1919 patch_at(w, _jit->pc.w);
1920 SLT(rn(t1), rn(t1), r0);
1922 patch_at(jal, _jit->pc.w);
1924 BNE(rn(t1), _ZERO_REGNO, br - w);
1931 _bosubi(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_word_t i0)
1935 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1937 w = bosubr(br, r0, rn(t0));
1943 _bosubr_u(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_int32_t r1)
1947 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1948 t1 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1949 subr(rn(t0), r0, r1);
1950 SLTU(rn(t1), r0, rn(t0));
1953 BNE(_ZERO_REGNO, rn(t1), br - w);
1960 _bosubi_u(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_word_t i0)
1964 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1966 w = bosubr_u(br, r0, rn(t0));
1972 _bxsubr(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_int32_t r1)
1976 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1977 t1 = jit_get_reg(jit_class_gpr|jit_class_nospill);
1979 SLT(rn(t0), _ZERO_REGNO, r1);
1984 /* overflow = r1 < 0 ? t1 < r0 : r0 < t1 */
1986 BNE(rn(t0), _ZERO_REGNO, 0);
1988 SLT(rn(t1), r0, rn(t1));
1990 JAL(_ZERO_REGNO, 0);
1992 patch_at(w, _jit->pc.w);
1993 SLT(rn(t1), rn(t1), r0);
1995 patch_at(jal, _jit->pc.w);
1997 BEQ(rn(t1), _ZERO_REGNO, br - w);
2004 _bxsubi(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_word_t i0)
2008 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
2010 w = bxsubr(br, r0, rn(t0));
2016 _bxsubr_u(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_int32_t r1)
2020 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
2021 t1 = jit_get_reg(jit_class_gpr|jit_class_nospill);
2022 subr(rn(t0), r0, r1);
2023 SLTU(rn(t1), r0, rn(t0));
2026 BEQ(_ZERO_REGNO, rn(t1), br - w);
2033 _bxsubi_u(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_word_t i0)
2037 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
2039 w = bxsubr_u(br, r0, rn(t0));
2045 _bmsr(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_int32_t r1)
2049 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
2050 AND(rn(t0), r0, r1);
2052 BNE(_ZERO_REGNO, rn(t0), br - w);
2058 _bmsi(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_word_t i0)
2062 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
2064 w = bmsr(br, r0, rn(t0));
2070 _bmcr(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_int32_t r1)
2074 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
2075 AND(rn(t0), r0, r1);
2077 BEQ(_ZERO_REGNO, rn(t0), br - w);
2083 _bmci(jit_state_t *_jit, jit_word_t br, jit_int32_t r0, jit_word_t i0)
2087 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
2089 w = bmcr(br, r0, rn(t0));
2095 _jmpi(jit_state_t *_jit, jit_word_t i0)
2099 dsp = i0 - _jit->pc.w;
2101 JAL(_ZERO_REGNO, dsp);
2103 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
2111 _jmpi_p(jit_state_t *_jit, jit_word_t i0)
2115 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
2116 w = movi_p(rn(t0), i0);
2123 _calli(jit_state_t *_jit, jit_word_t i0)
2127 dsp = i0 - _jit->pc.w;
2129 JAL(_RA_REGNO, dsp);
2131 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
2139 _calli_p(jit_state_t *_jit, jit_word_t i0)
2143 t0 = jit_get_reg(jit_class_gpr|jit_class_nospill);
2144 w = movi_p(rn(t0), i0);
2151 _prolog(jit_state_t *_jit, jit_node_t *node)
2154 if (_jitc->function->define_frame || _jitc->function->assume_frame) {
2155 jit_int32_t frame = -_jitc->function->frame;
2156 assert(_jitc->function->self.aoff >= frame);
2157 if (_jitc->function->assume_frame)
2159 _jitc->function->self.aoff = frame;
2161 if (_jitc->function->allocar)
2162 _jitc->function->self.aoff &= -16;
2163 _jitc->function->stack = ((_jitc->function->self.alen -
2164 /* align stack at 16 bytes */
2165 _jitc->function->self.aoff) + 15) & -16;
2166 subi(_SP_REGNO, _SP_REGNO, stack_framesize);
2167 stxi(0, _SP_REGNO, _RA_REGNO);
2168 stxi(8, _SP_REGNO, _FP_REGNO);
2169 if (jit_regset_tstbit(&_jitc->function->regset, _S1))
2170 stxi(16, _SP_REGNO, 9);
2171 if (jit_regset_tstbit(&_jitc->function->regset, _S2))
2172 stxi(24, _SP_REGNO, 18);
2173 if (jit_regset_tstbit(&_jitc->function->regset, _S3))
2174 stxi(32, _SP_REGNO, 19);
2175 if (jit_regset_tstbit(&_jitc->function->regset, _S4))
2176 stxi(40, _SP_REGNO, 20);
2177 if (jit_regset_tstbit(&_jitc->function->regset, _S5))
2178 stxi(48, _SP_REGNO, 21);
2179 if (jit_regset_tstbit(&_jitc->function->regset, _S6))
2180 stxi(56, _SP_REGNO, 22);
2181 if (jit_regset_tstbit(&_jitc->function->regset, _S7))
2182 stxi(64, _SP_REGNO, 23);
2183 if (jit_regset_tstbit(&_jitc->function->regset, _S8))
2184 stxi(72, _SP_REGNO, 24);
2185 if (jit_regset_tstbit(&_jitc->function->regset, _S9))
2186 stxi(80, _SP_REGNO, 25);
2187 if (jit_regset_tstbit(&_jitc->function->regset, _S10))
2188 stxi(88, _SP_REGNO, 26);
2189 if (jit_regset_tstbit(&_jitc->function->regset, _S11))
2190 stxi(96, _SP_REGNO, 27);
2191 if (jit_regset_tstbit(&_jitc->function->regset, _FS0))
2192 stxi_d(104, _SP_REGNO, 8);
2193 if (jit_regset_tstbit(&_jitc->function->regset, _FS1))
2194 stxi_d(112, _SP_REGNO, 9);
2195 if (jit_regset_tstbit(&_jitc->function->regset, _FS2))
2196 stxi_d(120, _SP_REGNO, 18);
2197 if (jit_regset_tstbit(&_jitc->function->regset, _FS3))
2198 stxi_d(128, _SP_REGNO, 19);
2199 if (jit_regset_tstbit(&_jitc->function->regset, _FS4))
2200 stxi_d(136, _SP_REGNO, 20);
2201 if (jit_regset_tstbit(&_jitc->function->regset, _FS5))
2202 stxi_d(144, _SP_REGNO, 21);
2203 if (jit_regset_tstbit(&_jitc->function->regset, _FS6))
2204 stxi_d(152, _SP_REGNO, 22);
2205 if (jit_regset_tstbit(&_jitc->function->regset, _FS7))
2206 stxi_d(160, _SP_REGNO, 23);
2207 if (jit_regset_tstbit(&_jitc->function->regset, _FS8))
2208 stxi_d(168, _SP_REGNO, 24);
2209 if (jit_regset_tstbit(&_jitc->function->regset, _FS9))
2210 stxi_d(176, _SP_REGNO, 25);
2211 if (jit_regset_tstbit(&_jitc->function->regset, _FS10))
2212 stxi_d(184, _SP_REGNO, 26);
2213 if (jit_regset_tstbit(&_jitc->function->regset, _FS11))
2214 stxi_d(192, _SP_REGNO, 27);
2215 movr(_FP_REGNO, _SP_REGNO);
2216 if (_jitc->function->stack)
2217 subi(_SP_REGNO, _SP_REGNO, _jitc->function->stack);
2218 if (_jitc->function->allocar) {
2219 reg = jit_get_reg(jit_class_gpr);
2220 movi(rn(reg), _jitc->function->self.aoff);
2221 stxi_i(_jitc->function->aoffoff, _FP_REGNO, rn(reg));
2224 if (_jitc->function->self.call & jit_call_varargs) {
2225 for (reg = _jitc->function->vagp; jit_arg_reg_p(reg); ++reg)
2226 stxi(stack_framesize - ((8 - reg) * 8),
2227 _FP_REGNO, rn(JIT_RA0 - reg));
2232 _epilog(jit_state_t *_jit, jit_node_t *node)
2234 if (_jitc->function->assume_frame)
2236 movr(_SP_REGNO, _FP_REGNO);
2237 ldxi(_RA_REGNO, _SP_REGNO, 0);
2238 ldxi(_FP_REGNO, _SP_REGNO, 8);
2239 if (jit_regset_tstbit(&_jitc->function->regset, _S1))
2240 ldxi(9, _SP_REGNO, 16);
2241 if (jit_regset_tstbit(&_jitc->function->regset, _S2))
2242 ldxi(18, _SP_REGNO, 24);
2243 if (jit_regset_tstbit(&_jitc->function->regset, _S3))
2244 ldxi(19, _SP_REGNO, 32);
2245 if (jit_regset_tstbit(&_jitc->function->regset, _S4))
2246 ldxi(20, _SP_REGNO, 40);
2247 if (jit_regset_tstbit(&_jitc->function->regset, _S5))
2248 ldxi(21, _SP_REGNO, 48);
2249 if (jit_regset_tstbit(&_jitc->function->regset, _S6))
2250 ldxi(22, _SP_REGNO, 56);
2251 if (jit_regset_tstbit(&_jitc->function->regset, _S7))
2252 ldxi(23, _SP_REGNO, 64);
2253 if (jit_regset_tstbit(&_jitc->function->regset, _S8))
2254 ldxi(24, _SP_REGNO, 72);
2255 if (jit_regset_tstbit(&_jitc->function->regset, _S9))
2256 ldxi(25, _SP_REGNO, 80);
2257 if (jit_regset_tstbit(&_jitc->function->regset, _S10))
2258 ldxi(26, _SP_REGNO, 88);
2259 if (jit_regset_tstbit(&_jitc->function->regset, _S11))
2260 ldxi(27, _SP_REGNO, 96);
2261 if (jit_regset_tstbit(&_jitc->function->regset, _FS0))
2262 ldxi_d(8, _SP_REGNO, 104);
2263 if (jit_regset_tstbit(&_jitc->function->regset, _FS1))
2264 ldxi_d(9, _SP_REGNO, 112);
2265 if (jit_regset_tstbit(&_jitc->function->regset, _FS2))
2266 ldxi_d(18, _SP_REGNO, 120);
2267 if (jit_regset_tstbit(&_jitc->function->regset, _FS3))
2268 ldxi_d(19, _SP_REGNO, 128);
2269 if (jit_regset_tstbit(&_jitc->function->regset, _FS4))
2270 ldxi_d(20, _SP_REGNO, 136);
2271 if (jit_regset_tstbit(&_jitc->function->regset, _FS5))
2272 ldxi_d(21, _SP_REGNO, 144);
2273 if (jit_regset_tstbit(&_jitc->function->regset, _FS6))
2274 ldxi_d(22, _SP_REGNO, 152);
2275 if (jit_regset_tstbit(&_jitc->function->regset, _FS7))
2276 ldxi_d(23, _SP_REGNO, 160);
2277 if (jit_regset_tstbit(&_jitc->function->regset, _FS8))
2278 ldxi_d(24, _SP_REGNO, 168);
2279 if (jit_regset_tstbit(&_jitc->function->regset, _FS9))
2280 ldxi_d(25, _SP_REGNO, 176);
2281 if (jit_regset_tstbit(&_jitc->function->regset, _FS10))
2282 ldxi_d(26, _SP_REGNO, 184);
2283 if (jit_regset_tstbit(&_jitc->function->regset, _FS11))
2284 ldxi_d(27, _SP_REGNO, 192);
2285 addi(_SP_REGNO, _SP_REGNO, stack_framesize);
2290 _vastart(jit_state_t *_jit, jit_int32_t r0)
2292 assert(_jitc->function->self.call & jit_call_varargs);
2293 /* Initialize va_list to the first stack argument. */
2294 if (jit_arg_reg_p(_jitc->function->vagp))
2295 addi(r0, _FP_REGNO, stack_framesize - ((8 - _jitc->function->vagp) * 8));
2297 addi(r0, _FP_REGNO, _jitc->function->self.size);
2301 _vaarg(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2303 assert(_jitc->function->self.call & jit_call_varargs);
2304 /* Load argument. */
2306 /* Update va_list. */
2307 addi(r1, r1, sizeof(jit_word_t));
2311 _patch_at(jit_state_t *_jit, jit_word_t instr, jit_word_t label)
2321 if (i.U.opcode == 55) { /* LUI */
2322 jit_int32_t ww = label << 32 >> 32;
2323 jit_int32_t lo = ww << 20 >> 20;
2324 jit_int32_t hi = ww - lo;
2325 i.U.imm12_31 = hi >> 12;
2328 if (i.I.opcode == 27 && i.I.funct3 == 0) { /* ADDIW */
2329 i.I.imm11_0 = lo & 0xfff;
2332 if (i.U.opcode == 55) { /* LUI */
2334 lo = ww << 20 >> 20;
2336 i.U.imm12_31 = hi >> 12;
2339 if (i.I.opcode == 27 && i.I.funct3 == 0) { /* ADDIW */
2340 i.I.imm11_0 = lo & 0xfff;
2343 assert(i.IS.opcode == 19); /* SLLI */
2344 assert(i.IS.shamt == 32);
2346 assert(i.R.opcode == 51); /* ADD */
2357 /* b{lt,le,eq,ge,gt,ne}{,_u}? */
2358 else if (i.B.opcode == 99) { /* B{EQ,NE,LT,GE,LTU,GEU} */
2359 jit_word_t jmp = label - instr;
2360 assert(simm12_p(jmp));
2361 i.B.imm11 = (jmp >> 11) & 0x1;
2362 i.B.imm4_1 = (jmp >> 1) & 0xf;
2363 i.B.imm10_5 = (jmp >> 5) & 0x3f;
2364 i.B.imm12 = (jmp >> 12) & 0x1;
2367 else if (i.J.opcode == 111) { /* JAL */
2368 jit_word_t jmp = label - instr;
2369 i.J.imm19_12 = (jmp >> 12) & 0xff;
2370 i.J.imm11 = (jmp >> 11) & 0x1;
2371 i.J.imm10_1 = (jmp >> 1) & 0x3ff;
2372 i.J.imm20 = (jmp >> 20) & 0x1;