Merge pull request #652 from pcercuei/update-lightrec-20220427
[pcsx_rearmed.git] / deps / lightning / lib / jit_arm-cpu.c
1 /*
2  * Copyright (C) 2012-2019  Free Software Foundation, Inc.
3  *
4  * This file is part of GNU lightning.
5  *
6  * GNU lightning is free software; you can redistribute it and/or modify it
7  * under the terms of the GNU Lesser General Public License as published
8  * by the Free Software Foundation; either version 3, or (at your option)
9  * any later version.
10  *
11  * GNU lightning is distributed in the hope that it will be useful, but
12  * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
13  * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
14  * License for more details.
15  *
16  * Authors:
17  *      Paulo Cesar Pereira de Andrade
18  */
19
20 #if PROTO
21 #  define stxi(i0,r0,r1)                stxi_i(i0,r0,r1)
22 #  define ldxi(r0,r1,i0)                ldxi_i(r0,r1,i0)
23 #  define ldr(r0,r1)                    ldr_i(r0,r1)
24 #  define _s20P(d)                      ((d) >= -(int)0x80000 && d <= 0x7ffff)
25 #  define _s24P(d)                      ((d) >= -(int)0x800000 && d <= 0x7fffff)
26 #  define _u3(v)                        ((v) & 0x7)
27 #  define _u4(v)                        ((v) & 0xf)
28 #  define _u5(v)                        ((v) & 0x1f)
29 #  define _u8(v)                        ((v) & 0xff)
30 #  define _u12(v)                       ((v) & 0xfff)
31 #  define _u13(v)                       ((v) & 0x1fff)
32 #  define _u16(v)                       ((v) & 0xffff)
33 #  define _u24(v)                       ((v) & 0xffffff)
34 #  define jit_thumb_p()                 jit_cpu.thumb
35 #  define jit_no_set_flags()            _jitc->no_set_flags
36 #  define jit_armv5_p()                 (jit_cpu.version >= 5)
37 #  define jit_armv5e_p()                (jit_cpu.version > 5 || (jit_cpu.version == 5 && jit_cpu.extend))
38 #  define jit_armv6_p()                 (jit_cpu.version >= 6)
39 #  define jit_armv7r_p()                0
40 #  define stack_framesize               48
41 extern int      __aeabi_idivmod(int, int);
42 extern unsigned __aeabi_uidivmod(unsigned, unsigned);
43 #  define _R0_REGNO                     0x00
44 #  define _R1_REGNO                     0x01
45 #  define _R2_REGNO                     0x02
46 #  define _R3_REGNO                     0x03
47 #  define _R4_REGNO                     0x04
48 #  define _R5_REGNO                     0x05
49 #  define _R6_REGNO                     0x06
50 #  define _R7_REGNO                     0x07
51 #  define _R8_REGNO                     0x08
52 #  define _R9_REGNO                     0x09
53 #  define _R10_REGNO                    0x0a
54 #  define _R11_REGNO                    0x0b
55 #  define _R12_REGNO                    0x0c
56 #  define _R13_REGNO                    0x0d
57 #  define _R14_REGNO                    0x0e
58 #  define _R15_REGNO                    0x0f
59 #  define _FP_REGNO                     _R11_REGNO
60 #  define _SP_REGNO                     _R13_REGNO
61 #  define _LR_REGNO                     _R14_REGNO
62 #  define _PC_REGNO                     _R15_REGNO
63 #  define ARM_CC_EQ                     0x00000000      /* Z=1 */
64 #  define ARM_CC_NE                     0x10000000      /* Z=0 */
65 #  define ARM_CC_HS                     0x20000000      /* C=1 */
66 #    define ARM_CC_CS                   ARM_CC_HS
67 #  define ARM_CC_LO                     0x30000000      /* C=0 */
68 #    define ARM_CC_CC                   ARM_CC_LO
69 #  define ARM_CC_MI                     0x40000000      /* N=1 */
70 #  define ARM_CC_PL                     0x50000000      /* N=0 */
71 #  define ARM_CC_VS                     0x60000000      /* V=1 */
72 #  define ARM_CC_VC                     0x70000000      /* V=0 */
73 #  define ARM_CC_HI                     0x80000000      /* C=1 && Z=0 */
74 #  define ARM_CC_LS                     0x90000000      /* C=0 || Z=1 */
75 #  define ARM_CC_GE                     0xa0000000      /* N=V */
76 #  define ARM_CC_LT                     0xb0000000      /* N!=V */
77 #  define ARM_CC_GT                     0xc0000000      /* Z=0 && N=V */
78 #  define ARM_CC_LE                     0xd0000000      /* Z=1 || N!=V */
79 #  define ARM_CC_AL                     0xe0000000      /* always */
80 #  define ARM_CC_NV                     0xf0000000      /* reserved */
81 #  define THUMB2_IT                     0
82 #  define THUMB2_ITT                    1
83 #  define THUMB2_ITE                    2
84 #  define THUMB2_ITTT                   3
85 #  define THUMB2_ITET                   4
86 #  define THUMB2_ITTE                   5
87 #  define THUMB2_ITEE                   6
88 #  define THUMB2_ITTTT                  7
89 #  define THUMB2_ITETT                  8
90 #  define THUMB2_ITTET                  9
91 #  define THUMB2_ITEET                  10
92 #  define THUMB2_ITTTE                  11
93 #  define THUMB2_ITETE                  12
94 #  define THUMB2_ITTEE                  13
95 #  define THUMB2_ITEEE                  14
96 #  define ARM_MOV                       0x01a00000
97 #  define THUMB_MOV                         0x4600
98 #  define ARM_MOVWI                     0x03000000      /* v6t2, v7 */
99 #  define THUMB_MOVI                        0x2000
100 #  define THUMB2_MOVI                   0xf0400000
101 #  define THUMB2_MOVWI                  0xf2400000
102 #  define ARM_MOVTI                     0x03400000
103 #  define THUMB2_MOVTI                  0xf2c00000
104 #  define ARM_MVN                       0x01e00000
105 #  define THUMB_MVN                         0x43c0
106 #  define THUMB2_MVN                    0xea600000
107 #  define THUMB2_MVNI                   0xf0600000
108 #  define ARM_I                         0x02000000 /* immediate */
109 #  define ARM_S                         0x00100000 /* set flags */
110 #  define ARM_ADD                       0x00800000
111 #  define THUMB_ADD                         0x1800
112 #  define THUMB_ADDX                        0x4400
113 #  define THUMB2_ADD                    0xeb000000
114 #  define THUMB_ADDI3                       0x1c00
115 #  define THUMB_ADDI8                       0x3000
116 #  define THUMB2_ADDI                   0xf1000000
117 #  define THUMB2_ADDWI                  0xf2000000
118 #  define ARM_ADC                       0x00a00000
119 #  define THUMB_ADC                         0x4140
120 #  define THUMB2_ADC                    0xeb400000
121 #  define THUMB2_ADCI                   0xf1400000
122 #  define ARM_SUB                       0x00400000
123 #  define THUMB_SUB                         0x1a00
124 #  define THUMB2_SUB                    0xeba00000
125 #  define THUMB_SUBI3                       0x1e00
126 #  define THUMB_SUBI8                       0x3800
127 #  define THUMB2_SUBI                   0xf1a00000
128 #  define THUMB2_SUBWI                  0xf2a00000
129 #  define ARM_SBC                       0x00c00000
130 #  define THUMB_SBC                         0x4180
131 #  define THUMB2_SBC                    0xeb600000
132 #  define THUMB2_SBCI                   0xf1600000
133 #  define ARM_RSB                       0x00600000
134 #  define THUMB_RSBI                        0x4240
135 #  define THUMB2_RSBI                   0xf1c00000
136 #  define ARM_MUL                       0x00000090
137 #  define THUMB_MUL                         0x4340
138 #  define THUMB2_MUL                    0xfb00f000
139 #  define ARM_UMULL                     0x00800090
140 #  define THUMB2_UMULL                  0xfba00000
141 #  define ARM_SMULL                     0x00c00090
142 #  define THUMB2_SMULL                  0xfb800000
143 #  define THUMB2_SDIV                   0xfb90f0f0
144 #  define THUMB2_UDIV                   0xfbb0f0f0
145 #  define ARM_AND                       0x00000000
146 #  define THUMB_AND                         0x4000
147 #  define THUMB2_AND                    0xea000000
148 #  define THUMB2_ANDI                   0xf0000000
149 #  define ARM_BIC                       0x01c00000
150 #  define THUMB2_BIC                    0xea200000
151 #  define THUMB2_BICI                   0xf0200000
152 #  define ARM_ORR                       0x01800000
153 #  define THUMB_ORR                         0x4300
154 #  define THUMB2_ORR                    0xea400000
155 #  define THUMB2_ORRI                   0xf0400000
156 #  define ARM_EOR                       0x00200000
157 #  define THUMB_EOR                         0x4040
158 #  define THUMB2_EOR                    0xea800000
159 #  define THUMB2_EORI                   0xf0800000
160 /* >> ARMv6* */
161 #  define ARM_REV                       0x06bf0f30
162 #  define THUMB_REV                         0xba00
163 #  define THUMB2_REV                    0xfa90f080
164 #  define ARM_REV16                     0x06bf0fb0
165 #  define THUMB_REV16                       0xba40
166 #  define THUMB2_REV16                  0xfa90f090
167 #  define ARM_SXTB                      0x06af0070
168 #  define THUMB_SXTB                        0xb240
169 #  define THUMB2_SXTB                   0xfa40f080
170 #  define ARM_UXTB                      0x06ef0070
171 #  define THUMB_UXTB                        0xb2c0
172 #  define THUMB2_UXTB                   0xfa50f080
173 #  define ARM_SXTH                      0x06bf0070
174 #  define THUMB_SXTH                        0xb200
175 #  define THUMB2_SXTH                   0xfa00f080
176 #  define ARM_UXTH                      0x06ff0070
177 #  define THUMB_UXTH                        0xb280
178 #  define THUMB2_UXTH                   0xfa10f080
179 #  define ARM_XTR8                      0x00000400 /* ?xt? rotate 8 bits */
180 #  define ARM_XTR16                     0x00000800 /* ?xt? rotate 16 bits */
181 #  define ARM_XTR24                     0x00000c00 /* ?xt? rotate 24 bits */
182 /* << ARMv6* */
183 #  define ARM_SHIFT                     0x01a00000
184 #  define ARM_R                         0x00000010 /* register shift */
185 #  define ARM_LSL                       0x00000000
186 #  define THUMB_LSL                         0x4080
187 #  define THUMB2_LSL                    0xfa00f000
188 #  define THUMB_LSLI                        0x0000
189 #  define THUMB2_LSLI                   0xea4f0000
190 #  define ARM_LSR                       0x00000020
191 #  define THUMB_LSR                         0x40c0
192 #  define THUMB2_LSR                    0xfa20f000
193 #  define THUMB_LSRI                        0x0800
194 #  define THUMB2_LSRI                   0xea4f0010
195 #  define ARM_ASR                       0x00000040
196 #  define THUMB_ASR                         0x4100
197 #  define THUMB2_ASR                    0xfa40f000
198 #  define THUMB_ASRI                        0x1000
199 #  define THUMB2_ASRI                   0xea4f0020
200 #  define ARM_ROR                       0x00000060
201 #  define ARM_CMP                       0x01500000
202 #  define THUMB_CMP                         0x4280
203 #  define THUMB_CMPX                        0x4500
204 #  define THUMB2_CMP                    0xebb00000
205 #  define THUMB_CMPI                        0x2800
206 #  define THUMB2_CMPI                   0xf1b00000
207 #  define ARM_CMN                       0x01700000
208 #  define THUMB_CMN                         0x42c0
209 #  define THUMB2_CMN                    0xeb100000
210 #  define THUMB2_CMNI                   0xf1100000
211 #  define ARM_TST                       0x01100000
212 #  define THUMB_TST                         0x4200
213 #  define THUMB2_TST                    0xea100000
214 #  define THUMB2_TSTI                   0xf0100000
215 #  define ARM_TEQ                       0x01300000
216 /* branch */
217 #  define ARM_BX                        0x012fff10
218 #  define ARM_BLX                       0x012fff30
219 #  define THUMB_BLX                         0x4780
220 #  define ARM_BLXI                      0xfa000000
221 #  define THUMB2_BLXI                   0xf000c000
222 #  define ARM_B                         0x0a000000
223 #  define THUMB_CC_B                        0xd000
224 #  define THUMB_B                           0xe000
225 #  define THUMB2_CC_B                   0xf0008000
226 #  define THUMB2_B                      0xf0009000
227 #  define ARM_BLI                       0x0b000000
228 #  define THUMB2_BLI                    0xf000d000
229 /* ldr/str */
230 #  define ARM_P                         0x00800000 /* positive offset */
231 #  define THUMB2_P                      0x00000400
232 #  define THUMB2_U                      0x00000200
233 #  define THUMB2_W                      0x00000100
234 #  define ARM_LDRSB                     0x011000d0
235 #  define THUMB_LDRSB                       0x5600
236 #  define THUMB2_LDRSB                  0xf9100000
237 #  define ARM_LDRSBI                    0x015000d0
238 #  define THUMB2_LDRSBI                 0xf9100c00
239 #  define THUMB2_LDRSBWI                0xf9900000
240 #  define ARM_LDRB                      0x07500000
241 #  define THUMB_LDRB                        0x5c00
242 #  define THUMB2_LDRB                   0xf8100000
243 #  define ARM_LDRBI                     0x05500000
244 #  define THUMB_LDRBI                       0x7800
245 #  define THUMB2_LDRBI                  0xf8100c00
246 #  define THUMB2_LDRBWI                 0xf8900000
247 #  define ARM_LDRSH                     0x011000f0
248 #  define THUMB_LDRSH                       0x5e00
249 #  define THUMB2_LDRSH                  0xf9300000
250 #  define ARM_LDRSHI                    0x015000f0
251 #  define THUMB2_LDRSHI                 0xf9300c00
252 #  define THUMB2_LDRSHWI                0xf9b00000
253 #  define ARM_LDRH                      0x011000b0
254 #  define THUMB_LDRH                        0x5a00
255 #  define THUMB2_LDRH                   0xf8300000
256 #  define ARM_LDRHI                     0x015000b0
257 #  define THUMB_LDRHI                       0x8800
258 #  define THUMB2_LDRHI                  0xf8300c00
259 #  define THUMB2_LDRHWI                 0xf8b00000
260 #  define ARM_LDR                       0x07100000
261 #  define THUMB_LDR                         0x5800
262 #  define THUMB2_LDR                    0xf8500000
263 #  define ARM_LDRI                      0x05100000
264 #  define THUMB_LDRI                        0x6800
265 #  define THUMB_LDRISP                      0x9800
266 #  define THUMB2_LDRI                   0xf8500c00
267 #  define THUMB2_LDRWI                  0xf8d00000
268 #  define ARM_LDRD                      0x010000d0
269 #  define ARM_LDRDI                     0x014000d0
270 #  define THUMB2_LDRDI                  0xe8500000
271 #  define ARM_STRB                      0x07400000
272 #  define THUMB_STRB                        0x5400
273 #  define THUMB2_STRB                   0xf8000000
274 #  define ARM_STRBI                     0x05400000
275 #  define THUMB_STRBI                       0x7000
276 #  define THUMB2_STRBI                  0xf8000c00
277 #  define THUMB2_STRBWI                 0xf8800000
278 #  define ARM_STRH                      0x010000b0
279 #  define THUMB_STRH                        0x5200
280 #  define THUMB2_STRH                   0xf8200000
281 #  define ARM_STRHI                     0x014000b0
282 #  define THUMB_STRHI                       0x8000
283 #  define THUMB2_STRHI                  0xf8200c00
284 #  define THUMB2_STRHWI                 0xf8a00000
285 #  define ARM_STR                       0x07000000
286 #  define THUMB_STR                         0x5000
287 #  define THUMB2_STR                    0xf8400000
288 #  define ARM_STRI                      0x05000000
289 #  define THUMB_STRI                        0x6000
290 # define THUMB2_STRWI                   0xf8c00000
291 #  define THUMB_STRISP                      0x9000
292 #  define THUMB2_STRI                   0xf8400c00
293 #  define ARM_STRD                      0x010000f0
294 # define ARM_STRDI                      0x014000f0
295 #  define THUMB2_STRDI                  0xe8400000
296 /* ldm/stm */
297 #  define ARM_M                         0x08000000
298 #  define ARM_M_L                       0x00100000 /* load; store if not set */
299 #  define ARM_M_I                       0x00800000 /* inc; dec if not set */
300 #  define ARM_M_B                       0x01000000 /* before; after if not set */
301 #  define ARM_M_U                       0x00200000 /* update Rn */
302 #  define THUMB2_LDM_W                  0x00200000
303 #  define THUMB2_LDM_P                  0x00008000
304 #  define THUMB2_LDM_M                  0x00004000
305 #  define THUMB_LDMIA                       0xc800
306 #  define THUMB2_LDMIA                  0xe8900000
307 #  define THUMB2_LDMB                   0xe9100000
308 #  define THUMB_PUSH                        0xb400
309 #  define THUMB2_PUSH                   0xe92d0000
310 #  define THUMB_POP                         0xbc00
311 #  define THUMB2_POP                    0xe8bd0000
312 #  define ii(i)                         *_jit->pc.ui++ = i
313 #  define is(i)                         *_jit->pc.us++ = i
314 #  if __BYTE_ORDER == __LITTLE_ENDIAN
315 #    define iss(i, j)                   do { is(j); is(i); } while (0)
316 #    define code2thumb(t0, t1, c0, c1)  do { t1 = c0; t0 = c1; } while (0)
317 #    define thumb2code(t0, t1, c0, c1)  do { c0 = t1; c1 = t0; } while (0)
318 #  else
319 #    define iss(i, j)                   do { is(i); is(j); } while (0)
320 #    define code2thumb(t0, t1, c0, c1)  do { t0 = c0; t1 = c1; } while (0)
321 #    define thumb2code(t0, t1, c0, c1)  do { c0 = t0; c1 = t1; } while (0)
322 #  endif
323 static int encode_arm_immediate(unsigned int v);
324 static int encode_thumb_immediate(unsigned int v);
325 static int encode_thumb_word_immediate(unsigned int v);
326 static int encode_thumb_jump(int v);
327 static int encode_thumb_cc_jump(int v);
328 static int encode_thumb_shift(int v, int type) maybe_unused;
329 #  define corrr(cc,o,rn,rd,rm)          _corrr(_jit,cc,o,rn,rd,rm)
330 static void _corrr(jit_state_t*,int,int,int,int,int);
331 #  define corri(cc,o,rn,rd,im)          _corri(_jit,cc,o,rn,rd,im)
332 static void _corri(jit_state_t*,int,int,int,int,int);
333 #define corri8(cc,o,rn,rt,im)   _corri8(_jit,cc,o,rn,rt,im)
334 static void _corri8(jit_state_t*,int,int,int,int,int);
335 #  define torrr(o,rn,rd,rm)             _torrr(_jit,o,rn,rd,rm)
336 static void _torrr(jit_state_t*,int,int,int,int);
337 #  define torrrs(o,rn,rd,rm,im)         _torrrs(_jit,o,rn,rd,rm,im)
338 static void _torrrs(jit_state_t*,int,int,int,int,int) maybe_unused;
339 #  define torxr(o,rn,rt,rm)             _torxr(_jit,o,rn,rt,rm)
340 static void _torxr(jit_state_t*,int,int,int,int);
341 #  define torrrr(o,rn,rl,rh,rm)         _torrrr(_jit,o,rn,rl,rh,rm)
342 static void _torrrr(jit_state_t*,int,int,int,int,int) maybe_unused;
343 #  define torrri8(o,rn,rt,rt2,im)       _torrri8(_jit,o,rn,rt,rt2,im)
344 static void _torrri8(jit_state_t*,int,int,int,int,int) maybe_unused;
345 #  define coriw(cc,o,rd,im)             _coriw(_jit,cc,o,rd,im)
346 static void _coriw(jit_state_t*,int,int,int,int);
347 #  define torri(o,rd,rn,im)             _torri(_jit,o,rd,rn,im)
348 static void _torri(jit_state_t*,int,int,int,int);
349 #  define torri8(o,rn,rt,im)            _torri8(_jit,o,rn,rt,im)
350 static void _torri8(jit_state_t*,int,int,int,int);
351 #  define torri12(o,rn,rt,im)           _torri12(_jit,o,rn,rt,im)
352 static void _torri12(jit_state_t*,int,int,int,int);
353 #  define tshift(o,rd,rm,im)            _tshift(_jit,o,rd,rm,im)
354 static void _tshift(jit_state_t*,int,int,int,int);
355 #  define toriw(o,rd,im)                _toriw(_jit,o,rd,im)
356 static void _toriw(jit_state_t*,int,int,int);
357 #  define tc8(cc,im)                    _tc8(_jit,cc,im)
358 static void _tc8(jit_state_t*,int,int) maybe_unused;
359 #  define t11(im)                       _t11(_jit,im)
360 static void _t11(jit_state_t*,int);
361 #  define tcb(cc,im)                    _tcb(_jit,cc,im)
362 static void _tcb(jit_state_t*,int,int);
363 #  define blxi(im)                      _blxi(_jit,im)
364 static void _blxi(jit_state_t*,int) maybe_unused;
365 #  define tb(o,im)                      _tb(_jit,o,im)
366 static void _tb(jit_state_t*,int,int);
367 #  define corrrr(cc,o,rh,rl,rm,rn)      _corrrr(_jit,cc,o,rh,rl,rm,rn)
368 static void _corrrr(jit_state_t*,int,int,int,int,int,int);
369 #  define corrrs(cc,o,rn,rd,rm,im)      _corrrs(_jit,cc,o,rn,rd,rm,im)
370 static void _corrrs(jit_state_t*,int,int,int,int,int,int);
371 #  define cshift(cc,o,rd,rm,rn,im)      _cshift(_jit,cc,o,rd,rm,rn,im)
372 static void _cshift(jit_state_t*,int,int,int,int,int,int);
373 #  define cb(cc,o,im)                   _cb(_jit,cc,o,im)
374 static void _cb(jit_state_t*,int,int,int);
375 #  define cbx(cc,o,rm)                  _cbx(_jit,cc,o,rm)
376 static void _cbx(jit_state_t*,int,int,int);
377 #  define corl(cc,o,r0,i0)              _corl(_jit,cc,o,r0,i0)
378 static void _corl(jit_state_t*,int,int,int,int);
379 #  define c6orr(cc,o,r0,r1)             _c6orr(_jit,cc,o,r0,r1)
380 static void _c6orr(jit_state_t*,int,int,int,int);
381 #  define tcit(cc,it)                   _tcit(_jit,cc,it)
382 static void _tcit(jit_state_t*,unsigned int,int);
383 #  define IT(cc)                        tcit(cc,THUMB2_IT)
384 #  define ITT(cc)                       tcit(cc,THUMB2_ITT)
385 #  define ITE(cc)                       tcit(cc,THUMB2_ITE)
386 #  define ITTT(cc)                      tcit(cc,THUMB2_ITTT)
387 #  define ITTE(cc)                      tcit(cc,THUMB2_ITTE)
388 #  define ITET(cc)                      tcit(cc,THUMB2_ITET)
389 #  define ITEE(cc)                      tcit(cc,THUMB2_ITEE)
390 #  define ITTTT(cc)                     tcit(cc,THUMB2_ITTTT)
391 #  define ITETT(cc)                     tcit(cc,THUMB2_ITETT)
392 #  define ITTET(cc)                     tcit(cc,THUMB2_ITTET)
393 #  define ITEET(cc)                     tcit(cc,THUMB2_ITEET)
394 #  define ITTTE(cc)                     tcit(cc,THUMB2_ITTTE)
395 #  define ITETE(cc)                     tcit(cc,THUMB2_ITETE)
396 #  define ITTEE(cc)                     tcit(cc,THUMB2_ITTEE)
397 #  define ITEEE(cc)                     tcit(cc,THUMB2_ITEEE)
398 #  define tpp(o,im)                     _tpp(_jit,o,im)
399 static void _tpp(jit_state_t*,int,int);
400 #  define torl(o,rn,im)                 _torl(_jit,o,rn,im)
401 static void _torl(jit_state_t*,int,int,int) maybe_unused;
402 #  define CC_MOV(cc,rd,rm)              corrr(cc,ARM_MOV,0,rd,rm)
403 #  define MOV(rd,rm)                    CC_MOV(ARM_CC_AL,rd,rm)
404 #  define T1_MOV(rd,rm)                 is(THUMB_MOV|((_u4(rd)&8)<<4)|(_u4(rm)<<3)|(rd&7))
405 #  define T2_MOV(rd,rm)                 T2_ORR(rd,_R15_REGNO,rm)
406 #  define CC_MOVI(cc,rd,im)             corri(cc,ARM_MOV|ARM_I,0,rd,im)
407 #  define MOVI(rd,im)                   CC_MOVI(ARM_CC_AL,rd,im)
408 #  define CC_MOVWI(cc,rd,im)            coriw(cc,ARM_MOVWI,rd,im)
409 #  define MOVWI(rd,im)                  CC_MOVWI(ARM_CC_AL,rd,im)
410 #  define T1_MOVI(rd,im)                is(THUMB_MOVI|(_u3(rd)<<8)|_u8(im))
411 #  define T2_MOVI(rd,im)                torri(THUMB2_MOVI,_R15_REGNO,rd,im)
412 #  define T2_MOVWI(rd,im)               toriw(THUMB2_MOVWI,rd,im)
413 #  define CC_MOVTI(cc,rd,im)            coriw(cc,ARM_MOVTI,rd,im)
414 #  define MOVTI(rd,im)                  CC_MOVTI(ARM_CC_AL,rd,im)
415 #  define T2_MOVTI(rd,im)               toriw(THUMB2_MOVTI,rd,im)
416 #  define CC_MVN(cc,rd,rm)              corrr(cc,ARM_MVN,0,rd,rm)
417 #  define MVN(rd,rm)                    CC_MVN(ARM_CC_AL,rd,rm)
418 #  define T1_MVN(rd,rm)                 is(THUMB_MVN|(_u3(rm)<<3)|_u3(rd))
419 #  define T2_MVN(rd,rm)                 torrr(THUMB2_MVN,_R15_REGNO,rd,rm)
420 #  define CC_MVNI(cc,rd,im)             corri(cc,ARM_MVN|ARM_I,0,rd,im)
421 #  define MVNI(rd,im)                   CC_MVNI(ARM_CC_AL,rd,im)
422 #  define T2_MVNI(rd,im)                torri(THUMB2_MVNI,_R15_REGNO,rd,im)
423 #  define CC_NOT(cc,rd,rm)              CC_MVN(cc,rd,rm)
424 #  define NOT(rd,rm)                    CC_NOT(ARM_CC_AL,rd,rm)
425 #  define T1_NOT(rd,rm)                 T1_MVN(rd,rm)
426 #  define T2_NOT(rd,rm)                 T2_MVN(rd,rm)
427 #  define NOP()                         MOV(_R0_REGNO, _R0_REGNO)
428 #  define T1_NOP()                      is(0xbf00)
429 #  define CC_ADD(cc,rd,rn,rm)           corrr(cc,ARM_ADD,rn,rd,rm)
430 #  define ADD(rd,rn,rm)                 CC_ADD(ARM_CC_AL,rd,rn,rm)
431 #  define T1_ADD(rd,rn,rm)              is(THUMB_ADD|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rd))
432 #  define T1_ADDX(rdn,rm)               is(THUMB_ADDX|((_u4(rdn)&8)<<4)|(_u4(rm)<<3)|(rdn&7))
433 #  define T2_ADD(rd,rn,rm)              torrr(THUMB2_ADD,rn,rd,rm)
434 #  define CC_ADDI(cc,rd,rn,im)          corri(cc,ARM_ADD|ARM_I,rn,rd,im)
435 #  define ADDI(rd,rn,im)                CC_ADDI(ARM_CC_AL,rd,rn,im)
436 #  define T1_ADDI3(rd,rn,im)            is(THUMB_ADDI3|(_u3(im)<<6)|(_u3(rn)<<3)|_u3(rd))
437 #  define T1_ADDI8(rdn,im)              is(THUMB_ADDI8|(_u3(rdn)<<8)|_u8(im))
438 #  define T2_ADDI(rd,rn,im)             torri(THUMB2_ADDI,rn,rd,im)
439 #  define T2_ADDWI(rd,rn,im)            torri(THUMB2_ADDWI,rn,rd,im)
440 #  define CC_ADDS(cc,rd,rn,rm)          corrr(cc,ARM_ADD|ARM_S,rn,rd,rm)
441 #  define ADDS(rd,rn,rm)                CC_ADDS(ARM_CC_AL,rd,rn,rm)
442 #  define T2_ADDS(rd,rn,rm)             torrr(THUMB2_ADD|ARM_S,rn,rd,rm)
443 #  define ADDSI(rd,rn,im)               corri(ARM_CC_AL,ARM_ADD|ARM_S|ARM_I,rn,rd,im)
444 #  define T2_ADDSI(rd,rn,im)            torri(THUMB2_ADDI|ARM_S,rn,rd,im)
445 #  define CC_ADC(cc,rd,rn,rm)           corrr(cc,ARM_ADC,rn,rd,rm)
446 #  define ADC(rd,rn,rm)                 CC_ADC(ARM_CC_AL,rd,rn,rm)
447 #  define T1_ADC(rdn,rm)                is(THUMB_ADC|(_u3(rm)<<3)|_u3(rdn))
448 #  define T2_ADC(rd,rn,rm)              torrr(THUMB2_ADC,rn,rd,rm)
449 #  define CC_ADCI(cc,rd,rn,im)          corri(cc,ARM_ADC|ARM_I,rn,rd,im)
450 #  define ADCI(rd,rn,im)                CC_ADCI(ARM_CC_AL,rd,rn,im)
451 #  define T2_ADCI(rd,rn,im)             torri(THUMB2_ADCI,rn,rd,im)
452 #  define CC_ADCS(cc,rd,rn,rm)          corrr(cc,ARM_ADC|ARM_S,rn,rd,rm)
453 #  define ADCS(rd,rn,rm)                CC_ADCS(ARM_CC_AL,rd,rn,rm)
454 #  define T2_ADCS(rd,rn,rm)             torrr(THUMB2_ADC|ARM_S,rn,rd,rm)
455 #  define CC_ADCSI(cc,rd,rn,im)         corri(cc,ARM_ADC|ARM_S|ARM_I,rn,rd,im)
456 #  define ADCSI(rd,rn,im)               CC_ADCSI(ARM_CC_AL,rd,rn,im)
457 #  define T2_ADCSI(rd,rn,im)            torri(THUMB2_ADCI|ARM_S,rn,rd,im)
458 #  define CC_SUB(cc,rd,rn,rm)           corrr(cc,ARM_SUB,rn,rd,rm)
459 #  define SUB(rd,rn,rm)                 CC_SUB(ARM_CC_AL,rd,rn,rm)
460 #  define T1_SUB(rd,rn,rm)              is(THUMB_SUB|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rd))
461 #  define T2_SUB(rd,rn,rm)              torrr(THUMB2_SUB,rn,rd,rm)
462 #  define CC_SUBI(cc,rd,rn,im)          corri(cc,ARM_SUB|ARM_I,rn,rd,im)
463 #  define SUBI(rd,rn,im)                CC_SUBI(ARM_CC_AL,rd,rn,im)
464 #  define T1_SUBI3(rd,rn,im)            is(THUMB_SUBI3|(_u3(im)<<6)|(_u3(rn)<<3)|_u3(rd))
465 #  define T1_SUBI8(rdn,im)              is(THUMB_SUBI8|(_u3(rdn)<<8)|_u8(im))
466 #  define T2_SUBI(rd,rn,im)             torri(THUMB2_SUBI,rn,rd,im)
467 #  define T2_SUBWI(rd,rn,im)            torri(THUMB2_SUBWI,rn,rd,im)
468 #  define CC_SUBS(cc,rd,rn,rm)          corrr(cc,ARM_SUB|ARM_S,rn,rd,rm)
469 #  define SUBS(rd,rn,rm)                CC_SUBS(ARM_CC_AL,rd,rn,rm)
470 #  define T2_SUBS(rd,rn,rm)             torrr(THUMB2_SUB|ARM_S,rn,rd,rm)
471 #  define CC_SUBSI(cc,rd,rn,im)         corri(cc,ARM_SUB|ARM_S|ARM_I,rn,rd,im)
472 #  define SUBSI(rd,rn,im)               CC_SUBSI(ARM_CC_AL,rd,rn,im)
473 #  define T2_SUBSI(rd,rn,im)            torri(THUMB2_SUBI|ARM_S,rn,rd,im)
474 #  define CC_SBC(cc,rd,rn,rm)           corrr(cc,ARM_SBC,rn,rd,rm)
475 #  define SBC(rd,rn,rm)                 CC_SBC(ARM_CC_AL,rd,rn,rm)
476 #  define T1_SBC(rdn,rm)                is(THUMB_SBC|(_u3(rm)<<3)|_u3(rdn))
477 #  define T2_SBC(rd,rn,rm)              torrr(THUMB2_SBC,rn,rd,rm)
478 #  define CC_SBCI(cc,rd,rn,im)          corri(cc,ARM_SBC|ARM_I,rn,rd,im)
479 #  define SBCI(rd,rn,im)                CC_SBCI(ARM_CC_AL,rd,rn,im)
480 #  define T2_SBCI(rd,rn,im)             torri(THUMB2_SBCI,rn,rd,im)
481 #  define CC_SBCS(cc,rd,rn,rm)          corrr(cc,ARM_SBC|ARM_S,rn,rd,rm)
482 #  define SBCS(rd,rn,rm)                CC_SBCS(ARM_CC_AL,rd,rn,rm)
483 #  define T2_SBCS(rd,rn,rm)             torrr(THUMB2_SBC|ARM_S,rn,rd,rm)
484 #  define CC_SBCSI(cc,rd,rn,im)         corri(cc,ARM_SBC|ARM_S|ARM_I,rn,rd,im)
485 #  define SBCSI(rd,rn,im)               CC_SBCSI(ARM_CC_AL,rd,rn,im)
486 #  define T2_SBCSI(rd,rn,im)            torri(THUMB2_SBCI|ARM_S,rn,rd,im)
487 #  define CC_RSB(cc,rd,rn,rm)           corrr(cc,ARM_RSB,rn,rd,rm)
488 #  define RSB(rd,rn,rm)                 CC_RSB(ARM_CC_AL,rd,rn,rm)
489 #  define T2_RSB(rd,rn,rm)              torrr(THUMB2_RSB,rn,rd,rm)
490 #  define CC_RSBI(cc,rd,rn,im)          corri(cc,ARM_RSB|ARM_I,rn,rd,im)
491 #  define RSBI(rd,rn,im)                CC_RSBI(ARM_CC_AL,rd,rn,im)
492 #  define T1_RSBI(rd,rn)                is(THUMB_RSBI|(_u3(rn)<<3)|_u3(rd))
493 #  define T2_RSBI(rd,rn,im)             torri(THUMB2_RSBI,rn,rd,im)
494 #  define CC_MUL(cc,rl,rn,rm)           corrrr(cc,ARM_MUL,rl,0,rm,rn)
495 #  define MUL(rl,rn,rm)                 CC_MUL(ARM_CC_AL,rl,rn,rm)
496 #  define T1_MUL(rdm,rn)                is(THUMB_MUL|(_u3(rn)<<3)|_u3(rdm))
497 #  define T2_MUL(rd,rn,rm)              torrr(THUMB2_MUL,rn,rd,rm)
498 #  define CC_SMULL(cc,rl,rh,rn,rm)      corrrr(cc,ARM_SMULL,rh,rl,rm,rn)
499 #  define SMULL(rl,rh,rn,rm)            CC_SMULL(ARM_CC_AL,rl,rh,rn,rm)
500 #  define T2_SMULL(rl,rh,rn,rm)         torrrr(THUMB2_SMULL,rn,rl,rh,rm)
501 #  define CC_UMULL(cc,rl,rh,rn,rm)      corrrr(cc,ARM_UMULL,rh,rl,rm,rn)
502 #  define UMULL(rl,rh,rn,rm)            CC_UMULL(ARM_CC_AL,rl,rh,rn,rm)
503 #  define T2_UMULL(rl,rh,rn,rm)         torrrr(THUMB2_UMULL,rn,rl,rh,rm)
504 #  define T2_SDIV(rd,rn,rm)             torrr(THUMB2_SDIV,rn,rd,rm)
505 #  define T2_UDIV(rd,rn,rm)             torrr(THUMB2_UDIV,rn,rd,rm)
506 #  define CC_AND(cc,rd,rn,rm)           corrr(cc,ARM_AND,rn,rd,rm)
507 #  define AND(rd,rn,rm)                 CC_AND(ARM_CC_AL,rd,rn,rm)
508 #  define T1_AND(rdn,rm)                is(THUMB_AND|(_u3(rm)<<3)|_u3(rdn))
509 #  define T2_AND(rd,rn,rm)              torrr(THUMB2_AND,rn,rd,rm)
510 #  define CC_ANDI(cc,rd,rn,im)          corri(cc,ARM_AND|ARM_I,rn,rd,im)
511 #  define ANDI(rd,rn,im)                CC_ANDI(ARM_CC_AL,rd,rn,im)
512 #  define T2_ANDI(rd,rn,im)             torri(THUMB2_ANDI,rn,rd,im)
513 #  define CC_ANDS(cc,rd,rn,rm)          corrr(cc,ARM_AND|ARM_S,rn,rd,rm)
514 #  define ANDS(rd,rn,rm)                CC_ANDS(ARM_CC_AL,rd,rn,rm)
515 #  define T2_ANDS(rd,rn,rm)             torrr(THUMB2_AND|ARM_S,rn,rd,rm)
516 #  define CC_ANDSI(cc,rd,rn,im)         corri(cc,ARM_AND|ARM_S|ARM_I,rn,rd,im)
517 #  define ANDSI(rd,rn,im)               CC_ANDSI(ARM_CC_AL,rd,rn,im)
518 #  define T2_ANDSI(rd,rn,im)            torri(ARM_CC_AL,THUMB2_ANDI|ARM_S,rn,rd,im)
519 #  define CC_BIC(cc,rd,rn,rm)           corrr(cc,ARM_BIC,rn,rd,rm)
520 #  define BIC(rd,rn,rm)                 CC_BIC(ARM_CC_AL,rd,rn,rm)
521 #  define T2_BIC(rd,rn,rm)              torrr(THUMB2_BIC,rn,rd,rm)
522 #  define CC_BICI(cc,rd,rn,im)          corri(cc,ARM_BIC|ARM_I,rn,rd,im)
523 #  define BICI(rd,rn,im)                CC_BICI(ARM_CC_AL,rd,rn,im)
524 #  define T2_BICI(rd,rn,im)             torri(THUMB2_BICI,rn,rd,im)
525 #  define CC_BICS(cc,rd,rn,rm)          corrr(cc,ARM_BIC|ARM_S,rn,rd,rm)
526 #  define BICS(rd,rn,rm)                CC_BICS(ARM_CC_AL,rd,rn,rm)
527 #  define T2_BICS(rd,rn,rm)             torrr(THUMB2_BIC|ARM_S,rn,rd,rm)
528 #  define CC_BICSI(cc,rd,rn,im)         corri(cc,ARM_BIC|ARM_S|ARM_I,rn,rd,im)
529 #  define BICSI(rd,rn,im)               CC_BICSI(ARM_CC_AL,rd,rn,im)
530 #  define T2_BICSI(rd,rn,im)            torri(ARM_CC_AL,THUMB2_BICI|ARM_S,rn,rd,im)
531 #  define CC_ORR(cc,rd,rn,rm)           corrr(cc,ARM_ORR,rn,rd,rm)
532 #  define ORR(rd,rn,rm)                 CC_ORR(ARM_CC_AL,rd,rn,rm)
533 #  define T1_ORR(rdn,rm)                is(THUMB_ORR|(_u3(rm)<<3)|_u3(rdn))
534 #  define T2_ORR(rd,rn,rm)              torrr(THUMB2_ORR,rn,rd,rm)
535 #  define CC_ORR_SI(cc,rd,rn,rt,sh,im)  corrrs(cc,ARM_ORR|sh,rn,rd,rm,im)
536 #  define ORR_SI(r0,r1,r2,sh,im)        CC_ORR_SI(ARM_CC_AL,r0,r1,r2,sh,im)
537 #  define CC_ORRI(cc,rd,rn,im)          corri(cc,ARM_ORR|ARM_I,rn,rd,im)
538 #  define ORRI(rd,rn,im)                CC_ORRI(ARM_CC_AL,rd,rn,im)
539 #  define T2_ORRI(rd,rn,im)             torri(THUMB2_ORRI,rn,rd,im)
540 #  define CC_EOR(cc,rd,rn,rm)           corrr(cc,ARM_EOR,rn,rd,rm)
541 #  define EOR(rd,rn,rm)                 CC_EOR(ARM_CC_AL,rd,rn,rm)
542 #  define T1_EOR(rdn,rm)                is(THUMB_EOR|(_u3(rm)<<3)|_u3(rdn))
543 #  define T2_EOR(rd,rn,rm)              torrr(THUMB2_EOR,rn,rd,rm)
544 #  define CC_EOR_SI(cc,rd,rn,rm,sh,im)  corrrs(cc,ARM_EOR|sh,rn,rd,rm,im)
545 #  define EOR_SI(r0,r1,r2,sh,im)        CC_EOR_SI(ARM_CC_AL,r0,r1,r2,sh,im)
546 #  define CC_EORI(cc,rd,rn,im)          corri(cc,ARM_EOR|ARM_I,rn,rd,im)
547 #  define EORI(rd,rn,im)                CC_EORI(ARM_CC_AL,rd,rn,im)
548 #  define T2_EORI(rd,rn,im)             torri(THUMB2_EORI,rn,rd,im)
549 #  define CC_REV(cc,rd,rm)              c6orr(cc,ARM_REV,rd,rm)
550 #  define REV(rd,rm)                    CC_REV(ARM_CC_AL,rd,rm)
551 #  define T1_REV(rd,rm)                 is(THUMB_REV|(_u3(rm)<<3)|_u3(rd))
552 #  define T2_REV(rd,rm)                 torrr(THUMB2_REV,rm,rd,rm)
553 #  define CC_REV16(cc,rd,rm)            c6orr(cc,ARM_REV16,rd,rm)
554 #  define REV16(rd,rm)                  CC_REV16(ARM_CC_AL,rd,rm)
555 #  define T1_REV16(rd,rm)               is(THUMB_REV16|(_u3(rm)<<3)|_u3(rd))
556 #  define T2_REV16(rd,rm)               torrr(THUMB2_REV16,rm,rd,rm)
557 #  define CC_SXTB(cc,rd,rm)             c6orr(cc,ARM_SXTB,rd,rm)
558 #  define SXTB(rd,rm)                   CC_SXTB(ARM_CC_AL,rd,rm)
559 #  define T1_SXTB(rd,rm)                is(THUMB_SXTB|(_u3(rm)<<3)|_u3(rd))
560 #  define T2_SXTB(rd,rm)                torrr(THUMB2_SXTB,_R15_REGNO,rd,rm)
561 #  define CC_UXTB(cc,rd,rm)             c6orr(cc,ARM_UXTB,rd,rm)
562 #  define UXTB(rd,rm)                   CC_UXTB(ARM_CC_AL,rd,rm)
563 #  define T1_UXTB(rd,rm)                is(THUMB_UXTB|(_u3(rm)<<3)|_u3(rd))
564 #  define T2_UXTB(rd,rm)                torrr(THUMB2_UXTB,_R15_REGNO,rd,rm)
565 #  define CC_SXTH(cc,rd,rm)             c6orr(cc,ARM_SXTH,rd,rm)
566 #  define SXTH(rd,rm)                   CC_SXTH(ARM_CC_AL,rd,rm)
567 #  define T1_SXTH(rd,rm)                is(THUMB_SXTH|(_u3(rm)<<3)|_u3(rd))
568 #  define T2_SXTH(rd,rm)                torrr(THUMB2_SXTH,_R15_REGNO,rd,rm)
569 #  define CC_UXTH(cc,rd,rm)             c6orr(cc,ARM_UXTH,rd,rm)
570 #  define UXTH(rd,rm)                   CC_UXTH(ARM_CC_AL,rd,rm)
571 #  define T1_UXTH(rd,rm)                is(THUMB_UXTH|(_u3(rm)<<3)|_u3(rd))
572 #  define T2_UXTH(rd,rm)                torrr(THUMB2_UXTH,_R15_REGNO,rd,rm)
573 #  define CC_SHIFT(cc,o,rd,rm,rn,im)    cshift(cc,o,rd,rm,rn,im)
574 #  define CC_LSL(cc,rd,rn,rm)           CC_SHIFT(cc,ARM_LSL|ARM_R,rd,rm,rn,0)
575 #  define LSL(rd,rn,rm)                 CC_LSL(ARM_CC_AL,rd,rn,rm)
576 #  define T1_LSL(rdn,rm)                is(THUMB_LSL|(_u3(rm)<<3)|_u3(rdn))
577 #  define T2_LSL(rd,rn,rm)              torrr(THUMB2_LSL,rn,rd,rm)
578 #  define CC_LSLI(cc,rd,rn,im)          CC_SHIFT(cc,ARM_LSL,rd,0,rn,im)
579 #  define LSLI(rd,rn,im)                CC_LSLI(ARM_CC_AL,rd,rn,im)
580 #  define T1_LSLI(rd,rm,im)             is(THUMB_LSLI|(_u5(im)<<6)|(_u3(rm)<<3)|_u3(rd))
581 #  define T2_LSLI(rd,rm,im)             tshift(THUMB2_LSLI,rd,rm,im)
582 #  define CC_LSR(cc,rd,rn,rm)           CC_SHIFT(cc,ARM_LSR|ARM_R,rd,rm,rn,0)
583 #  define LSR(rd,rn,rm)                 CC_LSR(ARM_CC_AL,rd,rn,rm)
584 #  define T1_LSR(rdn,rm)                is(THUMB_LSR|(_u3(rm)<<3)|_u3(rdn))
585 #  define T2_LSR(rd,rn,rm)              torrr(THUMB2_LSR,rn,rd,rm)
586 #  define CC_LSRI(cc,rd,rn,im)          CC_SHIFT(cc,ARM_LSR,rd,0,rn,im)
587 #  define LSRI(rd,rn,im)                CC_LSRI(ARM_CC_AL,rd,rn,im)
588 #  define T1_LSRI(rd,rm,im)             is(THUMB_LSRI|(_u5(im)<<6)|(_u3(rm)<<3)|_u3(rd))
589 #  define T2_LSRI(rd,rm,im)             tshift(THUMB2_LSRI,rd,rm,im)
590 #  define CC_ASR(cc,rd,rn,rm)           CC_SHIFT(cc,ARM_ASR|ARM_R,rd,rm,rn,0)
591 #  define ASR(rd,rn,rm)                 CC_ASR(ARM_CC_AL,rd,rn,rm)
592 #  define T1_ASR(rdn,rm)                is(THUMB_ASR|(_u3(rm)<<3)|_u3(rdn))
593 #  define T2_ASR(rd,rn,rm)              torrr(THUMB2_ASR,rn,rd,rm)
594 #  define CC_ASRI(cc,rd,rn,im)          CC_SHIFT(cc,ARM_ASR,rd,0,rn,im)
595 #  define ASRI(rd,rn,im)                CC_ASRI(ARM_CC_AL,rd,rn,im)
596 #  define T1_ASRI(rd,rm,im)             is(THUMB_ASRI|(_u5(im)<<6)|(_u3(rm)<<3)|_u3(rd))
597 #  define T2_ASRI(rd,rm,im)             tshift(THUMB2_ASRI,rd,rm,im)
598 #  define CC_CMP(cc,rn,rm)              corrr(cc,ARM_CMP,rn,0,rm)
599 #  define CMP(rn,rm)                    CC_CMP(ARM_CC_AL,rn,rm)
600 #  define T1_CMP(rn,rm)                 is(THUMB_CMP|(_u3(rm)<<3)|_u3(rn))
601 #  define T1_CMPX(rn,rm)                is(THUMB_CMPX|((_u4(rn)&8)<<4)|(_u4(rm)<<3)|(rn&7))
602 #  define T2_CMP(rn,rm)                 torrr(THUMB2_CMP,rn,_R15_REGNO,rm)
603 #  define CC_CMPI(cc,rn,im)             corri(cc,ARM_CMP|ARM_I,rn,0,im)
604 #  define CMPI(rn,im)                   CC_CMPI(ARM_CC_AL,rn,im)
605 #  define T1_CMPI(rn,im)                is(THUMB_CMPI|(_u3(rn)<<8)|_u8(im))
606 #  define T2_CMPI(rn,im)                torri(THUMB2_CMPI,rn,_R15_REGNO,im)
607 #  define CC_CMN(cc,rn,rm)              corrr(cc,ARM_CMN,rn,0,rm)
608 #  define CMN(rn,rm)                    CC_CMN(ARM_CC_AL,rn,rm)
609 #  define T1_CMN(rn,rm)                 is(THUMB_CMN|(_u3(rm)<<3)|_u3(rm))
610 #  define T2_CMN(rn,rm)                 torrr(THUMB2_CMN,rn,_R15_REGNO,rm)
611 #  define CC_CMNI(cc,rn,im)             corri(cc,ARM_CMN|ARM_I,rn,0,im)
612 #  define CMNI(rn,im)                   CC_CMNI(ARM_CC_AL,rn,im)
613 #  define T2_CMNI(rn,im)                torri(THUMB2_CMNI,rn,_R15_REGNO,im)
614 #  define CC_TST(cc,rn,rm)              corrr(cc,ARM_TST,rn,r0,rm)
615 #  define TST(rn,rm)                    CC_TST(ARM_CC_AL,rn,rm)
616 #  define T1_TST(rn,rm)                 is(THUMB_TST|(_u3(rm)<<3)|_u3(rn))
617 #  define T2_TST(rn,rm)                 torrr(THUMB2_TST,rn,_R15_REGNO,rm)
618 #  define CC_TSTI(cc,rn,im)             corri(cc,ARM_TST|ARM_I,rn,0,im)
619 #  define TSTI(rn,im)                   CC_TSTI(ARM_CC_AL,rn,im)
620 #  define T2_TSTI(rn,im)                torri(THUMB2_TSTI,rn,_R15_REGNO,im)
621 #  define CC_TEQ(cc,rn,rm)              corrr(cc,ARM_TEQ,rn,0,rm)
622 #  define TEQ(rn,rm)                    CC_TEQ(ARM_CC_AL,rn,rm)
623 #  define CC_TEQI(cc,rm,im)             corri(cc,ARM_TEQ|ARM_I,rn,0,im)
624 #  define TEQI(rn,im)                   CC_TEQI(ARM_CC_AL,rn,im)
625 #  define CC_BX(cc,rm)                  cbx(cc,ARM_BX,rm)
626 #  define BX(rm)                        CC_BX(ARM_CC_AL,rm)
627 #  define T1_BX(rm)                     is(0x4700|(_u4(rm)<<3))
628 #  define CC_BLX(cc,rm)                 cbx(cc,ARM_BLX,rm)
629 #  define BLX(rm)                       CC_BLX(ARM_CC_AL,rm)
630 #  define T1_BLX(rm)                    is(THUMB_BLX|(_u4(rm)<<3))
631 #  define BLXI(im)                      blxi(im)
632 #  define T2_BLXI(im)                   tb(THUMB2_BLXI,im)
633 #  define CC_B(cc,im)                   cb(cc,ARM_B,im)
634 #  define B(im)                         CC_B(ARM_CC_AL,im)
635 #  define T1_CC_B(cc,im)                tc8(cc,im)
636 #  define T1_B(im)                      t11(im)
637 #  define T2_CC_B(cc,im)                tcb(cc,im)
638 #  define T2_B(im)                      tb(THUMB2_B,im)
639 #  define CC_BLI(cc,im)                 cb(cc,ARM_BLI,im)
640 #  define BLI(im)                       CC_BLI(ARM_CC_AL,im)
641 #  define T2_BLI(im)                    tb(THUMB2_BLI,im)
642 #  define CC_LDRSB(cc,rt,rn,rm)         corrr(cc,ARM_LDRSB|ARM_P,rn,rt,rm)
643 #  define LDRSB(rt,rn,rm)               CC_LDRSB(ARM_CC_AL,rt,rn,rm)
644 #  define T1_LDRSB(rt,rn,rm)            is(THUMB_LDRSB|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rt))
645 #  define T2_LDRSB(rt,rn,rm)            torxr(THUMB2_LDRSB,rn,rt,rm)
646 #  define CC_LDRSBN(cc,rt,rn,rm)        corrr(cc,ARM_LDRSB,rn,rt,rm)
647 #  define LDRSBN(rt,rn,rm)              CC_LDRSBN(ARM_CC_AL,rt,rn,rm)
648 #  define CC_LDRSBI(cc,rt,rn,im)        corri8(cc,ARM_LDRSBI|ARM_P,rn,rt,im)
649 #  define LDRSBI(rt,rn,im)              CC_LDRSBI(ARM_CC_AL,rt,rn,im)
650 #  define T2_LDRSBI(rt,rn,im)           torri8(THUMB2_LDRSBI|THUMB2_U,rn,rt,im)
651 #  define T2_LDRSBWI(rt,rn,im)          torri12(THUMB2_LDRSBWI,rn,rt,im)
652 #  define CC_LDRSBIN(cc,rt,rn,im)       corri8(cc,ARM_LDRSBI,rn,rt,im)
653 #  define LDRSBIN(rt,rn,im)             CC_LDRSBIN(ARM_CC_AL,rt,rn,im)
654 #  define T2_LDRSBIN(rt,rn,im)          torri8(THUMB2_LDRSBI,rn,rt,im)
655 #  define CC_LDRB(cc,rt,rn,rm)          corrr(cc,ARM_LDRB|ARM_P,rn,rt,rm)
656 #  define LDRB(rt,rn,rm)                CC_LDRB(ARM_CC_AL,rt,rn,rm)
657 #  define T1_LDRB(rt,rn,rm)             is(THUMB_LDRB|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rt))
658 #  define T2_LDRB(rt,rn,rm)             torxr(THUMB2_LDRB,rn,rt,rm)
659 #  define CC_LDRBN(cc,rt,rn,rm)         corrr(cc,ARM_LDRB,rn,rt,rm)
660 #  define LDRBN(rt,rn,rm)               CC_LDRBN(ARM_CC_AL,rt,rn,rm)
661 #  define CC_LDRBI(cc,rt,rn,im)         corri(cc,ARM_LDRBI|ARM_P,rn,rt,im)
662 #  define LDRBI(rt,rn,im)               CC_LDRBI(ARM_CC_AL,rt,rn,im)
663 #  define T1_LDRBI(rt,rn,im)            is(THUMB_LDRBI|(_u5(im)<<6)|(_u3(rn)<<3)|_u3(rt))
664 #  define T2_LDRBI(rt,rn,im)            torri8(THUMB2_LDRBI|THUMB2_U,rn,rt,im)
665 #  define T2_LDRBWI(rt,rn,im)           torri12(THUMB2_LDRBWI,rn,rt,im)
666 #  define CC_LDRBIN(cc,rt,rn,im)        corri(cc,ARM_LDRBI,rn,rt,im)
667 #  define LDRBIN(rt,rn,im)              CC_LDRBIN(ARM_CC_AL,rt,rn,im)
668 #  define T2_LDRBIN(rt,rn,im)           torri8(THUMB2_LDRBI,rn,rt,im)
669 #  define CC_LDRSH(cc,rt,rn,rm)         corrr(cc,ARM_LDRSH|ARM_P,rn,rt,rm)
670 #  define LDRSH(rt,rn,rm)               CC_LDRSH(ARM_CC_AL,rt,rn,rm)
671 #  define T1_LDRSH(rt,rn,rm)            is(THUMB_LDRSH|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rt))
672 #  define T2_LDRSH(rt,rn,rm)            torxr(THUMB2_LDRSH,rn,rt,rm)
673 #  define CC_LDRSHN(cc,rt,rn,rm)        corrr(cc,ARM_LDRSH,rn,rt,rm)
674 #  define LDRSHN(rt,rn,rm)              CC_LDRSHN(ARM_CC_AL,rt,rn,rm)
675 #  define CC_LDRSHI(cc,rt,rn,im)        corri8(cc,ARM_LDRSHI|ARM_P,rn,rt,im)
676 #  define LDRSHI(rt,rn,im)              CC_LDRSHI(ARM_CC_AL,rt,rn,im)
677 #  define T2_LDRSHI(rt,rn,im)           torri8(THUMB2_LDRSHI|THUMB2_U,rn,rt,im)
678 #  define T2_LDRSHWI(rt,rn,im)          torri12(THUMB2_LDRSHWI,rn,rt,im)
679 #  define CC_LDRSHIN(cc,rt,rn,im)       corri8(cc,ARM_LDRSHI,rn,rt,im)
680 #  define LDRSHIN(rt,rn,im)             CC_LDRSHIN(ARM_CC_AL,rt,rn,im)
681 #  define T2_LDRSHIN(rt,rn,im)          torri8(THUMB2_LDRSHI,rn,rt,im)
682 #  define CC_LDRH(cc,rt,rn,rm)          corrr(cc,ARM_LDRH|ARM_P,rn,rt,rm)
683 #  define LDRH(rt,rn,rm)                CC_LDRH(ARM_CC_AL,rt,rn,rm)
684 #  define T1_LDRH(rt,rn,rm)             is(THUMB_LDRH|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rt))
685 #  define T2_LDRH(rt,rn,rm)             torxr(THUMB2_LDRH,rn,rt,rm)
686 #  define CC_LDRHN(cc,rt,rn,rm)         corrr(cc,ARM_LDRH,rn,rt,rm)
687 #  define LDRHN(rt,rn,rm)               CC_LDRHN(ARM_CC_AL,rt,rn,rm)
688 #  define CC_LDRHI(cc,rt,rn,im)         corri8(cc,ARM_LDRHI|ARM_P,rn,rt,im)
689 #  define LDRHI(rt,rn,im)               CC_LDRHI(ARM_CC_AL,rt,rn,im)
690 #  define T1_LDRHI(rt,rn,im)            is(THUMB_LDRHI|(_u5(im)<<6)|(_u3(rn)<<3)|_u3(rt))
691 #  define T2_LDRHI(rt,rn,im)            torri8(THUMB2_LDRHI|THUMB2_U,rn,rt,im)
692 #  define T2_LDRHWI(rt,rn,im)           torri12(THUMB2_LDRHWI,rn,rt,im)
693 #  define CC_LDRHIN(cc,rt,rn,im)        corri8(cc,ARM_LDRHI,rn,rt,im)
694 #  define LDRHIN(rt,rn,im)              CC_LDRHIN(ARM_CC_AL,rt,rn,im)
695 #  define T2_LDRHIN(rt,rn,im)           torri8(THUMB2_LDRHI,rn,rt,im)
696 #  define CC_LDR(cc,rt,rn,rm)           corrr(cc,ARM_LDR|ARM_P,rn,rt,rm)
697 #  define LDR(rt,rn,rm)                 CC_LDR(ARM_CC_AL,rt,rn,rm)
698 #  define T1_LDR(rt,rn,rm)              is(THUMB_LDR|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rt))
699 #  define T2_LDR(rt,rn,rm)              torxr(THUMB2_LDR,rn,rt,rm)
700 #  define CC_LDRN(cc,rt,rn,rm)          corrr(cc,ARM_LDR,rn,rt,rm)
701 #  define LDRN(rt,rn,rm)                CC_LDRN(ARM_CC_AL,rt,rn,rm)
702 #  define CC_LDRI(cc,rt,rn,im)          corri(cc,ARM_LDRI|ARM_P,rn,rt,im)
703 #  define LDRI(rt,rn,im)                CC_LDRI(ARM_CC_AL,rt,rn,im)
704 #  define T1_LDRI(rt,rn,im)             is(THUMB_LDRI|(_u5(im)<<6)|(_u3(rn)<<3)|_u3(rt))
705 #  define T1_LDRISP(rt,im)              is(THUMB_LDRISP|(_u3(rt)<<8)|_u8(im))
706 #  define T2_LDRI(rt,rn,im)             torri8(THUMB2_LDRI|THUMB2_U,rn,rt,im)
707 #  define T2_LDRWI(rt,rn,im)            torri12(THUMB2_LDRWI,rn,rt,im)
708 #  define CC_LDRIN(cc,rt,rn,im)         corri(cc,ARM_LDRI,rn,rt,im)
709 #  define LDRIN(rt,rn,im)               CC_LDRIN(ARM_CC_AL,rt,rn,im)
710 #  define T2_LDRIN(rt,rn,im)            torri8(THUMB2_LDRI,rn,rt,im)
711 #  define CC_LDRD(cc,rt,rn,rm)          corrr(cc,ARM_LDRD|ARM_P,rn,rt,rm)
712 #  define LDRD(rt,rn,rm)                CC_LDRD(ARM_CC_AL,rt,rn,rm)
713 #  define T2_LDRDI(rt,rt2,rn,im)        torrri8(THUMB2_LDRDI|ARM_P,rn,rt,rt2,im)
714 #  define CC_LDRDN(cc,rt,rn,rm)         corrr(cc,ARM_LDRD,rn,rt,rm)
715 #  define LDRDN(rd,rn,rm)               CC_LDRDN(ARM_CC_AL,rt,rn,rm)
716 #  define CC_LDRDI(cc,rt,rn,im)         corri8(cc,ARM_LDRDI|ARM_P,rn,rt,im)
717 #  define LDRDI(rt,rn,im)               CC_LDRDI(ARM_CC_AL,rt,rn,im)
718 #  define CC_LDRDIN(cc,rt,rn,im)        corri8(cc,ARM_LDRDI,rn,rt,im)
719 #  define LDRDIN(rt,rn,im)              CC_LDRDIN(ARM_CC_AL,rt,rn,im)
720 #  define T2_LDRDIN(rt,rt2,rn,im)       torrri8(THUMB2_LDRDI,rn,rt,rt2,im)
721 #  define CC_STRB(cc,rt,rn,rm)          corrr(cc,ARM_STRB|ARM_P,rn,rt,rm)
722 #  define STRB(rt,rn,rm)                CC_STRB(ARM_CC_AL,rt,rn,rm)
723 #  define T1_STRB(rt,rn,rm)             is(THUMB_STRB|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rt))
724 #  define T2_STRB(rt,rn,rm)             torxr(THUMB2_STRB,rn,rt,rm)
725 #  define CC_STRBN(cc,rt,rn,rm)         corrr(cc,ARM_STRB,rn,rt,rm)
726 #  define STRBN(rt,rn,rm)               CC_STRBN(ARM_CC_AL,rt,rn,rm)
727 #  define CC_STRBI(cc,rt,rn,im)         corri(cc,ARM_STRBI|ARM_P,rn,rt,im)
728 #  define STRBI(rt,rn,im)               CC_STRBI(ARM_CC_AL,rt,rn,im)
729 #  define T1_STRBI(rt,rn,im)            is(THUMB_STRBI|(_u5(im)<<6)|(_u3(rn)<<3)|_u3(rt))
730 #  define T2_STRBI(rt,rn,im)            torri8(THUMB2_STRBI|THUMB2_U,rn,rt,im)
731 #  define T2_STRBWI(rt,rn,im)           torri12(THUMB2_STRBWI,rn,rt,im)
732 #  define CC_STRBIN(cc,rt,rn,im)        corri(cc,ARM_STRBI,rn,rt,im)
733 #  define STRBIN(rt,rn,im)              CC_STRBIN(ARM_CC_AL,rt,rn,im)
734 #  define T2_STRBIN(rt,rn,im)           torri8(THUMB2_STRBI,rn,rt,im)
735 #  define CC_STRH(cc,rt,rn,rm)          corrr(cc,ARM_STRH|ARM_P,rn,rt,rm)
736 #  define STRH(rt,rn,rm)                CC_STRH(ARM_CC_AL,rt,rn,rm)
737 #  define T1_STRH(rt,rn,rm)             is(THUMB_STRH|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rt))
738 #  define T2_STRH(rt,rn,rm)             torxr(THUMB2_STRH,rn,rt,rm)
739 #  define CC_STRHN(cc,rt,rn,rm)         corrr(cc,ARM_STRH,rn,rt,rm)
740 #  define STRHN(rt,rn,rm)               CC_STRHN(ARM_CC_AL,rt,rn,rm)
741 #  define CC_STRHI(cc,rt,rn,im)         corri8(cc,ARM_STRHI|ARM_P,rn,rt,im)
742 #  define STRHI(rt,rn,im)               CC_STRHI(ARM_CC_AL,rt,rn,im)
743 #  define T1_STRHI(rt,rn,im)            is(THUMB_STRHI|(_u5(im)<<6)|(_u3(rn)<<3)|_u3(rt))
744 #  define T2_STRHI(rt,rn,im)            torri8(THUMB2_STRHI|THUMB2_U,rn,rt,im)
745 #  define T2_STRHWI(rt,rn,im)           torri12(THUMB2_STRHWI,rn,rt,im)
746 #  define CC_STRHIN(cc,rt,rn,im)        corri8(cc,ARM_STRHI,rn,rt,im)
747 #  define STRHIN(rt,rn,im)              CC_STRHIN(ARM_CC_AL,rt,rn,im)
748 #  define T2_STRHIN(rt,rn,im)           torri8(THUMB2_STRHI,rn,rt,im)
749 #  define CC_STR(cc,rt,rn,rm)           corrr(cc,ARM_STR|ARM_P,rn,rt,rm)
750 #  define STR(rt,rn,rm)                 CC_STR(ARM_CC_AL,rt,rn,rm)
751 #  define T1_STR(rt,rn,rm)              is(THUMB_STR|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rt))
752 #  define T2_STR(rt,rn,rm)              torxr(THUMB2_STR,rn,rt,rm)
753 #  define CC_STRN(cc,rt,rn,rm)          corrr(cc,ARM_STR,rn,rt,rm)
754 #  define STRN(rt,rn,rm)                CC_STRN(ARM_CC_AL,rt,rn,rm)
755 #  define CC_STRI(cc,rt,rn,im)          corri(cc,ARM_STRI|ARM_P,rn,rt,im)
756 #  define STRI(rt,rn,im)                CC_STRI(ARM_CC_AL,rt,rn,im)
757 #  define T1_STRI(rt,rn,im)             is(THUMB_STRI|(_u5(im)<<6)|(_u3(rn)<<3)|_u3(rt))
758 #  define T1_STRISP(rt,im)              is(THUMB_STRISP|(_u3(rt)<<8)|(_u8(im)))
759 #  define T2_STRI(rt,rn,im)             torri8(THUMB2_STRI|THUMB2_U,rn,rt,im)
760 #  define T2_STRWI(rt,rn,im)            torri12(THUMB2_STRWI,rn,rt,im)
761 #  define CC_STRIN(cc,rt,rn,im)         corri(cc,ARM_STRI,rn,rt,im)
762 #  define STRIN(rt,rn,im)               CC_STRIN(ARM_CC_AL,rt,rn,im)
763 #  define T2_STRIN(rt,rn,im)            torri8(THUMB2_STRI,rn,rt,im)
764 #  define CC_STRD(cc,rt,rn,rm)          corrr(cc,ARM_STRD|ARM_P,rn,rt,rm)
765 #  define STRD(rt,rn,rm)                CC_STRD(ARM_CC_AL,rt,rn,rm)
766 #  define CC_STRDN(cc,rt,rn,rm)         corrr(cc,ARM_STRD,rn,rt,rm)
767 #  define STRDN(rt,rn,rm)               CC_STRDN(ARM_CC_AL,rt,rn,rm)
768 #  define CC_STRDI(cc,rt,rn,im)         corri8(cc,ARM_STRDI|ARM_P,rn,rt,im)
769 #  define STRDI(rt,rn,im)               CC_STRDI(ARM_CC_AL,rt,rn,im)
770 #  define T2_STRDI(rt,rt2,rn,im)        torrri8(THUMB2_STRDI|ARM_P,rn,rt,rt2,im)
771 #  define CC_STRDIN(cc,rt,rn,im)        corri8(cc,ARM_STRDI,rn,rt,im)
772 #  define STRDIN(rt,rn,im)              CC_STRDIN(ARM_CC_AL,rt,rn,im)
773 #  define T2_STRDIN(rt,rt2,rn,im)       torrri8(THUMB2_STRDI,rn,rt,rt2,im)
774 #  define CC_LDMIA(cc,rn,im)            corl(cc,ARM_M|ARM_M_L|ARM_M_I,rn,im)
775 #  define LDMIA(rn,im)                  CC_LDMIA(ARM_CC_AL,rn,im)
776 #  define CC_LDM(cc,rn,im)              CC_LDMIA(cc,rn,im)
777 #  define LDM(rn,im)                    LDMIA(rn,im)
778 #  define T1_LDMIA(rn,im)               is(THUMB_LDMIA|(_u3(rn)<<8)|im)
779 #  define T2_LDMIA(rn,im)               torl(THUMB2_LDMIA,rn,im)
780 #  define CC_LDMIA_U(cc,rn,im)          corl(cc,ARM_M|ARM_M_L|ARM_M_I|ARM_M_U,rn,im)
781 #  define LDMIA_U(rn,im)                CC_LDMIA_U(ARM_CC_AL,rn,im)
782 #  define LDM_U(r0,i0)                  LDMIA_U(r0,i0)
783 #  define CC_LDMIB(cc,rn,im)            corl(cc,ARM_M|ARM_M_L|ARM_M_I|ARM_M_B,rn,im)
784 #  define LDMIB(rn,im)                  CC_LDMIB(ARM_CC_AL,rn,im)
785 #  define CC_LDMIB_U(cc,rn,im)          corl(cc,ARM_M|ARM_M_L|ARM_M_I|ARM_M_B|ARM_M_U,rn,im)
786 #  define LDMIB_U(rn,im)                CC_LDMIB_U(ARM_CC_AL,rn,im)
787 #  define CC_LDMDA(cc,rn,im)            corl(cc,ARM_M|ARM_M_L,rn,im)
788 #  define LDMDA(rn,im)                  CC_LDMDA(ARM_CC_AL,rn,im)
789 #  define CC_LDMDA_U(cc,rn,im)          corl(cc,ARM_M|ARM_M_L|ARM_M_U,rn,im)
790 #  define LDMDA_U(rn,im)                CC_LDMDA_U(ARM_CC_AL,rn,im)
791 #  define CC_LDMDB(cc,rn,im)            corl(cc,ARM_M|ARM_M_L|ARM_M_B,rn,im)
792 #  define LDMDB(rn,im)                  CC_LDMDB(ARM_CC_AL,rn,im)
793 #  define T2_LDMDB(rn,im)               torl(THUMB2_LDMDB,rn,im)
794 #  define CC_LDMDB_U(cc,rn,im)          corl(cc,ARM_M|ARM_M_L|ARM_M_B|ARM_M_U,rn,im)
795 #  define LDMDB_U(rn,im)                CC_LDMDB_U(ARM_CC_AL,rn,im)
796 #  define CC_STMIA(cc,rn,im)            corl(cc,ARM_M|ARM_M_I,rn,im)
797 #  define STMIA(rn,im)                  CC_STMIA(ARM_CC_AL,rn,im)
798 #  define CC_STM(cc,rn,im)              CC_STMIA(cc,rn,im)
799 #  define STM(rn,im)                    STMIA(rn,im)
800 #  define CC_STMIA_U(cc,rn,im)          corl(cc,ARM_M|ARM_M_I|ARM_M_U,rn,im)
801 #  define STMIA_U(rn,im)                CC_STMIA_U(ARM_CC_AL,rn,im)
802 #  define CC_STM_U(cc,rn,im)            CC_STMIA_U(cc,rn,im)
803 #  define STM_U(rn,im)                  STMIA_U(rn,im)
804 #  define CC_STMIB(cc,rn,im)            corl(cc,ARM_M|ARM_M_I|ARM_M_B,rn,im)
805 #  define STMIB(rn,im)                  CC_STMIB(ARM_CC_AL,rn,im)
806 #  define CC_STMIB_U(cc,rn,im)          corl(cc,ARM_M|ARM_M_I|ARM_M_B|ARM_M_U,rn,im)
807 #  define STMIB_U(rn,im)                CC_STMIB_U(ARM_CC_AL,rn,im)
808 #  define CC_STMDA(cc,rn,im)            corl(cc,ARM_M,rn,im)
809 #  define STMDA(rn,im)                  CC_STMDA(ARM_CC_AL,rn,im)
810 #  define CC_STMDA_U(cc,rn,im)          corl(cc,ARM_M|ARM_M_U,rn,im)
811 #  define STMDA_U(rn,im)                CC_STMDA_U(ARM_CC_AL,rn,im)
812 #  define CC_STMDB(cc,rn,im)            corl(cc,ARM_M|ARM_M_B,rn,im)
813 #  define STMDB(rn,im)                  CC_STMDB(ARM_CC_AL,rn,im)
814 #  define CC_STMDB_U(cc,rn,im)          corl(cc,ARM_M|ARM_M_B|ARM_M_U,rn,im)
815 #  define STMDB_U(rn,im)                CC_STMDB_U(ARM_CC_AL,rn,im)
816 #  define CC_PUSH(cc,im)                CC_STMDB_U(cc,_SP_REGNO,im)
817 #  define PUSH(im)                      STMDB_U(_SP_REGNO,im)
818 #  define T1_PUSH(im)                   is(THUMB_PUSH|((im&0x4000)>>6)|(im&0xff))
819 #  define T2_PUSH(im)                   tpp(THUMB2_PUSH,im)
820 #  define CC_POP(cc,im)                 LDMIA_U(cc,_SP_REGNO,im)
821 #  define POP(im)                       LDMIA_U(_SP_REGNO,im)
822 #  define T1_POP(im)                    is(THUMB_POP|((im&0x8000)>>7)|(im&0xff))
823 #  define T2_POP(im)                    tpp(THUMB2_POP,im)
824 #  define jit_get_reg_args()                                            \
825     do {                                                                \
826         (void)jit_get_reg(_R0|jit_class_named|jit_class_gpr);           \
827         (void)jit_get_reg(_R1|jit_class_named|jit_class_gpr);           \
828         (void)jit_get_reg(_R2|jit_class_named|jit_class_gpr);           \
829         (void)jit_get_reg(_R3|jit_class_named|jit_class_gpr);           \
830     } while (0)
831 #  define jit_unget_reg_args()                                          \
832     do {                                                                \
833         jit_unget_reg(_R3);                                             \
834         jit_unget_reg(_R2);                                             \
835         jit_unget_reg(_R1);                                             \
836         jit_unget_reg(_R0);                                             \
837     } while (0)
838 #  define nop(i0)                       _nop(_jit,i0)
839 static void _nop(jit_state_t*,jit_int32_t);
840 #  define movr(r0,r1)                   _movr(_jit,r0,r1)
841 static void _movr(jit_state_t*,jit_int32_t,jit_int32_t);
842 #  define movi(r0,i0)                   _movi(_jit,r0,i0)
843 static void _movi(jit_state_t*,jit_int32_t,jit_word_t);
844 #  define movi_p(r0,i0)                 _movi_p(_jit,r0,i0)
845 static jit_word_t _movi_p(jit_state_t*,jit_int32_t,jit_word_t);
846 #  define movnr(r0,r1,r2)               _movnr(_jit,r0,r1,r2)
847 static void _movnr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
848 #  define movzr(r0,r1,r2)               _movzr(_jit,r0,r1,r2)
849 static void _movzr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
850 #  define comr(r0,r1)                   _comr(_jit,r0,r1)
851 static void _comr(jit_state_t*,jit_int32_t,jit_int32_t);
852 #  define negr(r0,r1)                   _negr(_jit,r0,r1)
853 static void _negr(jit_state_t*,jit_int32_t,jit_int32_t);
854 #  define addr(r0,r1,r2)                _addr(_jit,r0,r1,r2)
855 static void _addr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
856 #  define addi(r0,r1,i0)                _addi(_jit,r0,r1,i0)
857 static void _addi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
858 #  define addcr(r0,r1,r2)               _addcr(_jit,r0,r1,r2)
859 static void _addcr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
860 #  define addci(r0,r1,i0)               _addci(_jit,r0,r1,i0)
861 static void _addci(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
862 #  define addxr(r0,r1,r2)               _addxr(_jit,r0,r1,r2)
863 static void _addxr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
864 #  define addxi(r0,r1,i0)               _addxi(_jit,r0,r1,i0)
865 static void _addxi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
866 #  define subr(r0,r1,r2)                _subr(_jit,r0,r1,r2)
867 static void _subr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
868 #  define subi(r0,r1,i0)                _subi(_jit,r0,r1,i0)
869 static void _subi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
870 #  define subcr(r0,r1,r2)               _subcr(_jit,r0,r1,r2)
871 static void _subcr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
872 #  define subci(r0,r1,i0)               _subci(_jit,r0,r1,i0)
873 static void _subci(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
874 #  define subxr(r0,r1,r2)               _subxr(_jit,r0,r1,r2)
875 static void _subxr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
876 #  define subxi(r0,r1,i0)               _subxi(_jit,r0,r1,i0)
877 static void _subxi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
878 #  define rsbi(r0, r1, i0)              _rsbi(_jit, r0, r1, i0)
879 static void _rsbi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
880 #  define mulr(r0,r1,r2)                _mulr(_jit,r0,r1,r2)
881 static void _mulr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
882 #  define muli(r0,r1,i0)                _muli(_jit,r0,r1,i0)
883 static void _muli(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
884 #  define qmulr(r0,r1,r2,r3)            iqmulr(r0,r1,r2,r3,1)
885 #  define qmulr_u(r0,r1,r2,r3)          iqmulr(r0,r1,r2,r3,0)
886 #  define iqmulr(r0,r1,r2,r3,cc)        _iqmulr(_jit,r0,r1,r2,r3,cc)
887 static void _iqmulr(jit_state_t*,jit_int32_t,jit_int32_t,
888                     jit_int32_t,jit_int32_t,jit_bool_t);
889 #  define qmuli(r0,r1,r2,i0)            iqmuli(r0,r1,r2,i0,1)
890 #  define qmuli_u(r0,r1,r2,i0)          iqmuli(r0,r1,r2,i0,0)
891 #  define iqmuli(r0,r1,r2,i0,cc)        _iqmuli(_jit,r0,r1,r2,i0,cc)
892 static void _iqmuli(jit_state_t*,jit_int32_t,jit_int32_t,
893                     jit_int32_t,jit_word_t,jit_bool_t);
894 #  define divrem(d,s,r0,r1,r2)          _divrem(_jit,d,s,r0,r1,r2)
895 static void _divrem(jit_state_t*,int,int,jit_int32_t,jit_int32_t,jit_int32_t);
896 #  define divr(r0,r1,r2)                _divr(_jit,r0,r1,r2)
897 static void _divr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
898 #  define divi(r0,r1,i0)                _divi(_jit,r0,r1,i0)
899 static void _divi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
900 #  define divr_u(r0,r1,r2)              _divr_u(_jit,r0,r1,r2)
901 static void _divr_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
902 #  define divi_u(r0,r1,i0)              _divi_u(_jit,r0,r1,i0)
903 static void _divi_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
904 #  define qdivr(r0,r1,r2,r3)            iqdivr(r0,r1,r2,r3,1)
905 #  define qdivr_u(r0,r1,r2,r3)          iqdivr(r0,r1,r2,r3,0)
906 #  define iqdivr(r0,r1,r2,r3,cc)        _iqdivr(_jit,r0,r1,r2,r3,cc)
907 static void _iqdivr(jit_state_t*,jit_int32_t,jit_int32_t,
908                     jit_int32_t,jit_int32_t,jit_bool_t);
909 #  define qdivi(r0,r1,r2,i0)            iqdivi(r0,r1,r2,i0,1)
910 #  define qdivi_u(r0,r1,r2,i0)          iqdivi(r0,r1,r2,i0,0)
911 #  define iqdivi(r0,r1,r2,i0,cc)        _iqdivi(_jit,r0,r1,r2,i0,cc)
912 static void _iqdivi(jit_state_t*,jit_int32_t,jit_int32_t,
913                     jit_int32_t,jit_word_t,jit_bool_t);
914 #  define remr(r0,r1,r2)                _remr(_jit,r0,r1,r2)
915 static void _remr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
916 #  define remi(r0,r1,i0)                _remi(_jit,r0,r1,i0)
917 static void _remi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
918 #  define remr_u(r0,r1,r2)              _remr_u(_jit,r0,r1,r2)
919 static void _remr_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
920 #  define remi_u(r0,r1,i0)              _remi_u(_jit,r0,r1,i0)
921 static void _remi_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
922 #  define andr(r0,r1,r2)                _andr(_jit,r0,r1,r2)
923 static void _andr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
924 #  define andi(r0,r1,i0)                _andi(_jit,r0,r1,i0)
925 static void _andi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
926 #  define orr(r0,r1,r2)                 _orr(_jit,r0,r1,r2)
927 static void _orr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
928 #  define ori(r0,r1,i0)                 _ori(_jit,r0,r1,i0)
929 static void _ori(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
930 #  define xorr(r0,r1,r2)                _xorr(_jit,r0,r1,r2)
931 static void _xorr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
932 #  define xori(r0,r1,i0)                _xori(_jit,r0,r1,i0)
933 static void _xori(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
934 #  define lshr(r0,r1,r2)                _lshr(_jit,r0,r1,r2)
935 static void _lshr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
936 #  define lshi(r0,r1,i0)                _lshi(_jit,r0,r1,i0)
937 static void _lshi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
938 #  define rshr(r0,r1,r2)                _rshr(_jit,r0,r1,r2)
939 static void _rshr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
940 #  define rshi(r0,r1,i0)                _rshi(_jit,r0,r1,i0)
941 static void _rshi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
942 #  define rshr_u(r0,r1,r2)              _rshr_u(_jit,r0,r1,r2)
943 static void _rshr_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
944 #  define rshi_u(r0,r1,i0)              _rshi_u(_jit,r0,r1,i0)
945 static void _rshi_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
946 #  define ccr(ct,cf,r0,r1,r2)           _ccr(_jit,ct,cf,r0,r1,r2)
947 static void _ccr(jit_state_t*,int,int,jit_int32_t,jit_int32_t,jit_int32_t);
948 #  define cci(ct,cf,r0,r1,i0)           _cci(_jit,ct,cf,r0,r1,i0)
949 static void _cci(jit_state_t*,int,int,jit_int32_t,jit_int32_t,jit_word_t);
950 #  define ltr(r0, r1, r2)               ccr(ARM_CC_LT,ARM_CC_GE,r0,r1,r2)
951 #  define lti(r0, r1, i0)               cci(ARM_CC_LT,ARM_CC_GE,r0,r1,i0)
952 #  define ltr_u(r0, r1, r2)             ccr(ARM_CC_LO,ARM_CC_HS,r0,r1,r2)
953 #  define lti_u(r0, r1, i0)             cci(ARM_CC_LO,ARM_CC_HS,r0,r1,i0)
954 #  define ler(r0, r1, r2)               ccr(ARM_CC_LE,ARM_CC_GT,r0,r1,r2)
955 #  define lei(r0, r1, i0)               cci(ARM_CC_LE,ARM_CC_GT,r0,r1,i0)
956 #  define ler_u(r0, r1, r2)             ccr(ARM_CC_LS,ARM_CC_HI,r0,r1,r2)
957 #  define lei_u(r0, r1, i0)             cci(ARM_CC_LS,ARM_CC_HI,r0,r1,i0)
958 #  define eqr(r0, r1, r2)               ccr(ARM_CC_EQ,ARM_CC_NE,r0,r1,r2)
959 #  define eqi(r0, r1, i0)               cci(ARM_CC_EQ,ARM_CC_NE,r0,r1,i0)
960 #  define ger(r0, r1, r2)               ccr(ARM_CC_GE,ARM_CC_LT,r0,r1,r2)
961 #  define gei(r0, r1, i0)               cci(ARM_CC_GE,ARM_CC_LT,r0,r1,i0)
962 #  define ger_u(r0, r1, r2)             ccr(ARM_CC_HS,ARM_CC_LO,r0,r1,r2)
963 #  define gei_u(r0, r1, i0)             cci(ARM_CC_HS,ARM_CC_LO,r0,r1,i0)
964 #  define gtr(r0, r1, r2)               ccr(ARM_CC_GT,ARM_CC_LE,r0,r1,r2)
965 #  define gti(r0, r1, i0)               cci(ARM_CC_GT,ARM_CC_LE,r0,r1,i0)
966 #  define gtr_u(r0, r1, r2)             ccr(ARM_CC_HI,ARM_CC_LS,r0,r1,r2)
967 #  define gti_u(r0, r1, i0)             cci(ARM_CC_HI,ARM_CC_LS,r0,r1,i0)
968 #  define ner(r0,r1,r2)                 _ner(_jit,r0,r1,r2)
969 static void _ner(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
970 #  define nei(r0,r1,i0)                 _nei(_jit,r0,r1,i0)
971 static void _nei(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
972 #  define jmpr(r0)                      _jmpr(_jit,r0)
973 static void _jmpr(jit_state_t*,jit_int32_t);
974 #  define jmpi(i0)                      _jmpi(_jit,i0)
975 static void _jmpi(jit_state_t*,jit_word_t);
976 #  define jmpi_p(i0, i1)                _jmpi_p(_jit,i0, i1)
977 static jit_word_t _jmpi_p(jit_state_t*,jit_word_t,jit_bool_t);
978 #  define bccr(cc,i0,r0,r1)             _bccr(_jit,cc,i0,r0,r1)
979 static jit_word_t _bccr(jit_state_t*,int,jit_word_t,jit_int32_t,jit_int32_t);
980 #  define bcci(cc,i0,r0,i1)             _bcci(_jit,cc,i0,r0,i1)
981 static jit_word_t _bcci(jit_state_t*,int,jit_word_t,jit_int32_t,jit_word_t);
982 #  define bltr(i0, r0, r1)              bccr(ARM_CC_LT,i0,r0,r1)
983 #  define blti(i0, r0, i1)              bcci(ARM_CC_LT,i0,r0,i1)
984 #  define bltr_u(i0, r0, r1)            bccr(ARM_CC_LO,i0,r0,r1)
985 #  define blti_u(i0, r0, i1)            bcci(ARM_CC_LO,i0,r0,i1)
986 #  define bler(i0, r0, r1)              bccr(ARM_CC_LE,i0,r0,r1)
987 #  define blei(i0, r0, i1)              bcci(ARM_CC_LE,i0,r0,i1)
988 #  define bler_u(i0, r0, r1)            bccr(ARM_CC_LS,i0,r0,r1)
989 #  define blei_u(i0, r0, i1)            bcci(ARM_CC_LS,i0,r0,i1)
990 #  define beqr(i0, r0, r1)              bccr(ARM_CC_EQ,i0,r0,r1)
991 #  define beqi(i0, r0, i1)              bcci(ARM_CC_EQ,i0,r0,i1)
992 #  define bger(i0, r0, r1)              bccr(ARM_CC_GE,i0,r0,r1)
993 #  define bgei(i0, r0, i1)              bcci(ARM_CC_GE,i0,r0,i1)
994 #  define bger_u(i0, r0, r1)            bccr(ARM_CC_HS,i0,r0,r1)
995 #  define bgei_u(i0, r0, i1)            bcci(ARM_CC_HS,i0,r0,i1)
996 #  define bgtr(i0, r0, r1)              bccr(ARM_CC_GT,i0,r0,r1)
997 #  define bgti(i0, r0, i1)              bcci(ARM_CC_GT,i0,r0,i1)
998 #  define bgtr_u(i0, r0, r1)            bccr(ARM_CC_HI,i0,r0,r1)
999 #  define bgti_u(i0, r0, i1)            bcci(ARM_CC_HI,i0,r0,i1)
1000 #  define bner(i0, r0, r1)              bccr(ARM_CC_NE,i0,r0,r1)
1001 #  define bnei(i0, r0, i1)              bcci(ARM_CC_NE,i0,r0,i1)
1002 #  define baddr(cc,i0,r0,r1)            _baddr(_jit,cc,i0,r0,r1)
1003 static jit_word_t _baddr(jit_state_t*,int,jit_word_t,jit_int32_t,jit_int32_t);
1004 #  define baddi(cc,i0,r0,r1)            _baddi(_jit,cc,i0,r0,r1)
1005 static jit_word_t _baddi(jit_state_t*,int,jit_word_t,jit_int32_t,jit_word_t);
1006 #  define boaddr(i0,r0,r1)              baddr(ARM_CC_VS,i0,r0,r1)
1007 #  define boaddi(i0,r0,i1)              baddi(ARM_CC_VS,i0,r0,i1)
1008 #  define boaddr_u(i0,r0,r1)            baddr(ARM_CC_HS,i0,r0,r1)
1009 #  define boaddi_u(i0,r0,i1)            baddi(ARM_CC_HS,i0,r0,i1)
1010 #  define bxaddr(i0,r0,r1)              baddr(ARM_CC_VC,i0,r0,r1)
1011 #  define bxaddi(i0,r0,i1)              baddi(ARM_CC_VC,i0,r0,i1)
1012 #  define bxaddr_u(i0,r0,r1)            baddr(ARM_CC_LO,i0,r0,r1)
1013 #  define bxaddi_u(i0,r0,i1)            baddi(ARM_CC_LO,i0,r0,i1)
1014 #  define bsubr(cc,i0,r0,r1)            _bsubr(_jit,cc,i0,r0,r1)
1015 static jit_word_t _bsubr(jit_state_t*,int,jit_word_t,jit_int32_t,jit_int32_t);
1016 #  define bsubi(cc,i0,r0,r1)            _bsubi(_jit,cc,i0,r0,r1)
1017 static jit_word_t _bsubi(jit_state_t*,int,jit_word_t,jit_int32_t,jit_word_t);
1018 #  define bosubr(i0,r0,r1)              bsubr(ARM_CC_VS,i0,r0,r1)
1019 #  define bosubi(i0,r0,i1)              bsubi(ARM_CC_VS,i0,r0,i1)
1020 #  define bosubr_u(i0,r0,r1)            bsubr(ARM_CC_LO,i0,r0,r1)
1021 #  define bosubi_u(i0,r0,i1)            bsubi(ARM_CC_LO,i0,r0,i1)
1022 #  define bxsubr(i0,r0,r1)              bsubr(ARM_CC_VC,i0,r0,r1)
1023 #  define bxsubi(i0,r0,i1)              bsubi(ARM_CC_VC,i0,r0,i1)
1024 #  define bxsubr_u(i0,r0,r1)            bsubr(ARM_CC_HS,i0,r0,r1)
1025 #  define bxsubi_u(i0,r0,i1)            bsubi(ARM_CC_HS,i0,r0,i1)
1026 #  define bmxr(cc,i0,r0,r1)             _bmxr(_jit,cc,i0,r0,r1)
1027 static jit_word_t _bmxr(jit_state_t*,int,jit_word_t,jit_int32_t,jit_int32_t);
1028 #  define bmxi(cc,i0,r0,r1)             _bmxi(_jit,cc,i0,r0,r1)
1029 static jit_word_t _bmxi(jit_state_t*,int,jit_word_t,jit_int32_t,jit_word_t);
1030 #  define bmsr(i0,r0,r1)                bmxr(ARM_CC_NE,i0,r0,r1)
1031 #  define bmsi(i0,r0,i1)                bmxi(ARM_CC_NE,i0,r0,i1)
1032 #  define bmcr(i0,r0,r1)                bmxr(ARM_CC_EQ,i0,r0,r1)
1033 #  define bmci(i0,r0,i1)                bmxi(ARM_CC_EQ,i0,r0,i1)
1034 #  define ldr_c(r0,r1)                  _ldr_c(_jit,r0,r1)
1035 static void _ldr_c(jit_state_t*,jit_int32_t,jit_int32_t);
1036 #  define ldi_c(r0,i0)                  _ldi_c(_jit,r0,i0)
1037 static void _ldi_c(jit_state_t*,jit_int32_t,jit_word_t);
1038 #  define ldxr_c(r0,r1,r2)              _ldxr_c(_jit,r0,r1,r2)
1039 static void _ldxr_c(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
1040 #  define ldxi_c(r0,r1,i0)              _ldxi_c(_jit,r0,r1,i0)
1041 static void _ldxi_c(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
1042 #  define ldr_uc(r0,r1)                 _ldr_uc(_jit,r0,r1)
1043 static void _ldr_uc(jit_state_t*,jit_int32_t,jit_int32_t);
1044 #  define ldi_uc(r0,i0)                 _ldi_uc(_jit,r0,i0)
1045 static void _ldi_uc(jit_state_t*,jit_int32_t,jit_word_t);
1046 #  define ldxr_uc(r0,r1,r2)             _ldxr_uc(_jit,r0,r1,r2)
1047 static void _ldxr_uc(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
1048 #  define ldxi_uc(r0,r1,i0)             _ldxi_uc(_jit,r0,r1,i0)
1049 static void _ldxi_uc(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
1050 #  define ldr_s(r0,r1)                  _ldr_s(_jit,r0,r1)
1051 static void _ldr_s(jit_state_t*,jit_int32_t,jit_int32_t);
1052 #  define ldi_s(r0,i0)                  _ldi_s(_jit,r0,i0)
1053 static void _ldi_s(jit_state_t*,jit_int32_t,jit_word_t);
1054 #  define ldxr_s(r0,r1,r2)              _ldxr_s(_jit,r0,r1,r2)
1055 static void _ldxr_s(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
1056 #  define ldxi_s(r0,r1,i0)              _ldxi_s(_jit,r0,r1,i0)
1057 static void _ldxi_s(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
1058 #  define ldr_us(r0,r1)                 _ldr_us(_jit,r0,r1)
1059 static void _ldr_us(jit_state_t*,jit_int32_t,jit_int32_t);
1060 #  define ldi_us(r0,i0)                 _ldi_us(_jit,r0,i0)
1061 static void _ldi_us(jit_state_t*,jit_int32_t,jit_word_t);
1062 #  define ldxr_us(r0,r1,r2)             _ldxr_us(_jit,r0,r1,r2)
1063 static void _ldxr_us(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
1064 #  define ldxi_us(r0,r1,i0)             _ldxi_us(_jit,r0,r1,i0)
1065 static void _ldxi_us(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
1066 #  define ldr_i(r0,r1)                  _ldr_i(_jit,r0,r1)
1067 static void _ldr_i(jit_state_t*,jit_int32_t,jit_int32_t);
1068 #  define ldi_i(r0,i0)                  _ldi_i(_jit,r0,i0)
1069 static void _ldi_i(jit_state_t*,jit_int32_t,jit_word_t);
1070 #  define ldxr_i(r0,r1,r2)              _ldxr_i(_jit,r0,r1,r2)
1071 static void _ldxr_i(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
1072 #  define ldxi_i(r0,r1,i0)              _ldxi_i(_jit,r0,r1,i0)
1073 static void _ldxi_i(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
1074 #  define str_c(r0,r1)                  _str_c(_jit,r0,r1)
1075 static void _str_c(jit_state_t*,jit_int32_t,jit_int32_t);
1076 #  define sti_c(i0,r0)                  _sti_c(_jit,i0,r0)
1077 static void _sti_c(jit_state_t*,jit_word_t,jit_int32_t);
1078 #  define stxr_c(r0,r1,r2)              _stxr_c(_jit,r0,r1,r2)
1079 static void _stxr_c(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
1080 #  define stxi_c(r0,r1,i0)              _stxi_c(_jit,r0,r1,i0)
1081 static void _stxi_c(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
1082 #  define str_s(r0,r1)                  _str_s(_jit,r0,r1)
1083 static void _str_s(jit_state_t*,jit_int32_t,jit_int32_t);
1084 #  define sti_s(i0,r0)                  _sti_s(_jit,i0,r0)
1085 static void _sti_s(jit_state_t*,jit_word_t,jit_int32_t);
1086 #  define stxr_s(r0,r1,r2)              _stxr_s(_jit,r0,r1,r2)
1087 static void _stxr_s(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
1088 #  define stxi_s(r0,r1,i0)              _stxi_s(_jit,r0,r1,i0)
1089 static void _stxi_s(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
1090 #  define str_i(r0,r1)                  _str_i(_jit,r0,r1)
1091 static void _str_i(jit_state_t*,jit_int32_t,jit_int32_t);
1092 #  define sti_i(i0,r0)                  _sti_i(_jit,i0,r0)
1093 static void _sti_i(jit_state_t*,jit_word_t,jit_int32_t);
1094 #  define stxr_i(r0,r1,r2)              _stxr_i(_jit,r0,r1,r2)
1095 static void _stxr_i(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
1096 #  define stxi_i(r0,r1,i0)              _stxi_i(_jit,r0,r1,i0)
1097 static void _stxi_i(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
1098 #  if __BYTE_ORDER == __LITTLE_ENDIAN
1099 #  define htonr_us(r0,r1)               _htonr_us(_jit,r0,r1)
1100 static void _htonr_us(jit_state_t*,jit_int32_t,jit_int32_t);
1101 #  define htonr_ui(r0,r1)               _htonr_ui(_jit,r0,r1)
1102 static void _htonr_ui(jit_state_t*,jit_int32_t,jit_int32_t);
1103 #  else
1104 #    define htonr_us(r0,r1)             extr_us(r0,r1)
1105 #    define htonr(r0,r1)                movr(r0,r1)
1106 #  endif
1107 #  define extr_c(r0,r1)                 _extr_c(_jit,r0,r1)
1108 static void _extr_c(jit_state_t*,jit_int32_t,jit_int32_t);
1109 #  define extr_uc(r0,r1)                _extr_uc(_jit,r0,r1)
1110 static void _extr_uc(jit_state_t*,jit_int32_t,jit_int32_t);
1111 #  define extr_s(r0,r1)                 _extr_s(_jit,r0,r1)
1112 static void _extr_s(jit_state_t*,jit_int32_t,jit_int32_t);
1113 #  define extr_us(r0,r1)                _extr_us(_jit,r0,r1)
1114 static void _extr_us(jit_state_t*,jit_int32_t,jit_int32_t);
1115 #  define prolog(i0)                    _prolog(_jit,i0)
1116 static void _prolog(jit_state_t*,jit_node_t*);
1117 #  define epilog(i0)                    _epilog(_jit,i0)
1118 static void _epilog(jit_state_t*,jit_node_t*);
1119 #  define callr(r0)                     _callr(_jit,r0)
1120 static void _callr(jit_state_t*,jit_int32_t);
1121 #  define calli(i0)                     _calli(_jit,i0)
1122 static void _calli(jit_state_t*,jit_word_t);
1123 #  define calli_p(i0)                   _calli_p(_jit,i0)
1124 static jit_word_t _calli_p(jit_state_t*,jit_word_t);
1125 #  define vastart(r0)                   _vastart(_jit, r0)
1126 static void _vastart(jit_state_t*, jit_int32_t);
1127 #  define vaarg(r0, r1)                 _vaarg(_jit, r0, r1)
1128 static void _vaarg(jit_state_t*, jit_int32_t, jit_int32_t);
1129 #  define patch_at(kind,jump,label)     _patch_at(_jit,kind,jump,label)
1130 static void _patch_at(jit_state_t*,jit_int32_t,jit_word_t,jit_word_t);
1131 #endif
1132
1133 #if CODE
1134 /* from binutils */
1135 #  define rotate_left(v, n)     (v << n | v >> (32 - n))
1136 static int
1137 encode_arm_immediate(unsigned int v)
1138 {
1139     unsigned int        a, i;
1140
1141     for (i = 0; i < 32; i += 2)
1142         if ((a = rotate_left(v, i)) <= 0xff)
1143             return (a | (i << 7));
1144
1145     return (-1);
1146 }
1147
1148 static int
1149 encode_thumb_immediate(unsigned int v)
1150 {
1151     int                 i;
1152     unsigned int        m;
1153     unsigned int        n;
1154     /* 00000000 00000000 00000000 abcdefgh */
1155     if ((v & 0xff) == v)
1156         return (v);
1157     /* 00000000 abcdefgh 00000000 abcdefgh */
1158     if ((v & 0xff00ff) == v && ((v & 0xff0000) >> 16) == (v & 0xff))
1159         return ((v & 0xff) | (1 << 12));
1160     /* abcdefgh 00000000 abcdefgh 00000000 */
1161     if (((v & 0xffff0000) >> 16) == (v & 0xffff) && (v & 0xff) == 0)
1162         return ((v & 0x000000ff) | (2 << 12));
1163     /* abcdefgh abcdefgh abcdefgh abcdefgh */
1164     if ( (v &    0xff)        == ((v &     0xff00) >>  8) &&
1165         ((v &   0xff00) >> 8) == ((v &   0xff0000) >> 16) &&
1166         ((v & 0xff0000) << 8) ==  (v & 0xff000000))
1167         return ((v & 0xff) | (3 << 12));
1168     /* 1bcdefgh << 24 ... 1bcdefgh << 1 */
1169     for (i = 8, m = 0xff000000, n = 0x80000000;
1170          i < 23; i++, m >>= 1,  n >>= 1) {
1171         if ((v & m) == v && (v & n)) {
1172             v >>= 32 - i;
1173             if (!(i & 1))
1174                 v &= 0x7f;
1175             i >>= 1;
1176             return (((i & 7) << 12) | ((i & 8) << 23) | v);
1177         }
1178     }
1179     return (-1);
1180 }
1181
1182 static int
1183 encode_thumb_word_immediate(unsigned int v)
1184 {
1185     if ((v & 0xfffff000) == 0)
1186         return (((v & 0x800) << 15) | ((v & 0x700) << 4) | (v & 0xff));
1187     return (-1);
1188 }
1189
1190 static int
1191 encode_thumb_jump(int v)
1192 {
1193     int         s, i1, i2, j1, j2;
1194     if (v >= (int)-0x800000 && v <= 0x7fffff) {
1195         s  = !!(v & 0x800000);
1196         i1 = !!(v & 0x400000);
1197         i2 = !!(v & 0x200000);
1198         j1 = s ? i1 : !i1;
1199         j2 = s ? i2 : !i2;
1200         return ((s<<26)|((v&0x1ff800)<<5)|(j1<<13)|(j2<<11)|(v&0x7ff));
1201     }
1202     return (-1);
1203 }
1204
1205 static int
1206 encode_thumb_cc_jump(int v)
1207 {
1208     int         s, j1, j2;
1209     if (v >= (int)-0x80000 && v <= 0x7ffff) {
1210         s  = !!(v & 0x80000);
1211         j1 = !!(v & 0x20000);
1212         j2 = !!(v & 0x40000);
1213         return ((s<<26)|((v&0x1f800)<<5)|(j1<<13)|(j2<<11)|(v&0x7ff));
1214     }
1215     return (-1);
1216 }
1217
1218 static int
1219 encode_thumb_shift(int v, int type)
1220 {
1221     switch (type) {
1222         case ARM_ASR:
1223         case ARM_LSL:
1224         case ARM_LSR:           type >>= 1;     break;
1225         default:                assert(!"handled shift");
1226     }
1227     assert(v >= 0 && v <= 31);
1228     return (((v & 0x1c) << 10) | ((v & 3) << 6) | type);
1229 }
1230
1231 static void
1232 _tcit(jit_state_t *_jit, unsigned int tc, int it)
1233 {
1234     int         c;
1235     int         m;
1236     c = (tc >> 28) & 1;
1237     assert(!(tc & 0xfffffff) && tc != ARM_CC_NV);
1238     switch (it) {
1239         case THUMB2_IT:         m =   1<<3;                     break;
1240         case THUMB2_ITT:        m =  (c<<3)| (1<<2);            break;
1241         case THUMB2_ITE:        m = (!c<<3)| (1<<2);            break;
1242         case THUMB2_ITTT:       m =  (c<<3)| (c<<2)| (1<<1);    break;
1243         case THUMB2_ITET:       m = (!c<<3)| (c<<2)| (1<<1);    break;
1244         case THUMB2_ITTE:       m =  (c<<3)|(!c<<2)| (1<<1);    break;
1245         case THUMB2_ITEE:       m = (!c<<3)|(!c<<2)| (1<<1);    break;
1246         case THUMB2_ITTTT:      m =  (c<<3)| (c<<2)| (c<<1)|1;  break;
1247         case THUMB2_ITETT:      m = (!c<<3)| (c<<2)| (c<<1)|1;  break;
1248         case THUMB2_ITTET:      m =  (c<<3)|(!c<<2)| (c<<1)|1;  break;
1249         case THUMB2_ITEET:      m = (!c<<3)|(!c<<2)| (c<<1)|1;  break;
1250         case THUMB2_ITTTE:      m =  (c<<3)| (c<<2)|(!c<<1)|1;  break;
1251         case THUMB2_ITETE:      m = (!c<<3)| (c<<2)|(!c<<1)|1;  break;
1252         case THUMB2_ITTEE:      m =  (c<<3)|(!c<<2)|(!c<<1)|1;  break;
1253         case THUMB2_ITEEE:      m = (!c<<3)|(!c<<2)|(!c<<1)|1;  break;
1254         default:                abort();
1255     }
1256     assert(m && (tc != ARM_CC_AL || !(m & (m - 1))));
1257     is(0xbf00 | (tc >> 24) | m);
1258 }
1259
1260 static void
1261 _corrr(jit_state_t *_jit, int cc, int o, int rn, int rd, int rm)
1262 {
1263     assert(!(cc & 0x0fffffff));
1264     assert(!(o  & 0xf00fff0f));
1265     ii(cc|o|(_u4(rn)<<16)|(_u4(rd)<<12)|_u4(rm));
1266 }
1267
1268 static void
1269 _corri(jit_state_t *_jit, int cc, int o, int rn, int rd, int im)
1270 {
1271     assert(!(cc & 0x0fffffff));
1272     assert(!(o  & 0xf00fffff));
1273     assert(!(im & 0xfffff000));
1274     ii(cc|o|(_u4(rn)<<16)|(_u4(rd)<<12)|_u12(im));
1275 }
1276
1277 static void
1278 _corri8(jit_state_t *_jit, int cc, int o, int rn, int rt, int im)
1279 {
1280     assert(!(cc & 0x0fffffff));
1281     assert(!(o  & 0xf00fff0f));
1282     assert(!(im & 0xffffff00));
1283     ii(cc|o|(_u4(rn)<<16)|(_u4(rt)<<12)|((im&0xf0)<<4)|(im&0x0f));
1284 }
1285
1286 static void
1287 _coriw(jit_state_t *_jit, int cc, int o, int rd, int im)
1288 {
1289     assert(!(cc & 0x0fffffff));
1290     assert(!(o  & 0xf00fffff));
1291     assert(!(im & 0xffff0000));
1292     ii(cc|o|((im&0xf000)<<4)|(_u4(rd)<<12)|(im&0xfff));
1293 }
1294
1295 static void
1296 _torrr(jit_state_t *_jit, int o, int rn, int rd, int rm)
1297 {
1298     jit_thumb_t thumb;
1299     assert(!(o & 0xf0f0f));
1300     thumb.i = o|(_u4(rn)<<16)|(_u4(rd)<<8)|_u4(rm);
1301     iss(thumb.s[0], thumb.s[1]);
1302 }
1303
1304 static void
1305 _torrrs(jit_state_t *_jit, int o, int rn, int rd, int rm, int im)
1306 {
1307     jit_thumb_t thumb;
1308     assert(!(o  & 0x000f0f0f));
1309     assert(!(im & 0xffff8f0f));
1310     thumb.i = o|(_u4(rn)<<16)|(_u4(rd)<<8)|im|_u4(rm);
1311     iss(thumb.s[0], thumb.s[1]);
1312 }
1313
1314 static void
1315 _torxr(jit_state_t *_jit, int o, int rn, int rt, int rm)
1316 {
1317     jit_thumb_t thumb;
1318     assert(!(o & 0xf0f0f));
1319     thumb.i = o|(_u4(rn)<<16)|(_u4(rt)<<12)|_u4(rm);
1320     iss(thumb.s[0], thumb.s[1]);
1321 }
1322
1323 static void
1324 _torrrr(jit_state_t *_jit, int o, int rn, int rl, int rh, int rm)
1325 {
1326     jit_thumb_t thumb;
1327     assert(!(o & 0x000fff0f));
1328     thumb.i = o|(_u4(rn)<<16)|(_u4(rl)<<12)|(_u4(rh)<<8)|_u4(rm);
1329     iss(thumb.s[0], thumb.s[1]);
1330 }
1331
1332 static void
1333 _torrri8(jit_state_t *_jit, int o, int rn, int rt, int rt2, int im)
1334 {
1335     jit_thumb_t thumb;
1336     assert(!(o  & 0x000fffff));
1337     assert(!(im & 0xffffff00));
1338     thumb.i = o|(_u4(rn)<<16)|(_u4(rt)<<12)|(_u4(rt2)<<8)|im;
1339     iss(thumb.s[0], thumb.s[1]);
1340 }
1341
1342 static void
1343 _torri(jit_state_t *_jit, int o, int rn, int rd, int im)
1344 {
1345     jit_thumb_t thumb;
1346     assert(!(o  & 0x0c0f7fff));
1347     assert(!(im & 0xfbff8f00));
1348     thumb.i = o|(_u4(rn)<<16)|(_u4(rd)<<8)|im;
1349     iss(thumb.s[0], thumb.s[1]);
1350 }
1351
1352 static void
1353 _torri8(jit_state_t *_jit, int o, int rn, int rt, int im)
1354 {
1355     jit_thumb_t thumb;
1356     assert(!(o  & 0x000ff0ff));
1357     assert(!(im & 0xffffff00));
1358     thumb.i = o|(_u4(rn)<<16)|(_u4(rt)<<12)|im;
1359     iss(thumb.s[0], thumb.s[1]);
1360 }
1361
1362 static void
1363 _torri12(jit_state_t *_jit, int o, int rn, int rt, int im)
1364 {
1365     jit_thumb_t thumb;
1366     assert(!(o  & 0x000fffff));
1367     assert(!(im & 0xfffff000));
1368     thumb.i = o|(_u4(rn)<<16)|(_u4(rt)<<12)|im;
1369     iss(thumb.s[0], thumb.s[1]);
1370 }
1371
1372 static void
1373 _tshift(jit_state_t *_jit, int o, int rd, int rm, int im)
1374 {
1375     jit_thumb_t thumb;
1376     assert(!(o & 0x7fcf));
1377     assert(im >= 0 && im < 32);
1378     thumb.i = o|((im&0x1c)<<10)|(_u4(rd)<<8)|((im&3)<<6)|_u4(rm);
1379     iss(thumb.s[0], thumb.s[1]);
1380 }
1381
1382 static void
1383 _toriw(jit_state_t *_jit, int o, int rd, int im)
1384 {
1385     jit_thumb_t thumb;
1386     assert(!(im & 0xffff0000));
1387     thumb.i = o|((im&0xf000)<<4)|((im&0x800)<<15)|((im&0x700)<<4)|(_u4(rd)<<8)|(im&0xff);
1388     iss(thumb.s[0], thumb.s[1]);
1389 }
1390
1391 static void
1392 _tc8(jit_state_t *_jit, int cc, int im)
1393 {
1394     assert(!(cc & 0x0fffffff));
1395     assert(cc != ARM_CC_AL && cc != ARM_CC_NV);
1396     assert(im >= -128 && im <= 127);
1397     is(THUMB_CC_B|(cc>>20)|(im&0xff));
1398 }
1399
1400 static void
1401 _t11(jit_state_t *_jit, int im)
1402 {
1403     assert(!(im & 0xfffff800));
1404     is(THUMB_B|im);
1405 }
1406
1407 static void
1408 _tcb(jit_state_t *_jit, int cc, int im)
1409 {
1410     jit_thumb_t thumb;
1411     assert(!(cc & 0xfffffff));
1412     assert(cc != ARM_CC_AL && cc != ARM_CC_NV);
1413     cc = ((jit_uint32_t)cc) >> 6;
1414     assert(!(im & (THUMB2_CC_B|cc)));
1415     thumb.i = THUMB2_CC_B|cc|im;
1416     iss(thumb.s[0], thumb.s[1]);
1417 }
1418
1419 static void
1420 _blxi(jit_state_t *_jit, int im)
1421 {
1422     assert(!(im & 0xfe000000));
1423     ii(ARM_BLXI|im);
1424 }
1425
1426 static void
1427 _tb(jit_state_t *_jit, int o, int im)
1428 {
1429     jit_thumb_t thumb;
1430     assert(!(o & 0x07ff2fff));
1431     assert(!(o & im));
1432     thumb.i = o|im;
1433     iss(thumb.s[0], thumb.s[1]);
1434 }
1435
1436 static void
1437 _corrrr(jit_state_t *_jit, int cc, int o, int rh, int rl, int rm, int rn)
1438 {
1439     assert(!(cc & 0x0fffffff));
1440     assert(!(o & 0xf00fff0f));
1441     ii(cc|o|(_u4(rh)<<16)|(_u4(rl)<<12)|(_u4(rm)<<8)|_u4(rn));
1442 }
1443
1444 static void
1445 _corrrs(jit_state_t *_jit, int cc, int o, int rn, int rd, int rm, int im)
1446 {
1447     assert(!(cc & 0x0fffffff));
1448     assert(!(o  & 0xf000ff8f));
1449     ii(cc|o|(_u4(rd)<<12)|(_u4(rn)<<16)|(im<<7)|_u4(rm));
1450 }
1451
1452 static void
1453 _cshift(jit_state_t *_jit, int cc, int o, int rd, int rm, int rn, int im)
1454 {
1455     assert(!(cc & 0x0fffffff));
1456     assert(!(o  & 0xffe0ff8f));
1457     assert(((_u4(rm)<<8)&(im<<7)) == 0);
1458     ii(cc|ARM_SHIFT|o|(_u4(rd)<<12)|(_u4(rm)<<8)|(im<<7)|_u4(rn));
1459 }
1460
1461 static void
1462 _cb(jit_state_t *_jit, int cc, int o, int im)
1463 {
1464     assert(!(cc & 0x0fffffff));
1465     assert(!(o  & 0xf0ffffff));
1466     ii(cc|o|_u24(im));
1467 }
1468
1469 static void
1470 _cbx(jit_state_t *_jit, int cc, int o, int rm)
1471 {
1472     assert(!(cc & 0x0fffffff));
1473     assert(!(o  & 0xf000000f));
1474     ii(cc|o|_u4(rm));
1475 }
1476
1477 static void
1478 _corl(jit_state_t *_jit, int cc, int o, int r0, int i0)
1479 {
1480     assert(!(cc & 0x0fffffff));
1481     assert(!(o  & 0xf00fffff));
1482     ii(cc|o|(_u4(r0)<<16)|_u16(i0));
1483 }
1484
1485 static void
1486 _c6orr(jit_state_t *_jit, int cc, int o, int rd, int rm)
1487 {
1488     assert(!(cc & 0x0fffffff));
1489     assert(!(o  & 0xf000f00f));
1490     ii(cc|o|(_u4(rd)<<12)|_u4(rm));
1491 }
1492
1493 static void
1494 _tpp(jit_state_t *_jit, int o, int im)
1495 {
1496     jit_thumb_t thumb;
1497     assert(!(o & 0x0000ffff));
1498     if (o == THUMB2_PUSH)
1499         assert(!(im & 0x8000));
1500     assert(__builtin_popcount(im & 0x1fff) > 1);
1501     thumb.i = o|im;
1502     iss(thumb.s[0], thumb.s[1]);
1503 }
1504
1505 static void
1506 _torl(jit_state_t *_jit, int o, int rn, int im)
1507 {
1508     jit_thumb_t thumb;
1509     assert(!(o & 0xf1fff));
1510     assert(rn != _R15 || !im || ((o & 0xc000) == 0xc000));
1511     assert(!(o & THUMB2_LDM_W) || !(im & (1 << rn)));
1512     thumb.i = o | (_u4(rn)<<16)|_u13(im);
1513     iss(thumb.s[0], thumb.s[1]);
1514 }
1515
1516 static void
1517 _nop(jit_state_t *_jit, jit_int32_t i0)
1518 {
1519     if (jit_thumb_p()) {
1520         for (; i0 > 0; i0 -= 2)
1521             T1_NOP();
1522     }
1523     else {
1524         for (; i0 > 0; i0 -= 4)
1525             NOP();
1526     }
1527     assert(i0 == 0);
1528 }
1529
1530 static void
1531 _movr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
1532 {
1533     if (r0 != r1) {
1534         if (jit_thumb_p())
1535             T1_MOV(r0, r1);
1536         else
1537             MOV(r0, r1);
1538     }
1539 }
1540
1541 static void
1542 _movi(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
1543 {
1544     int                 i;
1545     if (jit_thumb_p()) {
1546         if (!jit_no_set_flags() && r0 < 8 && !(i0 & 0xffffff80))
1547             T1_MOVI(r0, i0);
1548         else if ((i = encode_thumb_immediate(i0)) != -1)
1549             T2_MOVI(r0, i);
1550         else if ((i = encode_thumb_immediate(~i0)) != -1)
1551             T2_MVNI(r0, i);
1552         else {
1553             T2_MOVWI(r0, (jit_uint16_t)i0);
1554             if (i0 & 0xffff0000)
1555                 T2_MOVTI(r0, (jit_uint16_t)((unsigned)i0 >> 16));
1556         }
1557     }
1558     else {
1559         if (jit_armv6_p() && !(i0 & 0xffff0000))
1560             MOVWI(r0, i0);
1561         else if ((i = encode_arm_immediate(i0)) != -1)
1562             MOVI(r0, i);
1563         else if ((i = encode_arm_immediate(~i0)) != -1)
1564             MVNI(r0, i);
1565         else if (jit_armv6_p()) {
1566             MOVWI(r0, (jit_uint16_t)(i0));
1567             if ((i0 & 0xffff0000))
1568                 MOVTI(r0, (jit_uint16_t)((unsigned)i0 >> 16));
1569         }
1570         else
1571             load_const(0, r0, i0);
1572     }
1573 }
1574
1575 static jit_word_t
1576 _movi_p(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
1577 {
1578     jit_word_t          w;
1579     w = _jit->pc.w;
1580     if (jit_thumb_p()) {
1581         T2_MOVWI(r0, (jit_uint16_t)(i0));
1582         T2_MOVTI(r0, (jit_uint16_t)((unsigned)i0 >> 16));
1583     }
1584     else
1585         load_const(1, r0, 0);
1586     return (w);
1587 }
1588
1589 static void
1590 _movznr(jit_state_t *_jit, int ct, jit_int32_t r0,
1591         jit_int32_t r1, jit_int32_t r2)
1592 {
1593     if (jit_thumb_p()) {
1594         if (r2 < 7)
1595             T1_CMPI(r2, 0);
1596         else
1597             T2_CMPI(r2, 0);
1598         IT(ct);
1599         T1_MOV(r0, r1);
1600     } else {
1601         CMPI(r2, 0);
1602         CC_MOV(ct, r0, r1);
1603     }
1604 }
1605
1606 static void
1607 _movnr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1608 {
1609     _movznr(_jit, ARM_CC_NE, r0, r1, r2);
1610 }
1611
1612 static void
1613 _movzr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1614 {
1615     _movznr(_jit, ARM_CC_EQ, r0, r1, r2);
1616 }
1617
1618 static void
1619 _comr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
1620 {
1621     if (jit_thumb_p()) {
1622         if (!jit_no_set_flags() && (r0|r1) < 8)
1623             T1_NOT(r0, r1);
1624         else
1625             T2_NOT(r0, r1);
1626     }
1627     else
1628         NOT(r0, r1);
1629 }
1630
1631 static void
1632 _negr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
1633 {
1634     if (jit_thumb_p()) {
1635         if (!jit_no_set_flags() && (r0|r1) < 8)
1636             T1_RSBI(r0, r1);
1637         else
1638             T2_RSBI(r0, r1, 0);
1639     }
1640     else
1641         RSBI(r0, r1, 0);
1642 }
1643
1644 static void
1645 _addr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1646 {
1647     if (jit_thumb_p()) {
1648         if (!jit_no_set_flags() && (r0|r1|r2) < 8)
1649             T1_ADD(r0, r1, r2);
1650         else if (r0 == r1 || r0 == r2)
1651             T1_ADDX(r0, r0 == r1 ? r2 : r1);
1652         else
1653             T2_ADD(r0, r1, r2);
1654     }
1655     else
1656         ADD(r0, r1, r2);
1657 }
1658
1659 static void
1660 _addi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1661 {
1662     int                 i;
1663     jit_int32_t         reg;
1664     if (jit_thumb_p()) {
1665         if (!jit_no_set_flags() && (r0|r1) < 8 && !(i0 & ~7))
1666             T1_ADDI3(r0, r1, i0);
1667         else if (!jit_no_set_flags() && (r0|r1) < 8 && !(-i0 & ~7))
1668             T1_SUBI3(r0, r1, -i0);
1669         else if (!jit_no_set_flags() && r0 < 8 && r0 == r1 && !(i0 & ~0xff))
1670             T1_ADDI8(r0, i0);
1671         else if (!jit_no_set_flags() && r0 < 8 && r0 == r1 && !(-i0 & ~0xff))
1672             T1_SUBI8(r0, -i0);
1673         else if ((i = encode_thumb_immediate(i0)) != -1)
1674             T2_ADDI(r0, r1, i);
1675         else if ((i = encode_thumb_immediate(-i0)) != -1)
1676             T2_SUBI(r0, r1, i);
1677         else if ((i = encode_thumb_word_immediate(i0)) != -1)
1678             T2_ADDWI(r0, r1, i);
1679         else if ((i = encode_thumb_word_immediate(-i0)) != -1)
1680             T2_SUBWI(r0, r1, i);
1681         else {
1682             reg = jit_get_reg(jit_class_gpr);
1683             movi(rn(reg), i0);
1684             T2_ADD(r0, r1, rn(reg));
1685             jit_unget_reg(reg);
1686         }
1687     }
1688     else {
1689         if ((i = encode_arm_immediate(i0)) != -1)
1690             ADDI(r0, r1, i);
1691         else if ((i = encode_arm_immediate(-i0)) != -1)
1692             SUBI(r0, r1, i);
1693         else if (r0 != r1) {
1694             movi(r0, i0);
1695             ADD(r0, r1, r0);
1696         }
1697         else {
1698             reg = jit_get_reg(jit_class_gpr);
1699             movi(rn(reg), i0);
1700             ADD(r0, r1, rn(reg));
1701             jit_unget_reg(reg);
1702         }
1703     }
1704 }
1705
1706 static void
1707 _addcr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1708 {
1709     if (jit_thumb_p()) {
1710         /* thumb auto set carry if not inside IT block */
1711         if ((r0|r1|r2) < 8)
1712             T1_ADD(r0, r1, r2);
1713         else
1714             T2_ADDS(r0, r1, r2);
1715     }
1716     else
1717         ADDS(r0, r1, r2);
1718 }
1719
1720 static void
1721 _addci(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1722 {
1723     int                 i;
1724     jit_int32_t         reg;
1725     if (jit_thumb_p()) {
1726         if ((r0|r1) < 8 && !(i0 & ~7))
1727             T1_ADDI3(r0, r1, i0);
1728         else if ((r0|r1) < 8 && !(-i0 & ~7))
1729             T1_SUBI3(r0, r1, -i0);
1730         else if (r0 < 8 && r0 == r1 && !(i0 & ~0xff))
1731             T1_ADDI8(r0, i0);
1732         else if (r0 < 8 && r0 == r1 && !(-i0 & ~0xff))
1733             T1_SUBI8(r0, -i0);
1734         else if ((i = encode_thumb_immediate(i0)) != -1)
1735             T2_ADDSI(r0, r1, i);
1736         else if ((i = encode_thumb_immediate(-i0)) != -1)
1737             T2_SUBSI(r0, r1, i);
1738         else {
1739             reg = jit_get_reg(jit_class_gpr);
1740             movi(rn(reg), i0);
1741             T2_ADDS(r0, r1, rn(reg));
1742             jit_unget_reg(reg);
1743         }
1744     }
1745     else {
1746         if ((i = encode_arm_immediate(i0)) != -1)
1747             ADDSI(r0, r1, i);
1748         else if ((i = encode_arm_immediate(-i0)) != -1)
1749             SUBSI(r0, r1, i);
1750         else if (r0 != r1) {
1751             movi(r0, i0);
1752             ADDS(r0, r1, r0);
1753         }
1754         else {
1755             reg = jit_get_reg(jit_class_gpr);
1756             movi(rn(reg), i0);
1757             ADDS(r0, r1, rn(reg));
1758             jit_unget_reg(reg);
1759         }
1760     }
1761 }
1762
1763 static void
1764 _addxr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1765 {
1766     /* keep setting carry because don't know last ADC */
1767     if (jit_thumb_p()) {
1768         /* thumb auto set carry if not inside IT block */
1769         if ((r0|r1|r2) < 8 && (r0 == r1 || r0 == r2))
1770             T1_ADC(r0, r0 == r1 ? r2 : r1);
1771         else
1772             T2_ADCS(r0, r1, r2);
1773     }
1774     else
1775         ADCS(r0, r1, r2);
1776 }
1777
1778 static void
1779 _addxi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1780 {
1781     int                 i;
1782     jit_int32_t         reg;
1783     int                 no_set_flags;
1784     if (jit_thumb_p()) {
1785         no_set_flags = jit_no_set_flags();
1786         jit_no_set_flags() = 1;
1787         if ((i = encode_thumb_immediate(i0)) != -1)
1788             T2_ADCSI(r0, r1, i);
1789         else if ((i = encode_thumb_immediate(-i0)) != -1)
1790             T2_SBCSI(r0, r1, i);
1791         else if (r0 != r1) {
1792             movi(r0, i0);
1793             T2_ADCS(r0, r1, r0);
1794         }
1795         else {
1796             reg = jit_get_reg(jit_class_gpr);
1797             movi(rn(reg), i0);
1798             T2_ADCS(r0, r1, rn(reg));
1799             jit_unget_reg(reg);
1800         }
1801         jit_no_set_flags() = no_set_flags;
1802     }
1803     else {
1804         if ((i = encode_arm_immediate(i0)) != -1)
1805             ADCSI(r0, r1, i);
1806         else if ((i = encode_arm_immediate(-i0)) != -1)
1807             SBCSI(r0, r1, i);
1808         else if (r0 != r1) {
1809             movi(r0, i0);
1810             ADCS(r0, r1, r0);
1811         }
1812         else {
1813             reg = jit_get_reg(jit_class_gpr);
1814             movi(rn(reg), i0);
1815             ADCS(r0, r1, rn(reg));
1816             jit_unget_reg(reg);
1817         }
1818     }
1819 }
1820
1821 static void
1822 _subr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1823 {
1824     if (jit_thumb_p()) {
1825         if (!jit_no_set_flags() && (r0|r1|r2) < 8)
1826             T1_SUB(r0, r1, r2);
1827         else
1828             T2_SUB(r0, r1, r2);
1829     }
1830     else
1831         SUB(r0, r1, r2);
1832 }
1833
1834 static void
1835 _subi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1836 {
1837     int                 i;
1838     jit_int32_t         reg;
1839     if (jit_thumb_p()) {
1840         if (!jit_no_set_flags() && (r0|r1) < 8 && !(i0 & ~7))
1841             T1_SUBI3(r0, r1, i0);
1842         else if (!jit_no_set_flags() && (r0|r1) < 8 && !(-i0 & ~7))
1843             T1_ADDI3(r0, r1, -i0);
1844         else if (!jit_no_set_flags() && r0 < 8 && r0 == r1 && !(i0 & ~0xff))
1845             T1_SUBI8(r0, i0);
1846         else if (!jit_no_set_flags() && r0 < 8 && r0 == r1 && !(-i0 & ~0xff))
1847             T1_ADDI8(r0, -i0);
1848         else if ((i = encode_thumb_immediate(i0)) != -1)
1849             T2_SUBI(r0, r1, i);
1850         else if ((i = encode_thumb_immediate(-i0)) != -1)
1851             T2_ADDI(r0, r1, i);
1852         else if ((i = encode_thumb_word_immediate(i0)) != -1)
1853             T2_SUBWI(r0, r1, i);
1854         else if ((i = encode_thumb_word_immediate(-i0)) != -1)
1855             T2_ADDWI(r0, r1, i);
1856         else {
1857             reg = jit_get_reg(jit_class_gpr);
1858             movi(rn(reg), i0);
1859             T2_SUB(r0, r1, rn(reg));
1860             jit_unget_reg(reg);
1861         }
1862     }
1863     else {
1864         if ((i = encode_arm_immediate(i0)) != -1)
1865             SUBI(r0, r1, i);
1866         else if ((i = encode_arm_immediate(-i0)) != -1)
1867             ADDI(r0, r1, i);
1868         else if (r0 != r1) {
1869             movi(r0, i0);
1870             SUB(r0, r1, r0);
1871         }
1872         else {
1873             reg = jit_get_reg(jit_class_gpr);
1874             movi(rn(reg), i0);
1875             SUB(r0, r1, rn(reg));
1876             jit_unget_reg(reg);
1877         }
1878     }
1879 }
1880
1881 static void
1882 _subcr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1883 {
1884     if (jit_thumb_p()) {
1885         /* thumb auto set carry if not inside IT block */
1886         if ((r0|r1|r2) < 8)
1887             T1_SUB(r0, r1, r2);
1888         else
1889             T2_SUBS(r0, r1, r2);
1890     }
1891     else
1892         SUBS(r0, r1, r2);
1893 }
1894
1895 static void
1896 _subci(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1897 {
1898     int                 i;
1899     jit_int32_t         reg;
1900     if (jit_thumb_p()) {
1901         if ((r0|r1) < 8 && !(i0 & ~7))
1902             T1_SUBI3(r0, r1, i0);
1903         else if ((r0|r1) < 8 && !(-i0 & ~7))
1904             T1_ADDI3(r0, r1, -i0);
1905         else if (r0 < 8 && r0 == r1 && !(i0 & ~0xff))
1906             T1_SUBI8(r0, i0);
1907         else if (r0 < 8 && r0 == r1 && !(-i0 & ~0xff))
1908             T1_ADDI8(r0, -i0);
1909         else if ((i = encode_thumb_immediate(i0)) != -1)
1910             T2_SUBSI(r0, r1, i);
1911         else if ((i = encode_thumb_immediate(-i0)) != -1)
1912             T2_ADDSI(r0, r1, i);
1913         else {
1914             reg = jit_get_reg(jit_class_gpr);
1915             movi(rn(reg), i0);
1916             T2_SUBS(r0, r1, rn(reg));
1917             jit_unget_reg(reg);
1918         }
1919     }
1920     else {
1921         if ((i = encode_arm_immediate(i0)) != -1)
1922             SUBSI(r0, r1, i);
1923         else if ((i = encode_arm_immediate(-i0)) != -1)
1924             ADDSI(r0, r1, i);
1925         else if (r0 != r1) {
1926             movi(r0, i0);
1927             SUBS(r0, r1, r0);
1928         }
1929         else {
1930             reg = jit_get_reg(jit_class_gpr);
1931             movi(rn(reg), i0);
1932             SUBS(r0, r1, rn(reg));
1933             jit_unget_reg(reg);
1934         }
1935     }
1936 }
1937
1938 static void
1939 _subxr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1940 {
1941     /* keep setting carry because don't know last SBC */
1942     if (jit_thumb_p()) {
1943         /* thumb auto set carry if not inside IT block */
1944         if ((r0|r1|r2) < 8 && r0 == r1)
1945             T1_SBC(r0, r2);
1946         else
1947             T2_SBCS(r0, r1, r2);
1948     }
1949     else
1950         SBCS(r0, r1, r2);
1951 }
1952
1953 static void
1954 _subxi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1955 {
1956     int                 i;
1957     jit_int32_t         reg;
1958     int                 no_set_flags;
1959     if (jit_thumb_p()) {
1960         no_set_flags = jit_no_set_flags();
1961         jit_no_set_flags() = 1;
1962         if ((i = encode_arm_immediate(i0)) != -1)
1963             T2_SBCSI(r0, r1, i);
1964         else if ((i = encode_arm_immediate(-i0)) != -1)
1965             T2_ADCSI(r0, r1, i);
1966         else if (r0 != r1) {
1967             movi(r0, i0);
1968             T2_SBCS(r0, r1, r0);
1969         }
1970         else {
1971             reg = jit_get_reg(jit_class_gpr);
1972             movi(rn(reg), i0);
1973             SBCS(r0, r1, rn(reg));
1974             jit_unget_reg(reg);
1975         }
1976         jit_no_set_flags() = no_set_flags;
1977     }
1978     else {
1979         if ((i = encode_arm_immediate(i0)) != -1)
1980             SBCSI(r0, r1, i);
1981         else if ((i = encode_arm_immediate(-i0)) != -1)
1982             ADCSI(r0, r1, i);
1983         else if (r0 != r1) {
1984             movi(r0, i0);
1985             SBCS(r0, r1, r0);
1986         }
1987         else {
1988             reg = jit_get_reg(jit_class_gpr);
1989             movi(rn(reg), i0);
1990             SBCS(r0, r1, rn(reg));
1991             jit_unget_reg(reg);
1992         }
1993     }
1994 }
1995
1996 static void
1997 _rsbi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1998 {
1999     subi(r0, r1, i0);
2000     negr(r0, r0);
2001 }
2002
2003 static void
2004 _mulr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2005 {
2006     jit_int32_t         reg;
2007     if (jit_thumb_p()) {
2008         if (!jit_no_set_flags() && r0 == r2 && (r0|r1) < 8)
2009             T1_MUL(r0, r1);
2010         else if (!jit_no_set_flags() && r0 == r1 && (r0|r2) < 8)
2011             T1_MUL(r0, r2);
2012         else
2013             T2_MUL(r0, r1, r2);
2014     }
2015     else {
2016         if (r0 == r1 && !jit_armv6_p()) {
2017             if (r0 != r2)
2018                 MUL(r0, r2, r1);
2019             else {
2020                 reg = jit_get_reg(jit_class_gpr);
2021                 MOV(rn(reg), r1);
2022                 MUL(r0, rn(reg), r2);
2023                 jit_unget_reg(reg);
2024             }
2025         }
2026         else
2027             MUL(r0, r1, r2);
2028     }
2029 }
2030
2031 static void
2032 _muli(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2033 {
2034     jit_int32_t         reg;
2035     reg = jit_get_reg(jit_class_gpr);
2036     movi(rn(reg), i0);
2037     mulr(r0, r1, rn(reg));
2038     jit_unget_reg(reg);
2039 }
2040
2041 static void
2042 _iqmulr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1,
2043         jit_int32_t r2, jit_int32_t r3, jit_bool_t sign)
2044 {
2045     jit_int32_t         reg;
2046     if (jit_thumb_p()) {
2047         if (r2 == r3) {
2048             reg = jit_get_reg(jit_class_gpr);
2049             movr(rn(reg), r2);
2050             if (sign)
2051                 T2_SMULL(r0, r1, rn(reg), r2);
2052             else
2053                 T2_UMULL(r0, r1, rn(reg), r2);
2054             jit_unget_reg(reg);
2055         }
2056         else if (r0 != r2 && r1 != r2) {
2057             if (sign)
2058                 T2_SMULL(r0, r1, r2, r3);
2059             else
2060                 T2_UMULL(r0, r1, r2, r3);
2061         }
2062         else {
2063             if (sign)
2064                 T2_SMULL(r0, r1, r3, r2);
2065             else
2066                 T2_UMULL(r0, r1, r3, r2);
2067         }
2068     }
2069     else {
2070         if (r2 == r3) {
2071             reg = jit_get_reg(jit_class_gpr);
2072             movr(rn(reg), r2);
2073             if (sign)
2074                 SMULL(r0, r1, rn(reg), r2);
2075             else
2076                 UMULL(r0, r1, rn(reg), r2);
2077             jit_unget_reg(reg);
2078         }
2079         else if (r0 != r2 && r1 != r2) {
2080             if (sign)
2081                 SMULL(r0, r1, r2, r3);
2082             else
2083                 UMULL(r0, r1, r2, r3);
2084         }
2085         else {
2086             if (sign)
2087                 SMULL(r0, r1, r3, r2);
2088             else
2089                 UMULL(r0, r1, r3, r2);
2090         }
2091     }
2092 }
2093
2094 static void
2095 _iqmuli(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1,
2096         jit_int32_t r2, jit_word_t i0, jit_bool_t sign)
2097 {
2098     jit_int32_t         reg;
2099     reg = jit_get_reg(jit_class_gpr);
2100     movi(rn(reg), i0);
2101     iqmulr(r0, r1, r2, rn(reg), sign);
2102     jit_unget_reg(reg);
2103 }
2104
2105 static void
2106 _divrem(jit_state_t *_jit, int div, int sign,
2107         jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2108 {
2109     jit_word_t          d;
2110     jit_word_t          w;
2111     jit_get_reg_args();
2112     movr(_R0_REGNO, r1);
2113     movr(_R1_REGNO, r2);
2114     if (sign)                   w = (jit_word_t)__aeabi_idivmod;
2115     else                        w = (jit_word_t)__aeabi_uidivmod;
2116     if (!jit_exchange_p()) {
2117         if (jit_thumb_p())      d = ((w - _jit->pc.w) >> 1) - 2;
2118         else                    d = ((w - _jit->pc.w) >> 2) - 2;
2119         if (_s24P(d)) {
2120             if (jit_thumb_p())  T2_BLI(encode_thumb_jump(d));
2121             else                BLI(d & 0x00ffffff);
2122         }
2123         else                    goto fallback;
2124     }
2125     else {
2126     fallback:
2127         movi(_R2_REGNO, w);
2128         if (jit_thumb_p())      T1_BLX(_R2_REGNO);
2129         else                    BLX(_R2_REGNO);
2130     }
2131     if (div)                    movr(r0, _R0_REGNO);
2132     else                        movr(r0, _R1_REGNO);
2133     jit_unget_reg_args();
2134 }
2135
2136 static void
2137 _divr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2138 {
2139     if (jit_armv7r_p() && jit_thumb_p())
2140         T2_SDIV(r0, r1, r2);
2141     else
2142         divrem(1, 1, r0, r1, r2);
2143 }
2144
2145 static void
2146 _divi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2147 {
2148     jit_int32_t         reg;
2149     reg = jit_get_reg(jit_class_gpr);
2150     movi(rn(reg), i0);
2151     divr(r0, r1, rn(reg));
2152     jit_unget_reg(reg);
2153 }
2154
2155 static void
2156 _divr_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2157 {
2158     if (jit_armv7r_p() && jit_thumb_p())
2159         T2_UDIV(r0, r1, r2);
2160     else
2161         divrem(1, 0, r0, r1, r2);
2162 }
2163
2164 static void
2165 _divi_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2166 {
2167     jit_int32_t         reg;
2168     reg = jit_get_reg(jit_class_gpr);
2169     movi(rn(reg), i0);
2170     divr_u(r0, r1, rn(reg));
2171     jit_unget_reg(reg);
2172 }
2173
2174 static void
2175 _iqdivr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1,
2176         jit_int32_t r2, jit_int32_t r3, jit_bool_t sign)
2177 {
2178     jit_word_t          d;
2179     jit_word_t          w;
2180     jit_get_reg_args();
2181     movr(_R0_REGNO, r2);
2182     movr(_R1_REGNO, r3);
2183     if (sign)                   w = (jit_word_t)__aeabi_idivmod;
2184     else                        w = (jit_word_t)__aeabi_uidivmod;
2185     if (!jit_exchange_p()) {
2186         if (jit_thumb_p())      d = ((w - _jit->pc.w) >> 1) - 2;
2187         else                    d = ((w - _jit->pc.w) >> 2) - 2;
2188         if (_s24P(d)) {
2189             if (jit_thumb_p())  T2_BLI(encode_thumb_jump(d));
2190             else                BLI(d & 0x00ffffff);
2191         }
2192         else                    goto fallback;
2193     }
2194     else {
2195     fallback:
2196         movi(_R2_REGNO, w);
2197         if (jit_thumb_p())      T1_BLX(_R2_REGNO);
2198         else                    BLX(_R2_REGNO);
2199     }
2200     movr(r0, _R0_REGNO);
2201     movr(r1, _R1_REGNO);
2202     jit_unget_reg_args();
2203 }
2204
2205 static void
2206 _iqdivi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1,
2207         jit_int32_t r2, jit_word_t i0, jit_bool_t sign)
2208 {
2209     jit_int32_t         reg;
2210     reg = jit_get_reg(jit_class_gpr);
2211     movi(rn(reg), i0);
2212     iqdivr(r0, r1, r2, rn(reg), sign);
2213     jit_unget_reg(reg);
2214 }
2215
2216 static void
2217 _remr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2218 {
2219     divrem(0, 1, r0, r1, r2);
2220 }
2221
2222 static void
2223 _remi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2224 {
2225     jit_int32_t         reg;
2226     reg = jit_get_reg(jit_class_gpr);
2227     movi(rn(reg), i0);
2228     remr(r0, r1, rn(reg));
2229     jit_unget_reg(reg);
2230 }
2231
2232 static void
2233 _remr_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2234 {
2235     divrem(0, 0, r0, r1, r2);
2236 }
2237
2238 static void
2239 _remi_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2240 {
2241     jit_int32_t         reg;
2242     reg = jit_get_reg(jit_class_gpr);
2243     movi(rn(reg), i0);
2244     remr_u(r0, r1,rn(reg));
2245     jit_unget_reg(reg);
2246 }
2247
2248 static void
2249 _andr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2250 {
2251     if (jit_thumb_p()) {
2252         if (!jit_no_set_flags() && (r0|r1|r2) < 8 && (r0 == r1 || r0 == r2))
2253             T1_AND(r0, r0 == r1 ? r2 : r1);
2254         else
2255             T2_AND(r0, r1, r2);
2256     }
2257     else
2258         AND(r0, r1, r2);
2259 }
2260
2261 static void
2262 _andi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2263 {
2264     int                 i;
2265     jit_int32_t         reg;
2266     if (jit_thumb_p()) {
2267         if ((i = encode_thumb_immediate(i0)) != -1)
2268             T2_ANDI(r0, r1, i);
2269         else if ((i = encode_thumb_immediate(~i0)) != -1)
2270             T2_BICI(r0, r1, i);
2271         else if (r0 != r1) {
2272             movi(r0, i0);
2273             T2_AND(r0, r1, r0);
2274         }
2275         else {
2276             reg = jit_get_reg(jit_class_gpr);
2277             movi(rn(reg), i0);
2278             T2_AND(r0, r1, rn(reg));
2279             jit_unget_reg(reg);
2280         }
2281     }
2282     else {
2283         if ((i = encode_arm_immediate(i0)) != -1)
2284             ANDI(r0, r1, i);
2285         else if ((i = encode_arm_immediate(~i0)) != -1)
2286             BICI(r0, r1, i);
2287         else if (r0 != r1) {
2288             movi(r0, i0);
2289             AND(r0, r1, r0);
2290         }
2291         else {
2292             reg = jit_get_reg(jit_class_gpr);
2293             movi(rn(reg), i0);
2294             AND(r0, r1, rn(reg));
2295             jit_unget_reg(reg);
2296         }
2297     }
2298 }
2299
2300 static void
2301 _orr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2302 {
2303     if (jit_thumb_p()) {
2304         if (!jit_no_set_flags() && (r0|r1|r2) < 8 && (r0 == r1 || r0 == r2))
2305             T1_ORR(r0, r0 == r1 ? r2 : r1);
2306         else
2307             T2_ORR(r0, r1, r2);
2308     }
2309     else
2310         ORR(r0, r1, r2);
2311 }
2312
2313 static void
2314 _ori(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2315 {
2316     int                 i;
2317     jit_int32_t         reg;
2318     if (jit_thumb_p()) {
2319         if ((i = encode_thumb_immediate(i0)) != -1)
2320             T2_ORRI(r0, r1, i);
2321         else if (r0 != r1) {
2322             movi(r0, i0);
2323             T2_ORR(r0, r1, r0);
2324         }
2325         else {
2326             reg = jit_get_reg(jit_class_gpr);
2327             movi(rn(reg), i0);
2328             T2_ORR(r0, r1, rn(reg));
2329             jit_unget_reg(reg);
2330         }
2331     }
2332     else {
2333         if ((i = encode_arm_immediate(i0)) != -1)
2334             ORRI(r0, r1, i);
2335         else if (r0 != r1) {
2336             movi(r0, i0);
2337             ORR(r0, r1, r0);
2338         }
2339         else {
2340             reg = jit_get_reg(jit_class_gpr);
2341             movi(rn(reg), i0);
2342             ORR(r0, r1, rn(reg));
2343             jit_unget_reg(reg);
2344         }
2345     }
2346 }
2347
2348 static void
2349 _xorr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2350 {
2351     if (jit_thumb_p()) {
2352         if (!jit_no_set_flags() && (r0|r1|r2) < 8 && (r0 == r1 || r0 == r2))
2353             T1_EOR(r0, r0 == r1 ? r2 : r1);
2354         else
2355             T2_EOR(r0, r1, r2);
2356     }
2357     else
2358         EOR(r0, r1, r2);
2359 }
2360
2361 static void
2362 _xori(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2363 {
2364     int                 i;
2365     jit_int32_t         reg;
2366     if (jit_thumb_p()) {
2367         if ((i = encode_thumb_immediate(i0)) != -1)
2368             T2_EORI(r0, r1, i);
2369         else if (r0 != r1) {
2370             movi(r0, i0);
2371             T2_EOR(r0, r1, r0);
2372         }
2373         else {
2374             reg = jit_get_reg(jit_class_gpr);
2375             movi(rn(reg), i0);
2376             T2_EOR(r0, r1, rn(reg));
2377             jit_unget_reg(reg);
2378         }
2379     }
2380     else {
2381         if ((i = encode_arm_immediate(i0)) != -1)
2382             EORI(r0, r1, i);
2383         else if (r0 != r1) {
2384             movi(r0, i0);
2385             EOR(r0, r1, r0);
2386         }
2387         else {
2388             reg = jit_get_reg(jit_class_gpr);
2389             movi(rn(reg), i0);
2390             EOR(r0, r1, rn(reg));
2391             jit_unget_reg(reg);
2392         }
2393     }
2394 }
2395
2396 static void
2397 _lshr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2398 {
2399     if (jit_thumb_p()) {
2400         if (!jit_no_set_flags() && (r0|r1|r2) < 8 && r0 == r1)
2401             T1_LSL(r0, r2);
2402         else
2403             T2_LSL(r0, r1, r2);
2404     }
2405     else
2406         LSL(r0, r1, r2);
2407 }
2408
2409 static void
2410 _lshi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2411 {
2412     assert(i0 >= 0 && i0 <= 31);
2413     if (i0 == 0)
2414         movr(r0, r1);
2415     else if (jit_thumb_p()) {
2416         if (!jit_no_set_flags() && (r0|r1) < 8)
2417             T1_LSLI(r0, r1, i0);
2418         else
2419             T2_LSLI(r0, r1, i0);
2420     }
2421     else
2422         LSLI(r0, r1, i0);
2423 }
2424
2425 static void
2426 _rshr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2427 {
2428     if (jit_thumb_p()) {
2429         if (!jit_no_set_flags() && (r0|r1|r2) < 8 && r0 == r1)
2430             T1_ASR(r0, r2);
2431         else
2432             T2_ASR(r0, r1, r2);
2433     }
2434     else
2435         ASR(r0, r1, r2);
2436 }
2437
2438 static void
2439 _rshi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2440 {
2441     assert(i0 >= 0 && i0 <= 31);
2442     if (i0 == 0)
2443         movr(r0, r1);
2444     else if (jit_thumb_p()) {
2445         if (!jit_no_set_flags() && (r0|r1) < 8)
2446             T1_ASRI(r0, r1, i0);
2447         else
2448             T2_ASRI(r0, r1, i0);
2449     }
2450     else
2451         ASRI(r0, r1, i0);
2452 }
2453
2454 static void
2455 _rshr_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2456 {
2457     if (jit_thumb_p()) {
2458         if (!jit_no_set_flags() && (r0|r1|r2) < 8 && r0 == r1)
2459             T1_LSR(r0, r2);
2460         else
2461             T2_LSR(r0, r1, r2);
2462     }
2463     else
2464         LSR(r0, r1, r2);
2465 }
2466
2467 static void
2468 _rshi_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2469 {
2470     assert(i0 >= 0 && i0 <= 31);
2471     if (i0 == 0)
2472         movr(r0, r1);
2473     else if (jit_thumb_p()) {
2474         if (!jit_no_set_flags() && (r0|r1) < 8)
2475             T1_LSRI(r0, r1, i0);
2476         else
2477             T2_LSRI(r0, r1, i0);
2478     }
2479     else
2480         LSRI(r0, r1, i0);
2481 }
2482
2483 static void
2484 _ccr(jit_state_t *_jit, int ct, int cf,
2485      jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2486 {
2487     if (jit_thumb_p()) {
2488         assert((ct ^ cf) >> 28 == 1);
2489         if ((r1|r2) < 8)
2490             T1_CMP(r1, r2);
2491         else if ((r1&r2) & 8)
2492             T1_CMPX(r1, r2);
2493         else
2494             T2_CMP(r1, r2);
2495         ITE(ct);
2496         if (r0 < 8) {
2497             T1_MOVI(r0, 1);
2498             T1_MOVI(r0, 0);
2499         }
2500         else {
2501             T2_MOVI(r0, 1);
2502             T2_MOVI(r0, 0);
2503         }
2504     }
2505     else {
2506         CMP(r1, r2);
2507         CC_MOVI(ct, r0, 1);
2508         CC_MOVI(cf, r0, 0);
2509     }
2510 }
2511
2512 static void
2513 _cci(jit_state_t *_jit, int ct, int cf,
2514      jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2515 {
2516     int                 i;
2517     jit_int32_t         reg;
2518     if (jit_thumb_p()) {
2519         if (r1 < 7 && !(i0 & 0xffffff00))
2520             T1_CMPI(r1, i0);
2521         else if ((i = encode_thumb_immediate(i0)) != -1)
2522             T2_CMPI(r1, i);
2523         else if ((i = encode_thumb_immediate(-i0)) != -1)
2524             T2_CMNI(r1, i);
2525         else {
2526             reg = jit_get_reg(jit_class_gpr);
2527             movi(rn(reg), i0);
2528             ccr(ct, cf, r0, r1, rn(reg));
2529             jit_unget_reg(reg);
2530             return;
2531         }
2532         ITE(ct);
2533         if (r0 < 8) {
2534             T1_MOVI(r0, 1);
2535             T1_MOVI(r0, 0);
2536         }
2537         else {
2538             T2_MOVI(r0, 1);
2539             T2_MOVI(r0, 0);
2540         }
2541     }
2542     else {
2543         if ((i = encode_arm_immediate(i0)) != -1)
2544             CMPI(r1, i);
2545         else if ((i = encode_arm_immediate(-i0)) != -1)
2546             CMNI(r1, i);
2547         else if (r0 != r1) {
2548             movi(r0, i0);
2549             CMP(r1, r0);
2550         }
2551         else {
2552             reg = jit_get_reg(jit_class_gpr);
2553             movi(rn(reg), i0);
2554             CMP(r1, rn(reg));
2555             jit_unget_reg(reg);
2556         }
2557         CC_MOVI(ct, r0, 1);
2558         CC_MOVI(cf, r0, 0);
2559     }
2560 }
2561
2562 static void
2563 _ner(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2564 {
2565     if (jit_thumb_p())
2566         ccr(ARM_CC_NE, ARM_CC_EQ, r0, r1, r2);
2567     else {
2568         SUBS(r0, r1, r2);
2569         CC_MOVI(ARM_CC_NE, r0, 1);
2570     }
2571 }
2572
2573 static void
2574 _nei(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2575 {
2576     int                 i;
2577     jit_int32_t         reg;
2578     if (jit_thumb_p())
2579         cci(ARM_CC_NE, ARM_CC_EQ, r0, r1, i0);
2580     else {
2581         if ((i = encode_arm_immediate(i0)) != -1)
2582             SUBSI(r0, r1, i);
2583         else if ((i = encode_arm_immediate(-i0)) != -1)
2584             ADDSI(r0, r1, i);
2585         else if (r0 != r1) {
2586             movi(r0, i0);
2587             SUBS(r0, r1, r0);
2588         }
2589         else {
2590             reg = jit_get_reg(jit_class_gpr);
2591             movi(rn(reg), i0);
2592             SUBS(r0, r1, rn(reg));
2593             jit_unget_reg(reg);
2594         }
2595         CC_MOVI(ARM_CC_NE, r0, 1);
2596     }
2597 }
2598
2599 static void
2600 _jmpr(jit_state_t *_jit, jit_int32_t r0)
2601 {
2602     if (jit_thumb_p())
2603         T1_MOV(_R15_REGNO, r0);
2604     else
2605         MOV(_R15_REGNO, r0);
2606 }
2607
2608 static void
2609 _jmpi(jit_state_t *_jit, jit_word_t i0)
2610 {
2611     jit_word_t          w;
2612     jit_word_t          d;
2613     jit_int32_t         reg;
2614     w = _jit->pc.w;
2615     /* if thumb and in thumb mode */
2616     if (jit_thumb_p() && _jitc->thumb) {
2617         d = ((i0 - w) >> 1) - 2;
2618         if (d >= -1024 && d <= 1023)
2619             T1_B(d & 0x7ff);
2620         else if (_s24P(d))
2621             T2_B(encode_thumb_jump(d));
2622         else {
2623             reg = jit_get_reg(jit_class_gpr|jit_class_nospill);
2624             movi(rn(reg), i0);
2625             jmpr(rn(reg));
2626             jit_unget_reg(reg);
2627         }
2628     }
2629     else {
2630         d = ((i0 - w) >> 2) - 2;
2631         if (_s24P(d))
2632             B(d & 0x00ffffff);
2633         else {
2634             reg = jit_get_reg(jit_class_gpr|jit_class_nospill);
2635             movi(rn(reg), i0);
2636             jmpr(rn(reg));
2637             jit_unget_reg(reg);
2638         }
2639     }
2640 }
2641
2642 static jit_word_t
2643 _jmpi_p(jit_state_t *_jit, jit_word_t i0, jit_bool_t i1)
2644 {
2645     jit_word_t          w;
2646     jit_word_t          d;
2647     jit_int32_t         reg;
2648     if (i1) {
2649         /* Assume jump is not longer than 23 bits if inside jit */
2650         w = _jit->pc.w;
2651         /* if thumb and in thumb mode */
2652         if (jit_thumb_p() && _jitc->thumb) {
2653             d = ((i0 - w) >> 1) - 2;
2654             assert(_s24P(d));
2655             T2_B(encode_thumb_jump(d));
2656         }
2657         else {
2658             d = ((i0 - w) >> 2) - 2;
2659             assert(_s24P(d));
2660             B(d & 0x00ffffff);
2661         }
2662     }
2663     else {
2664         reg = jit_get_reg(jit_class_gpr|jit_class_nospill);
2665         w = movi_p(rn(reg), i0);
2666         jmpr(rn(reg));
2667         jit_unget_reg(reg);
2668     }
2669     return (w);
2670 }
2671
2672 static jit_word_t
2673 _bccr(jit_state_t *_jit, int cc, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
2674 {
2675     jit_word_t          w;
2676     jit_word_t          d;
2677     if (jit_thumb_p()) {
2678         if ((r0|r1) < 8)
2679             T1_CMP(r0, r1);
2680         else if ((r0&r1) & 8)
2681             T1_CMPX(r0, r1);
2682         else
2683             T2_CMP(r0, r1);
2684         /* use only thumb2 conditional as does not know if will be patched */
2685         w = _jit->pc.w;
2686         d = ((i0 - w) >> 1) - 2;
2687         assert(_s20P(d));
2688         T2_CC_B(cc, encode_thumb_cc_jump(d));
2689     }
2690     else {
2691         CMP(r0, r1);
2692         w = _jit->pc.w;
2693         d = ((i0 - w) >> 2) - 2;
2694         assert(_s24P(d));
2695         CC_B(cc, d & 0x00ffffff);
2696     }
2697     return (w);
2698 }
2699
2700 static jit_word_t
2701 _bcci(jit_state_t *_jit, int cc, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
2702 {
2703     jit_word_t          w;
2704     jit_word_t          d;
2705     int                 i;
2706     jit_int32_t         reg;
2707     if (jit_thumb_p()) {
2708         if (r0 < 7 && !(i1 & 0xffffff00))
2709             T1_CMPI(r0, i1);
2710         else if ((i = encode_thumb_immediate(i1)) != -1)
2711             T2_CMPI(r0, i);
2712         else if ((i = encode_thumb_immediate(-i1)) != -1)
2713             T2_CMNI(r0, i);
2714         else {
2715             reg = jit_get_reg(jit_class_gpr);
2716             movi(rn(reg), i1);
2717             T2_CMP(r0, rn(reg));
2718             jit_unget_reg(reg);
2719         }
2720         /* use only thumb2 conditional as does not know if will be patched */
2721         w = _jit->pc.w;
2722         d = ((i0 - w) >> 1) - 2;
2723         assert(_s20P(d));
2724         T2_CC_B(cc, encode_thumb_cc_jump(d));
2725     }
2726     else {
2727         if ((i = encode_arm_immediate(i1)) != -1)
2728             CMPI(r0, i);
2729         else if ((i = encode_arm_immediate(-i1)) != -1)
2730             CMNI(r0, i);
2731         else {
2732             reg = jit_get_reg(jit_class_gpr);
2733             movi(rn(reg), i1);
2734             CMP(r0, rn(reg));
2735             jit_unget_reg(reg);
2736         }
2737         w = _jit->pc.w;
2738         d = ((i0 - w) >> 2) - 2;
2739         assert(_s24P(d));
2740         CC_B(cc, d & 0x00ffffff);
2741     }
2742     return (w);
2743 }
2744
2745 static jit_word_t
2746 _baddr(jit_state_t *_jit, int cc, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
2747 {
2748     jit_word_t          w;
2749     jit_word_t          d;
2750     if (jit_thumb_p()) {
2751         if ((r0|r1) < 8)
2752             T1_ADD(r0, r0, r1);
2753         else
2754             T2_ADDS(r0, r0, r1);
2755         w = _jit->pc.w;
2756         d = ((i0 - w) >> 1) - 2;
2757         assert(_s20P(d));
2758         T2_CC_B(cc, encode_thumb_cc_jump(d));
2759     }
2760     else {
2761         ADDS(r0, r0, r1);
2762         w = _jit->pc.w;
2763         d = ((i0 - w) >> 2) - 2;
2764         assert(_s24P(d));
2765         CC_B(cc, d & 0x00ffffff);
2766     }
2767     return (w);
2768 }
2769
2770 static jit_word_t
2771 _baddi(jit_state_t *_jit, int cc, jit_word_t i0, jit_int32_t r0, int i1)
2772 {
2773     int                 i;
2774     jit_word_t          w;
2775     jit_word_t          d;
2776     jit_int32_t         reg;
2777     if (jit_thumb_p()) {
2778         if (r0 < 8 && !(i1 & ~7))
2779             T1_ADDI3(r0, r0, i1);
2780         else if (r0 < 8 && !(-i1 & ~7))
2781             T1_SUBI3(r0, r0, -i1);
2782         else if (r0 < 8 && !(i1 & ~0xff))
2783             T1_ADDI8(r0, i1);
2784         else if (r0 < 8 && !(-i1 & ~0xff))
2785             T1_SUBI8(r0, -i1);
2786         else if ((i = encode_thumb_immediate(i1)) != -1)
2787             T2_ADDSI(r0, r0, i);
2788         else if ((i = encode_thumb_immediate(-i1)) != -1)
2789             T2_SUBSI(r0, r0, i);
2790         else {
2791             reg = jit_get_reg(jit_class_gpr);
2792             movi(rn(reg), i1);
2793             T2_ADDS(r0, r0, rn(reg));
2794             jit_unget_reg(reg);
2795         }
2796         w = _jit->pc.w;
2797         d = ((i0 - w) >> 1) - 2;
2798         assert(_s20P(d));
2799         T2_CC_B(cc, encode_thumb_cc_jump(d));
2800     }
2801     else {
2802         if ((i = encode_arm_immediate(i1)) != -1)
2803             ADDSI(r0, r0, i);
2804         else if ((i = encode_arm_immediate(-i1)) != -1)
2805             SUBSI(r0, r0, i);
2806         else {
2807             reg = jit_get_reg(jit_class_gpr);
2808             movi(rn(reg), i1);
2809             ADDS(r0, r0, rn(reg));
2810             jit_unget_reg(reg);
2811         }
2812         w = _jit->pc.w;
2813         d = ((i0 - w) >> 2) - 2;
2814         assert(_s24P(d));
2815         CC_B(cc, d & 0x00ffffff);
2816     }
2817     return (w);
2818 }
2819
2820 static jit_word_t
2821 _bsubr(jit_state_t *_jit, int cc, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
2822 {
2823     jit_word_t          w;
2824     jit_word_t          d;
2825     if (jit_thumb_p()) {
2826         if ((r0|r1) < 8)
2827             T1_SUB(r0, r0, r1);
2828         else
2829             T2_SUBS(r0, r0, r1);
2830         w = _jit->pc.w;
2831         d = ((i0 - w) >> 1) - 2;
2832         assert(_s20P(d));
2833         T2_CC_B(cc, encode_thumb_cc_jump(d));
2834     }
2835     else {
2836         SUBS(r0, r0, r1);
2837         w = _jit->pc.w;
2838         d = ((i0 - w) >> 2) - 2;
2839         assert(_s24P(d));
2840         CC_B(cc, d & 0x00ffffff);
2841     }
2842     return (w);
2843 }
2844
2845 static jit_word_t
2846 _bsubi(jit_state_t *_jit, int cc, jit_word_t i0, jit_int32_t r0, int i1)
2847 {
2848     int                 i;
2849     jit_word_t          w;
2850     jit_word_t          d;
2851     jit_int32_t         reg;
2852     if (jit_thumb_p()) {
2853         if (r0 < 8 && !(i1 & ~7))
2854             T1_SUBI3(r0, r0, i1);
2855         else if (r0 < 8 && !(-i1 & ~7))
2856             T1_ADDI3(r0, r0, -i1);
2857         else if (r0 < 8 && !(i1 & ~0xff))
2858             T1_SUBI8(r0, i1);
2859         else if (r0 < 8 && !(-i1 & ~0xff))
2860             T1_ADDI8(r0, -i1);
2861         else if ((i = encode_thumb_immediate(i1)) != -1)
2862             T2_SUBSI(r0, r0, i);
2863         else if ((i = encode_thumb_immediate(-i1)) != -1)
2864             T2_SUBSI(r0, r0, i);
2865         else {
2866             reg = jit_get_reg(jit_class_gpr);
2867             movi(rn(reg), i1);
2868             T2_SUBS(r0, r0, rn(reg));
2869             jit_unget_reg(reg);
2870         }
2871         w = _jit->pc.w;
2872         d = ((i0 - w) >> 1) - 2;
2873         assert(_s20P(d));
2874         T2_CC_B(cc, encode_thumb_cc_jump(d));
2875     }
2876     else {
2877         if ((i = encode_arm_immediate(i1)) != -1)
2878             SUBSI(r0, r0, i);
2879         else if ((i = encode_arm_immediate(-i1)) != -1)
2880             ADDSI(r0, r0, i);
2881         else {
2882             reg = jit_get_reg(jit_class_gpr);
2883             movi(rn(reg), i1);
2884             SUBS(r0, r0, rn(reg));
2885             jit_unget_reg(reg);
2886         }
2887         w = _jit->pc.w;
2888         d = ((i0 - w) >> 2) - 2;
2889         assert(_s24P(d));
2890         CC_B(cc, d & 0x00ffffff);
2891     }
2892     return (w);
2893 }
2894
2895 static jit_word_t
2896 _bmxr(jit_state_t *_jit, int cc, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
2897 {
2898     jit_word_t          w;
2899     jit_word_t          d;
2900     jit_int32_t         reg;
2901     if (jit_thumb_p()) {
2902         if ((r0|r1) < 8)
2903             T1_TST(r0, r1);
2904         else
2905             T2_TST(r0, r1);
2906         w = _jit->pc.w;
2907         d = ((i0 - w) >> 1) - 2;
2908         assert(_s20P(d));
2909         T2_CC_B(cc, encode_thumb_cc_jump(d));
2910     }
2911     else {
2912         if (jit_armv5_p())
2913             TST(r0, r1);
2914         else {
2915             reg = jit_get_reg(jit_class_gpr);
2916             ANDS(rn(reg), r0, r1);
2917             jit_unget_reg(reg);
2918         }
2919         w = _jit->pc.w;
2920         d = ((i0 - w) >> 2) - 2;
2921         assert(_s24P(d));
2922         CC_B(cc, d & 0x00ffffff);
2923     }
2924     return (w);
2925 }
2926
2927 static jit_word_t
2928 _bmxi(jit_state_t *_jit, int cc, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
2929 {
2930     int                 i;
2931     jit_word_t          w;
2932     jit_word_t          d;
2933     jit_int32_t         reg;
2934     if (jit_thumb_p()) {
2935         if ((i = encode_thumb_immediate(i1)) != -1)
2936             T2_TSTI(r0, i);
2937         else {
2938             reg = jit_get_reg(jit_class_gpr);
2939             movi(rn(reg), i1);
2940             T2_TST(r0, rn(reg));
2941             jit_unget_reg(reg);
2942         }
2943         w = _jit->pc.w;
2944         d = ((i0 - w) >> 1) - 2;
2945         assert(_s20P(d));
2946         T2_CC_B(cc, encode_thumb_cc_jump(d));
2947     }
2948     else {
2949         if (jit_armv5_p()) {
2950             if ((i = encode_arm_immediate(i1)) != -1)
2951                 TSTI(r0, i);
2952             else {
2953                 reg = jit_get_reg(jit_class_gpr);
2954                 movi(rn(reg), i1);
2955                 TST(r0, rn(reg));
2956                 jit_unget_reg(reg);
2957             }
2958         }
2959         else {
2960             reg = jit_get_reg(jit_class_gpr);
2961             if ((i = encode_arm_immediate(i1)) != -1)
2962                 ANDSI(rn(reg), r0, i);
2963             else if ((i = encode_arm_immediate(~i1)) != -1)
2964                 BICSI(rn(reg), r0, i);
2965             else {
2966                 movi(rn(reg), i1);
2967                 ANDS(rn(reg), r0, rn(reg));
2968             }
2969             jit_unget_reg(reg);
2970         }
2971         w = _jit->pc.w;
2972         d = ((i0 - w) >> 2) - 2;
2973         assert(_s24P(d));
2974         CC_B(cc, d & 0x00ffffff);
2975     }
2976     return (w);
2977 }
2978
2979 static void
2980 _ldr_c(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2981 {
2982     if (jit_thumb_p())
2983         T2_LDRSBI(r0, r1, 0);
2984     else
2985         LDRSBI(r0, r1, 0);
2986 }
2987
2988 static void
2989 _ldi_c(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
2990 {
2991     jit_int32_t         reg;
2992     reg = jit_get_reg(jit_class_gpr);
2993     movi(rn(reg), i0);
2994     if (jit_thumb_p())
2995         T2_LDRSBI(r0, rn(reg), 0);
2996     else
2997         LDRSBI(r0, rn(reg), 0);
2998     jit_unget_reg(reg);
2999 }
3000
3001 static void
3002 _ldxr_c(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
3003 {
3004     if (jit_thumb_p()) {
3005         if ((r0|r1|r2) < 8)
3006             T1_LDRSB(r0, r1, r2);
3007         else
3008             T2_LDRSB(r0, r1, r2);
3009     }
3010     else
3011         LDRSB(r0, r1, r2);
3012 }
3013
3014 static void
3015 _ldxi_c(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
3016 {
3017     jit_int32_t         reg;
3018     if (jit_thumb_p()) {
3019         if (jit_ldrt_strt_p() && i0 >= 0 && i0 <= 255)
3020             T2_LDRSBI(r0, r1, i0);
3021         else if (i0 < 0 && i0 >= -255)
3022             T2_LDRSBIN(r0, r1, -i0);
3023         else if (i0 >= 0 && i0 <= 4095)
3024             T2_LDRSBWI(r0, r1, i0);
3025         else if (r0 != r1) {
3026             movi(r0, i0);
3027             if ((r0|r1) < 8)
3028                 T1_LDRSB(r0, r1, r0);
3029             else
3030                 T2_LDRSB(r0, r1, r0);
3031         }
3032         else {
3033             reg = jit_get_reg(jit_class_gpr);
3034             movi(rn(reg), i0);
3035             if ((r0|r1|rn(reg)) < 8)
3036                 T1_LDRSB(r0, r1, rn(reg));
3037             else
3038                 T2_LDRSB(r0, r1, rn(reg));
3039             jit_unget_reg(reg);
3040         }
3041     }
3042     else {
3043         if (i0 >= 0 && i0 <= 255)
3044             LDRSBI(r0, r1, i0);
3045         else if (i0 < 0 && i0 >= -255)
3046             LDRSBIN(r0, r1, -i0);
3047         else if (r0 != r1) {
3048             movi(r0, i0);
3049             LDRSB(r0, r1, r0);
3050         }
3051         else {
3052             reg = jit_get_reg(jit_class_gpr);
3053             movi(rn(reg), i0);
3054             LDRSB(r0, r1, rn(reg));
3055             jit_unget_reg(reg);
3056         }
3057     }
3058 }
3059
3060 static void
3061 _ldr_uc(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3062 {
3063     if (jit_thumb_p())
3064         T2_LDRBI(r0, r1, 0);
3065     else
3066         LDRBI(r0, r1, 0);
3067 }
3068
3069 static void
3070 _ldi_uc(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
3071 {
3072     jit_int32_t         reg;
3073     reg = jit_get_reg(jit_class_gpr);
3074     movi(rn(reg), i0);
3075     if (jit_thumb_p())
3076         T2_LDRBI(r0, rn(reg), 0);
3077     else
3078         LDRBI(r0, rn(reg), 0);
3079     jit_unget_reg(reg);
3080 }
3081
3082 static void
3083 _ldxr_uc(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
3084 {
3085     if (jit_thumb_p()) {
3086         if ((r0|r1|r2) < 8)
3087             T1_LDRB(r0, r1, r2);
3088         else
3089             T2_LDRB(r0, r1, r2);
3090     }
3091     else
3092         LDRB(r0, r1, r2);
3093 }
3094
3095 static void
3096 _ldxi_uc(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
3097 {
3098     jit_int32_t         reg;
3099     if (jit_thumb_p()) {
3100         if ((r0|r1) < 8 && i0 >= 0 && i0 < 0x20)
3101             T1_LDRBI(r0, r1, i0);
3102         else if (jit_ldrt_strt_p() && i0 >= 0 && i0 <= 255)
3103             T2_LDRBI(r0, r1, i0);
3104         else if (i0 < 0 && i0 >= -255)
3105             T2_LDRBIN(r0, r1, -i0);
3106         else if (i0 >= 0 && i0 <= 4095)
3107             T2_LDRBWI(r0, r1, i0);
3108         else if (r0 != r1) {
3109             movi(r0, i0);
3110             if ((r0|r1) < 8)
3111                 T1_LDRB(r0, r1, r0);
3112             else
3113                 T2_LDRB(r0, r1, r0);
3114         }
3115         else {
3116             reg = jit_get_reg(jit_class_gpr);
3117             movi(rn(reg), i0);
3118             if ((r0|r1|rn(reg)) < 8)
3119                 T1_LDRB(r0, r1, rn(reg));
3120             else
3121                 T2_LDRB(r0, r1, rn(reg));
3122             jit_unget_reg(reg);
3123         }
3124     }
3125     else {
3126         if (i0 >= 0 && i0 <= 4095)
3127             LDRBI(r0, r1, i0);
3128         else if (i0 < 0 && i0 >= -4095)
3129             LDRBIN(r0, r1, -i0);
3130         else if (r0 != r1) {
3131             movi(r0, i0);
3132             LDRB(r0, r1, r0);
3133         }
3134         else {
3135             reg = jit_get_reg(jit_class_gpr);
3136             movi(rn(reg), i0);
3137             LDRB(r0, r1, rn(reg));
3138             jit_unget_reg(reg);
3139         }
3140     }
3141 }
3142
3143 static void
3144 _ldr_s(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3145 {
3146     if (jit_thumb_p())
3147         T2_LDRSHI(r0, r1, 0);
3148     else
3149         LDRSHI(r0, r1, 0);
3150 }
3151
3152 static void
3153 _ldi_s(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
3154 {
3155     jit_int32_t         reg;
3156     reg = jit_get_reg(jit_class_gpr);
3157     movi(rn(reg), i0);
3158     if (jit_thumb_p())
3159         T2_LDRSHI(r0, rn(reg), 0);
3160     else
3161         LDRSHI(r0, rn(reg), 0);
3162     jit_unget_reg(reg);
3163 }
3164
3165 static void
3166 _ldxr_s(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
3167 {
3168     if (jit_thumb_p()) {
3169         if ((r0|r1|r2) < 8)
3170             T1_LDRSH(r0, r1, r2);
3171         else
3172             T2_LDRSH(r0, r1, r2);
3173     }
3174     else
3175         LDRSH(r0, r1, r2);
3176 }
3177
3178 static void
3179 _ldxi_s(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
3180 {
3181     jit_int32_t         reg;
3182     if (jit_thumb_p()) {
3183         if (jit_ldrt_strt_p() && i0 >= 0 && i0 <= 255)
3184             T2_LDRSHI(r0, r1, i0);
3185         else if (i0 < 0 && i0 >= -255)
3186             T2_LDRSHIN(r0, r1, -i0);
3187         else if (i0 >= 0 && i0 <= 4095)
3188             T2_LDRSHWI(r0, r1, i0);
3189         else if (r0 != r1) {
3190             movi(r0, i0);
3191             if ((r0|r1) < 8)
3192                 T1_LDRSH(r0, r1, r0);
3193             else
3194                 T2_LDRSH(r0, r1, r0);
3195         }
3196         else {
3197             reg = jit_get_reg(jit_class_gpr);
3198             movi(rn(reg), i0);
3199             if ((r0|r1|rn(reg)) < 8)
3200                 T1_LDRSH(r0, r1, rn(reg));
3201             else
3202                 T2_LDRSH(r0, r1, rn(reg));
3203             jit_unget_reg(reg);
3204         }
3205     }
3206     else {
3207         if (i0 >= 0 && i0 <= 255)
3208             LDRSHI(r0, r1, i0);
3209         else if (i0 < 0 && i0 >= -255)
3210             LDRSHIN(r0, r1, -i0);
3211         else if (r0 != r1) {
3212             movi(r0, i0);
3213             LDRSH(r0, r1, r0);
3214         }
3215         else {
3216             reg = jit_get_reg(jit_class_gpr);
3217             movi(rn(reg), i0);
3218             LDRSH(r0, r1, rn(reg));
3219             jit_unget_reg(reg);
3220         }
3221     }
3222 }
3223
3224 static void
3225 _ldr_us(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3226 {
3227     if (jit_thumb_p())
3228         T2_LDRHI(r0, r1, 0);
3229     else
3230         LDRHI(r0, r1, 0);
3231 }
3232
3233 static void
3234 _ldi_us(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
3235 {
3236     jit_int32_t         reg;
3237     reg = jit_get_reg(jit_class_gpr);
3238     movi(rn(reg), i0);
3239     if (jit_thumb_p())
3240         T2_LDRHI(r0, rn(reg), 0);
3241     else
3242         LDRHI(r0, rn(reg), 0);
3243     jit_unget_reg(reg);
3244 }
3245
3246 static void
3247 _ldxr_us(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
3248 {
3249     if (jit_thumb_p()) {
3250         if ((r0|r1|r2) < 8)
3251             T1_LDRH(r0, r1, r2);
3252         else
3253             T2_LDRH(r0, r1, r2);
3254     }
3255     else
3256         LDRH(r0, r1, r2);
3257 }
3258
3259 static void
3260 _ldxi_us(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
3261 {
3262     jit_int32_t         reg;
3263     if (jit_thumb_p()) {
3264         if ((r0|r1) < 8 && i0 >= 0 && !(i0 & 1) && (i0 >> 1) < 0x20)
3265             T1_LDRHI(r0, r1, i0 >> 1);
3266         else if (jit_ldrt_strt_p() && i0 >= 0 && i0 <= 255)
3267             T2_LDRHI(r0, r1, i0);
3268         else if (i0 < 0 && i0 >= -255)
3269             T2_LDRHIN(r0, r1, -i0);
3270         else if (i0 >= 0 && i0 <= 4095)
3271             T2_LDRHWI(r0, r1, i0);
3272         else if (r0 != r1) {
3273             movi(r0, i0);
3274             if ((r0|r1) < 8)
3275                 T1_LDRH(r0, r1, r0);
3276             else
3277                 T2_LDRH(r0, r1, r0);
3278         }
3279         else {
3280             reg = jit_get_reg(jit_class_gpr);
3281             movi(rn(reg), i0);
3282             if ((r0|r1|rn(reg)) < 8)
3283                 T1_LDRH(r0, r1, rn(reg));
3284             else
3285                 T2_LDRH(r0, r1, rn(reg));
3286             jit_unget_reg(reg);
3287         }
3288     }
3289     else {
3290         if (i0 >= 0 && i0 <= 255)
3291             LDRHI(r0, r1, i0);
3292         else if (i0 < 0 && i0 >= -255)
3293             LDRHIN(r0, r1, -i0);
3294         else if (r0 != r1) {
3295             movi(r0, i0);
3296             LDRH(r0, r1, r0);
3297         }
3298         else {
3299             reg = jit_get_reg(jit_class_gpr);
3300             movi(rn(reg), i0);
3301             LDRH(r0, r1, rn(reg));
3302             jit_unget_reg(reg);
3303         }
3304     }
3305 }
3306
3307 static void
3308 _ldr_i(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3309 {
3310     if (jit_thumb_p())
3311         T2_LDRI(r0, r1, 0);
3312     else
3313         LDRI(r0, r1, 0);
3314 }
3315
3316 static void
3317 _ldi_i(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
3318 {
3319     jit_int32_t         reg;
3320     reg = jit_get_reg(jit_class_gpr);
3321     movi(rn(reg), i0);
3322     if (jit_thumb_p())
3323         T2_LDRI(r0, rn(reg), 0);
3324     else
3325         LDRI(r0, rn(reg), 0);
3326     jit_unget_reg(reg);
3327 }
3328
3329 static void
3330 _ldxr_i(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
3331 {
3332     if (jit_thumb_p()) {
3333         if ((r0|r1|r2) < 8)
3334             T1_LDR(r0, r1, r2);
3335         else
3336             T2_LDR(r0, r1, r2);
3337     }
3338     else
3339         LDR(r0, r1, r2);
3340 }
3341
3342 static void
3343 _ldxi_i(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
3344 {
3345     jit_int32_t         reg;
3346     if (jit_thumb_p()) {
3347         if ((r0|r1) < 8 && i0 >= 0 && !(i0 & 3) && (i0 >> 2) < 0x20)
3348             T1_LDRI(r0, r1, i0 >> 2);
3349         else if (r1 == _R13_REGNO && r0 < 8 &&
3350                  i0 >= 0 && !(i0 & 3) && (i0 >> 2) <= 255)
3351             T1_LDRISP(r0, i0 >> 2);
3352         else if (jit_ldrt_strt_p() && i0 >= 0 && i0 <= 255)
3353             T2_LDRI(r0, r1, i0);
3354         else if (i0 < 0 && i0 > -255)
3355             T2_LDRIN(r0, r1, -i0);
3356         else if (i0 >= 0 && i0 <= 4095)
3357             T2_LDRWI(r0, r1, i0);
3358         else if (r0 != r1) {
3359             movi(r0, i0);
3360             if ((r0|r1) < 8)
3361                 T1_LDR(r0, r1, r0);
3362             else
3363                 T2_LDR(r0, r1, r0);
3364         }
3365         else {
3366             reg = jit_get_reg(jit_class_gpr);
3367             movi(rn(reg), i0);
3368             if ((r0|r1|rn(reg)) < 8)
3369                 T1_LDR(r0, r1, rn(reg));
3370             else
3371                 T2_LDR(r0, r1, rn(reg));
3372             jit_unget_reg(reg);
3373         }
3374     }
3375     else {
3376         if (i0 >= 0 && i0 <= 4095)
3377             LDRI(r0, r1, i0);
3378         else if (i0 < 0 && i0 >= -4095)
3379             LDRIN(r0, r1, -i0);
3380         else if (r0 != r1) {
3381             movi(r0, i0);
3382             LDR(r0, r1, r0);
3383         }
3384         else {
3385             reg = jit_get_reg(jit_class_gpr);
3386             movi(rn(reg), i0);
3387             LDR(r0, r1, rn(reg));
3388             jit_unget_reg(reg);
3389         }
3390     }
3391 }
3392
3393 static void
3394 _str_c(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3395 {
3396     if (jit_thumb_p())
3397         T2_STRBI(r1, r0, 0);
3398     else
3399         STRBI(r1, r0, 0);
3400 }
3401
3402 static void
3403 _sti_c(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0)
3404 {
3405     jit_int32_t         reg;
3406     reg = jit_get_reg(jit_class_gpr);
3407     movi(rn(reg), i0);
3408     if (jit_thumb_p())
3409         T2_STRBI(r0, rn(reg), 0);
3410     else
3411         STRBI(r0, rn(reg), 0);
3412     jit_unget_reg(reg);
3413 }
3414
3415 static void
3416 _stxr_c(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
3417 {
3418     if (jit_thumb_p()) {
3419         if ((r0|r1|r2) < 8)
3420             T1_STRB(r2, r1, r0);
3421         else
3422             T2_STRB(r2, r1, r0);
3423     }
3424     else
3425         STRB(r2, r1, r0);
3426 }
3427
3428 static void
3429 _stxi_c(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3430 {
3431     jit_int32_t         reg;
3432     if (jit_thumb_p()) {
3433         if ((r0|r1) < 8 && i0 >= 0 && i0 < 0x20)
3434             T1_STRBI(r1, r0, i0);
3435         else if (jit_ldrt_strt_p() && i0 >= 0 && i0 <= 255)
3436             T2_STRBI(r1, r0, i0);
3437         else if (i0 < 0 && i0 >= -255)
3438             T2_STRBIN(r1, r0, -i0);
3439         else if (i0 >= 0 && i0 <= 4095)
3440             T2_STRBWI(r1, r0, i0);
3441         else {
3442             reg = jit_get_reg(jit_class_gpr);
3443             movi(rn(reg), i0);
3444             if ((r0|r1|rn(reg)) < 8)
3445                 T1_STRB(r1, r0, rn(reg));
3446             else
3447                 T2_STRB(r1, r0, rn(reg));
3448             jit_unget_reg(reg);
3449         }
3450     }
3451     else {
3452         if (i0 >= 0 && i0 <= 4095)
3453             STRBI(r1, r0, i0);
3454         else if (i0 < 0 && i0 >= -4095)
3455             STRBIN(r1, r0, -i0);
3456         else {
3457             reg = jit_get_reg(jit_class_gpr);
3458             movi(rn(reg), i0);
3459             STRB(r1, r0, rn(reg));
3460             jit_unget_reg(reg);
3461         }
3462     }
3463 }
3464
3465 static void
3466 _str_s(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3467 {
3468     if (jit_thumb_p())
3469         T2_STRHI(r1, r0, 0);
3470     else
3471         STRHI(r1, r0, 0);
3472 }
3473
3474 static void
3475 _sti_s(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0)
3476 {
3477     jit_int32_t         reg;
3478     reg = jit_get_reg(jit_class_gpr);
3479     movi(rn(reg), i0);
3480     if (jit_thumb_p())
3481         T2_STRHI(r0, rn(reg), 0);
3482     else
3483         STRHI(r0, rn(reg), 0);
3484     jit_unget_reg(reg);
3485 }
3486
3487 static void
3488 _stxr_s(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
3489 {
3490     if (jit_thumb_p()) {
3491         if ((r0|r1|r2) < 8)
3492             T1_STRH(r2, r1, r0);
3493         else
3494             T2_STRH(r2, r1, r0);
3495     }
3496     else
3497         STRH(r2, r1, r0);
3498 }
3499
3500 static void
3501 _stxi_s(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3502 {
3503     jit_int32_t         reg;
3504     if (jit_thumb_p()) {
3505         if ((r0|r1) < 8 && i0 >= 0 && !(i0 & 1) && (i0 >> 1) < 0x20)
3506             T1_STRHI(r1, r0, i0 >> 1);
3507         else if (jit_ldrt_strt_p() && i0 >= 0 && i0 <= 255)
3508             T2_STRHI(r1, r0, i0);
3509         else if (i0 < 0 && i0 >= -255)
3510             T2_STRHIN(r1, r0, -i0);
3511         else if (i0 >= 0 && i0 <= 4095)
3512             T2_STRHWI(r1, r0, i0);
3513         else {
3514             reg = jit_get_reg(jit_class_gpr);
3515             movi(rn(reg), i0);
3516             if ((r0|r1|rn(reg)) < 8)
3517                 T1_STRH(r1, r0, rn(reg));
3518             else
3519                 T2_STRH(r1, r0, rn(reg));
3520             jit_unget_reg(reg);
3521         }
3522     }
3523     else {
3524         if (i0 >= 0 && i0 <= 255)
3525             STRHI(r1, r0, i0);
3526         else if (i0 < 0 && i0 >= -255)
3527             STRHIN(r1, r0, -i0);
3528         else {
3529             reg = jit_get_reg(jit_class_gpr);
3530             movi(rn(reg), i0);
3531             STRH(r1, r0, rn(reg));
3532             jit_unget_reg(reg);
3533         }
3534     }
3535 }
3536
3537 static void
3538 _str_i(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3539 {
3540     if (jit_thumb_p())
3541         T2_STRI(r1, r0, 0);
3542     else
3543         STRI(r1, r0, 0);
3544 }
3545
3546 static void
3547 _sti_i(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0)
3548 {
3549     jit_int32_t         reg;
3550     reg = jit_get_reg(jit_class_gpr);
3551     movi(rn(reg), i0);
3552     if (jit_thumb_p())
3553         T2_STRI(r0, rn(reg), 0);
3554     else
3555         STRI(r0, rn(reg), 0);
3556     jit_unget_reg(reg);
3557 }
3558
3559 static void
3560 _stxr_i(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
3561 {
3562     if (jit_thumb_p()) {
3563         if ((r0|r1|r2) < 8)
3564             T1_STR(r2, r1, r0);
3565         else
3566             T2_STR(r2, r1, r0);
3567     }
3568     else
3569         STR(r2, r1, r0);
3570 }
3571
3572 static void
3573 _stxi_i(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3574 {
3575     jit_int32_t         reg;
3576     if (jit_thumb_p()) {
3577         if ((r0|r1) < 8 && i0 >= 0 && !(i0 & 3) && (i0 >> 2) < 0x20)
3578             T1_STRI(r1, r0, i0 >> 2);
3579         else if (r0 == _R13_REGNO && r1 < 8 &&
3580                  i0 >= 0 && !(i0 & 3) && (i0 >> 2) <= 255)
3581             T1_STRISP(r1, i0 >> 2);
3582         else if (jit_ldrt_strt_p() && i0 >= 0 && i0 <= 255)
3583             T2_STRI(r1, r0, i0);
3584         else if (i0 < 0 && i0 >= -255)
3585             T2_STRIN(r1, r0, -i0);
3586         else if (i0 >= 0 && i0 <= 4095)
3587             T2_STRWI(r1, r0, i0);
3588         else {
3589             reg = jit_get_reg(jit_class_gpr);
3590             movi(rn(reg), i0);
3591             if ((r0|r1|rn(reg)) < 8)
3592                 T1_STR(r1, r0, rn(reg));
3593             else
3594                 T2_STR(r1, r0, rn(reg));
3595             jit_unget_reg(reg);
3596         }
3597     }
3598     else {
3599         if (i0 >= 0 && i0 <= 4095)
3600             STRI(r1, r0, i0);
3601         else if (i0 < 0 && i0 >= -4095)
3602             STRIN(r1, r0, -i0);
3603         else {
3604             reg = jit_get_reg(jit_class_gpr);
3605             movi(rn(reg), i0);
3606             STR(r1, r0, rn(reg));
3607             jit_unget_reg(reg);
3608         }
3609     }
3610 }
3611
3612 #  if __BYTE_ORDER == __LITTLE_ENDIAN
3613 static void
3614 _htonr_us(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3615 {
3616     jit_int32_t         t0;
3617     if (jit_thumb_p()) {
3618         if ((r0|r1) < 8)
3619             T1_REV(r0, r1);
3620         else
3621             T2_REV(r0, r1);
3622         rshi_u(r0, r0, 16);
3623     }
3624     else {
3625         if (jit_armv6_p()) {
3626             REV(r0, r1);
3627             rshi_u(r0, r0, 16);
3628         }
3629         else {
3630             t0 = jit_get_reg(jit_class_gpr);
3631             rshi(rn(t0), r1, 8);
3632             andi(r0, r1, 0xff);
3633             andi(rn(t0), rn(t0), 0xff);
3634             lshi(r0, r0, 8);
3635             orr(r0, r0, rn(t0));
3636             jit_unget_reg(t0);
3637         }
3638     }
3639 }
3640
3641 /* inline glibc htonl (without register clobber) */
3642 static void
3643 _htonr_ui(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3644 {
3645     jit_int32_t         reg;
3646     if (jit_thumb_p()) {
3647         if ((r0|r1) < 8)
3648             T1_REV(r0, r1);
3649         else
3650             T2_REV(r0, r1);
3651     }
3652     else {
3653         if (jit_armv6_p())
3654             REV(r0, r1);
3655         else {
3656             reg = jit_get_reg(jit_class_gpr);
3657             EOR_SI(rn(reg), r1, r1, ARM_ROR, 16);
3658             LSRI(rn(reg), rn(reg), 8);
3659             BICI(rn(reg), rn(reg), encode_arm_immediate(0xff00));
3660             EOR_SI(r0, rn(reg), r1, ARM_ROR, 8);
3661             jit_unget_reg(reg);
3662         }
3663     }
3664 }
3665 #endif
3666
3667 static void
3668 _extr_c(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3669 {
3670     if (jit_thumb_p()) {
3671         if ((r0|r1) < 8)
3672             T1_SXTB(r0, r1);
3673         else
3674             T2_SXTB(r0, r1);
3675     }
3676     else {
3677         if (jit_armv6_p())
3678             SXTB(r0, r1);
3679         else {
3680             LSLI(r0, r1, 24);
3681             ASRI(r0, r0, 24);
3682         }
3683     }
3684 }
3685
3686 static void
3687 _extr_uc(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3688 {
3689     if (jit_thumb_p()) {
3690         if ((r0|r1) < 8)
3691             T1_UXTB(r0, r1);
3692         else
3693             T2_UXTB(r0, r1);
3694     }
3695     else {
3696         if (jit_armv6_p())
3697             UXTB(r0, r1);
3698         else
3699             ANDI(r0, r1, 0xff);
3700     }
3701 }
3702
3703 static void
3704 _extr_s(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3705 {
3706     if (jit_thumb_p()) {
3707         if ((r0|r1) < 8)
3708             T1_SXTH(r0, r1);
3709         else
3710             T2_SXTH(r0, r1);
3711     }
3712     else {
3713         if (jit_armv6_p())
3714             SXTH(r0, r1);
3715         else {
3716             LSLI(r0, r1, 16);
3717             ASRI(r0, r0, 16);
3718         }
3719     }
3720 }
3721
3722 static void
3723 _extr_us(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3724 {
3725     if (jit_thumb_p()) {
3726         if ((r0|r1) < 8)
3727             T1_UXTH(r0, r1);
3728         else
3729             T2_UXTH(r0, r1);
3730     }
3731     else {
3732         if (jit_armv6_p())
3733             UXTH(r0, r1);
3734         else {
3735             LSLI(r0, r1, 16);
3736             LSRI(r0, r0, 16);
3737         }
3738     }
3739 }
3740
3741 static void
3742 _callr(jit_state_t *_jit, jit_int32_t r0)
3743 {
3744     if (jit_thumb_p())
3745         T1_BLX(r0);
3746     else
3747         BLX(r0);
3748 }
3749
3750 static void
3751 _calli(jit_state_t *_jit, jit_word_t i0)
3752 {
3753     jit_word_t          d;
3754     jit_int32_t         reg;
3755     d = ((i0 - _jit->pc.w) >> 2) - 2;
3756     if (!jit_exchange_p() && !jit_thumb_p() && _s24P(d))
3757         BLI(d & 0x00ffffff);
3758     else {
3759         reg = jit_get_reg(jit_class_gpr);
3760         movi(rn(reg), i0);
3761         if (jit_thumb_p())
3762             T1_BLX(rn(reg));
3763         else
3764             BLX(rn(reg));
3765         jit_unget_reg(reg);
3766     }
3767 }
3768
3769 static jit_word_t
3770 _calli_p(jit_state_t *_jit, jit_word_t i0)
3771 {
3772     jit_word_t          w;
3773     jit_int32_t         reg;
3774     reg = jit_get_reg(jit_class_gpr);
3775     w = _jit->pc.w;
3776     movi_p(rn(reg), i0);
3777     if (jit_thumb_p())
3778         T1_BLX(rn(reg));
3779     else
3780         BLX(rn(reg));
3781     jit_unget_reg(reg);
3782     return (w);
3783 }
3784
3785 static void
3786 _prolog(jit_state_t *_jit, jit_node_t *node)
3787 {
3788     jit_int32_t         reg;
3789     if (_jitc->function->define_frame || _jitc->function->assume_frame) {
3790         jit_int32_t     frame = -_jitc->function->frame;
3791         assert(_jitc->function->self.aoff >= frame);
3792         if (_jitc->function->assume_frame) {
3793             if (jit_thumb_p() && !_jitc->thumb)
3794                 _jitc->thumb = _jit->pc.w;
3795             return;
3796         }
3797         _jitc->function->self.aoff = frame;
3798     }
3799     if (_jitc->function->allocar)
3800         _jitc->function->self.aoff &= -8;
3801     _jitc->function->stack = ((_jitc->function->self.alen -
3802                               /* align stack at 8 bytes */
3803                               _jitc->function->self.aoff) + 7) & -8;
3804
3805     if (jit_thumb_p()) {
3806         /*  switch to thumb mode (better approach would be to
3807          * ORR 1 address being called, but no clear distinction
3808          * of what is a pointer to a jit function, or if patching
3809          * a pointer to a jit function) */
3810         ADDI(_R12_REGNO, _R15_REGNO, 1);
3811         BX(_R12_REGNO);
3812         if (!_jitc->thumb)
3813             _jitc->thumb = _jit->pc.w;
3814         if (jit_cpu.abi) {
3815             T2_PUSH(0xf);
3816             T2_PUSH(0x3f0|(1<<_FP_REGNO)|(1<<_LR_REGNO));
3817             VPUSH_F64(_D8_REGNO, 8);
3818         }
3819         else {
3820             T2_PUSH(0xf);
3821             T2_PUSH(0x3f0|(1<<_FP_REGNO)|(1<<_LR_REGNO));
3822         }
3823     }
3824     else {
3825         if (jit_cpu.abi) {
3826             PUSH(0xf);
3827             PUSH(0x3f0|(1<<_FP_REGNO)|(1<<_LR_REGNO));
3828             VPUSH_F64(_D8_REGNO, 8);
3829         }
3830         else {
3831             PUSH(0xf);
3832             PUSH(0x3f0|(1<<_FP_REGNO)|(1<<_LR_REGNO));
3833         }
3834     }
3835     movr(_FP_REGNO, _SP_REGNO);
3836     if (_jitc->function->stack)
3837         subi(_SP_REGNO, _SP_REGNO, _jitc->function->stack);
3838     if (_jitc->function->allocar) {
3839         reg = jit_get_reg(jit_class_gpr);
3840         movi(rn(reg), _jitc->function->self.aoff);
3841         stxi_i(_jitc->function->aoffoff, _FP_REGNO, rn(reg));
3842         jit_unget_reg(reg);
3843     }
3844 }
3845
3846 static void
3847 _epilog(jit_state_t *_jit, jit_node_t *node)
3848 {
3849     if (_jitc->function->assume_frame)
3850         return;
3851
3852     movr(_SP_REGNO, _FP_REGNO);
3853     if (jit_cpu.abi)
3854         VPOP_F64(_D8_REGNO, 8);
3855     if (jit_thumb_p())
3856         T2_POP(0x3f0|(1<<_FP_REGNO)|(1<<_LR_REGNO));
3857     else
3858         POP(0x3f0|(1<<_FP_REGNO)|(1<<_LR_REGNO));
3859     addi(_SP_REGNO, _SP_REGNO, 16);
3860     if (jit_thumb_p())
3861         T1_BX(_LR_REGNO);
3862     else
3863         BX(_LR_REGNO);
3864     if (jit_thumb_p() && (_jit->pc.w & 2))
3865         T1_NOP();
3866 }
3867
3868 static void
3869 _vastart(jit_state_t *_jit, jit_int32_t r0)
3870 {
3871     assert(_jitc->function->self.call & jit_call_varargs);
3872
3873     /* Initialize stack pointer to the first stack argument.
3874      * The -16 is to account for the 4 argument registers
3875      * always saved, and _jitc->function->vagp is to account
3876      * for declared arguments. */
3877     addi(r0, _FP_REGNO, _jitc->function->self.size -
3878          16 + _jitc->function->vagp);
3879 }
3880
3881 static void
3882 _vaarg(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3883 {
3884     assert(_jitc->function->self.call & jit_call_varargs);
3885
3886     /* Load argument. */
3887     ldr(r0, r1);
3888
3889     /* Update stack pointer. */
3890     addi(r1, r1, sizeof(jit_word_t));
3891 }
3892
3893 static void
3894 _patch_at(jit_state_t *_jit,
3895           jit_int32_t kind, jit_word_t instr, jit_word_t label)
3896 {
3897     jit_word_t           d;
3898     jit_thumb_t          thumb;
3899     union {
3900         jit_int16_t     *s;
3901         jit_int32_t     *i;
3902         jit_word_t       w;
3903     } u;
3904     u.w = instr;
3905     if (kind == arm_patch_jump) {
3906         if (jit_thumb_p() && (jit_uword_t)instr >= _jitc->thumb) {
3907             code2thumb(thumb.s[0], thumb.s[1], u.s[0], u.s[1]);
3908             if ((thumb.i & THUMB2_B) == THUMB2_B) {
3909                 d = ((label - instr) >> 1) - 2;
3910                 assert(_s24P(d));
3911                 thumb.i = THUMB2_B | encode_thumb_jump(d);
3912                 thumb2code(thumb.s[0], thumb.s[1], u.s[0], u.s[1]);
3913             }
3914             else if ((thumb.i & THUMB2_B) == THUMB2_CC_B) {
3915                 d = ((label - instr) >> 1) - 2;
3916                 assert(_s20P(d));
3917                 thumb.i = THUMB2_CC_B | (thumb.i & 0x3c00000) |
3918                           encode_thumb_cc_jump(d);
3919                 thumb2code(thumb.s[0], thumb.s[1], u.s[0], u.s[1]);
3920             }
3921             else {
3922                 /* for the sake of simplicity in case choose to
3923                  * movw+movt+[bx|blx], e.g. if changing to instead
3924                  * of asserting target is reachable, load constant
3925                  * and do indirect jump if not reachable */
3926                 if ((thumb.i & 0xfbf00000) == THUMB2_MOVWI)
3927                     goto indirect_jump;
3928                 assert(!"handled branch opcode");
3929             }
3930         }
3931         else {
3932             thumb.i = u.i[0];
3933             /* 0x0e000000 because 0x01000000 is (branch&) link modifier */
3934             assert((thumb.i & 0x0e000000) == ARM_B);
3935             d = ((label - instr) >> 2) - 2;
3936             assert(_s24P(d));
3937             u.i[0] = (thumb.i & 0xff000000) | (d & 0x00ffffff);
3938         }
3939     }
3940     else if (kind == arm_patch_load) {
3941         /* offset may be negative for a forward patch because it
3942          * is relative to pc + 8, for example:
3943          *          ldr r0, [pc, #-4]
3944          *          bx r0               ;; [pc, #-8]
3945          *          .data ...           ;; [pc, #-4]
3946          *          ...                 ;; [pc]
3947          */
3948         assert(!jit_thumb_p());
3949         thumb.i = u.i[0];
3950         assert((thumb.i & 0x0f700000) == ARM_LDRI);
3951         d = label - (instr + 8);
3952         if (d < 0) {
3953             thumb.i &= ~ARM_P;
3954             d = -d;
3955         }
3956         else
3957             thumb.i |= ARM_P;
3958         assert(!(d & 0xfffff000));
3959         u.i[0] = (thumb.i & 0xfffff000) | d;
3960     }
3961     else if (kind == arm_patch_word) {
3962         if (jit_thumb_p()) {
3963             code2thumb(thumb.s[0], thumb.s[1], u.s[0], u.s[1]);
3964             assert((thumb.i & 0xfbf00000) == THUMB2_MOVWI);
3965         indirect_jump:
3966             thumb.i = ((thumb.i & 0xfbf00f00) |
3967                        ( (label & 0x0000f000) <<  4) |
3968                        ( (label & 0x00000800) << 15) |
3969                        ( (label & 0x00000700) <<  4) |
3970                        (  label & 0x000000ff));
3971             thumb2code(thumb.s[0], thumb.s[1], u.s[0], u.s[1]);
3972             label >>= 16;
3973             code2thumb(thumb.s[0], thumb.s[1], u.s[2], u.s[3]);
3974             assert((thumb.i & 0xfbf00000) == THUMB2_MOVTI);
3975             thumb.i = ((thumb.i & 0xfbf00f00) |
3976                        ( (label & 0x0000f000) <<  4) |
3977                        ( (label & 0x00000800) << 15) |
3978                        ( (label & 0x00000700) <<  4) |
3979                        (  label & 0x000000ff));
3980             thumb2code(thumb.s[0], thumb.s[1], u.s[2], u.s[3]);
3981         }
3982         else
3983             u.i[0] = label;
3984     }
3985     else
3986         assert(!"handled patch");
3987 }
3988 #endif