1 /*
2  * Copyright (C) 2012-2019  Free Software Foundation, Inc.
3  *
4  * This file is part of GNU lightning.
5  *
6  * GNU lightning is free software; you can redistribute it and/or modify it
7  * under the terms of the GNU Lesser General Public License as published
8  * by the Free Software Foundation; either version 3, or (at your option)
9  * any later version.
10  *
11  * GNU lightning is distributed in the hope that it will be useful, but
12  * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
13  * or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
14  * License for more details.
15  *
16  * Authors:
17  *	Paulo Cesar Pereira de Andrade
18  */
19 
20 #if PROTO
21 #  define stxi(i0,r0,r1)		stxi_i(i0,r0,r1)
22 #  define ldxi(r0,r1,i0)		ldxi_i(r0,r1,i0)
23 #  define ldr(r0,r1)			ldr_i(r0,r1)
24 #  define _s20P(d)			((d) >= -(int)0x80000 && d <= 0x7ffff)
25 #  define _s24P(d)			((d) >= -(int)0x800000 && d <= 0x7fffff)
26 #  define _u3(v)			((v) & 0x7)
27 #  define _u4(v)			((v) & 0xf)
28 #  define _u5(v)			((v) & 0x1f)
29 #  define _u8(v)			((v) & 0xff)
30 #  define _u12(v)			((v) & 0xfff)
31 #  define _u13(v)			((v) & 0x1fff)
32 #  define _u16(v)			((v) & 0xffff)
33 #  define _u24(v)			((v) & 0xffffff)
34 #  define jit_thumb_p()			jit_cpu.thumb
35 #  define jit_no_set_flags()		_jitc->no_set_flags
36 #  define jit_armv5_p()			(jit_cpu.version >= 5)
37 #  define jit_armv5e_p()		(jit_cpu.version > 5 || (jit_cpu.version == 5 && jit_cpu.extend))
38 #  define jit_armv6_p()			(jit_cpu.version >= 6)
39 #  define jit_armv7r_p()		0
40 #  define stack_framesize		48
41 extern int	__aeabi_idivmod(int, int);
42 extern unsigned	__aeabi_uidivmod(unsigned, unsigned);
43 #  define _R0_REGNO			0x00
44 #  define _R1_REGNO			0x01
45 #  define _R2_REGNO			0x02
46 #  define _R3_REGNO			0x03
47 #  define _R4_REGNO			0x04
48 #  define _R5_REGNO			0x05
49 #  define _R6_REGNO			0x06
50 #  define _R7_REGNO			0x07
51 #  define _R8_REGNO			0x08
52 #  define _R9_REGNO			0x09
53 #  define _R10_REGNO			0x0a
54 #  define _R11_REGNO			0x0b
55 #  define _R12_REGNO			0x0c
56 #  define _R13_REGNO			0x0d
57 #  define _R14_REGNO			0x0e
58 #  define _R15_REGNO			0x0f
59 #  define _FP_REGNO			_R11_REGNO
60 #  define _SP_REGNO			_R13_REGNO
61 #  define _LR_REGNO			_R14_REGNO
62 #  define _PC_REGNO			_R15_REGNO
63 #  define ARM_CC_EQ			0x00000000	/* Z=1 */
64 #  define ARM_CC_NE			0x10000000	/* Z=0 */
65 #  define ARM_CC_HS			0x20000000	/* C=1 */
66 #    define ARM_CC_CS			ARM_CC_HS
67 #  define ARM_CC_LO			0x30000000	/* C=0 */
68 #    define ARM_CC_CC			ARM_CC_LO
69 #  define ARM_CC_MI			0x40000000	/* N=1 */
70 #  define ARM_CC_PL			0x50000000	/* N=0 */
71 #  define ARM_CC_VS			0x60000000	/* V=1 */
72 #  define ARM_CC_VC			0x70000000	/* V=0 */
73 #  define ARM_CC_HI			0x80000000	/* C=1 && Z=0 */
74 #  define ARM_CC_LS			0x90000000	/* C=0 || Z=1 */
75 #  define ARM_CC_GE			0xa0000000	/* N=V */
76 #  define ARM_CC_LT			0xb0000000	/* N!=V */
77 #  define ARM_CC_GT			0xc0000000	/* Z=0 && N=V */
78 #  define ARM_CC_LE			0xd0000000	/* Z=1 || N!=V */
79 #  define ARM_CC_AL			0xe0000000	/* always */
80 #  define ARM_CC_NV			0xf0000000	/* reserved */
81 #  define THUMB2_IT			0
82 #  define THUMB2_ITT			1
83 #  define THUMB2_ITE			2
84 #  define THUMB2_ITTT			3
85 #  define THUMB2_ITET			4
86 #  define THUMB2_ITTE			5
87 #  define THUMB2_ITEE			6
88 #  define THUMB2_ITTTT			7
89 #  define THUMB2_ITETT			8
90 #  define THUMB2_ITTET			9
91 #  define THUMB2_ITEET			10
92 #  define THUMB2_ITTTE			11
93 #  define THUMB2_ITETE			12
94 #  define THUMB2_ITTEE			13
95 #  define THUMB2_ITEEE			14
96 #  define ARM_MOV			0x01a00000
97 #  define THUMB_MOV			    0x4600
98 #  define ARM_MOVWI			0x03000000	/* v6t2, v7 */
99 #  define THUMB_MOVI			    0x2000
100 #  define THUMB2_MOVI			0xf0400000
101 #  define THUMB2_MOVWI			0xf2400000
102 #  define ARM_MOVTI			0x03400000
103 #  define THUMB2_MOVTI			0xf2c00000
104 #  define ARM_MVN			0x01e00000
105 #  define THUMB_MVN			    0x43c0
106 #  define THUMB2_MVN			0xea600000
107 #  define THUMB2_MVNI			0xf0600000
108 #  define ARM_I				0x02000000 /* immediate */
109 #  define ARM_S				0x00100000 /* set flags */
110 #  define ARM_ADD			0x00800000
111 #  define THUMB_ADD			    0x1800
112 #  define THUMB_ADDX			    0x4400
113 #  define THUMB2_ADD			0xeb000000
114 #  define THUMB_ADDI3			    0x1c00
115 #  define THUMB_ADDI8			    0x3000
116 #  define THUMB2_ADDI			0xf1000000
117 #  define THUMB2_ADDWI			0xf2000000
118 #  define ARM_ADC			0x00a00000
119 #  define THUMB_ADC			    0x4140
120 #  define THUMB2_ADC			0xeb400000
121 #  define THUMB2_ADCI			0xf1400000
122 #  define ARM_SUB			0x00400000
123 #  define THUMB_SUB			    0x1a00
124 #  define THUMB2_SUB			0xeba00000
125 #  define THUMB_SUBI3			    0x1e00
126 #  define THUMB_SUBI8			    0x3800
127 #  define THUMB2_SUBI			0xf1a00000
128 #  define THUMB2_SUBWI			0xf2a00000
129 #  define ARM_SBC			0x00c00000
130 #  define THUMB_SBC			    0x4180
131 #  define THUMB2_SBC			0xeb600000
132 #  define THUMB2_SBCI			0xf1600000
133 #  define ARM_RSB			0x00600000
134 #  define THUMB_RSBI			    0x4240
135 #  define THUMB2_RSBI			0xf1c00000
136 #  define ARM_MUL			0x00000090
137 #  define THUMB_MUL			    0x4340
138 #  define THUMB2_MUL			0xfb00f000
139 #  define ARM_UMULL			0x00800090
140 #  define THUMB2_UMULL			0xfba00000
141 #  define ARM_SMULL			0x00c00090
142 #  define THUMB2_SMULL			0xfb800000
143 #  define THUMB2_SDIV			0xfb90f0f0
144 #  define THUMB2_UDIV			0xfbb0f0f0
145 #  define ARM_AND			0x00000000
146 #  define THUMB_AND			    0x4000
147 #  define THUMB2_AND			0xea000000
148 #  define THUMB2_ANDI			0xf0000000
149 #  define ARM_BIC			0x01c00000
150 #  define THUMB2_BIC			0xea200000
151 #  define THUMB2_BICI			0xf0200000
152 #  define ARM_ORR			0x01800000
153 #  define THUMB_ORR			    0x4300
154 #  define THUMB2_ORR			0xea400000
155 #  define THUMB2_ORRI			0xf0400000
156 #  define ARM_EOR			0x00200000
157 #  define THUMB_EOR			    0x4040
158 #  define THUMB2_EOR			0xea800000
159 #  define THUMB2_EORI			0xf0800000
160 /* >> ARMv6* */
161 #  define ARM_REV			0x06bf0f30
162 #  define THUMB_REV			    0xba00
163 #  define THUMB2_REV			0xfa90f080
164 #  define ARM_REV16			0x06bf0fb0
165 #  define THUMB_REV16			    0xba40
166 #  define THUMB2_REV16			0xfa90f090
167 #  define ARM_SXTB			0x06af0070
168 #  define THUMB_SXTB			    0xb240
169 #  define THUMB2_SXTB			0xfa40f080
170 #  define ARM_UXTB			0x06ef0070
171 #  define THUMB_UXTB			    0xb2c0
172 #  define THUMB2_UXTB			0xfa50f080
173 #  define ARM_SXTH			0x06bf0070
174 #  define THUMB_SXTH			    0xb200
175 #  define THUMB2_SXTH			0xfa00f080
176 #  define ARM_UXTH			0x06ff0070
177 #  define THUMB_UXTH			    0xb280
178 #  define THUMB2_UXTH			0xfa10f080
179 #  define ARM_XTR8			0x00000400 /* ?xt? rotate 8 bits */
180 #  define ARM_XTR16			0x00000800 /* ?xt? rotate 16 bits */
181 #  define ARM_XTR24			0x00000c00 /* ?xt? rotate 24 bits */
182 /* << ARMv6* */
183 #  define ARM_SHIFT			0x01a00000
184 #  define ARM_R				0x00000010 /* register shift */
185 #  define ARM_LSL			0x00000000
186 #  define THUMB_LSL			    0x4080
187 #  define THUMB2_LSL			0xfa00f000
188 #  define THUMB_LSLI			    0x0000
189 #  define THUMB2_LSLI			0xea4f0000
190 #  define ARM_LSR			0x00000020
191 #  define THUMB_LSR			    0x40c0
192 #  define THUMB2_LSR			0xfa20f000
193 #  define THUMB_LSRI			    0x0800
194 #  define THUMB2_LSRI			0xea4f0010
195 #  define ARM_ASR			0x00000040
196 #  define THUMB_ASR			    0x4100
197 #  define THUMB2_ASR			0xfa40f000
198 #  define THUMB_ASRI			    0x1000
199 #  define THUMB2_ASRI			0xea4f0020
200 #  define ARM_ROR			0x00000060
201 #  define ARM_CMP			0x01500000
202 #  define THUMB_CMP			    0x4280
203 #  define THUMB_CMPX			    0x4500
204 #  define THUMB2_CMP			0xebb00000
205 #  define THUMB_CMPI			    0x2800
206 #  define THUMB2_CMPI			0xf1b00000
207 #  define ARM_CMN			0x01700000
208 #  define THUMB_CMN			    0x42c0
209 #  define THUMB2_CMN			0xeb100000
210 #  define THUMB2_CMNI			0xf1100000
211 #  define ARM_TST			0x01100000
212 #  define THUMB_TST			    0x4200
213 #  define THUMB2_TST			0xea100000
214 #  define THUMB2_TSTI			0xf0100000
215 #  define ARM_TEQ			0x01300000
216 /* branch */
217 #  define ARM_BX			0x012fff10
218 #  define ARM_BLX			0x012fff30
219 #  define THUMB_BLX			    0x4780
220 #  define ARM_BLXI			0xfa000000
221 #  define THUMB2_BLXI			0xf000c000
222 #  define ARM_B				0x0a000000
223 #  define THUMB_CC_B			    0xd000
224 #  define THUMB_B			    0xe000
225 #  define THUMB2_CC_B			0xf0008000
226 #  define THUMB2_B			0xf0009000
227 #  define ARM_BLI			0x0b000000
228 #  define THUMB2_BLI			0xf000d000
229 /* ldr/str */
230 #  define ARM_P				0x00800000 /* positive offset */
231 #  define THUMB2_P			0x00000400
232 #  define THUMB2_U			0x00000200
233 #  define THUMB2_W			0x00000100
234 #  define ARM_LDRSB			0x011000d0
235 #  define THUMB_LDRSB			    0x5600
236 #  define THUMB2_LDRSB			0xf9100000
237 #  define ARM_LDRSBI			0x015000d0
238 #  define THUMB2_LDRSBI			0xf9100c00
239 #  define THUMB2_LDRSBWI		0xf9900000
240 #  define ARM_LDRB			0x07500000
241 #  define THUMB_LDRB			    0x5c00
242 #  define THUMB2_LDRB			0xf8100000
243 #  define ARM_LDRBI			0x05500000
244 #  define THUMB_LDRBI			    0x7800
245 #  define THUMB2_LDRBI			0xf8100c00
246 #  define THUMB2_LDRBWI			0xf8900000
247 #  define ARM_LDRSH			0x011000f0
248 #  define THUMB_LDRSH			    0x5e00
249 #  define THUMB2_LDRSH			0xf9300000
250 #  define ARM_LDRSHI			0x015000f0
251 #  define THUMB2_LDRSHI			0xf9300c00
252 #  define THUMB2_LDRSHWI		0xf9b00000
253 #  define ARM_LDRH			0x011000b0
254 #  define THUMB_LDRH			    0x5a00
255 #  define THUMB2_LDRH			0xf8300000
256 #  define ARM_LDRHI			0x015000b0
257 #  define THUMB_LDRHI			    0x8800
258 #  define THUMB2_LDRHI			0xf8300c00
259 #  define THUMB2_LDRHWI			0xf8b00000
260 #  define ARM_LDR			0x07100000
261 #  define THUMB_LDR			    0x5800
262 #  define THUMB2_LDR			0xf8500000
263 #  define ARM_LDRI			0x05100000
264 #  define THUMB_LDRI			    0x6800
265 #  define THUMB_LDRISP			    0x9800
266 #  define THUMB2_LDRI			0xf8500c00
267 #  define THUMB2_LDRWI			0xf8d00000
268 #  define ARM_LDRD			0x010000d0
269 #  define ARM_LDRDI			0x014000d0
270 #  define THUMB2_LDRDI			0xe8500000
271 #  define ARM_STRB			0x07400000
272 #  define THUMB_STRB			    0x5400
273 #  define THUMB2_STRB			0xf8000000
274 #  define ARM_STRBI			0x05400000
275 #  define THUMB_STRBI			    0x7000
276 #  define THUMB2_STRBI			0xf8000c00
277 #  define THUMB2_STRBWI			0xf8800000
278 #  define ARM_STRH			0x010000b0
279 #  define THUMB_STRH			    0x5200
280 #  define THUMB2_STRH			0xf8200000
281 #  define ARM_STRHI			0x014000b0
282 #  define THUMB_STRHI			    0x8000
283 #  define THUMB2_STRHI			0xf8200c00
284 #  define THUMB2_STRHWI			0xf8a00000
285 #  define ARM_STR			0x07000000
286 #  define THUMB_STR			    0x5000
287 #  define THUMB2_STR			0xf8400000
288 #  define ARM_STRI			0x05000000
289 #  define THUMB_STRI			    0x6000
290 # define THUMB2_STRWI			0xf8c00000
291 #  define THUMB_STRISP			    0x9000
292 #  define THUMB2_STRI			0xf8400c00
293 #  define ARM_STRD			0x010000f0
294 # define ARM_STRDI			0x014000f0
295 #  define THUMB2_STRDI			0xe8400000
296 /* ldm/stm */
297 #  define ARM_M				0x08000000
298 #  define ARM_M_L			0x00100000 /* load; store if not set */
299 #  define ARM_M_I			0x00800000 /* inc; dec if not set */
300 #  define ARM_M_B			0x01000000 /* before; after if not set */
301 #  define ARM_M_U			0x00200000 /* update Rn */
302 #  define THUMB2_LDM_W			0x00200000
303 #  define THUMB2_LDM_P			0x00008000
304 #  define THUMB2_LDM_M			0x00004000
305 #  define THUMB_LDMIA			    0xc800
306 #  define THUMB2_LDMIA			0xe8900000
307 #  define THUMB2_LDMB			0xe9100000
308 #  define THUMB_PUSH			    0xb400
309 #  define THUMB2_PUSH			0xe92d0000
310 #  define THUMB_POP			    0xbc00
311 #  define THUMB2_POP			0xe8bd0000
312 #  define ii(i)				*_jit->pc.ui++ = i
313 #  define is(i)				*_jit->pc.us++ = i
314 #  if __BYTE_ORDER == __LITTLE_ENDIAN
315 #    define iss(i, j)			do { is(j); is(i); } while (0)
316 #    define code2thumb(t0, t1, c0, c1)	do { t1 = c0; t0 = c1; } while (0)
317 #    define thumb2code(t0, t1, c0, c1)	do { c0 = t1; c1 = t0; } while (0)
318 #  else
319 #    define iss(i, j)			do { is(i); is(j); } while (0)
320 #    define code2thumb(t0, t1, c0, c1)	do { t0 = c0; t1 = c1; } while (0)
321 #    define thumb2code(t0, t1, c0, c1)	do { c0 = t0; c1 = t1; } while (0)
322 #  endif
323 static int encode_arm_immediate(unsigned int v);
324 static int encode_thumb_immediate(unsigned int v);
325 static int encode_thumb_word_immediate(unsigned int v);
326 static int encode_thumb_jump(int v);
327 static int encode_thumb_cc_jump(int v);
328 static int encode_thumb_shift(int v, int type) maybe_unused;
329 #  define corrr(cc,o,rn,rd,rm)		_corrr(_jit,cc,o,rn,rd,rm)
330 static void _corrr(jit_state_t*,int,int,int,int,int);
331 #  define corri(cc,o,rn,rd,im)		_corri(_jit,cc,o,rn,rd,im)
332 static void _corri(jit_state_t*,int,int,int,int,int);
333 #define corri8(cc,o,rn,rt,im)	_corri8(_jit,cc,o,rn,rt,im)
334 static void _corri8(jit_state_t*,int,int,int,int,int);
335 #  define torrr(o,rn,rd,rm)		_torrr(_jit,o,rn,rd,rm)
336 static void _torrr(jit_state_t*,int,int,int,int);
337 #  define torrrs(o,rn,rd,rm,im)		_torrrs(_jit,o,rn,rd,rm,im)
338 static void _torrrs(jit_state_t*,int,int,int,int,int) maybe_unused;
339 #  define torxr(o,rn,rt,rm)		_torxr(_jit,o,rn,rt,rm)
340 static void _torxr(jit_state_t*,int,int,int,int);
341 #  define torrrr(o,rn,rl,rh,rm)		_torrrr(_jit,o,rn,rl,rh,rm)
342 static void _torrrr(jit_state_t*,int,int,int,int,int) maybe_unused;
343 #  define torrri8(o,rn,rt,rt2,im)	_torrri8(_jit,o,rn,rt,rt2,im)
344 static void _torrri8(jit_state_t*,int,int,int,int,int) maybe_unused;
345 #  define coriw(cc,o,rd,im)		_coriw(_jit,cc,o,rd,im)
346 static void _coriw(jit_state_t*,int,int,int,int);
347 #  define torri(o,rd,rn,im)		_torri(_jit,o,rd,rn,im)
348 static void _torri(jit_state_t*,int,int,int,int);
349 #  define torri8(o,rn,rt,im)		_torri8(_jit,o,rn,rt,im)
350 static void _torri8(jit_state_t*,int,int,int,int);
351 #  define torri12(o,rn,rt,im)		_torri12(_jit,o,rn,rt,im)
352 static void _torri12(jit_state_t*,int,int,int,int);
353 #  define tshift(o,rd,rm,im)		_tshift(_jit,o,rd,rm,im)
354 static void _tshift(jit_state_t*,int,int,int,int);
355 #  define toriw(o,rd,im)		_toriw(_jit,o,rd,im)
356 static void _toriw(jit_state_t*,int,int,int);
357 #  define tc8(cc,im)			_tc8(_jit,cc,im)
358 static void _tc8(jit_state_t*,int,int) maybe_unused;
359 #  define t11(im)			_t11(_jit,im)
360 static void _t11(jit_state_t*,int);
361 #  define tcb(cc,im)			_tcb(_jit,cc,im)
362 static void _tcb(jit_state_t*,int,int);
363 #  define blxi(im)			_blxi(_jit,im)
364 static void _blxi(jit_state_t*,int) maybe_unused;
365 #  define tb(o,im)			_tb(_jit,o,im)
366 static void _tb(jit_state_t*,int,int);
367 #  define corrrr(cc,o,rh,rl,rm,rn)	_corrrr(_jit,cc,o,rh,rl,rm,rn)
368 static void _corrrr(jit_state_t*,int,int,int,int,int,int);
369 #  define corrrs(cc,o,rn,rd,rm,im)	_corrrs(_jit,cc,o,rn,rd,rm,im)
370 static void _corrrs(jit_state_t*,int,int,int,int,int,int);
371 #  define cshift(cc,o,rd,rm,rn,im)	_cshift(_jit,cc,o,rd,rm,rn,im)
372 static void _cshift(jit_state_t*,int,int,int,int,int,int);
373 #  define cb(cc,o,im)			_cb(_jit,cc,o,im)
374 static void _cb(jit_state_t*,int,int,int);
375 #  define cbx(cc,o,rm)			_cbx(_jit,cc,o,rm)
376 static void _cbx(jit_state_t*,int,int,int);
377 #  define corl(cc,o,r0,i0)		_corl(_jit,cc,o,r0,i0)
378 static void _corl(jit_state_t*,int,int,int,int);
379 #  define c6orr(cc,o,r0,r1)		_c6orr(_jit,cc,o,r0,r1)
380 static void _c6orr(jit_state_t*,int,int,int,int);
381 #  define tcit(cc,it)			_tcit(_jit,cc,it)
382 static void _tcit(jit_state_t*,unsigned int,int);
383 #  define IT(cc)			tcit(cc,THUMB2_IT)
384 #  define ITT(cc)			tcit(cc,THUMB2_ITT)
385 #  define ITE(cc)			tcit(cc,THUMB2_ITE)
386 #  define ITTT(cc)			tcit(cc,THUMB2_ITTT)
387 #  define ITTE(cc)			tcit(cc,THUMB2_ITTE)
388 #  define ITET(cc)			tcit(cc,THUMB2_ITET)
389 #  define ITEE(cc)			tcit(cc,THUMB2_ITEE)
390 #  define ITTTT(cc)			tcit(cc,THUMB2_ITTTT)
391 #  define ITETT(cc)			tcit(cc,THUMB2_ITETT)
392 #  define ITTET(cc)			tcit(cc,THUMB2_ITTET)
393 #  define ITEET(cc)			tcit(cc,THUMB2_ITEET)
394 #  define ITTTE(cc)			tcit(cc,THUMB2_ITTTE)
395 #  define ITETE(cc)			tcit(cc,THUMB2_ITETE)
396 #  define ITTEE(cc)			tcit(cc,THUMB2_ITTEE)
397 #  define ITEEE(cc)			tcit(cc,THUMB2_ITEEE)
398 #  define tpp(o,im)			_tpp(_jit,o,im)
399 static void _tpp(jit_state_t*,int,int);
400 #  define torl(o,rn,im)			_torl(_jit,o,rn,im)
401 static void _torl(jit_state_t*,int,int,int) maybe_unused;
402 #  define CC_MOV(cc,rd,rm)		corrr(cc,ARM_MOV,0,rd,rm)
403 #  define MOV(rd,rm)			CC_MOV(ARM_CC_AL,rd,rm)
404 #  define T1_MOV(rd,rm)			is(THUMB_MOV|((_u4(rd)&8)<<4)|(_u4(rm)<<3)|(rd&7))
405 #  define T2_MOV(rd,rm)			T2_ORR(rd,_R15_REGNO,rm)
406 #  define CC_MOVI(cc,rd,im)		corri(cc,ARM_MOV|ARM_I,0,rd,im)
407 #  define MOVI(rd,im)			CC_MOVI(ARM_CC_AL,rd,im)
408 #  define CC_MOVWI(cc,rd,im)		coriw(cc,ARM_MOVWI,rd,im)
409 #  define MOVWI(rd,im)			CC_MOVWI(ARM_CC_AL,rd,im)
410 #  define T1_MOVI(rd,im)		is(THUMB_MOVI|(_u3(rd)<<8)|_u8(im))
411 #  define T2_MOVI(rd,im)		torri(THUMB2_MOVI,_R15_REGNO,rd,im)
412 #  define T2_MOVWI(rd,im)		toriw(THUMB2_MOVWI,rd,im)
413 #  define CC_MOVTI(cc,rd,im)		coriw(cc,ARM_MOVTI,rd,im)
414 #  define MOVTI(rd,im)			CC_MOVTI(ARM_CC_AL,rd,im)
415 #  define T2_MOVTI(rd,im)		toriw(THUMB2_MOVTI,rd,im)
416 #  define CC_MVN(cc,rd,rm)		corrr(cc,ARM_MVN,0,rd,rm)
417 #  define MVN(rd,rm)			CC_MVN(ARM_CC_AL,rd,rm)
418 #  define T1_MVN(rd,rm)			is(THUMB_MVN|(_u3(rm)<<3)|_u3(rd))
419 #  define T2_MVN(rd,rm)			torrr(THUMB2_MVN,_R15_REGNO,rd,rm)
420 #  define CC_MVNI(cc,rd,im)		corri(cc,ARM_MVN|ARM_I,0,rd,im)
421 #  define MVNI(rd,im)			CC_MVNI(ARM_CC_AL,rd,im)
422 #  define T2_MVNI(rd,im)		torri(THUMB2_MVNI,_R15_REGNO,rd,im)
423 #  define CC_NOT(cc,rd,rm)		CC_MVN(cc,rd,rm)
424 #  define NOT(rd,rm)			CC_NOT(ARM_CC_AL,rd,rm)
425 #  define T1_NOT(rd,rm)			T1_MVN(rd,rm)
426 #  define T2_NOT(rd,rm)			T2_MVN(rd,rm)
427 #  define NOP()				MOV(_R0_REGNO, _R0_REGNO)
428 #  define T1_NOP()			is(0xbf00)
429 #  define CC_ADD(cc,rd,rn,rm)		corrr(cc,ARM_ADD,rn,rd,rm)
430 #  define ADD(rd,rn,rm)			CC_ADD(ARM_CC_AL,rd,rn,rm)
431 #  define T1_ADD(rd,rn,rm)		is(THUMB_ADD|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rd))
432 #  define T1_ADDX(rdn,rm)		is(THUMB_ADDX|((_u4(rdn)&8)<<4)|(_u4(rm)<<3)|(rdn&7))
433 #  define T2_ADD(rd,rn,rm)		torrr(THUMB2_ADD,rn,rd,rm)
434 #  define CC_ADDI(cc,rd,rn,im)		corri(cc,ARM_ADD|ARM_I,rn,rd,im)
435 #  define ADDI(rd,rn,im)		CC_ADDI(ARM_CC_AL,rd,rn,im)
436 #  define T1_ADDI3(rd,rn,im)		is(THUMB_ADDI3|(_u3(im)<<6)|(_u3(rn)<<3)|_u3(rd))
437 #  define T1_ADDI8(rdn,im)		is(THUMB_ADDI8|(_u3(rdn)<<8)|_u8(im))
438 #  define T2_ADDI(rd,rn,im)		torri(THUMB2_ADDI,rn,rd,im)
439 #  define T2_ADDWI(rd,rn,im)		torri(THUMB2_ADDWI,rn,rd,im)
440 #  define CC_ADDS(cc,rd,rn,rm)		corrr(cc,ARM_ADD|ARM_S,rn,rd,rm)
441 #  define ADDS(rd,rn,rm)		CC_ADDS(ARM_CC_AL,rd,rn,rm)
442 #  define T2_ADDS(rd,rn,rm)		torrr(THUMB2_ADD|ARM_S,rn,rd,rm)
443 #  define ADDSI(rd,rn,im)		corri(ARM_CC_AL,ARM_ADD|ARM_S|ARM_I,rn,rd,im)
444 #  define T2_ADDSI(rd,rn,im)		torri(THUMB2_ADDI|ARM_S,rn,rd,im)
445 #  define CC_ADC(cc,rd,rn,rm)		corrr(cc,ARM_ADC,rn,rd,rm)
446 #  define ADC(rd,rn,rm)			CC_ADC(ARM_CC_AL,rd,rn,rm)
447 #  define T1_ADC(rdn,rm)		is(THUMB_ADC|(_u3(rm)<<3)|_u3(rdn))
448 #  define T2_ADC(rd,rn,rm)		torrr(THUMB2_ADC,rn,rd,rm)
449 #  define CC_ADCI(cc,rd,rn,im)		corri(cc,ARM_ADC|ARM_I,rn,rd,im)
450 #  define ADCI(rd,rn,im)		CC_ADCI(ARM_CC_AL,rd,rn,im)
451 #  define T2_ADCI(rd,rn,im)		torri(THUMB2_ADCI,rn,rd,im)
452 #  define CC_ADCS(cc,rd,rn,rm)		corrr(cc,ARM_ADC|ARM_S,rn,rd,rm)
453 #  define ADCS(rd,rn,rm)		CC_ADCS(ARM_CC_AL,rd,rn,rm)
454 #  define T2_ADCS(rd,rn,rm)		torrr(THUMB2_ADC|ARM_S,rn,rd,rm)
455 #  define CC_ADCSI(cc,rd,rn,im)		corri(cc,ARM_ADC|ARM_S|ARM_I,rn,rd,im)
456 #  define ADCSI(rd,rn,im)		CC_ADCSI(ARM_CC_AL,rd,rn,im)
457 #  define T2_ADCSI(rd,rn,im)		torri(THUMB2_ADCI|ARM_S,rn,rd,im)
458 #  define CC_SUB(cc,rd,rn,rm)		corrr(cc,ARM_SUB,rn,rd,rm)
459 #  define SUB(rd,rn,rm)			CC_SUB(ARM_CC_AL,rd,rn,rm)
460 #  define T1_SUB(rd,rn,rm)		is(THUMB_SUB|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rd))
461 #  define T2_SUB(rd,rn,rm)		torrr(THUMB2_SUB,rn,rd,rm)
462 #  define CC_SUBI(cc,rd,rn,im)		corri(cc,ARM_SUB|ARM_I,rn,rd,im)
463 #  define SUBI(rd,rn,im)		CC_SUBI(ARM_CC_AL,rd,rn,im)
464 #  define T1_SUBI3(rd,rn,im)		is(THUMB_SUBI3|(_u3(im)<<6)|(_u3(rn)<<3)|_u3(rd))
465 #  define T1_SUBI8(rdn,im)		is(THUMB_SUBI8|(_u3(rdn)<<8)|_u8(im))
466 #  define T2_SUBI(rd,rn,im)		torri(THUMB2_SUBI,rn,rd,im)
467 #  define T2_SUBWI(rd,rn,im)		torri(THUMB2_SUBWI,rn,rd,im)
468 #  define CC_SUBS(cc,rd,rn,rm)		corrr(cc,ARM_SUB|ARM_S,rn,rd,rm)
469 #  define SUBS(rd,rn,rm)		CC_SUBS(ARM_CC_AL,rd,rn,rm)
470 #  define T2_SUBS(rd,rn,rm)		torrr(THUMB2_SUB|ARM_S,rn,rd,rm)
471 #  define CC_SUBSI(cc,rd,rn,im)		corri(cc,ARM_SUB|ARM_S|ARM_I,rn,rd,im)
472 #  define SUBSI(rd,rn,im)		CC_SUBSI(ARM_CC_AL,rd,rn,im)
473 #  define T2_SUBSI(rd,rn,im)		torri(THUMB2_SUBI|ARM_S,rn,rd,im)
474 #  define CC_SBC(cc,rd,rn,rm)		corrr(cc,ARM_SBC,rn,rd,rm)
475 #  define SBC(rd,rn,rm)			CC_SBC(ARM_CC_AL,rd,rn,rm)
476 #  define T1_SBC(rdn,rm)		is(THUMB_SBC|(_u3(rm)<<3)|_u3(rdn))
477 #  define T2_SBC(rd,rn,rm)		torrr(THUMB2_SBC,rn,rd,rm)
478 #  define CC_SBCI(cc,rd,rn,im)		corri(cc,ARM_SBC|ARM_I,rn,rd,im)
479 #  define SBCI(rd,rn,im)		CC_SBCI(ARM_CC_AL,rd,rn,im)
480 #  define T2_SBCI(rd,rn,im)		torri(THUMB2_SBCI,rn,rd,im)
481 #  define CC_SBCS(cc,rd,rn,rm)		corrr(cc,ARM_SBC|ARM_S,rn,rd,rm)
482 #  define SBCS(rd,rn,rm)		CC_SBCS(ARM_CC_AL,rd,rn,rm)
483 #  define T2_SBCS(rd,rn,rm)		torrr(THUMB2_SBC|ARM_S,rn,rd,rm)
484 #  define CC_SBCSI(cc,rd,rn,im)		corri(cc,ARM_SBC|ARM_S|ARM_I,rn,rd,im)
485 #  define SBCSI(rd,rn,im)		CC_SBCSI(ARM_CC_AL,rd,rn,im)
486 #  define T2_SBCSI(rd,rn,im)		torri(THUMB2_SBCI|ARM_S,rn,rd,im)
487 #  define CC_RSB(cc,rd,rn,rm)		corrr(cc,ARM_RSB,rn,rd,rm)
488 #  define RSB(rd,rn,rm)			CC_RSB(ARM_CC_AL,rd,rn,rm)
489 #  define T2_RSB(rd,rn,rm)		torrr(THUMB2_RSB,rn,rd,rm)
490 #  define CC_RSBI(cc,rd,rn,im)		corri(cc,ARM_RSB|ARM_I,rn,rd,im)
491 #  define RSBI(rd,rn,im)		CC_RSBI(ARM_CC_AL,rd,rn,im)
492 #  define T1_RSBI(rd,rn)		is(THUMB_RSBI|(_u3(rn)<<3)|_u3(rd))
493 #  define T2_RSBI(rd,rn,im)		torri(THUMB2_RSBI,rn,rd,im)
494 #  define CC_MUL(cc,rl,rn,rm)		corrrr(cc,ARM_MUL,rl,0,rm,rn)
495 #  define MUL(rl,rn,rm)			CC_MUL(ARM_CC_AL,rl,rn,rm)
496 #  define T1_MUL(rdm,rn)		is(THUMB_MUL|(_u3(rn)<<3)|_u3(rdm))
497 #  define T2_MUL(rd,rn,rm)		torrr(THUMB2_MUL,rn,rd,rm)
498 #  define CC_SMULL(cc,rl,rh,rn,rm)	corrrr(cc,ARM_SMULL,rh,rl,rm,rn)
499 #  define SMULL(rl,rh,rn,rm)		CC_SMULL(ARM_CC_AL,rl,rh,rn,rm)
500 #  define T2_SMULL(rl,rh,rn,rm)		torrrr(THUMB2_SMULL,rn,rl,rh,rm)
501 #  define CC_UMULL(cc,rl,rh,rn,rm)	corrrr(cc,ARM_UMULL,rh,rl,rm,rn)
502 #  define UMULL(rl,rh,rn,rm)		CC_UMULL(ARM_CC_AL,rl,rh,rn,rm)
503 #  define T2_UMULL(rl,rh,rn,rm)		torrrr(THUMB2_UMULL,rn,rl,rh,rm)
504 #  define T2_SDIV(rd,rn,rm)		torrr(THUMB2_SDIV,rn,rd,rm)
505 #  define T2_UDIV(rd,rn,rm)		torrr(THUMB2_UDIV,rn,rd,rm)
506 #  define CC_AND(cc,rd,rn,rm)		corrr(cc,ARM_AND,rn,rd,rm)
507 #  define AND(rd,rn,rm)			CC_AND(ARM_CC_AL,rd,rn,rm)
508 #  define T1_AND(rdn,rm)		is(THUMB_AND|(_u3(rm)<<3)|_u3(rdn))
509 #  define T2_AND(rd,rn,rm)		torrr(THUMB2_AND,rn,rd,rm)
510 #  define CC_ANDI(cc,rd,rn,im)		corri(cc,ARM_AND|ARM_I,rn,rd,im)
511 #  define ANDI(rd,rn,im)		CC_ANDI(ARM_CC_AL,rd,rn,im)
512 #  define T2_ANDI(rd,rn,im)		torri(THUMB2_ANDI,rn,rd,im)
513 #  define CC_ANDS(cc,rd,rn,rm)		corrr(cc,ARM_AND|ARM_S,rn,rd,rm)
514 #  define ANDS(rd,rn,rm)		CC_ANDS(ARM_CC_AL,rd,rn,rm)
515 #  define T2_ANDS(rd,rn,rm)		torrr(THUMB2_AND|ARM_S,rn,rd,rm)
516 #  define CC_ANDSI(cc,rd,rn,im)		corri(cc,ARM_AND|ARM_S|ARM_I,rn,rd,im)
517 #  define ANDSI(rd,rn,im)		CC_ANDSI(ARM_CC_AL,rd,rn,im)
518 #  define T2_ANDSI(rd,rn,im)		torri(ARM_CC_AL,THUMB2_ANDI|ARM_S,rn,rd,im)
519 #  define CC_BIC(cc,rd,rn,rm)		corrr(cc,ARM_BIC,rn,rd,rm)
520 #  define BIC(rd,rn,rm)			CC_BIC(ARM_CC_AL,rd,rn,rm)
521 #  define T2_BIC(rd,rn,rm)		torrr(THUMB2_BIC,rn,rd,rm)
522 #  define CC_BICI(cc,rd,rn,im)		corri(cc,ARM_BIC|ARM_I,rn,rd,im)
523 #  define BICI(rd,rn,im)		CC_BICI(ARM_CC_AL,rd,rn,im)
524 #  define T2_BICI(rd,rn,im)		torri(THUMB2_BICI,rn,rd,im)
525 #  define CC_BICS(cc,rd,rn,rm)		corrr(cc,ARM_BIC|ARM_S,rn,rd,rm)
526 #  define BICS(rd,rn,rm)		CC_BICS(ARM_CC_AL,rd,rn,rm)
527 #  define T2_BICS(rd,rn,rm)		torrr(THUMB2_BIC|ARM_S,rn,rd,rm)
528 #  define CC_BICSI(cc,rd,rn,im)		corri(cc,ARM_BIC|ARM_S|ARM_I,rn,rd,im)
529 #  define BICSI(rd,rn,im)		CC_BICSI(ARM_CC_AL,rd,rn,im)
530 #  define T2_BICSI(rd,rn,im)		torri(ARM_CC_AL,THUMB2_BICI|ARM_S,rn,rd,im)
531 #  define CC_ORR(cc,rd,rn,rm)		corrr(cc,ARM_ORR,rn,rd,rm)
532 #  define ORR(rd,rn,rm)			CC_ORR(ARM_CC_AL,rd,rn,rm)
533 #  define T1_ORR(rdn,rm)		is(THUMB_ORR|(_u3(rm)<<3)|_u3(rdn))
534 #  define T2_ORR(rd,rn,rm)		torrr(THUMB2_ORR,rn,rd,rm)
535 #  define CC_ORR_SI(cc,rd,rn,rt,sh,im)	corrrs(cc,ARM_ORR|sh,rn,rd,rm,im)
536 #  define ORR_SI(r0,r1,r2,sh,im)	CC_ORR_SI(ARM_CC_AL,r0,r1,r2,sh,im)
537 #  define CC_ORRI(cc,rd,rn,im)		corri(cc,ARM_ORR|ARM_I,rn,rd,im)
538 #  define ORRI(rd,rn,im)		CC_ORRI(ARM_CC_AL,rd,rn,im)
539 #  define T2_ORRI(rd,rn,im)		torri(THUMB2_ORRI,rn,rd,im)
540 #  define CC_EOR(cc,rd,rn,rm)		corrr(cc,ARM_EOR,rn,rd,rm)
541 #  define EOR(rd,rn,rm)			CC_EOR(ARM_CC_AL,rd,rn,rm)
542 #  define T1_EOR(rdn,rm)		is(THUMB_EOR|(_u3(rm)<<3)|_u3(rdn))
543 #  define T2_EOR(rd,rn,rm)		torrr(THUMB2_EOR,rn,rd,rm)
544 #  define CC_EOR_SI(cc,rd,rn,rm,sh,im)	corrrs(cc,ARM_EOR|sh,rn,rd,rm,im)
545 #  define EOR_SI(r0,r1,r2,sh,im)	CC_EOR_SI(ARM_CC_AL,r0,r1,r2,sh,im)
546 #  define CC_EORI(cc,rd,rn,im)		corri(cc,ARM_EOR|ARM_I,rn,rd,im)
547 #  define EORI(rd,rn,im)		CC_EORI(ARM_CC_AL,rd,rn,im)
548 #  define T2_EORI(rd,rn,im)		torri(THUMB2_EORI,rn,rd,im)
549 #  define CC_REV(cc,rd,rm)		c6orr(cc,ARM_REV,rd,rm)
550 #  define REV(rd,rm)			CC_REV(ARM_CC_AL,rd,rm)
551 #  define T1_REV(rd,rm)			is(THUMB_REV|(_u3(rm)<<3)|_u3(rd))
552 #  define T2_REV(rd,rm)			torrr(THUMB2_REV,rm,rd,rm)
553 #  define CC_REV16(cc,rd,rm)		c6orr(cc,ARM_REV16,rd,rm)
554 #  define REV16(rd,rm)			CC_REV16(ARM_CC_AL,rd,rm)
555 #  define T1_REV16(rd,rm)		is(THUMB_REV16|(_u3(rm)<<3)|_u3(rd))
556 #  define T2_REV16(rd,rm)		torrr(THUMB2_REV16,rm,rd,rm)
557 #  define CC_SXTB(cc,rd,rm)		c6orr(cc,ARM_SXTB,rd,rm)
558 #  define SXTB(rd,rm)			CC_SXTB(ARM_CC_AL,rd,rm)
559 #  define T1_SXTB(rd,rm)		is(THUMB_SXTB|(_u3(rm)<<3)|_u3(rd))
560 #  define T2_SXTB(rd,rm)		torrr(THUMB2_SXTB,_R15_REGNO,rd,rm)
561 #  define CC_UXTB(cc,rd,rm)		c6orr(cc,ARM_UXTB,rd,rm)
562 #  define UXTB(rd,rm)			CC_UXTB(ARM_CC_AL,rd,rm)
563 #  define T1_UXTB(rd,rm)		is(THUMB_UXTB|(_u3(rm)<<3)|_u3(rd))
564 #  define T2_UXTB(rd,rm)		torrr(THUMB2_UXTB,_R15_REGNO,rd,rm)
565 #  define CC_SXTH(cc,rd,rm)		c6orr(cc,ARM_SXTH,rd,rm)
566 #  define SXTH(rd,rm)			CC_SXTH(ARM_CC_AL,rd,rm)
567 #  define T1_SXTH(rd,rm)		is(THUMB_SXTH|(_u3(rm)<<3)|_u3(rd))
568 #  define T2_SXTH(rd,rm)		torrr(THUMB2_SXTH,_R15_REGNO,rd,rm)
569 #  define CC_UXTH(cc,rd,rm)		c6orr(cc,ARM_UXTH,rd,rm)
570 #  define UXTH(rd,rm)			CC_UXTH(ARM_CC_AL,rd,rm)
571 #  define T1_UXTH(rd,rm)		is(THUMB_UXTH|(_u3(rm)<<3)|_u3(rd))
572 #  define T2_UXTH(rd,rm)		torrr(THUMB2_UXTH,_R15_REGNO,rd,rm)
573 #  define CC_SHIFT(cc,o,rd,rm,rn,im)	cshift(cc,o,rd,rm,rn,im)
574 #  define CC_LSL(cc,rd,rn,rm)		CC_SHIFT(cc,ARM_LSL|ARM_R,rd,rm,rn,0)
575 #  define LSL(rd,rn,rm)			CC_LSL(ARM_CC_AL,rd,rn,rm)
576 #  define T1_LSL(rdn,rm)		is(THUMB_LSL|(_u3(rm)<<3)|_u3(rdn))
577 #  define T2_LSL(rd,rn,rm)		torrr(THUMB2_LSL,rn,rd,rm)
578 #  define CC_LSLI(cc,rd,rn,im)		CC_SHIFT(cc,ARM_LSL,rd,0,rn,im)
579 #  define LSLI(rd,rn,im)		CC_LSLI(ARM_CC_AL,rd,rn,im)
580 #  define T1_LSLI(rd,rm,im)		is(THUMB_LSLI|(_u5(im)<<6)|(_u3(rm)<<3)|_u3(rd))
581 #  define T2_LSLI(rd,rm,im)		tshift(THUMB2_LSLI,rd,rm,im)
582 #  define CC_LSR(cc,rd,rn,rm)		CC_SHIFT(cc,ARM_LSR|ARM_R,rd,rm,rn,0)
583 #  define LSR(rd,rn,rm)			CC_LSR(ARM_CC_AL,rd,rn,rm)
584 #  define T1_LSR(rdn,rm)		is(THUMB_LSR|(_u3(rm)<<3)|_u3(rdn))
585 #  define T2_LSR(rd,rn,rm)		torrr(THUMB2_LSR,rn,rd,rm)
586 #  define CC_LSRI(cc,rd,rn,im)		CC_SHIFT(cc,ARM_LSR,rd,0,rn,im)
587 #  define LSRI(rd,rn,im)		CC_LSRI(ARM_CC_AL,rd,rn,im)
588 #  define T1_LSRI(rd,rm,im)		is(THUMB_LSRI|(_u5(im)<<6)|(_u3(rm)<<3)|_u3(rd))
589 #  define T2_LSRI(rd,rm,im)		tshift(THUMB2_LSRI,rd,rm,im)
590 #  define CC_ASR(cc,rd,rn,rm)		CC_SHIFT(cc,ARM_ASR|ARM_R,rd,rm,rn,0)
591 #  define ASR(rd,rn,rm)			CC_ASR(ARM_CC_AL,rd,rn,rm)
592 #  define T1_ASR(rdn,rm)		is(THUMB_ASR|(_u3(rm)<<3)|_u3(rdn))
593 #  define T2_ASR(rd,rn,rm)		torrr(THUMB2_ASR,rn,rd,rm)
594 #  define CC_ASRI(cc,rd,rn,im)		CC_SHIFT(cc,ARM_ASR,rd,0,rn,im)
595 #  define ASRI(rd,rn,im)		CC_ASRI(ARM_CC_AL,rd,rn,im)
596 #  define T1_ASRI(rd,rm,im)		is(THUMB_ASRI|(_u5(im)<<6)|(_u3(rm)<<3)|_u3(rd))
597 #  define T2_ASRI(rd,rm,im)		tshift(THUMB2_ASRI,rd,rm,im)
598 #  define CC_CMP(cc,rn,rm)		corrr(cc,ARM_CMP,rn,0,rm)
599 #  define CMP(rn,rm)			CC_CMP(ARM_CC_AL,rn,rm)
600 #  define T1_CMP(rn,rm)			is(THUMB_CMP|(_u3(rm)<<3)|_u3(rn))
601 #  define T1_CMPX(rn,rm)		is(THUMB_CMPX|((_u4(rn)&8)<<4)|(_u4(rm)<<3)|(rn&7))
602 #  define T2_CMP(rn,rm)			torrr(THUMB2_CMP,rn,_R15_REGNO,rm)
603 #  define CC_CMPI(cc,rn,im)		corri(cc,ARM_CMP|ARM_I,rn,0,im)
604 #  define CMPI(rn,im)			CC_CMPI(ARM_CC_AL,rn,im)
605 #  define T1_CMPI(rn,im)		is(THUMB_CMPI|(_u3(rn)<<8)|_u8(im))
606 #  define T2_CMPI(rn,im)		torri(THUMB2_CMPI,rn,_R15_REGNO,im)
607 #  define CC_CMN(cc,rn,rm)		corrr(cc,ARM_CMN,rn,0,rm)
608 #  define CMN(rn,rm)			CC_CMN(ARM_CC_AL,rn,rm)
609 #  define T1_CMN(rn,rm)			is(THUMB_CMN|(_u3(rm)<<3)|_u3(rm))
610 #  define T2_CMN(rn,rm)			torrr(THUMB2_CMN,rn,_R15_REGNO,rm)
611 #  define CC_CMNI(cc,rn,im)		corri(cc,ARM_CMN|ARM_I,rn,0,im)
612 #  define CMNI(rn,im)			CC_CMNI(ARM_CC_AL,rn,im)
613 #  define T2_CMNI(rn,im)		torri(THUMB2_CMNI,rn,_R15_REGNO,im)
614 #  define CC_TST(cc,rn,rm)		corrr(cc,ARM_TST,rn,r0,rm)
615 #  define TST(rn,rm)			CC_TST(ARM_CC_AL,rn,rm)
616 #  define T1_TST(rn,rm)			is(THUMB_TST|(_u3(rm)<<3)|_u3(rn))
617 #  define T2_TST(rn,rm)			torrr(THUMB2_TST,rn,_R15_REGNO,rm)
618 #  define CC_TSTI(cc,rn,im)		corri(cc,ARM_TST|ARM_I,rn,0,im)
619 #  define TSTI(rn,im)			CC_TSTI(ARM_CC_AL,rn,im)
620 #  define T2_TSTI(rn,im)		torri(THUMB2_TSTI,rn,_R15_REGNO,im)
621 #  define CC_TEQ(cc,rn,rm)		corrr(cc,ARM_TEQ,rn,0,rm)
622 #  define TEQ(rn,rm)			CC_TEQ(ARM_CC_AL,rn,rm)
623 #  define CC_TEQI(cc,rm,im)		corri(cc,ARM_TEQ|ARM_I,rn,0,im)
624 #  define TEQI(rn,im)			CC_TEQI(ARM_CC_AL,rn,im)
625 #  define CC_BX(cc,rm)			cbx(cc,ARM_BX,rm)
626 #  define BX(rm)			CC_BX(ARM_CC_AL,rm)
627 #  define T1_BX(rm)			is(0x4700|(_u4(rm)<<3))
628 #  define CC_BLX(cc,rm)			cbx(cc,ARM_BLX,rm)
629 #  define BLX(rm)			CC_BLX(ARM_CC_AL,rm)
630 #  define T1_BLX(rm)			is(THUMB_BLX|(_u4(rm)<<3))
631 #  define BLXI(im)			blxi(im)
632 #  define T2_BLXI(im)			tb(THUMB2_BLXI,im)
633 #  define CC_B(cc,im)			cb(cc,ARM_B,im)
634 #  define B(im)				CC_B(ARM_CC_AL,im)
635 #  define T1_CC_B(cc,im)		tc8(cc,im)
636 #  define T1_B(im)			t11(im)
637 #  define T2_CC_B(cc,im)		tcb(cc,im)
638 #  define T2_B(im)			tb(THUMB2_B,im)
639 #  define CC_BLI(cc,im)			cb(cc,ARM_BLI,im)
640 #  define BLI(im)			CC_BLI(ARM_CC_AL,im)
641 #  define T2_BLI(im)			tb(THUMB2_BLI,im)
642 #  define CC_LDRSB(cc,rt,rn,rm)		corrr(cc,ARM_LDRSB|ARM_P,rn,rt,rm)
643 #  define LDRSB(rt,rn,rm)		CC_LDRSB(ARM_CC_AL,rt,rn,rm)
644 #  define T1_LDRSB(rt,rn,rm)		is(THUMB_LDRSB|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rt))
645 #  define T2_LDRSB(rt,rn,rm)		torxr(THUMB2_LDRSB,rn,rt,rm)
646 #  define CC_LDRSBN(cc,rt,rn,rm)	corrr(cc,ARM_LDRSB,rn,rt,rm)
647 #  define LDRSBN(rt,rn,rm)		CC_LDRSBN(ARM_CC_AL,rt,rn,rm)
648 #  define CC_LDRSBI(cc,rt,rn,im)	corri8(cc,ARM_LDRSBI|ARM_P,rn,rt,im)
649 #  define LDRSBI(rt,rn,im)		CC_LDRSBI(ARM_CC_AL,rt,rn,im)
650 #  define T2_LDRSBI(rt,rn,im)		torri8(THUMB2_LDRSBI|THUMB2_U,rn,rt,im)
651 #  define T2_LDRSBWI(rt,rn,im)		torri12(THUMB2_LDRSBWI,rn,rt,im)
652 #  define CC_LDRSBIN(cc,rt,rn,im)	corri8(cc,ARM_LDRSBI,rn,rt,im)
653 #  define LDRSBIN(rt,rn,im)		CC_LDRSBIN(ARM_CC_AL,rt,rn,im)
654 #  define T2_LDRSBIN(rt,rn,im)		torri8(THUMB2_LDRSBI,rn,rt,im)
655 #  define CC_LDRB(cc,rt,rn,rm)		corrr(cc,ARM_LDRB|ARM_P,rn,rt,rm)
656 #  define LDRB(rt,rn,rm)		CC_LDRB(ARM_CC_AL,rt,rn,rm)
657 #  define T1_LDRB(rt,rn,rm)		is(THUMB_LDRB|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rt))
658 #  define T2_LDRB(rt,rn,rm)		torxr(THUMB2_LDRB,rn,rt,rm)
659 #  define CC_LDRBN(cc,rt,rn,rm)		corrr(cc,ARM_LDRB,rn,rt,rm)
660 #  define LDRBN(rt,rn,rm)		CC_LDRBN(ARM_CC_AL,rt,rn,rm)
661 #  define CC_LDRBI(cc,rt,rn,im)		corri(cc,ARM_LDRBI|ARM_P,rn,rt,im)
662 #  define LDRBI(rt,rn,im)		CC_LDRBI(ARM_CC_AL,rt,rn,im)
663 #  define T1_LDRBI(rt,rn,im)		is(THUMB_LDRBI|(_u5(im)<<6)|(_u3(rn)<<3)|_u3(rt))
664 #  define T2_LDRBI(rt,rn,im)		torri8(THUMB2_LDRBI|THUMB2_U,rn,rt,im)
665 #  define T2_LDRBWI(rt,rn,im)		torri12(THUMB2_LDRBWI,rn,rt,im)
666 #  define CC_LDRBIN(cc,rt,rn,im)	corri(cc,ARM_LDRBI,rn,rt,im)
667 #  define LDRBIN(rt,rn,im)		CC_LDRBIN(ARM_CC_AL,rt,rn,im)
668 #  define T2_LDRBIN(rt,rn,im)		torri8(THUMB2_LDRBI,rn,rt,im)
669 #  define CC_LDRSH(cc,rt,rn,rm)		corrr(cc,ARM_LDRSH|ARM_P,rn,rt,rm)
670 #  define LDRSH(rt,rn,rm)		CC_LDRSH(ARM_CC_AL,rt,rn,rm)
671 #  define T1_LDRSH(rt,rn,rm)		is(THUMB_LDRSH|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rt))
672 #  define T2_LDRSH(rt,rn,rm)		torxr(THUMB2_LDRSH,rn,rt,rm)
673 #  define CC_LDRSHN(cc,rt,rn,rm)	corrr(cc,ARM_LDRSH,rn,rt,rm)
674 #  define LDRSHN(rt,rn,rm)		CC_LDRSHN(ARM_CC_AL,rt,rn,rm)
675 #  define CC_LDRSHI(cc,rt,rn,im)	corri8(cc,ARM_LDRSHI|ARM_P,rn,rt,im)
676 #  define LDRSHI(rt,rn,im)		CC_LDRSHI(ARM_CC_AL,rt,rn,im)
677 #  define T2_LDRSHI(rt,rn,im)		torri8(THUMB2_LDRSHI|THUMB2_U,rn,rt,im)
678 #  define T2_LDRSHWI(rt,rn,im)		torri12(THUMB2_LDRSHWI,rn,rt,im)
679 #  define CC_LDRSHIN(cc,rt,rn,im)	corri8(cc,ARM_LDRSHI,rn,rt,im)
680 #  define LDRSHIN(rt,rn,im)		CC_LDRSHIN(ARM_CC_AL,rt,rn,im)
681 #  define T2_LDRSHIN(rt,rn,im)		torri8(THUMB2_LDRSHI,rn,rt,im)
682 #  define CC_LDRH(cc,rt,rn,rm)		corrr(cc,ARM_LDRH|ARM_P,rn,rt,rm)
683 #  define LDRH(rt,rn,rm)		CC_LDRH(ARM_CC_AL,rt,rn,rm)
684 #  define T1_LDRH(rt,rn,rm)		is(THUMB_LDRH|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rt))
685 #  define T2_LDRH(rt,rn,rm)		torxr(THUMB2_LDRH,rn,rt,rm)
686 #  define CC_LDRHN(cc,rt,rn,rm)		corrr(cc,ARM_LDRH,rn,rt,rm)
687 #  define LDRHN(rt,rn,rm)		CC_LDRHN(ARM_CC_AL,rt,rn,rm)
688 #  define CC_LDRHI(cc,rt,rn,im)		corri8(cc,ARM_LDRHI|ARM_P,rn,rt,im)
689 #  define LDRHI(rt,rn,im)		CC_LDRHI(ARM_CC_AL,rt,rn,im)
690 #  define T1_LDRHI(rt,rn,im)		is(THUMB_LDRHI|(_u5(im)<<6)|(_u3(rn)<<3)|_u3(rt))
691 #  define T2_LDRHI(rt,rn,im)		torri8(THUMB2_LDRHI|THUMB2_U,rn,rt,im)
692 #  define T2_LDRHWI(rt,rn,im)		torri12(THUMB2_LDRHWI,rn,rt,im)
693 #  define CC_LDRHIN(cc,rt,rn,im)	corri8(cc,ARM_LDRHI,rn,rt,im)
694 #  define LDRHIN(rt,rn,im)		CC_LDRHIN(ARM_CC_AL,rt,rn,im)
695 #  define T2_LDRHIN(rt,rn,im)		torri8(THUMB2_LDRHI,rn,rt,im)
696 #  define CC_LDR(cc,rt,rn,rm)		corrr(cc,ARM_LDR|ARM_P,rn,rt,rm)
697 #  define LDR(rt,rn,rm)			CC_LDR(ARM_CC_AL,rt,rn,rm)
698 #  define T1_LDR(rt,rn,rm)		is(THUMB_LDR|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rt))
699 #  define T2_LDR(rt,rn,rm)		torxr(THUMB2_LDR,rn,rt,rm)
700 #  define CC_LDRN(cc,rt,rn,rm)		corrr(cc,ARM_LDR,rn,rt,rm)
701 #  define LDRN(rt,rn,rm)		CC_LDRN(ARM_CC_AL,rt,rn,rm)
702 #  define CC_LDRI(cc,rt,rn,im)		corri(cc,ARM_LDRI|ARM_P,rn,rt,im)
703 #  define LDRI(rt,rn,im)		CC_LDRI(ARM_CC_AL,rt,rn,im)
704 #  define T1_LDRI(rt,rn,im)		is(THUMB_LDRI|(_u5(im)<<6)|(_u3(rn)<<3)|_u3(rt))
705 #  define T1_LDRISP(rt,im)		is(THUMB_LDRISP|(_u3(rt)<<8)|_u8(im))
706 #  define T2_LDRI(rt,rn,im)		torri8(THUMB2_LDRI|THUMB2_U,rn,rt,im)
707 #  define T2_LDRWI(rt,rn,im)		torri12(THUMB2_LDRWI,rn,rt,im)
708 #  define CC_LDRIN(cc,rt,rn,im)		corri(cc,ARM_LDRI,rn,rt,im)
709 #  define LDRIN(rt,rn,im)		CC_LDRIN(ARM_CC_AL,rt,rn,im)
710 #  define T2_LDRIN(rt,rn,im)		torri8(THUMB2_LDRI,rn,rt,im)
711 #  define CC_LDRD(cc,rt,rn,rm)		corrr(cc,ARM_LDRD|ARM_P,rn,rt,rm)
712 #  define LDRD(rt,rn,rm)		CC_LDRD(ARM_CC_AL,rt,rn,rm)
713 #  define T2_LDRDI(rt,rt2,rn,im)	torrri8(THUMB2_LDRDI|ARM_P,rn,rt,rt2,im)
714 #  define CC_LDRDN(cc,rt,rn,rm)		corrr(cc,ARM_LDRD,rn,rt,rm)
715 #  define LDRDN(rd,rn,rm)		CC_LDRDN(ARM_CC_AL,rt,rn,rm)
716 #  define CC_LDRDI(cc,rt,rn,im)		corri8(cc,ARM_LDRDI|ARM_P,rn,rt,im)
717 #  define LDRDI(rt,rn,im)		CC_LDRDI(ARM_CC_AL,rt,rn,im)
718 #  define CC_LDRDIN(cc,rt,rn,im)	corri8(cc,ARM_LDRDI,rn,rt,im)
719 #  define LDRDIN(rt,rn,im)		CC_LDRDIN(ARM_CC_AL,rt,rn,im)
720 #  define T2_LDRDIN(rt,rt2,rn,im)	torrri8(THUMB2_LDRDI,rn,rt,rt2,im)
721 #  define CC_STRB(cc,rt,rn,rm)		corrr(cc,ARM_STRB|ARM_P,rn,rt,rm)
722 #  define STRB(rt,rn,rm)		CC_STRB(ARM_CC_AL,rt,rn,rm)
723 #  define T1_STRB(rt,rn,rm)		is(THUMB_STRB|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rt))
724 #  define T2_STRB(rt,rn,rm)		torxr(THUMB2_STRB,rn,rt,rm)
725 #  define CC_STRBN(cc,rt,rn,rm)		corrr(cc,ARM_STRB,rn,rt,rm)
726 #  define STRBN(rt,rn,rm)		CC_STRBN(ARM_CC_AL,rt,rn,rm)
727 #  define CC_STRBI(cc,rt,rn,im)		corri(cc,ARM_STRBI|ARM_P,rn,rt,im)
728 #  define STRBI(rt,rn,im)		CC_STRBI(ARM_CC_AL,rt,rn,im)
729 #  define T1_STRBI(rt,rn,im)		is(THUMB_STRBI|(_u5(im)<<6)|(_u3(rn)<<3)|_u3(rt))
730 #  define T2_STRBI(rt,rn,im)		torri8(THUMB2_STRBI|THUMB2_U,rn,rt,im)
731 #  define T2_STRBWI(rt,rn,im)		torri12(THUMB2_STRBWI,rn,rt,im)
732 #  define CC_STRBIN(cc,rt,rn,im)	corri(cc,ARM_STRBI,rn,rt,im)
733 #  define STRBIN(rt,rn,im)		CC_STRBIN(ARM_CC_AL,rt,rn,im)
734 #  define T2_STRBIN(rt,rn,im)		torri8(THUMB2_STRBI,rn,rt,im)
735 #  define CC_STRH(cc,rt,rn,rm)		corrr(cc,ARM_STRH|ARM_P,rn,rt,rm)
736 #  define STRH(rt,rn,rm)		CC_STRH(ARM_CC_AL,rt,rn,rm)
737 #  define T1_STRH(rt,rn,rm)		is(THUMB_STRH|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rt))
738 #  define T2_STRH(rt,rn,rm)		torxr(THUMB2_STRH,rn,rt,rm)
739 #  define CC_STRHN(cc,rt,rn,rm)		corrr(cc,ARM_STRH,rn,rt,rm)
740 #  define STRHN(rt,rn,rm)		CC_STRHN(ARM_CC_AL,rt,rn,rm)
741 #  define CC_STRHI(cc,rt,rn,im)		corri8(cc,ARM_STRHI|ARM_P,rn,rt,im)
742 #  define STRHI(rt,rn,im)		CC_STRHI(ARM_CC_AL,rt,rn,im)
743 #  define T1_STRHI(rt,rn,im)		is(THUMB_STRHI|(_u5(im)<<6)|(_u3(rn)<<3)|_u3(rt))
744 #  define T2_STRHI(rt,rn,im)		torri8(THUMB2_STRHI|THUMB2_U,rn,rt,im)
745 #  define T2_STRHWI(rt,rn,im)		torri12(THUMB2_STRHWI,rn,rt,im)
746 #  define CC_STRHIN(cc,rt,rn,im)	corri8(cc,ARM_STRHI,rn,rt,im)
747 #  define STRHIN(rt,rn,im)		CC_STRHIN(ARM_CC_AL,rt,rn,im)
748 #  define T2_STRHIN(rt,rn,im)		torri8(THUMB2_STRHI,rn,rt,im)
749 #  define CC_STR(cc,rt,rn,rm)		corrr(cc,ARM_STR|ARM_P,rn,rt,rm)
750 #  define STR(rt,rn,rm)			CC_STR(ARM_CC_AL,rt,rn,rm)
751 #  define T1_STR(rt,rn,rm)		is(THUMB_STR|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rt))
752 #  define T2_STR(rt,rn,rm)		torxr(THUMB2_STR,rn,rt,rm)
753 #  define CC_STRN(cc,rt,rn,rm)		corrr(cc,ARM_STR,rn,rt,rm)
754 #  define STRN(rt,rn,rm)		CC_STRN(ARM_CC_AL,rt,rn,rm)
755 #  define CC_STRI(cc,rt,rn,im)		corri(cc,ARM_STRI|ARM_P,rn,rt,im)
756 #  define STRI(rt,rn,im)		CC_STRI(ARM_CC_AL,rt,rn,im)
757 #  define T1_STRI(rt,rn,im)		is(THUMB_STRI|(_u5(im)<<6)|(_u3(rn)<<3)|_u3(rt))
758 #  define T1_STRISP(rt,im)		is(THUMB_STRISP|(_u3(rt)<<8)|(_u8(im)))
759 #  define T2_STRI(rt,rn,im)		torri8(THUMB2_STRI|THUMB2_U,rn,rt,im)
760 #  define T2_STRWI(rt,rn,im)		torri12(THUMB2_STRWI,rn,rt,im)
761 #  define CC_STRIN(cc,rt,rn,im)		corri(cc,ARM_STRI,rn,rt,im)
762 #  define STRIN(rt,rn,im)		CC_STRIN(ARM_CC_AL,rt,rn,im)
763 #  define T2_STRIN(rt,rn,im)		torri8(THUMB2_STRI,rn,rt,im)
764 #  define CC_STRD(cc,rt,rn,rm)		corrr(cc,ARM_STRD|ARM_P,rn,rt,rm)
765 #  define STRD(rt,rn,rm)		CC_STRD(ARM_CC_AL,rt,rn,rm)
766 #  define CC_STRDN(cc,rt,rn,rm)		corrr(cc,ARM_STRD,rn,rt,rm)
767 #  define STRDN(rt,rn,rm)		CC_STRDN(ARM_CC_AL,rt,rn,rm)
768 #  define CC_STRDI(cc,rt,rn,im)		corri8(cc,ARM_STRDI|ARM_P,rn,rt,im)
769 #  define STRDI(rt,rn,im)		CC_STRDI(ARM_CC_AL,rt,rn,im)
770 #  define T2_STRDI(rt,rt2,rn,im)	torrri8(THUMB2_STRDI|ARM_P,rn,rt,rt2,im)
771 #  define CC_STRDIN(cc,rt,rn,im)	corri8(cc,ARM_STRDI,rn,rt,im)
772 #  define STRDIN(rt,rn,im)		CC_STRDIN(ARM_CC_AL,rt,rn,im)
773 #  define T2_STRDIN(rt,rt2,rn,im)	torrri8(THUMB2_STRDI,rn,rt,rt2,im)
774 #  define CC_LDMIA(cc,rn,im)		corl(cc,ARM_M|ARM_M_L|ARM_M_I,rn,im)
775 #  define LDMIA(rn,im)			CC_LDMIA(ARM_CC_AL,rn,im)
776 #  define CC_LDM(cc,rn,im)		CC_LDMIA(cc,rn,im)
777 #  define LDM(rn,im)			LDMIA(rn,im)
778 #  define T1_LDMIA(rn,im)		is(THUMB_LDMIA|(_u3(rn)<<8)|im)
779 #  define T2_LDMIA(rn,im)		torl(THUMB2_LDMIA,rn,im)
780 #  define CC_LDMIA_U(cc,rn,im)		corl(cc,ARM_M|ARM_M_L|ARM_M_I|ARM_M_U,rn,im)
781 #  define LDMIA_U(rn,im)		CC_LDMIA_U(ARM_CC_AL,rn,im)
782 #  define LDM_U(r0,i0)			LDMIA_U(r0,i0)
783 #  define CC_LDMIB(cc,rn,im)		corl(cc,ARM_M|ARM_M_L|ARM_M_I|ARM_M_B,rn,im)
784 #  define LDMIB(rn,im)			CC_LDMIB(ARM_CC_AL,rn,im)
785 #  define CC_LDMIB_U(cc,rn,im)		corl(cc,ARM_M|ARM_M_L|ARM_M_I|ARM_M_B|ARM_M_U,rn,im)
786 #  define LDMIB_U(rn,im)		CC_LDMIB_U(ARM_CC_AL,rn,im)
787 #  define CC_LDMDA(cc,rn,im)		corl(cc,ARM_M|ARM_M_L,rn,im)
788 #  define LDMDA(rn,im)			CC_LDMDA(ARM_CC_AL,rn,im)
789 #  define CC_LDMDA_U(cc,rn,im)		corl(cc,ARM_M|ARM_M_L|ARM_M_U,rn,im)
790 #  define LDMDA_U(rn,im)		CC_LDMDA_U(ARM_CC_AL,rn,im)
791 #  define CC_LDMDB(cc,rn,im)		corl(cc,ARM_M|ARM_M_L|ARM_M_B,rn,im)
792 #  define LDMDB(rn,im)			CC_LDMDB(ARM_CC_AL,rn,im)
793 #  define T2_LDMDB(rn,im)		torl(THUMB2_LDMDB,rn,im)
794 #  define CC_LDMDB_U(cc,rn,im)		corl(cc,ARM_M|ARM_M_L|ARM_M_B|ARM_M_U,rn,im)
795 #  define LDMDB_U(rn,im)		CC_LDMDB_U(ARM_CC_AL,rn,im)
796 #  define CC_STMIA(cc,rn,im)		corl(cc,ARM_M|ARM_M_I,rn,im)
797 #  define STMIA(rn,im)			CC_STMIA(ARM_CC_AL,rn,im)
798 #  define CC_STM(cc,rn,im)		CC_STMIA(cc,rn,im)
799 #  define STM(rn,im)			STMIA(rn,im)
800 #  define CC_STMIA_U(cc,rn,im)		corl(cc,ARM_M|ARM_M_I|ARM_M_U,rn,im)
801 #  define STMIA_U(rn,im)		CC_STMIA_U(ARM_CC_AL,rn,im)
802 #  define CC_STM_U(cc,rn,im)		CC_STMIA_U(cc,rn,im)
803 #  define STM_U(rn,im)			STMIA_U(rn,im)
804 #  define CC_STMIB(cc,rn,im)		corl(cc,ARM_M|ARM_M_I|ARM_M_B,rn,im)
805 #  define STMIB(rn,im)			CC_STMIB(ARM_CC_AL,rn,im)
806 #  define CC_STMIB_U(cc,rn,im)		corl(cc,ARM_M|ARM_M_I|ARM_M_B|ARM_M_U,rn,im)
807 #  define STMIB_U(rn,im)		CC_STMIB_U(ARM_CC_AL,rn,im)
808 #  define CC_STMDA(cc,rn,im)		corl(cc,ARM_M,rn,im)
809 #  define STMDA(rn,im)			CC_STMDA(ARM_CC_AL,rn,im)
810 #  define CC_STMDA_U(cc,rn,im)		corl(cc,ARM_M|ARM_M_U,rn,im)
811 #  define STMDA_U(rn,im)		CC_STMDA_U(ARM_CC_AL,rn,im)
812 #  define CC_STMDB(cc,rn,im)		corl(cc,ARM_M|ARM_M_B,rn,im)
813 #  define STMDB(rn,im)			CC_STMDB(ARM_CC_AL,rn,im)
814 #  define CC_STMDB_U(cc,rn,im)		corl(cc,ARM_M|ARM_M_B|ARM_M_U,rn,im)
815 #  define STMDB_U(rn,im)		CC_STMDB_U(ARM_CC_AL,rn,im)
816 #  define CC_PUSH(cc,im)		CC_STMDB_U(cc,_SP_REGNO,im)
817 #  define PUSH(im)			STMDB_U(_SP_REGNO,im)
818 #  define T1_PUSH(im)			is(THUMB_PUSH|((im&0x4000)>>6)|(im&0xff))
819 #  define T2_PUSH(im)			tpp(THUMB2_PUSH,im)
820 #  define CC_POP(cc,im)			LDMIA_U(cc,_SP_REGNO,im)
821 #  define POP(im)			LDMIA_U(_SP_REGNO,im)
822 #  define T1_POP(im)			is(THUMB_POP|((im&0x8000)>>7)|(im&0xff))
823 #  define T2_POP(im)			tpp(THUMB2_POP,im)
824 #  define jit_get_reg_args()						\
825     do {								\
826 	(void)jit_get_reg(_R0|jit_class_named|jit_class_gpr);		\
827 	(void)jit_get_reg(_R1|jit_class_named|jit_class_gpr);		\
828 	(void)jit_get_reg(_R2|jit_class_named|jit_class_gpr);		\
829 	(void)jit_get_reg(_R3|jit_class_named|jit_class_gpr);		\
830     } while (0)
831 #  define jit_unget_reg_args()						\
832     do {								\
833 	jit_unget_reg(_R3);						\
834 	jit_unget_reg(_R2);						\
835 	jit_unget_reg(_R1);						\
836 	jit_unget_reg(_R0);						\
837     } while (0)
838 #  define nop(i0)			_nop(_jit,i0)
839 static void _nop(jit_state_t*,jit_int32_t);
840 #  define movr(r0,r1)			_movr(_jit,r0,r1)
841 static void _movr(jit_state_t*,jit_int32_t,jit_int32_t);
842 #  define movi(r0,i0)			_movi(_jit,r0,i0)
843 static void _movi(jit_state_t*,jit_int32_t,jit_word_t);
844 #  define movi_p(r0,i0)			_movi_p(_jit,r0,i0)
845 static jit_word_t _movi_p(jit_state_t*,jit_int32_t,jit_word_t);
846 #  define comr(r0,r1)			_comr(_jit,r0,r1)
847 static void _comr(jit_state_t*,jit_int32_t,jit_int32_t);
848 #  define negr(r0,r1)			_negr(_jit,r0,r1)
849 static void _negr(jit_state_t*,jit_int32_t,jit_int32_t);
850 #  define addr(r0,r1,r2)		_addr(_jit,r0,r1,r2)
851 static void _addr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
852 #  define addi(r0,r1,i0)		_addi(_jit,r0,r1,i0)
853 static void _addi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
854 #  define addcr(r0,r1,r2)		_addcr(_jit,r0,r1,r2)
855 static void _addcr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
856 #  define addci(r0,r1,i0)		_addci(_jit,r0,r1,i0)
857 static void _addci(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
858 #  define addxr(r0,r1,r2)		_addxr(_jit,r0,r1,r2)
859 static void _addxr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
860 #  define addxi(r0,r1,i0)		_addxi(_jit,r0,r1,i0)
861 static void _addxi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
862 #  define subr(r0,r1,r2)		_subr(_jit,r0,r1,r2)
863 static void _subr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
864 #  define subi(r0,r1,i0)		_subi(_jit,r0,r1,i0)
865 static void _subi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
866 #  define subcr(r0,r1,r2)		_subcr(_jit,r0,r1,r2)
867 static void _subcr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
868 #  define subci(r0,r1,i0)		_subci(_jit,r0,r1,i0)
869 static void _subci(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
870 #  define subxr(r0,r1,r2)		_subxr(_jit,r0,r1,r2)
871 static void _subxr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
872 #  define subxi(r0,r1,i0)		_subxi(_jit,r0,r1,i0)
873 static void _subxi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
874 #  define rsbi(r0, r1, i0)		_rsbi(_jit, r0, r1, i0)
875 static void _rsbi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
876 #  define mulr(r0,r1,r2)		_mulr(_jit,r0,r1,r2)
877 static void _mulr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
878 #  define muli(r0,r1,i0)		_muli(_jit,r0,r1,i0)
879 static void _muli(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
880 #  define qmulr(r0,r1,r2,r3)		iqmulr(r0,r1,r2,r3,1)
881 #  define qmulr_u(r0,r1,r2,r3)		iqmulr(r0,r1,r2,r3,0)
882 #  define iqmulr(r0,r1,r2,r3,cc)	_iqmulr(_jit,r0,r1,r2,r3,cc)
883 static void _iqmulr(jit_state_t*,jit_int32_t,jit_int32_t,
884 		    jit_int32_t,jit_int32_t,jit_bool_t);
885 #  define qmuli(r0,r1,r2,i0)		iqmuli(r0,r1,r2,i0,1)
886 #  define qmuli_u(r0,r1,r2,i0)		iqmuli(r0,r1,r2,i0,0)
887 #  define iqmuli(r0,r1,r2,i0,cc)	_iqmuli(_jit,r0,r1,r2,i0,cc)
888 static void _iqmuli(jit_state_t*,jit_int32_t,jit_int32_t,
889 		    jit_int32_t,jit_word_t,jit_bool_t);
890 #  define divrem(d,s,r0,r1,r2)		_divrem(_jit,d,s,r0,r1,r2)
891 static void _divrem(jit_state_t*,int,int,jit_int32_t,jit_int32_t,jit_int32_t);
892 #  define divr(r0,r1,r2)		_divr(_jit,r0,r1,r2)
893 static void _divr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
894 #  define divi(r0,r1,i0)		_divi(_jit,r0,r1,i0)
895 static void _divi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
896 #  define divr_u(r0,r1,r2)		_divr_u(_jit,r0,r1,r2)
897 static void _divr_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
898 #  define divi_u(r0,r1,i0)		_divi_u(_jit,r0,r1,i0)
899 static void _divi_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
900 #  define qdivr(r0,r1,r2,r3)		iqdivr(r0,r1,r2,r3,1)
901 #  define qdivr_u(r0,r1,r2,r3)		iqdivr(r0,r1,r2,r3,0)
902 #  define iqdivr(r0,r1,r2,r3,cc)	_iqdivr(_jit,r0,r1,r2,r3,cc)
903 static void _iqdivr(jit_state_t*,jit_int32_t,jit_int32_t,
904 		    jit_int32_t,jit_int32_t,jit_bool_t);
905 #  define qdivi(r0,r1,r2,i0)		iqdivi(r0,r1,r2,i0,1)
906 #  define qdivi_u(r0,r1,r2,i0)		iqdivi(r0,r1,r2,i0,0)
907 #  define iqdivi(r0,r1,r2,i0,cc)	_iqdivi(_jit,r0,r1,r2,i0,cc)
908 static void _iqdivi(jit_state_t*,jit_int32_t,jit_int32_t,
909 		    jit_int32_t,jit_word_t,jit_bool_t);
910 #  define remr(r0,r1,r2)		_remr(_jit,r0,r1,r2)
911 static void _remr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
912 #  define remi(r0,r1,i0)		_remi(_jit,r0,r1,i0)
913 static void _remi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
914 #  define remr_u(r0,r1,r2)		_remr_u(_jit,r0,r1,r2)
915 static void _remr_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
916 #  define remi_u(r0,r1,i0)		_remi_u(_jit,r0,r1,i0)
917 static void _remi_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
918 #  define andr(r0,r1,r2)		_andr(_jit,r0,r1,r2)
919 static void _andr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
920 #  define andi(r0,r1,i0)		_andi(_jit,r0,r1,i0)
921 static void _andi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
922 #  define orr(r0,r1,r2)			_orr(_jit,r0,r1,r2)
923 static void _orr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
924 #  define ori(r0,r1,i0)			_ori(_jit,r0,r1,i0)
925 static void _ori(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
926 #  define xorr(r0,r1,r2)		_xorr(_jit,r0,r1,r2)
927 static void _xorr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
928 #  define xori(r0,r1,i0)		_xori(_jit,r0,r1,i0)
929 static void _xori(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
930 #  define lshr(r0,r1,r2)		_lshr(_jit,r0,r1,r2)
931 static void _lshr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
932 #  define lshi(r0,r1,i0)		_lshi(_jit,r0,r1,i0)
933 static void _lshi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
934 #  define rshr(r0,r1,r2)		_rshr(_jit,r0,r1,r2)
935 static void _rshr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
936 #  define rshi(r0,r1,i0)		_rshi(_jit,r0,r1,i0)
937 static void _rshi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
938 #  define rshr_u(r0,r1,r2)		_rshr_u(_jit,r0,r1,r2)
939 static void _rshr_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
940 #  define rshi_u(r0,r1,i0)		_rshi_u(_jit,r0,r1,i0)
941 static void _rshi_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
942 #  define ccr(ct,cf,r0,r1,r2)		_ccr(_jit,ct,cf,r0,r1,r2)
943 static void _ccr(jit_state_t*,int,int,jit_int32_t,jit_int32_t,jit_int32_t);
944 #  define cci(ct,cf,r0,r1,i0)		_cci(_jit,ct,cf,r0,r1,i0)
945 static void _cci(jit_state_t*,int,int,jit_int32_t,jit_int32_t,jit_word_t);
946 #  define ltr(r0, r1, r2)		ccr(ARM_CC_LT,ARM_CC_GE,r0,r1,r2)
947 #  define lti(r0, r1, i0)		cci(ARM_CC_LT,ARM_CC_GE,r0,r1,i0)
948 #  define ltr_u(r0, r1, r2)		ccr(ARM_CC_LO,ARM_CC_HS,r0,r1,r2)
949 #  define lti_u(r0, r1, i0)		cci(ARM_CC_LO,ARM_CC_HS,r0,r1,i0)
950 #  define ler(r0, r1, r2)		ccr(ARM_CC_LE,ARM_CC_GT,r0,r1,r2)
951 #  define lei(r0, r1, i0)		cci(ARM_CC_LE,ARM_CC_GT,r0,r1,i0)
952 #  define ler_u(r0, r1, r2)		ccr(ARM_CC_LS,ARM_CC_HI,r0,r1,r2)
953 #  define lei_u(r0, r1, i0)		cci(ARM_CC_LS,ARM_CC_HI,r0,r1,i0)
954 #  define eqr(r0, r1, r2)		ccr(ARM_CC_EQ,ARM_CC_NE,r0,r1,r2)
955 #  define eqi(r0, r1, i0)		cci(ARM_CC_EQ,ARM_CC_NE,r0,r1,i0)
956 #  define ger(r0, r1, r2)		ccr(ARM_CC_GE,ARM_CC_LT,r0,r1,r2)
957 #  define gei(r0, r1, i0)		cci(ARM_CC_GE,ARM_CC_LT,r0,r1,i0)
958 #  define ger_u(r0, r1, r2)		ccr(ARM_CC_HS,ARM_CC_LO,r0,r1,r2)
959 #  define gei_u(r0, r1, i0)		cci(ARM_CC_HS,ARM_CC_LO,r0,r1,i0)
960 #  define gtr(r0, r1, r2)		ccr(ARM_CC_GT,ARM_CC_LE,r0,r1,r2)
961 #  define gti(r0, r1, i0)		cci(ARM_CC_GT,ARM_CC_LE,r0,r1,i0)
962 #  define gtr_u(r0, r1, r2)		ccr(ARM_CC_HI,ARM_CC_LS,r0,r1,r2)
963 #  define gti_u(r0, r1, i0)		cci(ARM_CC_HI,ARM_CC_LS,r0,r1,i0)
964 #  define ner(r0,r1,r2)			_ner(_jit,r0,r1,r2)
965 static void _ner(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
966 #  define nei(r0,r1,i0)			_nei(_jit,r0,r1,i0)
967 static void _nei(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
968 #  define jmpr(r0)			_jmpr(_jit,r0)
969 static void _jmpr(jit_state_t*,jit_int32_t);
970 #  define jmpi(i0)			_jmpi(_jit,i0)
971 static void _jmpi(jit_state_t*,jit_word_t);
972 #  define jmpi_p(i0, i1)		_jmpi_p(_jit,i0, i1)
973 static jit_word_t _jmpi_p(jit_state_t*,jit_word_t,jit_bool_t);
974 #  define bccr(cc,i0,r0,r1)		_bccr(_jit,cc,i0,r0,r1)
975 static jit_word_t _bccr(jit_state_t*,int,jit_word_t,jit_int32_t,jit_int32_t);
976 #  define bcci(cc,i0,r0,i1)		_bcci(_jit,cc,i0,r0,i1)
977 static jit_word_t _bcci(jit_state_t*,int,jit_word_t,jit_int32_t,jit_word_t);
978 #  define bltr(i0, r0, r1)		bccr(ARM_CC_LT,i0,r0,r1)
979 #  define blti(i0, r0, i1)		bcci(ARM_CC_LT,i0,r0,i1)
980 #  define bltr_u(i0, r0, r1)		bccr(ARM_CC_LO,i0,r0,r1)
981 #  define blti_u(i0, r0, i1)		bcci(ARM_CC_LO,i0,r0,i1)
982 #  define bler(i0, r0, r1)		bccr(ARM_CC_LE,i0,r0,r1)
983 #  define blei(i0, r0, i1)		bcci(ARM_CC_LE,i0,r0,i1)
984 #  define bler_u(i0, r0, r1)		bccr(ARM_CC_LS,i0,r0,r1)
985 #  define blei_u(i0, r0, i1)		bcci(ARM_CC_LS,i0,r0,i1)
986 #  define beqr(i0, r0, r1)		bccr(ARM_CC_EQ,i0,r0,r1)
987 #  define beqi(i0, r0, i1)		bcci(ARM_CC_EQ,i0,r0,i1)
988 #  define bger(i0, r0, r1)		bccr(ARM_CC_GE,i0,r0,r1)
989 #  define bgei(i0, r0, i1)		bcci(ARM_CC_GE,i0,r0,i1)
990 #  define bger_u(i0, r0, r1)		bccr(ARM_CC_HS,i0,r0,r1)
991 #  define bgei_u(i0, r0, i1)		bcci(ARM_CC_HS,i0,r0,i1)
992 #  define bgtr(i0, r0, r1)		bccr(ARM_CC_GT,i0,r0,r1)
993 #  define bgti(i0, r0, i1)		bcci(ARM_CC_GT,i0,r0,i1)
994 #  define bgtr_u(i0, r0, r1)		bccr(ARM_CC_HI,i0,r0,r1)
995 #  define bgti_u(i0, r0, i1)		bcci(ARM_CC_HI,i0,r0,i1)
996 #  define bner(i0, r0, r1)		bccr(ARM_CC_NE,i0,r0,r1)
997 #  define bnei(i0, r0, i1)		bcci(ARM_CC_NE,i0,r0,i1)
998 #  define baddr(cc,i0,r0,r1)		_baddr(_jit,cc,i0,r0,r1)
999 static jit_word_t _baddr(jit_state_t*,int,jit_word_t,jit_int32_t,jit_int32_t);
1000 #  define baddi(cc,i0,r0,r1)		_baddi(_jit,cc,i0,r0,r1)
1001 static jit_word_t _baddi(jit_state_t*,int,jit_word_t,jit_int32_t,jit_word_t);
1002 #  define boaddr(i0,r0,r1)		baddr(ARM_CC_VS,i0,r0,r1)
1003 #  define boaddi(i0,r0,i1)		baddi(ARM_CC_VS,i0,r0,i1)
1004 #  define boaddr_u(i0,r0,r1)		baddr(ARM_CC_HS,i0,r0,r1)
1005 #  define boaddi_u(i0,r0,i1)		baddi(ARM_CC_HS,i0,r0,i1)
1006 #  define bxaddr(i0,r0,r1)		baddr(ARM_CC_VC,i0,r0,r1)
1007 #  define bxaddi(i0,r0,i1)		baddi(ARM_CC_VC,i0,r0,i1)
1008 #  define bxaddr_u(i0,r0,r1)		baddr(ARM_CC_LO,i0,r0,r1)
1009 #  define bxaddi_u(i0,r0,i1)		baddi(ARM_CC_LO,i0,r0,i1)
1010 #  define bsubr(cc,i0,r0,r1)		_bsubr(_jit,cc,i0,r0,r1)
1011 static jit_word_t _bsubr(jit_state_t*,int,jit_word_t,jit_int32_t,jit_int32_t);
1012 #  define bsubi(cc,i0,r0,r1)		_bsubi(_jit,cc,i0,r0,r1)
1013 static jit_word_t _bsubi(jit_state_t*,int,jit_word_t,jit_int32_t,jit_word_t);
1014 #  define bosubr(i0,r0,r1)		bsubr(ARM_CC_VS,i0,r0,r1)
1015 #  define bosubi(i0,r0,i1)		bsubi(ARM_CC_VS,i0,r0,i1)
1016 #  define bosubr_u(i0,r0,r1)		bsubr(ARM_CC_LO,i0,r0,r1)
1017 #  define bosubi_u(i0,r0,i1)		bsubi(ARM_CC_LO,i0,r0,i1)
1018 #  define bxsubr(i0,r0,r1)		bsubr(ARM_CC_VC,i0,r0,r1)
1019 #  define bxsubi(i0,r0,i1)		bsubi(ARM_CC_VC,i0,r0,i1)
1020 #  define bxsubr_u(i0,r0,r1)		bsubr(ARM_CC_HS,i0,r0,r1)
1021 #  define bxsubi_u(i0,r0,i1)		bsubi(ARM_CC_HS,i0,r0,i1)
1022 #  define bmxr(cc,i0,r0,r1)		_bmxr(_jit,cc,i0,r0,r1)
1023 static jit_word_t _bmxr(jit_state_t*,int,jit_word_t,jit_int32_t,jit_int32_t);
1024 #  define bmxi(cc,i0,r0,r1)		_bmxi(_jit,cc,i0,r0,r1)
1025 static jit_word_t _bmxi(jit_state_t*,int,jit_word_t,jit_int32_t,jit_word_t);
1026 #  define bmsr(i0,r0,r1)		bmxr(ARM_CC_NE,i0,r0,r1)
1027 #  define bmsi(i0,r0,i1)		bmxi(ARM_CC_NE,i0,r0,i1)
1028 #  define bmcr(i0,r0,r1)		bmxr(ARM_CC_EQ,i0,r0,r1)
1029 #  define bmci(i0,r0,i1)		bmxi(ARM_CC_EQ,i0,r0,i1)
1030 #  define ldr_c(r0,r1)			_ldr_c(_jit,r0,r1)
1031 static void _ldr_c(jit_state_t*,jit_int32_t,jit_int32_t);
1032 #  define ldi_c(r0,i0)			_ldi_c(_jit,r0,i0)
1033 static void _ldi_c(jit_state_t*,jit_int32_t,jit_word_t);
1034 #  define ldxr_c(r0,r1,r2)		_ldxr_c(_jit,r0,r1,r2)
1035 static void _ldxr_c(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
1036 #  define ldxi_c(r0,r1,i0)		_ldxi_c(_jit,r0,r1,i0)
1037 static void _ldxi_c(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
1038 #  define ldr_uc(r0,r1)			_ldr_uc(_jit,r0,r1)
1039 static void _ldr_uc(jit_state_t*,jit_int32_t,jit_int32_t);
1040 #  define ldi_uc(r0,i0)			_ldi_uc(_jit,r0,i0)
1041 static void _ldi_uc(jit_state_t*,jit_int32_t,jit_word_t);
1042 #  define ldxr_uc(r0,r1,r2)		_ldxr_uc(_jit,r0,r1,r2)
1043 static void _ldxr_uc(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
1044 #  define ldxi_uc(r0,r1,i0)		_ldxi_uc(_jit,r0,r1,i0)
1045 static void _ldxi_uc(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
1046 #  define ldr_s(r0,r1)			_ldr_s(_jit,r0,r1)
1047 static void _ldr_s(jit_state_t*,jit_int32_t,jit_int32_t);
1048 #  define ldi_s(r0,i0)			_ldi_s(_jit,r0,i0)
1049 static void _ldi_s(jit_state_t*,jit_int32_t,jit_word_t);
1050 #  define ldxr_s(r0,r1,r2)		_ldxr_s(_jit,r0,r1,r2)
1051 static void _ldxr_s(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
1052 #  define ldxi_s(r0,r1,i0)		_ldxi_s(_jit,r0,r1,i0)
1053 static void _ldxi_s(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
1054 #  define ldr_us(r0,r1)			_ldr_us(_jit,r0,r1)
1055 static void _ldr_us(jit_state_t*,jit_int32_t,jit_int32_t);
1056 #  define ldi_us(r0,i0)			_ldi_us(_jit,r0,i0)
1057 static void _ldi_us(jit_state_t*,jit_int32_t,jit_word_t);
1058 #  define ldxr_us(r0,r1,r2)		_ldxr_us(_jit,r0,r1,r2)
1059 static void _ldxr_us(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
1060 #  define ldxi_us(r0,r1,i0)		_ldxi_us(_jit,r0,r1,i0)
1061 static void _ldxi_us(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
1062 #  define ldr_i(r0,r1)			_ldr_i(_jit,r0,r1)
1063 static void _ldr_i(jit_state_t*,jit_int32_t,jit_int32_t);
1064 #  define ldi_i(r0,i0)			_ldi_i(_jit,r0,i0)
1065 static void _ldi_i(jit_state_t*,jit_int32_t,jit_word_t);
1066 #  define ldxr_i(r0,r1,r2)		_ldxr_i(_jit,r0,r1,r2)
1067 static void _ldxr_i(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
1068 #  define ldxi_i(r0,r1,i0)		_ldxi_i(_jit,r0,r1,i0)
1069 static void _ldxi_i(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
1070 #  define str_c(r0,r1)			_str_c(_jit,r0,r1)
1071 static void _str_c(jit_state_t*,jit_int32_t,jit_int32_t);
1072 #  define sti_c(i0,r0)			_sti_c(_jit,i0,r0)
1073 static void _sti_c(jit_state_t*,jit_word_t,jit_int32_t);
1074 #  define stxr_c(r0,r1,r2)		_stxr_c(_jit,r0,r1,r2)
1075 static void _stxr_c(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
1076 #  define stxi_c(r0,r1,i0)		_stxi_c(_jit,r0,r1,i0)
1077 static void _stxi_c(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
1078 #  define str_s(r0,r1)			_str_s(_jit,r0,r1)
1079 static void _str_s(jit_state_t*,jit_int32_t,jit_int32_t);
1080 #  define sti_s(i0,r0)			_sti_s(_jit,i0,r0)
1081 static void _sti_s(jit_state_t*,jit_word_t,jit_int32_t);
1082 #  define stxr_s(r0,r1,r2)		_stxr_s(_jit,r0,r1,r2)
1083 static void _stxr_s(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
1084 #  define stxi_s(r0,r1,i0)		_stxi_s(_jit,r0,r1,i0)
1085 static void _stxi_s(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
1086 #  define str_i(r0,r1)			_str_i(_jit,r0,r1)
1087 static void _str_i(jit_state_t*,jit_int32_t,jit_int32_t);
1088 #  define sti_i(i0,r0)			_sti_i(_jit,i0,r0)
1089 static void _sti_i(jit_state_t*,jit_word_t,jit_int32_t);
1090 #  define stxr_i(r0,r1,r2)		_stxr_i(_jit,r0,r1,r2)
1091 static void _stxr_i(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
1092 #  define stxi_i(r0,r1,i0)		_stxi_i(_jit,r0,r1,i0)
1093 static void _stxi_i(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
1094 #  if __BYTE_ORDER == __LITTLE_ENDIAN
1095 #  define htonr_us(r0,r1)		_htonr_us(_jit,r0,r1)
1096 static void _htonr_us(jit_state_t*,jit_int32_t,jit_int32_t);
1097 #  define htonr_ui(r0,r1)		_htonr_ui(_jit,r0,r1)
1098 static void _htonr_ui(jit_state_t*,jit_int32_t,jit_int32_t);
1099 #  else
1100 #    define htonr_us(r0,r1)		extr_us(r0,r1)
1101 #    define htonr(r0,r1)		movr(r0,r1)
1102 #  endif
1103 #  define extr_c(r0,r1)			_extr_c(_jit,r0,r1)
1104 static void _extr_c(jit_state_t*,jit_int32_t,jit_int32_t);
1105 #  define extr_uc(r0,r1)		_extr_uc(_jit,r0,r1)
1106 static void _extr_uc(jit_state_t*,jit_int32_t,jit_int32_t);
1107 #  define extr_s(r0,r1)			_extr_s(_jit,r0,r1)
1108 static void _extr_s(jit_state_t*,jit_int32_t,jit_int32_t);
1109 #  define extr_us(r0,r1)		_extr_us(_jit,r0,r1)
1110 static void _extr_us(jit_state_t*,jit_int32_t,jit_int32_t);
1111 #  define prolog(i0)			_prolog(_jit,i0)
1112 static void _prolog(jit_state_t*,jit_node_t*);
1113 #  define epilog(i0)			_epilog(_jit,i0)
1114 static void _epilog(jit_state_t*,jit_node_t*);
1115 #  define callr(r0)			_callr(_jit,r0)
1116 static void _callr(jit_state_t*,jit_int32_t);
1117 #  define calli(i0)			_calli(_jit,i0)
1118 static void _calli(jit_state_t*,jit_word_t);
1119 #  define calli_p(i0)			_calli_p(_jit,i0)
1120 static jit_word_t _calli_p(jit_state_t*,jit_word_t);
1121 #  define vastart(r0)			_vastart(_jit, r0)
1122 static void _vastart(jit_state_t*, jit_int32_t);
1123 #  define vaarg(r0, r1)			_vaarg(_jit, r0, r1)
1124 static void _vaarg(jit_state_t*, jit_int32_t, jit_int32_t);
1125 #  define patch_at(kind,jump,label)	_patch_at(_jit,kind,jump,label)
1126 static void _patch_at(jit_state_t*,jit_int32_t,jit_word_t,jit_word_t);
1127 #endif
1128 
1129 #if CODE
1130 /* from binutils */
1131 #  define rotate_left(v, n)	(v << n | v >> (32 - n))
1132 static int
encode_arm_immediate(unsigned int v)1133 encode_arm_immediate(unsigned int v)
1134 {
1135     unsigned int	a, i;
1136 
1137     for (i = 0; i < 32; i += 2)
1138 	if ((a = rotate_left(v, i)) <= 0xff)
1139 	    return (a | (i << 7));
1140 
1141     return (-1);
1142 }
1143 
1144 static int
encode_thumb_immediate(unsigned int v)1145 encode_thumb_immediate(unsigned int v)
1146 {
1147     int			i;
1148     unsigned int	m;
1149     unsigned int	n;
1150     /* 00000000 00000000 00000000 abcdefgh */
1151     if ((v & 0xff) == v)
1152 	return (v);
1153     /* 00000000 abcdefgh 00000000 abcdefgh */
1154     if ((v & 0xff00ff) == v && ((v & 0xff0000) >> 16) == (v & 0xff))
1155 	return ((v & 0xff) | (1 << 12));
1156     /* abcdefgh 00000000 abcdefgh 00000000 */
1157     if (((v & 0xffff0000) >> 16) == (v & 0xffff) && (v & 0xff) == 0)
1158 	return ((v & 0x000000ff) | (2 << 12));
1159     /* abcdefgh abcdefgh abcdefgh abcdefgh */
1160     if ( (v &    0xff)        == ((v &     0xff00) >>  8) &&
1161 	((v &   0xff00) >> 8) == ((v &   0xff0000) >> 16) &&
1162 	((v & 0xff0000) << 8) ==  (v & 0xff000000))
1163 	return ((v & 0xff) | (3 << 12));
1164     /* 1bcdefgh << 24 ... 1bcdefgh << 1 */
1165     for (i = 8, m = 0xff000000, n = 0x80000000;
1166 	 i < 23; i++, m >>= 1,  n >>= 1) {
1167 	if ((v & m) == v && (v & n)) {
1168 	    v >>= 32 - i;
1169 	    if (!(i & 1))
1170 		v &= 0x7f;
1171 	    i >>= 1;
1172 	    return (((i & 7) << 12) | ((i & 8) << 23) | v);
1173 	}
1174     }
1175     return (-1);
1176 }
1177 
1178 static int
encode_thumb_word_immediate(unsigned int v)1179 encode_thumb_word_immediate(unsigned int v)
1180 {
1181     if ((v & 0xfffff000) == 0)
1182 	return (((v & 0x800) << 15) | ((v & 0x700) << 4) | (v & 0xff));
1183     return (-1);
1184 }
1185 
1186 static int
encode_thumb_jump(int v)1187 encode_thumb_jump(int v)
1188 {
1189     int		s, i1, i2, j1, j2;
1190     if (v >= (int)-0x800000 && v <= 0x7fffff) {
1191 	s  = !!(v & 0x800000);
1192 	i1 = !!(v & 0x400000);
1193 	i2 = !!(v & 0x200000);
1194 	j1 = s ? i1 : !i1;
1195 	j2 = s ? i2 : !i2;
1196 	return ((s<<26)|((v&0x1ff800)<<5)|(j1<<13)|(j2<<11)|(v&0x7ff));
1197     }
1198     return (-1);
1199 }
1200 
1201 static int
encode_thumb_cc_jump(int v)1202 encode_thumb_cc_jump(int v)
1203 {
1204     int		s, j1, j2;
1205     if (v >= (int)-0x80000 && v <= 0x7ffff) {
1206 	s  = !!(v & 0x80000);
1207 	j1 = !!(v & 0x20000);
1208 	j2 = !!(v & 0x40000);
1209 	return ((s<<26)|((v&0x1f800)<<5)|(j1<<13)|(j2<<11)|(v&0x7ff));
1210     }
1211     return (-1);
1212 }
1213 
1214 static int
encode_thumb_shift(int v,int type)1215 encode_thumb_shift(int v, int type)
1216 {
1217     switch (type) {
1218 	case ARM_ASR:
1219 	case ARM_LSL:
1220 	case ARM_LSR:		type >>= 1;	break;
1221 	default:		assert(!"handled shift");
1222     }
1223     assert(v >= 0 && v <= 31);
1224     return (((v & 0x1c) << 10) | ((v & 3) << 6) | type);
1225 }
1226 
1227 static void
_tcit(jit_state_t * _jit,unsigned int tc,int it)1228 _tcit(jit_state_t *_jit, unsigned int tc, int it)
1229 {
1230     int		c;
1231     int		m;
1232     c = (tc >> 28) & 1;
1233     assert(!(tc & 0xfffffff) && tc != ARM_CC_NV);
1234     switch (it) {
1235 	case THUMB2_IT:		m =   1<<3; 			break;
1236 	case THUMB2_ITT:	m =  (c<<3)| (1<<2);		break;
1237 	case THUMB2_ITE:	m = (!c<<3)| (1<<2);		break;
1238 	case THUMB2_ITTT:	m =  (c<<3)| (c<<2)| (1<<1);	break;
1239 	case THUMB2_ITET:	m = (!c<<3)| (c<<2)| (1<<1);	break;
1240 	case THUMB2_ITTE:	m =  (c<<3)|(!c<<2)| (1<<1);	break;
1241 	case THUMB2_ITEE:	m = (!c<<3)|(!c<<2)| (1<<1);	break;
1242 	case THUMB2_ITTTT:	m =  (c<<3)| (c<<2)| (c<<1)|1;	break;
1243 	case THUMB2_ITETT:	m = (!c<<3)| (c<<2)| (c<<1)|1;	break;
1244 	case THUMB2_ITTET:	m =  (c<<3)|(!c<<2)| (c<<1)|1;	break;
1245 	case THUMB2_ITEET:	m = (!c<<3)|(!c<<2)| (c<<1)|1;	break;
1246 	case THUMB2_ITTTE:	m =  (c<<3)| (c<<2)|(!c<<1)|1;	break;
1247 	case THUMB2_ITETE:	m = (!c<<3)| (c<<2)|(!c<<1)|1;	break;
1248 	case THUMB2_ITTEE:	m =  (c<<3)|(!c<<2)|(!c<<1)|1;	break;
1249 	case THUMB2_ITEEE:	m = (!c<<3)|(!c<<2)|(!c<<1)|1;	break;
1250 	default:		abort();
1251     }
1252     assert(m && (tc != ARM_CC_AL || !(m & (m - 1))));
1253     is(0xbf00 | (tc >> 24) | m);
1254 }
1255 
1256 static void
_corrr(jit_state_t * _jit,int cc,int o,int rn,int rd,int rm)1257 _corrr(jit_state_t *_jit, int cc, int o, int rn, int rd, int rm)
1258 {
1259     assert(!(cc & 0x0fffffff));
1260     assert(!(o  & 0xf00fff0f));
1261     ii(cc|o|(_u4(rn)<<16)|(_u4(rd)<<12)|_u4(rm));
1262 }
1263 
1264 static void
_corri(jit_state_t * _jit,int cc,int o,int rn,int rd,int im)1265 _corri(jit_state_t *_jit, int cc, int o, int rn, int rd, int im)
1266 {
1267     assert(!(cc & 0x0fffffff));
1268     assert(!(o  & 0xf00fffff));
1269     assert(!(im & 0xfffff000));
1270     ii(cc|o|(_u4(rn)<<16)|(_u4(rd)<<12)|_u12(im));
1271 }
1272 
1273 static void
_corri8(jit_state_t * _jit,int cc,int o,int rn,int rt,int im)1274 _corri8(jit_state_t *_jit, int cc, int o, int rn, int rt, int im)
1275 {
1276     assert(!(cc & 0x0fffffff));
1277     assert(!(o  & 0xf00fff0f));
1278     assert(!(im & 0xffffff00));
1279     ii(cc|o|(_u4(rn)<<16)|(_u4(rt)<<12)|((im&0xf0)<<4)|(im&0x0f));
1280 }
1281 
1282 static void
_coriw(jit_state_t * _jit,int cc,int o,int rd,int im)1283 _coriw(jit_state_t *_jit, int cc, int o, int rd, int im)
1284 {
1285     assert(!(cc & 0x0fffffff));
1286     assert(!(o  & 0xf00fffff));
1287     assert(!(im & 0xffff0000));
1288     ii(cc|o|((im&0xf000)<<4)|(_u4(rd)<<12)|(im&0xfff));
1289 }
1290 
1291 static void
_torrr(jit_state_t * _jit,int o,int rn,int rd,int rm)1292 _torrr(jit_state_t *_jit, int o, int rn, int rd, int rm)
1293 {
1294     jit_thumb_t	thumb;
1295     assert(!(o & 0xf0f0f));
1296     thumb.i = o|(_u4(rn)<<16)|(_u4(rd)<<8)|_u4(rm);
1297     iss(thumb.s[0], thumb.s[1]);
1298 }
1299 
1300 static void
_torrrs(jit_state_t * _jit,int o,int rn,int rd,int rm,int im)1301 _torrrs(jit_state_t *_jit, int o, int rn, int rd, int rm, int im)
1302 {
1303     jit_thumb_t	thumb;
1304     assert(!(o  & 0x000f0f0f));
1305     assert(!(im & 0xffff8f0f));
1306     thumb.i = o|(_u4(rn)<<16)|(_u4(rd)<<8)|im|_u4(rm);
1307     iss(thumb.s[0], thumb.s[1]);
1308 }
1309 
1310 static void
_torxr(jit_state_t * _jit,int o,int rn,int rt,int rm)1311 _torxr(jit_state_t *_jit, int o, int rn, int rt, int rm)
1312 {
1313     jit_thumb_t	thumb;
1314     assert(!(o & 0xf0f0f));
1315     thumb.i = o|(_u4(rn)<<16)|(_u4(rt)<<12)|_u4(rm);
1316     iss(thumb.s[0], thumb.s[1]);
1317 }
1318 
1319 static void
_torrrr(jit_state_t * _jit,int o,int rn,int rl,int rh,int rm)1320 _torrrr(jit_state_t *_jit, int o, int rn, int rl, int rh, int rm)
1321 {
1322     jit_thumb_t	thumb;
1323     assert(!(o & 0x000fff0f));
1324     thumb.i = o|(_u4(rn)<<16)|(_u4(rl)<<12)|(_u4(rh)<<8)|_u4(rm);
1325     iss(thumb.s[0], thumb.s[1]);
1326 }
1327 
1328 static void
_torrri8(jit_state_t * _jit,int o,int rn,int rt,int rt2,int im)1329 _torrri8(jit_state_t *_jit, int o, int rn, int rt, int rt2, int im)
1330 {
1331     jit_thumb_t	thumb;
1332     assert(!(o  & 0x000fffff));
1333     assert(!(im & 0xffffff00));
1334     thumb.i = o|(_u4(rn)<<16)|(_u4(rt)<<12)|(_u4(rt2)<<8)|im;
1335     iss(thumb.s[0], thumb.s[1]);
1336 }
1337 
1338 static void
_torri(jit_state_t * _jit,int o,int rn,int rd,int im)1339 _torri(jit_state_t *_jit, int o, int rn, int rd, int im)
1340 {
1341     jit_thumb_t	thumb;
1342     assert(!(o  & 0x0c0f7fff));
1343     assert(!(im & 0xfbff8f00));
1344     thumb.i = o|(_u4(rn)<<16)|(_u4(rd)<<8)|im;
1345     iss(thumb.s[0], thumb.s[1]);
1346 }
1347 
1348 static void
_torri8(jit_state_t * _jit,int o,int rn,int rt,int im)1349 _torri8(jit_state_t *_jit, int o, int rn, int rt, int im)
1350 {
1351     jit_thumb_t	thumb;
1352     assert(!(o  & 0x000ff0ff));
1353     assert(!(im & 0xffffff00));
1354     thumb.i = o|(_u4(rn)<<16)|(_u4(rt)<<12)|im;
1355     iss(thumb.s[0], thumb.s[1]);
1356 }
1357 
1358 static void
_torri12(jit_state_t * _jit,int o,int rn,int rt,int im)1359 _torri12(jit_state_t *_jit, int o, int rn, int rt, int im)
1360 {
1361     jit_thumb_t	thumb;
1362     assert(!(o  & 0x000fffff));
1363     assert(!(im & 0xfffff000));
1364     thumb.i = o|(_u4(rn)<<16)|(_u4(rt)<<12)|im;
1365     iss(thumb.s[0], thumb.s[1]);
1366 }
1367 
1368 static void
_tshift(jit_state_t * _jit,int o,int rd,int rm,int im)1369 _tshift(jit_state_t *_jit, int o, int rd, int rm, int im)
1370 {
1371     jit_thumb_t	thumb;
1372     assert(!(o & 0x7fcf));
1373     assert(im >= 0 && im < 32);
1374     thumb.i = o|((im&0x1c)<<10)|(_u4(rd)<<8)|((im&3)<<6)|_u4(rm);
1375     iss(thumb.s[0], thumb.s[1]);
1376 }
1377 
1378 static void
_toriw(jit_state_t * _jit,int o,int rd,int im)1379 _toriw(jit_state_t *_jit, int o, int rd, int im)
1380 {
1381     jit_thumb_t	thumb;
1382     assert(!(im & 0xffff0000));
1383     thumb.i = o|((im&0xf000)<<4)|((im&0x800)<<15)|((im&0x700)<<4)|(_u4(rd)<<8)|(im&0xff);
1384     iss(thumb.s[0], thumb.s[1]);
1385 }
1386 
1387 static void
_tc8(jit_state_t * _jit,int cc,int im)1388 _tc8(jit_state_t *_jit, int cc, int im)
1389 {
1390     assert(!(cc & 0x0fffffff));
1391     assert(cc != ARM_CC_AL && cc != ARM_CC_NV);
1392     assert(im >= -128 && im <= 127);
1393     is(THUMB_CC_B|(cc>>20)|(im&0xff));
1394 }
1395 
1396 static void
_t11(jit_state_t * _jit,int im)1397 _t11(jit_state_t *_jit, int im)
1398 {
1399     assert(!(im & 0xfffff800));
1400     is(THUMB_B|im);
1401 }
1402 
1403 static void
_tcb(jit_state_t * _jit,int cc,int im)1404 _tcb(jit_state_t *_jit, int cc, int im)
1405 {
1406     jit_thumb_t	thumb;
1407     assert(!(cc & 0xfffffff));
1408     assert(cc != ARM_CC_AL && cc != ARM_CC_NV);
1409     cc = ((jit_uint32_t)cc) >> 6;
1410     assert(!(im & (THUMB2_CC_B|cc)));
1411     thumb.i = THUMB2_CC_B|cc|im;
1412     iss(thumb.s[0], thumb.s[1]);
1413 }
1414 
1415 static void
_blxi(jit_state_t * _jit,int im)1416 _blxi(jit_state_t *_jit, int im)
1417 {
1418     assert(!(im & 0xfe000000));
1419     ii(ARM_BLXI|im);
1420 }
1421 
1422 static void
_tb(jit_state_t * _jit,int o,int im)1423 _tb(jit_state_t *_jit, int o, int im)
1424 {
1425     jit_thumb_t	thumb;
1426     assert(!(o & 0x07ff2fff));
1427     assert(!(o & im));
1428     thumb.i = o|im;
1429     iss(thumb.s[0], thumb.s[1]);
1430 }
1431 
1432 static void
_corrrr(jit_state_t * _jit,int cc,int o,int rh,int rl,int rm,int rn)1433 _corrrr(jit_state_t *_jit, int cc, int o, int rh, int rl, int rm, int rn)
1434 {
1435     assert(!(cc & 0x0fffffff));
1436     assert(!(o & 0xf00fff0f));
1437     ii(cc|o|(_u4(rh)<<16)|(_u4(rl)<<12)|(_u4(rm)<<8)|_u4(rn));
1438 }
1439 
1440 static void
_corrrs(jit_state_t * _jit,int cc,int o,int rn,int rd,int rm,int im)1441 _corrrs(jit_state_t *_jit, int cc, int o, int rn, int rd, int rm, int im)
1442 {
1443     assert(!(cc & 0x0fffffff));
1444     assert(!(o  & 0xf000ff8f));
1445     ii(cc|o|(_u4(rd)<<12)|(_u4(rn)<<16)|(im<<7)|_u4(rm));
1446 }
1447 
1448 static void
_cshift(jit_state_t * _jit,int cc,int o,int rd,int rm,int rn,int im)1449 _cshift(jit_state_t *_jit, int cc, int o, int rd, int rm, int rn, int im)
1450 {
1451     assert(!(cc & 0x0fffffff));
1452     assert(!(o  & 0xffe0ff8f));
1453     assert(((_u4(rm)<<8)&(im<<7)) == 0);
1454     ii(cc|ARM_SHIFT|o|(_u4(rd)<<12)|(_u4(rm)<<8)|(im<<7)|_u4(rn));
1455 }
1456 
1457 static void
_cb(jit_state_t * _jit,int cc,int o,int im)1458 _cb(jit_state_t *_jit, int cc, int o, int im)
1459 {
1460     assert(!(cc & 0x0fffffff));
1461     assert(!(o  & 0xf0ffffff));
1462     ii(cc|o|_u24(im));
1463 }
1464 
1465 static void
_cbx(jit_state_t * _jit,int cc,int o,int rm)1466 _cbx(jit_state_t *_jit, int cc, int o, int rm)
1467 {
1468     assert(!(cc & 0x0fffffff));
1469     assert(!(o  & 0xf000000f));
1470     ii(cc|o|_u4(rm));
1471 }
1472 
1473 static void
_corl(jit_state_t * _jit,int cc,int o,int r0,int i0)1474 _corl(jit_state_t *_jit, int cc, int o, int r0, int i0)
1475 {
1476     assert(!(cc & 0x0fffffff));
1477     assert(!(o  & 0xf00fffff));
1478     ii(cc|o|(_u4(r0)<<16)|_u16(i0));
1479 }
1480 
1481 static void
_c6orr(jit_state_t * _jit,int cc,int o,int rd,int rm)1482 _c6orr(jit_state_t *_jit, int cc, int o, int rd, int rm)
1483 {
1484     assert(!(cc & 0x0fffffff));
1485     assert(!(o  & 0xf000f00f));
1486     ii(cc|o|(_u4(rd)<<12)|_u4(rm));
1487 }
1488 
1489 static void
_tpp(jit_state_t * _jit,int o,int im)1490 _tpp(jit_state_t *_jit, int o, int im)
1491 {
1492     jit_thumb_t	thumb;
1493     assert(!(o & 0x0000ffff));
1494     if (o == THUMB2_PUSH)
1495 	assert(!(im & 0x8000));
1496     assert(__builtin_popcount(im & 0x1fff) > 1);
1497     thumb.i = o|im;
1498     iss(thumb.s[0], thumb.s[1]);
1499 }
1500 
1501 static void
_torl(jit_state_t * _jit,int o,int rn,int im)1502 _torl(jit_state_t *_jit, int o, int rn, int im)
1503 {
1504     jit_thumb_t	thumb;
1505     assert(!(o & 0xf1fff));
1506     assert(rn != _R15 || !im || ((o & 0xc000) == 0xc000));
1507     assert(!(o & THUMB2_LDM_W) || !(im & (1 << rn)));
1508     thumb.i = o | (_u4(rn)<<16)|_u13(im);
1509     iss(thumb.s[0], thumb.s[1]);
1510 }
1511 
1512 static void
_nop(jit_state_t * _jit,jit_int32_t i0)1513 _nop(jit_state_t *_jit, jit_int32_t i0)
1514 {
1515     if (jit_thumb_p()) {
1516 	for (; i0 > 0; i0 -= 2)
1517 	    T1_NOP();
1518     }
1519     else {
1520 	for (; i0 > 0; i0 -= 4)
1521 	    NOP();
1522     }
1523     assert(i0 == 0);
1524 }
1525 
1526 static void
_movr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)1527 _movr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
1528 {
1529     if (r0 != r1) {
1530 	if (jit_thumb_p())
1531 	    T1_MOV(r0, r1);
1532 	else
1533 	    MOV(r0, r1);
1534     }
1535 }
1536 
1537 static void
_movi(jit_state_t * _jit,jit_int32_t r0,jit_word_t i0)1538 _movi(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
1539 {
1540     int			i;
1541     if (jit_thumb_p()) {
1542 	if (!jit_no_set_flags() && r0 < 8 && !(i0 & 0xffffff80))
1543 	    T1_MOVI(r0, i0);
1544 	else if ((i = encode_thumb_immediate(i0)) != -1)
1545 	    T2_MOVI(r0, i);
1546 	else if ((i = encode_thumb_immediate(~i0)) != -1)
1547 	    T2_MVNI(r0, i);
1548 	else {
1549 	    T2_MOVWI(r0, (jit_uint16_t)i0);
1550 	    if (i0 & 0xffff0000)
1551 		T2_MOVTI(r0, (jit_uint16_t)((unsigned)i0 >> 16));
1552 	}
1553     }
1554     else {
1555 	if (jit_armv6_p() && !(i0 & 0xffff0000))
1556 	    MOVWI(r0, i0);
1557 	else if ((i = encode_arm_immediate(i0)) != -1)
1558 	    MOVI(r0, i);
1559 	else if ((i = encode_arm_immediate(~i0)) != -1)
1560 	    MVNI(r0, i);
1561 	else if (jit_armv6_p()) {
1562 	    MOVWI(r0, (jit_uint16_t)(i0));
1563 	    if ((i0 & 0xffff0000))
1564 		MOVTI(r0, (jit_uint16_t)((unsigned)i0 >> 16));
1565 	}
1566 	else
1567 	    load_const(0, r0, i0);
1568     }
1569 }
1570 
1571 static jit_word_t
_movi_p(jit_state_t * _jit,jit_int32_t r0,jit_word_t i0)1572 _movi_p(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
1573 {
1574     jit_word_t		w;
1575     w = _jit->pc.w;
1576     if (jit_thumb_p()) {
1577 	T2_MOVWI(r0, (jit_uint16_t)(i0));
1578 	T2_MOVTI(r0, (jit_uint16_t)((unsigned)i0 >> 16));
1579     }
1580     else
1581 	load_const(1, r0, 0);
1582     return (w);
1583 }
1584 
1585 static void
_comr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)1586 _comr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
1587 {
1588     if (jit_thumb_p()) {
1589 	if (!jit_no_set_flags() && (r0|r1) < 8)
1590 	    T1_NOT(r0, r1);
1591 	else
1592 	    T2_NOT(r0, r1);
1593     }
1594     else
1595 	NOT(r0, r1);
1596 }
1597 
1598 static void
_negr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)1599 _negr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
1600 {
1601     if (jit_thumb_p()) {
1602 	if (!jit_no_set_flags() && (r0|r1) < 8)
1603 	    T1_RSBI(r0, r1);
1604 	else
1605 	    T2_RSBI(r0, r1, 0);
1606     }
1607     else
1608 	RSBI(r0, r1, 0);
1609 }
1610 
1611 static void
_addr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)1612 _addr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1613 {
1614     if (jit_thumb_p()) {
1615 	if (!jit_no_set_flags() && (r0|r1|r2) < 8)
1616 	    T1_ADD(r0, r1, r2);
1617 	else if (r0 == r1 || r0 == r2)
1618 	    T1_ADDX(r0, r0 == r1 ? r2 : r1);
1619 	else
1620 	    T2_ADD(r0, r1, r2);
1621     }
1622     else
1623 	ADD(r0, r1, r2);
1624 }
1625 
1626 static void
_addi(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)1627 _addi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1628 {
1629     int			i;
1630     jit_int32_t		reg;
1631     if (jit_thumb_p()) {
1632 	if (!jit_no_set_flags() && (r0|r1) < 8 && !(i0 & ~7))
1633 	    T1_ADDI3(r0, r1, i0);
1634 	else if (!jit_no_set_flags() && (r0|r1) < 8 && !(-i0 & ~7))
1635 	    T1_SUBI3(r0, r1, -i0);
1636 	else if (!jit_no_set_flags() && r0 < 8 && r0 == r1 && !(i0 & ~0xff))
1637 	    T1_ADDI8(r0, i0);
1638 	else if (!jit_no_set_flags() && r0 < 8 && r0 == r1 && !(-i0 & ~0xff))
1639 	    T1_SUBI8(r0, -i0);
1640 	else if ((i = encode_thumb_immediate(i0)) != -1)
1641 	    T2_ADDI(r0, r1, i);
1642 	else if ((i = encode_thumb_immediate(-i0)) != -1)
1643 	    T2_SUBI(r0, r1, i);
1644 	else if ((i = encode_thumb_word_immediate(i0)) != -1)
1645 	    T2_ADDWI(r0, r1, i);
1646 	else if ((i = encode_thumb_word_immediate(-i0)) != -1)
1647 	    T2_SUBWI(r0, r1, i);
1648 	else {
1649 	    reg = jit_get_reg(jit_class_gpr);
1650 	    movi(rn(reg), i0);
1651 	    T2_ADD(r0, r1, rn(reg));
1652 	    jit_unget_reg(reg);
1653 	}
1654     }
1655     else {
1656 	if ((i = encode_arm_immediate(i0)) != -1)
1657 	    ADDI(r0, r1, i);
1658 	else if ((i = encode_arm_immediate(-i0)) != -1)
1659 	    SUBI(r0, r1, i);
1660 	else if (r0 != r1) {
1661 	    movi(r0, i0);
1662 	    ADD(r0, r1, r0);
1663 	}
1664 	else {
1665 	    reg = jit_get_reg(jit_class_gpr);
1666 	    movi(rn(reg), i0);
1667 	    ADD(r0, r1, rn(reg));
1668 	    jit_unget_reg(reg);
1669 	}
1670     }
1671 }
1672 
1673 static void
_addcr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)1674 _addcr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1675 {
1676     if (jit_thumb_p()) {
1677 	/* thumb auto set carry if not inside IT block */
1678 	if ((r0|r1|r2) < 8)
1679 	    T1_ADD(r0, r1, r2);
1680 	else
1681 	    T2_ADDS(r0, r1, r2);
1682     }
1683     else
1684 	ADDS(r0, r1, r2);
1685 }
1686 
1687 static void
_addci(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)1688 _addci(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1689 {
1690     int			i;
1691     jit_int32_t		reg;
1692     if (jit_thumb_p()) {
1693 	if ((r0|r1) < 8 && !(i0 & ~7))
1694 	    T1_ADDI3(r0, r1, i0);
1695 	else if ((r0|r1) < 8 && !(-i0 & ~7))
1696 	    T1_SUBI3(r0, r1, -i0);
1697 	else if (r0 < 8 && r0 == r1 && !(i0 & ~0xff))
1698 	    T1_ADDI8(r0, i0);
1699 	else if (r0 < 8 && r0 == r1 && !(-i0 & ~0xff))
1700 	    T1_SUBI8(r0, -i0);
1701 	else if ((i = encode_thumb_immediate(i0)) != -1)
1702 	    T2_ADDSI(r0, r1, i);
1703 	else if ((i = encode_thumb_immediate(-i0)) != -1)
1704 	    T2_SUBSI(r0, r1, i);
1705 	else {
1706 	    reg = jit_get_reg(jit_class_gpr);
1707 	    movi(rn(reg), i0);
1708 	    T2_ADDS(r0, r1, rn(reg));
1709 	    jit_unget_reg(reg);
1710 	}
1711     }
1712     else {
1713 	if ((i = encode_arm_immediate(i0)) != -1)
1714 	    ADDSI(r0, r1, i);
1715 	else if ((i = encode_arm_immediate(-i0)) != -1)
1716 	    SUBSI(r0, r1, i);
1717 	else if (r0 != r1) {
1718 	    movi(r0, i0);
1719 	    ADDS(r0, r1, r0);
1720 	}
1721 	else {
1722 	    reg = jit_get_reg(jit_class_gpr);
1723 	    movi(rn(reg), i0);
1724 	    ADDS(r0, r1, rn(reg));
1725 	    jit_unget_reg(reg);
1726 	}
1727     }
1728 }
1729 
1730 static void
_addxr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)1731 _addxr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1732 {
1733     /* keep setting carry because don't know last ADC */
1734     if (jit_thumb_p()) {
1735 	/* thumb auto set carry if not inside IT block */
1736 	if ((r0|r1|r2) < 8 && (r0 == r1 || r0 == r2))
1737 	    T1_ADC(r0, r0 == r1 ? r2 : r1);
1738 	else
1739 	    T2_ADCS(r0, r1, r2);
1740     }
1741     else
1742 	ADCS(r0, r1, r2);
1743 }
1744 
1745 static void
_addxi(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)1746 _addxi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1747 {
1748     int			i;
1749     jit_int32_t		reg;
1750     int			no_set_flags;
1751     if (jit_thumb_p()) {
1752 	no_set_flags = jit_no_set_flags();
1753 	jit_no_set_flags() = 1;
1754 	if ((i = encode_thumb_immediate(i0)) != -1)
1755 	    T2_ADCSI(r0, r1, i);
1756 	else if ((i = encode_thumb_immediate(-i0)) != -1)
1757 	    T2_SBCSI(r0, r1, i);
1758 	else if (r0 != r1) {
1759 	    movi(r0, i0);
1760 	    T2_ADCS(r0, r1, r0);
1761 	}
1762 	else {
1763 	    reg = jit_get_reg(jit_class_gpr);
1764 	    movi(rn(reg), i0);
1765 	    T2_ADCS(r0, r1, rn(reg));
1766 	    jit_unget_reg(reg);
1767 	}
1768 	jit_no_set_flags() = no_set_flags;
1769     }
1770     else {
1771 	if ((i = encode_arm_immediate(i0)) != -1)
1772 	    ADCSI(r0, r1, i);
1773 	else if ((i = encode_arm_immediate(-i0)) != -1)
1774 	    SBCSI(r0, r1, i);
1775 	else if (r0 != r1) {
1776 	    movi(r0, i0);
1777 	    ADCS(r0, r1, r0);
1778 	}
1779 	else {
1780 	    reg = jit_get_reg(jit_class_gpr);
1781 	    movi(rn(reg), i0);
1782 	    ADCS(r0, r1, rn(reg));
1783 	    jit_unget_reg(reg);
1784 	}
1785     }
1786 }
1787 
1788 static void
_subr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)1789 _subr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1790 {
1791     if (jit_thumb_p()) {
1792 	if (!jit_no_set_flags() && (r0|r1|r2) < 8)
1793 	    T1_SUB(r0, r1, r2);
1794 	else
1795 	    T2_SUB(r0, r1, r2);
1796     }
1797     else
1798 	SUB(r0, r1, r2);
1799 }
1800 
1801 static void
_subi(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)1802 _subi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1803 {
1804     int			i;
1805     jit_int32_t		reg;
1806     if (jit_thumb_p()) {
1807 	if (!jit_no_set_flags() && (r0|r1) < 8 && !(i0 & ~7))
1808 	    T1_SUBI3(r0, r1, i0);
1809 	else if (!jit_no_set_flags() && (r0|r1) < 8 && !(-i0 & ~7))
1810 	    T1_ADDI3(r0, r1, -i0);
1811 	else if (!jit_no_set_flags() && r0 < 8 && r0 == r1 && !(i0 & ~0xff))
1812 	    T1_SUBI8(r0, i0);
1813 	else if (!jit_no_set_flags() && r0 < 8 && r0 == r1 && !(-i0 & ~0xff))
1814 	    T1_ADDI8(r0, -i0);
1815 	else if ((i = encode_thumb_immediate(i0)) != -1)
1816 	    T2_SUBI(r0, r1, i);
1817 	else if ((i = encode_thumb_immediate(-i0)) != -1)
1818 	    T2_ADDI(r0, r1, i);
1819 	else if ((i = encode_thumb_word_immediate(i0)) != -1)
1820 	    T2_SUBWI(r0, r1, i);
1821 	else if ((i = encode_thumb_word_immediate(-i0)) != -1)
1822 	    T2_ADDWI(r0, r1, i);
1823 	else {
1824 	    reg = jit_get_reg(jit_class_gpr);
1825 	    movi(rn(reg), i0);
1826 	    T2_SUB(r0, r1, rn(reg));
1827 	    jit_unget_reg(reg);
1828 	}
1829     }
1830     else {
1831 	if ((i = encode_arm_immediate(i0)) != -1)
1832 	    SUBI(r0, r1, i);
1833 	else if ((i = encode_arm_immediate(-i0)) != -1)
1834 	    ADDI(r0, r1, i);
1835 	else if (r0 != r1) {
1836 	    movi(r0, i0);
1837 	    SUB(r0, r1, r0);
1838 	}
1839 	else {
1840 	    reg = jit_get_reg(jit_class_gpr);
1841 	    movi(rn(reg), i0);
1842 	    SUB(r0, r1, rn(reg));
1843 	    jit_unget_reg(reg);
1844 	}
1845     }
1846 }
1847 
1848 static void
_subcr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)1849 _subcr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1850 {
1851     if (jit_thumb_p()) {
1852 	/* thumb auto set carry if not inside IT block */
1853 	if ((r0|r1|r2) < 8)
1854 	    T1_SUB(r0, r1, r2);
1855 	else
1856 	    T2_SUBS(r0, r1, r2);
1857     }
1858     else
1859 	SUBS(r0, r1, r2);
1860 }
1861 
1862 static void
_subci(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)1863 _subci(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1864 {
1865     int			i;
1866     jit_int32_t		reg;
1867     if (jit_thumb_p()) {
1868 	if ((r0|r1) < 8 && !(i0 & ~7))
1869 	    T1_SUBI3(r0, r1, i0);
1870 	else if ((r0|r1) < 8 && !(-i0 & ~7))
1871 	    T1_ADDI3(r0, r1, -i0);
1872 	else if (r0 < 8 && r0 == r1 && !(i0 & ~0xff))
1873 	    T1_SUBI8(r0, i0);
1874 	else if (r0 < 8 && r0 == r1 && !(-i0 & ~0xff))
1875 	    T1_ADDI8(r0, -i0);
1876 	else if ((i = encode_thumb_immediate(i0)) != -1)
1877 	    T2_SUBSI(r0, r1, i);
1878 	else if ((i = encode_thumb_immediate(-i0)) != -1)
1879 	    T2_ADDSI(r0, r1, i);
1880 	else {
1881 	    reg = jit_get_reg(jit_class_gpr);
1882 	    movi(rn(reg), i0);
1883 	    T2_SUBS(r0, r1, rn(reg));
1884 	    jit_unget_reg(reg);
1885 	}
1886     }
1887     else {
1888 	if ((i = encode_arm_immediate(i0)) != -1)
1889 	    SUBSI(r0, r1, i);
1890 	else if ((i = encode_arm_immediate(-i0)) != -1)
1891 	    ADDSI(r0, r1, i);
1892 	else if (r0 != r1) {
1893 	    movi(r0, i0);
1894 	    SUBS(r0, r1, r0);
1895 	}
1896 	else {
1897 	    reg = jit_get_reg(jit_class_gpr);
1898 	    movi(rn(reg), i0);
1899 	    SUBS(r0, r1, rn(reg));
1900 	    jit_unget_reg(reg);
1901 	}
1902     }
1903 }
1904 
1905 static void
_subxr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)1906 _subxr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1907 {
1908     /* keep setting carry because don't know last SBC */
1909     if (jit_thumb_p()) {
1910 	/* thumb auto set carry if not inside IT block */
1911 	if ((r0|r1|r2) < 8 && r0 == r1)
1912 	    T1_SBC(r0, r2);
1913 	else
1914 	    T2_SBCS(r0, r1, r2);
1915     }
1916     else
1917 	SBCS(r0, r1, r2);
1918 }
1919 
1920 static void
_subxi(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)1921 _subxi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1922 {
1923     int			i;
1924     jit_int32_t		reg;
1925     int			no_set_flags;
1926     if (jit_thumb_p()) {
1927 	no_set_flags = jit_no_set_flags();
1928 	jit_no_set_flags() = 1;
1929 	if ((i = encode_arm_immediate(i0)) != -1)
1930 	    T2_SBCSI(r0, r1, i);
1931 	else if ((i = encode_arm_immediate(-i0)) != -1)
1932 	    T2_ADCSI(r0, r1, i);
1933 	else if (r0 != r1) {
1934 	    movi(r0, i0);
1935 	    T2_SBCS(r0, r1, r0);
1936 	}
1937 	else {
1938 	    reg = jit_get_reg(jit_class_gpr);
1939 	    movi(rn(reg), i0);
1940 	    SBCS(r0, r1, rn(reg));
1941 	    jit_unget_reg(reg);
1942 	}
1943 	jit_no_set_flags() = no_set_flags;
1944     }
1945     else {
1946 	if ((i = encode_arm_immediate(i0)) != -1)
1947 	    SBCSI(r0, r1, i);
1948 	else if ((i = encode_arm_immediate(-i0)) != -1)
1949 	    ADCSI(r0, r1, i);
1950 	else if (r0 != r1) {
1951 	    movi(r0, i0);
1952 	    SBCS(r0, r1, r0);
1953 	}
1954 	else {
1955 	    reg = jit_get_reg(jit_class_gpr);
1956 	    movi(rn(reg), i0);
1957 	    SBCS(r0, r1, rn(reg));
1958 	    jit_unget_reg(reg);
1959 	}
1960     }
1961 }
1962 
1963 static void
_rsbi(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)1964 _rsbi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1965 {
1966     subi(r0, r1, i0);
1967     negr(r0, r0);
1968 }
1969 
1970 static void
_mulr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)1971 _mulr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1972 {
1973     jit_int32_t		reg;
1974     if (jit_thumb_p()) {
1975 	if (!jit_no_set_flags() && r0 == r2 && (r0|r1) < 8)
1976 	    T1_MUL(r0, r1);
1977 	else if (!jit_no_set_flags() && r0 == r1 && (r0|r2) < 8)
1978 	    T1_MUL(r0, r2);
1979 	else
1980 	    T2_MUL(r0, r1, r2);
1981     }
1982     else {
1983 	if (r0 == r1 && !jit_armv6_p()) {
1984 	    if (r0 != r2)
1985 		MUL(r0, r2, r1);
1986 	    else {
1987 		reg = jit_get_reg(jit_class_gpr);
1988 		MOV(rn(reg), r1);
1989 		MUL(r0, rn(reg), r2);
1990 		jit_unget_reg(reg);
1991 	    }
1992 	}
1993 	else
1994 	    MUL(r0, r1, r2);
1995     }
1996 }
1997 
1998 static void
_muli(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)1999 _muli(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2000 {
2001     jit_int32_t		reg;
2002     reg = jit_get_reg(jit_class_gpr);
2003     movi(rn(reg), i0);
2004     mulr(r0, r1, rn(reg));
2005     jit_unget_reg(reg);
2006 }
2007 
2008 static void
_iqmulr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2,jit_int32_t r3,jit_bool_t sign)2009 _iqmulr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1,
2010 	jit_int32_t r2, jit_int32_t r3, jit_bool_t sign)
2011 {
2012     jit_int32_t		reg;
2013     if (jit_thumb_p()) {
2014 	if (r2 == r3) {
2015 	    reg = jit_get_reg(jit_class_gpr);
2016 	    movr(rn(reg), r2);
2017 	    if (sign)
2018 		T2_SMULL(r0, r1, rn(reg), r2);
2019 	    else
2020 		T2_UMULL(r0, r1, rn(reg), r2);
2021 	    jit_unget_reg(reg);
2022 	}
2023 	else if (r0 != r2 && r1 != r2) {
2024 	    if (sign)
2025 		T2_SMULL(r0, r1, r2, r3);
2026 	    else
2027 		T2_UMULL(r0, r1, r2, r3);
2028 	}
2029 	else {
2030 	    if (sign)
2031 		T2_SMULL(r0, r1, r3, r2);
2032 	    else
2033 		T2_UMULL(r0, r1, r3, r2);
2034 	}
2035     }
2036     else {
2037 	if (r2 == r3) {
2038 	    reg = jit_get_reg(jit_class_gpr);
2039 	    movr(rn(reg), r2);
2040 	    if (sign)
2041 		SMULL(r0, r1, rn(reg), r2);
2042 	    else
2043 		UMULL(r0, r1, rn(reg), r2);
2044 	    jit_unget_reg(reg);
2045 	}
2046 	else if (r0 != r2 && r1 != r2) {
2047 	    if (sign)
2048 		SMULL(r0, r1, r2, r3);
2049 	    else
2050 		UMULL(r0, r1, r2, r3);
2051 	}
2052 	else {
2053 	    if (sign)
2054 		SMULL(r0, r1, r3, r2);
2055 	    else
2056 		UMULL(r0, r1, r3, r2);
2057 	}
2058     }
2059 }
2060 
2061 static void
_iqmuli(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2,jit_word_t i0,jit_bool_t sign)2062 _iqmuli(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1,
2063 	jit_int32_t r2, jit_word_t i0, jit_bool_t sign)
2064 {
2065     jit_int32_t		reg;
2066     reg = jit_get_reg(jit_class_gpr);
2067     movi(rn(reg), i0);
2068     iqmulr(r0, r1, r2, rn(reg), sign);
2069     jit_unget_reg(reg);
2070 }
2071 
2072 static void
_divrem(jit_state_t * _jit,int div,int sign,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2073 _divrem(jit_state_t *_jit, int div, int sign,
2074 	jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2075 {
2076     jit_word_t		d;
2077     jit_word_t		w;
2078     jit_get_reg_args();
2079     movr(_R0_REGNO, r1);
2080     movr(_R1_REGNO, r2);
2081     if (sign)			w = (jit_word_t)__aeabi_idivmod;
2082     else			w = (jit_word_t)__aeabi_uidivmod;
2083     if (!jit_exchange_p()) {
2084 	if (jit_thumb_p())	d = ((w - _jit->pc.w) >> 1) - 2;
2085 	else			d = ((w - _jit->pc.w) >> 2) - 2;
2086 	if (_s24P(d)) {
2087 	    if (jit_thumb_p())	T2_BLI(encode_thumb_jump(d));
2088 	    else		BLI(d & 0x00ffffff);
2089 	}
2090 	else			goto fallback;
2091     }
2092     else {
2093     fallback:
2094 	movi(_R2_REGNO, w);
2095 	if (jit_thumb_p())	T1_BLX(_R2_REGNO);
2096 	else			BLX(_R2_REGNO);
2097     }
2098     if (div)			movr(r0, _R0_REGNO);
2099     else			movr(r0, _R1_REGNO);
2100     jit_unget_reg_args();
2101 }
2102 
2103 static void
_divr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2104 _divr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2105 {
2106     if (jit_armv7r_p() && jit_thumb_p())
2107 	T2_SDIV(r0, r1, r2);
2108     else
2109 	divrem(1, 1, r0, r1, r2);
2110 }
2111 
2112 static void
_divi(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2113 _divi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2114 {
2115     jit_int32_t		reg;
2116     reg = jit_get_reg(jit_class_gpr);
2117     movi(rn(reg), i0);
2118     divr(r0, r1, rn(reg));
2119     jit_unget_reg(reg);
2120 }
2121 
2122 static void
_divr_u(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2123 _divr_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2124 {
2125     if (jit_armv7r_p() && jit_thumb_p())
2126 	T2_UDIV(r0, r1, r2);
2127     else
2128 	divrem(1, 0, r0, r1, r2);
2129 }
2130 
2131 static void
_divi_u(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2132 _divi_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2133 {
2134     jit_int32_t		reg;
2135     reg = jit_get_reg(jit_class_gpr);
2136     movi(rn(reg), i0);
2137     divr_u(r0, r1, rn(reg));
2138     jit_unget_reg(reg);
2139 }
2140 
2141 static void
_iqdivr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2,jit_int32_t r3,jit_bool_t sign)2142 _iqdivr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1,
2143 	jit_int32_t r2, jit_int32_t r3,	jit_bool_t sign)
2144 {
2145     jit_word_t		d;
2146     jit_word_t		w;
2147     jit_get_reg_args();
2148     movr(_R0_REGNO, r2);
2149     movr(_R1_REGNO, r3);
2150     if (sign)			w = (jit_word_t)__aeabi_idivmod;
2151     else			w = (jit_word_t)__aeabi_uidivmod;
2152     if (!jit_exchange_p()) {
2153 	if (jit_thumb_p())	d = ((w - _jit->pc.w) >> 1) - 2;
2154 	else			d = ((w - _jit->pc.w) >> 2) - 2;
2155 	if (_s24P(d)) {
2156 	    if (jit_thumb_p())	T2_BLI(encode_thumb_jump(d));
2157 	    else		BLI(d & 0x00ffffff);
2158 	}
2159 	else			goto fallback;
2160     }
2161     else {
2162     fallback:
2163 	movi(_R2_REGNO, w);
2164 	if (jit_thumb_p())	T1_BLX(_R2_REGNO);
2165 	else			BLX(_R2_REGNO);
2166     }
2167     movr(r0, _R0_REGNO);
2168     movr(r1, _R1_REGNO);
2169     jit_unget_reg_args();
2170 }
2171 
2172 static void
_iqdivi(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2,jit_word_t i0,jit_bool_t sign)2173 _iqdivi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1,
2174 	jit_int32_t r2, jit_word_t i0, jit_bool_t sign)
2175 {
2176     jit_int32_t		reg;
2177     reg = jit_get_reg(jit_class_gpr);
2178     movi(rn(reg), i0);
2179     iqdivr(r0, r1, r2, rn(reg), sign);
2180     jit_unget_reg(reg);
2181 }
2182 
2183 static void
_remr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2184 _remr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2185 {
2186     divrem(0, 1, r0, r1, r2);
2187 }
2188 
2189 static void
_remi(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2190 _remi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2191 {
2192     jit_int32_t		reg;
2193     reg = jit_get_reg(jit_class_gpr);
2194     movi(rn(reg), i0);
2195     remr(r0, r1, rn(reg));
2196     jit_unget_reg(reg);
2197 }
2198 
2199 static void
_remr_u(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2200 _remr_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2201 {
2202     divrem(0, 0, r0, r1, r2);
2203 }
2204 
2205 static void
_remi_u(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2206 _remi_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2207 {
2208     jit_int32_t		reg;
2209     reg = jit_get_reg(jit_class_gpr);
2210     movi(rn(reg), i0);
2211     remr_u(r0, r1,rn(reg));
2212     jit_unget_reg(reg);
2213 }
2214 
2215 static void
_andr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2216 _andr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2217 {
2218     if (jit_thumb_p()) {
2219 	if (!jit_no_set_flags() && (r0|r1|r2) < 8 && (r0 == r1 || r0 == r2))
2220 	    T1_AND(r0, r0 == r1 ? r2 : r1);
2221 	else
2222 	    T2_AND(r0, r1, r2);
2223     }
2224     else
2225 	AND(r0, r1, r2);
2226 }
2227 
2228 static void
_andi(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2229 _andi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2230 {
2231     int			i;
2232     jit_int32_t		reg;
2233     if (jit_thumb_p()) {
2234 	if ((i = encode_thumb_immediate(i0)) != -1)
2235 	    T2_ANDI(r0, r1, i);
2236 	else if ((i = encode_thumb_immediate(~i0)) != -1)
2237 	    T2_BICI(r0, r1, i);
2238 	else if (r0 != r1) {
2239 	    movi(r0, i0);
2240 	    T2_AND(r0, r1, r0);
2241 	}
2242 	else {
2243 	    reg = jit_get_reg(jit_class_gpr);
2244 	    movi(rn(reg), i0);
2245 	    T2_AND(r0, r1, rn(reg));
2246 	    jit_unget_reg(reg);
2247 	}
2248     }
2249     else {
2250 	if ((i = encode_arm_immediate(i0)) != -1)
2251 	    ANDI(r0, r1, i);
2252 	else if ((i = encode_arm_immediate(~i0)) != -1)
2253 	    BICI(r0, r1, i);
2254 	else if (r0 != r1) {
2255 	    movi(r0, i0);
2256 	    AND(r0, r1, r0);
2257 	}
2258 	else {
2259 	    reg = jit_get_reg(jit_class_gpr);
2260 	    movi(rn(reg), i0);
2261 	    AND(r0, r1, rn(reg));
2262 	    jit_unget_reg(reg);
2263 	}
2264     }
2265 }
2266 
2267 static void
_orr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2268 _orr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2269 {
2270     if (jit_thumb_p()) {
2271 	if (!jit_no_set_flags() && (r0|r1|r2) < 8 && (r0 == r1 || r0 == r2))
2272 	    T1_ORR(r0, r0 == r1 ? r2 : r1);
2273 	else
2274 	    T2_ORR(r0, r1, r2);
2275     }
2276     else
2277 	ORR(r0, r1, r2);
2278 }
2279 
2280 static void
_ori(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2281 _ori(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2282 {
2283     int			i;
2284     jit_int32_t		reg;
2285     if (jit_thumb_p()) {
2286 	if ((i = encode_thumb_immediate(i0)) != -1)
2287 	    T2_ORRI(r0, r1, i);
2288 	else if (r0 != r1) {
2289 	    movi(r0, i0);
2290 	    T2_ORR(r0, r1, r0);
2291 	}
2292 	else {
2293 	    reg = jit_get_reg(jit_class_gpr);
2294 	    movi(rn(reg), i0);
2295 	    T2_ORR(r0, r1, rn(reg));
2296 	    jit_unget_reg(reg);
2297 	}
2298     }
2299     else {
2300 	if ((i = encode_arm_immediate(i0)) != -1)
2301 	    ORRI(r0, r1, i);
2302 	else if (r0 != r1) {
2303 	    movi(r0, i0);
2304 	    ORR(r0, r1, r0);
2305 	}
2306 	else {
2307 	    reg = jit_get_reg(jit_class_gpr);
2308 	    movi(rn(reg), i0);
2309 	    ORR(r0, r1, rn(reg));
2310 	    jit_unget_reg(reg);
2311 	}
2312     }
2313 }
2314 
2315 static void
_xorr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2316 _xorr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2317 {
2318     if (jit_thumb_p()) {
2319 	if (!jit_no_set_flags() && (r0|r1|r2) < 8 && (r0 == r1 || r0 == r2))
2320 	    T1_EOR(r0, r0 == r1 ? r2 : r1);
2321 	else
2322 	    T2_EOR(r0, r1, r2);
2323     }
2324     else
2325 	EOR(r0, r1, r2);
2326 }
2327 
2328 static void
_xori(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2329 _xori(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2330 {
2331     int			i;
2332     jit_int32_t		reg;
2333     if (jit_thumb_p()) {
2334 	if ((i = encode_thumb_immediate(i0)) != -1)
2335 	    T2_EORI(r0, r1, i);
2336 	else if (r0 != r1) {
2337 	    movi(r0, i0);
2338 	    T2_EOR(r0, r1, r0);
2339 	}
2340 	else {
2341 	    reg = jit_get_reg(jit_class_gpr);
2342 	    movi(rn(reg), i0);
2343 	    T2_EOR(r0, r1, rn(reg));
2344 	    jit_unget_reg(reg);
2345 	}
2346     }
2347     else {
2348 	if ((i = encode_arm_immediate(i0)) != -1)
2349 	    EORI(r0, r1, i);
2350 	else if (r0 != r1) {
2351 	    movi(r0, i0);
2352 	    EOR(r0, r1, r0);
2353 	}
2354 	else {
2355 	    reg = jit_get_reg(jit_class_gpr);
2356 	    movi(rn(reg), i0);
2357 	    EOR(r0, r1, rn(reg));
2358 	    jit_unget_reg(reg);
2359 	}
2360     }
2361 }
2362 
2363 static void
_lshr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2364 _lshr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2365 {
2366     if (jit_thumb_p()) {
2367 	if (!jit_no_set_flags() && (r0|r1|r2) < 8 && r0 == r1)
2368 	    T1_LSL(r0, r2);
2369 	else
2370 	    T2_LSL(r0, r1, r2);
2371     }
2372     else
2373 	LSL(r0, r1, r2);
2374 }
2375 
2376 static void
_lshi(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2377 _lshi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2378 {
2379     assert(i0 >= 0 && i0 <= 31);
2380     if (i0 == 0)
2381 	movr(r0, r1);
2382     else if (jit_thumb_p()) {
2383 	if (!jit_no_set_flags() && (r0|r1) < 8)
2384 	    T1_LSLI(r0, r1, i0);
2385 	else
2386 	    T2_LSLI(r0, r1, i0);
2387     }
2388     else
2389 	LSLI(r0, r1, i0);
2390 }
2391 
2392 static void
_rshr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2393 _rshr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2394 {
2395     if (jit_thumb_p()) {
2396 	if (!jit_no_set_flags() && (r0|r1|r2) < 8 && r0 == r1)
2397 	    T1_ASR(r0, r2);
2398 	else
2399 	    T2_ASR(r0, r1, r2);
2400     }
2401     else
2402 	ASR(r0, r1, r2);
2403 }
2404 
2405 static void
_rshi(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2406 _rshi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2407 {
2408     assert(i0 >= 0 && i0 <= 31);
2409     if (i0 == 0)
2410 	movr(r0, r1);
2411     else if (jit_thumb_p()) {
2412 	if (!jit_no_set_flags() && (r0|r1) < 8)
2413 	    T1_ASRI(r0, r1, i0);
2414 	else
2415 	    T2_ASRI(r0, r1, i0);
2416     }
2417     else
2418 	ASRI(r0, r1, i0);
2419 }
2420 
2421 static void
_rshr_u(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2422 _rshr_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2423 {
2424     if (jit_thumb_p()) {
2425 	if (!jit_no_set_flags() && (r0|r1|r2) < 8 && r0 == r1)
2426 	    T1_LSR(r0, r2);
2427 	else
2428 	    T2_LSR(r0, r1, r2);
2429     }
2430     else
2431 	LSR(r0, r1, r2);
2432 }
2433 
2434 static void
_rshi_u(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2435 _rshi_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2436 {
2437     assert(i0 >= 0 && i0 <= 31);
2438     if (i0 == 0)
2439 	movr(r0, r1);
2440     else if (jit_thumb_p()) {
2441 	if (!jit_no_set_flags() && (r0|r1) < 8)
2442 	    T1_LSRI(r0, r1, i0);
2443 	else
2444 	    T2_LSRI(r0, r1, i0);
2445     }
2446     else
2447 	LSRI(r0, r1, i0);
2448 }
2449 
2450 static void
_ccr(jit_state_t * _jit,int ct,int cf,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2451 _ccr(jit_state_t *_jit, int ct, int cf,
2452      jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2453 {
2454     if (jit_thumb_p()) {
2455 	assert((ct ^ cf) >> 28 == 1);
2456 	if ((r1|r2) < 8)
2457 	    T1_CMP(r1, r2);
2458 	else if ((r1&r2) & 8)
2459 	    T1_CMPX(r1, r2);
2460 	else
2461 	    T2_CMP(r1, r2);
2462 	ITE(ct);
2463 	if (r0 < 8) {
2464 	    T1_MOVI(r0, 1);
2465 	    T1_MOVI(r0, 0);
2466 	}
2467 	else {
2468 	    T2_MOVI(r0, 1);
2469 	    T2_MOVI(r0, 0);
2470 	}
2471     }
2472     else {
2473 	CMP(r1, r2);
2474 	CC_MOVI(ct, r0, 1);
2475 	CC_MOVI(cf, r0, 0);
2476     }
2477 }
2478 
2479 static void
_cci(jit_state_t * _jit,int ct,int cf,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2480 _cci(jit_state_t *_jit, int ct, int cf,
2481      jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2482 {
2483     int			i;
2484     jit_int32_t		reg;
2485     if (jit_thumb_p()) {
2486 	if (r1 < 7 && !(i0 & 0xffffff00))
2487 	    T1_CMPI(r1, i0);
2488 	else if ((i = encode_thumb_immediate(i0)) != -1)
2489 	    T2_CMPI(r1, i);
2490 	else if ((i = encode_thumb_immediate(-i0)) != -1)
2491 	    T2_CMNI(r1, i);
2492 	else {
2493 	    reg = jit_get_reg(jit_class_gpr);
2494 	    movi(rn(reg), i0);
2495 	    ccr(ct, cf, r0, r1, rn(reg));
2496 	    jit_unget_reg(reg);
2497 	    return;
2498 	}
2499 	ITE(ct);
2500 	if (r0 < 8) {
2501 	    T1_MOVI(r0, 1);
2502 	    T1_MOVI(r0, 0);
2503 	}
2504 	else {
2505 	    T2_MOVI(r0, 1);
2506 	    T2_MOVI(r0, 0);
2507 	}
2508     }
2509     else {
2510 	if ((i = encode_arm_immediate(i0)) != -1)
2511 	    CMPI(r1, i);
2512 	else if ((i = encode_arm_immediate(-i0)) != -1)
2513 	    CMNI(r1, i);
2514 	else if (r0 != r1) {
2515 	    movi(r0, i0);
2516 	    CMP(r1, r0);
2517 	}
2518 	else {
2519 	    reg = jit_get_reg(jit_class_gpr);
2520 	    movi(rn(reg), i0);
2521 	    CMP(r1, rn(reg));
2522 	    jit_unget_reg(reg);
2523 	}
2524 	CC_MOVI(ct, r0, 1);
2525 	CC_MOVI(cf, r0, 0);
2526     }
2527 }
2528 
2529 static void
_ner(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2530 _ner(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2531 {
2532     if (jit_thumb_p())
2533 	ccr(ARM_CC_NE, ARM_CC_EQ, r0, r1, r2);
2534     else {
2535 	SUBS(r0, r1, r2);
2536 	CC_MOVI(ARM_CC_NE, r0, 1);
2537     }
2538 }
2539 
2540 static void
_nei(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2541 _nei(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2542 {
2543     int			i;
2544     jit_int32_t		reg;
2545     if (jit_thumb_p())
2546 	cci(ARM_CC_NE, ARM_CC_EQ, r0, r1, i0);
2547     else {
2548 	if ((i = encode_arm_immediate(i0)) != -1)
2549 	    SUBSI(r0, r1, i);
2550 	else if ((i = encode_arm_immediate(-i0)) != -1)
2551 	    ADDSI(r0, r1, i);
2552 	else if (r0 != r1) {
2553 	    movi(r0, i0);
2554 	    SUBS(r0, r1, r0);
2555 	}
2556 	else {
2557 	    reg = jit_get_reg(jit_class_gpr);
2558 	    movi(rn(reg), i0);
2559 	    SUBS(r0, r1, rn(reg));
2560 	    jit_unget_reg(reg);
2561 	}
2562 	CC_MOVI(ARM_CC_NE, r0, 1);
2563     }
2564 }
2565 
2566 static void
_jmpr(jit_state_t * _jit,jit_int32_t r0)2567 _jmpr(jit_state_t *_jit, jit_int32_t r0)
2568 {
2569     if (jit_thumb_p())
2570 	T1_MOV(_R15_REGNO, r0);
2571     else
2572 	MOV(_R15_REGNO, r0);
2573 }
2574 
2575 static void
_jmpi(jit_state_t * _jit,jit_word_t i0)2576 _jmpi(jit_state_t *_jit, jit_word_t i0)
2577 {
2578     jit_word_t		w;
2579     jit_word_t		d;
2580     jit_int32_t		reg;
2581     w = _jit->pc.w;
2582     /* if thumb and in thumb mode */
2583     if (jit_thumb_p() && _jitc->thumb) {
2584 	d = ((i0 - w) >> 1) - 2;
2585 	if (d >= -1024 && d <= 1023)
2586 	    T1_B(d & 0x7ff);
2587 	else if (_s24P(d))
2588 	    T2_B(encode_thumb_jump(d));
2589 	else {
2590 	    reg = jit_get_reg(jit_class_gpr|jit_class_nospill);
2591 	    movi(rn(reg), i0);
2592 	    jmpr(rn(reg));
2593 	    jit_unget_reg(reg);
2594 	}
2595     }
2596     else {
2597 	d = ((i0 - w) >> 2) - 2;
2598 	if (_s24P(d))
2599 	    B(d & 0x00ffffff);
2600 	else {
2601 	    reg = jit_get_reg(jit_class_gpr|jit_class_nospill);
2602 	    movi(rn(reg), i0);
2603 	    jmpr(rn(reg));
2604 	    jit_unget_reg(reg);
2605 	}
2606     }
2607 }
2608 
2609 static jit_word_t
_jmpi_p(jit_state_t * _jit,jit_word_t i0,jit_bool_t i1)2610 _jmpi_p(jit_state_t *_jit, jit_word_t i0, jit_bool_t i1)
2611 {
2612     jit_word_t		w;
2613     jit_word_t		d;
2614     jit_int32_t		reg;
2615     if (i1) {
2616 	/* Assume jump is not longer than 23 bits if inside jit */
2617 	w = _jit->pc.w;
2618 	/* if thumb and in thumb mode */
2619 	if (jit_thumb_p() && _jitc->thumb) {
2620 	    d = ((i0 - w) >> 1) - 2;
2621 	    assert(_s24P(d));
2622 	    T2_B(encode_thumb_jump(d));
2623 	}
2624 	else {
2625 	    d = ((i0 - w) >> 2) - 2;
2626 	    assert(_s24P(d));
2627 	    B(d & 0x00ffffff);
2628 	}
2629     }
2630     else {
2631 	reg = jit_get_reg(jit_class_gpr|jit_class_nospill);
2632 	w = movi_p(rn(reg), i0);
2633 	jmpr(rn(reg));
2634 	jit_unget_reg(reg);
2635     }
2636     return (w);
2637 }
2638 
2639 static jit_word_t
_bccr(jit_state_t * _jit,int cc,jit_word_t i0,jit_int32_t r0,jit_int32_t r1)2640 _bccr(jit_state_t *_jit, int cc, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
2641 {
2642     jit_word_t		w;
2643     jit_word_t		d;
2644     if (jit_thumb_p()) {
2645 	if ((r0|r1) < 8)
2646 	    T1_CMP(r0, r1);
2647 	else if ((r0&r1) & 8)
2648 	    T1_CMPX(r0, r1);
2649 	else
2650 	    T2_CMP(r0, r1);
2651 	/* use only thumb2 conditional as does not know if will be patched */
2652 	w = _jit->pc.w;
2653 	d = ((i0 - w) >> 1) - 2;
2654 	assert(_s20P(d));
2655 	T2_CC_B(cc, encode_thumb_cc_jump(d));
2656     }
2657     else {
2658 	CMP(r0, r1);
2659 	w = _jit->pc.w;
2660 	d = ((i0 - w) >> 2) - 2;
2661 	assert(_s24P(d));
2662 	CC_B(cc, d & 0x00ffffff);
2663     }
2664     return (w);
2665 }
2666 
2667 static jit_word_t
_bcci(jit_state_t * _jit,int cc,jit_word_t i0,jit_int32_t r0,jit_word_t i1)2668 _bcci(jit_state_t *_jit, int cc, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
2669 {
2670     jit_word_t		w;
2671     jit_word_t		d;
2672     int			i;
2673     jit_int32_t		reg;
2674     if (jit_thumb_p()) {
2675 	if (r0 < 7 && !(i1 & 0xffffff00))
2676 	    T1_CMPI(r0, i1);
2677 	else if ((i = encode_thumb_immediate(i1)) != -1)
2678 	    T2_CMPI(r0, i);
2679 	else if ((i = encode_thumb_immediate(-i1)) != -1)
2680 	    T2_CMNI(r0, i);
2681 	else {
2682 	    reg = jit_get_reg(jit_class_gpr);
2683 	    movi(rn(reg), i1);
2684 	    T2_CMP(r0, rn(reg));
2685 	    jit_unget_reg(reg);
2686 	}
2687 	/* use only thumb2 conditional as does not know if will be patched */
2688 	w = _jit->pc.w;
2689 	d = ((i0 - w) >> 1) - 2;
2690 	assert(_s20P(d));
2691 	T2_CC_B(cc, encode_thumb_cc_jump(d));
2692     }
2693     else {
2694 	if ((i = encode_arm_immediate(i1)) != -1)
2695 	    CMPI(r0, i);
2696 	else if ((i = encode_arm_immediate(-i1)) != -1)
2697 	    CMNI(r0, i);
2698 	else {
2699 	    reg = jit_get_reg(jit_class_gpr);
2700 	    movi(rn(reg), i1);
2701 	    CMP(r0, rn(reg));
2702 	    jit_unget_reg(reg);
2703 	}
2704 	w = _jit->pc.w;
2705 	d = ((i0 - w) >> 2) - 2;
2706 	assert(_s24P(d));
2707 	CC_B(cc, d & 0x00ffffff);
2708     }
2709     return (w);
2710 }
2711 
2712 static jit_word_t
_baddr(jit_state_t * _jit,int cc,jit_word_t i0,jit_int32_t r0,jit_int32_t r1)2713 _baddr(jit_state_t *_jit, int cc, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
2714 {
2715     jit_word_t		w;
2716     jit_word_t		d;
2717     if (jit_thumb_p()) {
2718 	if ((r0|r1) < 8)
2719 	    T1_ADD(r0, r0, r1);
2720 	else
2721 	    T2_ADDS(r0, r0, r1);
2722 	w = _jit->pc.w;
2723 	d = ((i0 - w) >> 1) - 2;
2724 	assert(_s20P(d));
2725 	T2_CC_B(cc, encode_thumb_cc_jump(d));
2726     }
2727     else {
2728 	ADDS(r0, r0, r1);
2729 	w = _jit->pc.w;
2730 	d = ((i0 - w) >> 2) - 2;
2731 	assert(_s24P(d));
2732 	CC_B(cc, d & 0x00ffffff);
2733     }
2734     return (w);
2735 }
2736 
2737 static jit_word_t
_baddi(jit_state_t * _jit,int cc,jit_word_t i0,jit_int32_t r0,int i1)2738 _baddi(jit_state_t *_jit, int cc, jit_word_t i0, jit_int32_t r0, int i1)
2739 {
2740     int			i;
2741     jit_word_t		w;
2742     jit_word_t		d;
2743     jit_int32_t		reg;
2744     if (jit_thumb_p()) {
2745 	if (r0 < 8 && !(i1 & ~7))
2746 	    T1_ADDI3(r0, r0, i1);
2747 	else if (r0 < 8 && !(-i1 & ~7))
2748 	    T1_SUBI3(r0, r0, -i1);
2749 	else if (r0 < 8 && !(i1 & ~0xff))
2750 	    T1_ADDI8(r0, i1);
2751 	else if (r0 < 8 && !(-i1 & ~0xff))
2752 	    T1_SUBI8(r0, -i1);
2753 	else if ((i = encode_thumb_immediate(i1)) != -1)
2754 	    T2_ADDSI(r0, r0, i);
2755 	else if ((i = encode_thumb_immediate(-i1)) != -1)
2756 	    T2_SUBSI(r0, r0, i);
2757 	else {
2758 	    reg = jit_get_reg(jit_class_gpr);
2759 	    movi(rn(reg), i1);
2760 	    T2_ADDS(r0, r0, rn(reg));
2761 	    jit_unget_reg(reg);
2762 	}
2763 	w = _jit->pc.w;
2764 	d = ((i0 - w) >> 1) - 2;
2765 	assert(_s20P(d));
2766 	T2_CC_B(cc, encode_thumb_cc_jump(d));
2767     }
2768     else {
2769 	if ((i = encode_arm_immediate(i1)) != -1)
2770 	    ADDSI(r0, r0, i);
2771 	else if ((i = encode_arm_immediate(-i1)) != -1)
2772 	    SUBSI(r0, r0, i);
2773 	else {
2774 	    reg = jit_get_reg(jit_class_gpr);
2775 	    movi(rn(reg), i1);
2776 	    ADDS(r0, r0, rn(reg));
2777 	    jit_unget_reg(reg);
2778 	}
2779 	w = _jit->pc.w;
2780 	d = ((i0 - w) >> 2) - 2;
2781 	assert(_s24P(d));
2782 	CC_B(cc, d & 0x00ffffff);
2783     }
2784     return (w);
2785 }
2786 
2787 static jit_word_t
_bsubr(jit_state_t * _jit,int cc,jit_word_t i0,jit_int32_t r0,jit_int32_t r1)2788 _bsubr(jit_state_t *_jit, int cc, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
2789 {
2790     jit_word_t		w;
2791     jit_word_t		d;
2792     if (jit_thumb_p()) {
2793 	if ((r0|r1) < 8)
2794 	    T1_SUB(r0, r0, r1);
2795 	else
2796 	    T2_SUBS(r0, r0, r1);
2797 	w = _jit->pc.w;
2798 	d = ((i0 - w) >> 1) - 2;
2799 	assert(_s20P(d));
2800 	T2_CC_B(cc, encode_thumb_cc_jump(d));
2801     }
2802     else {
2803 	SUBS(r0, r0, r1);
2804 	w = _jit->pc.w;
2805 	d = ((i0 - w) >> 2) - 2;
2806 	assert(_s24P(d));
2807 	CC_B(cc, d & 0x00ffffff);
2808     }
2809     return (w);
2810 }
2811 
2812 static jit_word_t
_bsubi(jit_state_t * _jit,int cc,jit_word_t i0,jit_int32_t r0,int i1)2813 _bsubi(jit_state_t *_jit, int cc, jit_word_t i0, jit_int32_t r0, int i1)
2814 {
2815     int			i;
2816     jit_word_t		w;
2817     jit_word_t		d;
2818     jit_int32_t		reg;
2819     if (jit_thumb_p()) {
2820 	if (r0 < 8 && !(i1 & ~7))
2821 	    T1_SUBI3(r0, r0, i1);
2822 	else if (r0 < 8 && !(-i1 & ~7))
2823 	    T1_ADDI3(r0, r0, -i1);
2824 	else if (r0 < 8 && !(i1 & ~0xff))
2825 	    T1_SUBI8(r0, i1);
2826 	else if (r0 < 8 && !(-i1 & ~0xff))
2827 	    T1_ADDI8(r0, -i1);
2828 	else if ((i = encode_thumb_immediate(i1)) != -1)
2829 	    T2_SUBSI(r0, r0, i);
2830 	else if ((i = encode_thumb_immediate(-i1)) != -1)
2831 	    T2_SUBSI(r0, r0, i);
2832 	else {
2833 	    reg = jit_get_reg(jit_class_gpr);
2834 	    movi(rn(reg), i1);
2835 	    T2_SUBS(r0, r0, rn(reg));
2836 	    jit_unget_reg(reg);
2837 	}
2838 	w = _jit->pc.w;
2839 	d = ((i0 - w) >> 1) - 2;
2840 	assert(_s20P(d));
2841 	T2_CC_B(cc, encode_thumb_cc_jump(d));
2842     }
2843     else {
2844 	if ((i = encode_arm_immediate(i1)) != -1)
2845 	    SUBSI(r0, r0, i);
2846 	else if ((i = encode_arm_immediate(-i1)) != -1)
2847 	    ADDSI(r0, r0, i);
2848 	else {
2849 	    reg = jit_get_reg(jit_class_gpr);
2850 	    movi(rn(reg), i1);
2851 	    SUBS(r0, r0, rn(reg));
2852 	    jit_unget_reg(reg);
2853 	}
2854 	w = _jit->pc.w;
2855 	d = ((i0 - w) >> 2) - 2;
2856 	assert(_s24P(d));
2857 	CC_B(cc, d & 0x00ffffff);
2858     }
2859     return (w);
2860 }
2861 
2862 static jit_word_t
_bmxr(jit_state_t * _jit,int cc,jit_word_t i0,jit_int32_t r0,jit_int32_t r1)2863 _bmxr(jit_state_t *_jit, int cc, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
2864 {
2865     jit_word_t		w;
2866     jit_word_t		d;
2867     jit_int32_t		reg;
2868     if (jit_thumb_p()) {
2869 	if ((r0|r1) < 8)
2870 	    T1_TST(r0, r1);
2871 	else
2872 	    T2_TST(r0, r1);
2873 	w = _jit->pc.w;
2874 	d = ((i0 - w) >> 1) - 2;
2875 	assert(_s20P(d));
2876 	T2_CC_B(cc, encode_thumb_cc_jump(d));
2877     }
2878     else {
2879 	if (jit_armv5_p())
2880 	    TST(r0, r1);
2881 	else {
2882 	    reg = jit_get_reg(jit_class_gpr);
2883 	    ANDS(rn(reg), r0, r1);
2884 	    jit_unget_reg(reg);
2885 	}
2886 	w = _jit->pc.w;
2887 	d = ((i0 - w) >> 2) - 2;
2888 	assert(_s24P(d));
2889 	CC_B(cc, d & 0x00ffffff);
2890     }
2891     return (w);
2892 }
2893 
2894 static jit_word_t
_bmxi(jit_state_t * _jit,int cc,jit_word_t i0,jit_int32_t r0,jit_word_t i1)2895 _bmxi(jit_state_t *_jit, int cc, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
2896 {
2897     int			i;
2898     jit_word_t		w;
2899     jit_word_t		d;
2900     jit_int32_t		reg;
2901     if (jit_thumb_p()) {
2902 	if ((i = encode_thumb_immediate(i1)) != -1)
2903 	    T2_TSTI(r0, i);
2904 	else {
2905 	    reg = jit_get_reg(jit_class_gpr);
2906 	    movi(rn(reg), i1);
2907 	    T2_TST(r0, rn(reg));
2908 	    jit_unget_reg(reg);
2909 	}
2910 	w = _jit->pc.w;
2911 	d = ((i0 - w) >> 1) - 2;
2912 	assert(_s20P(d));
2913 	T2_CC_B(cc, encode_thumb_cc_jump(d));
2914     }
2915     else {
2916 	if (jit_armv5_p()) {
2917 	    if ((i = encode_arm_immediate(i1)) != -1)
2918 		TSTI(r0, i);
2919 	    else {
2920 		reg = jit_get_reg(jit_class_gpr);
2921 		movi(rn(reg), i1);
2922 		TST(r0, rn(reg));
2923 		jit_unget_reg(reg);
2924 	    }
2925 	}
2926 	else {
2927 	    reg = jit_get_reg(jit_class_gpr);
2928 	    if ((i = encode_arm_immediate(i1)) != -1)
2929 		ANDSI(rn(reg), r0, i);
2930 	    else if ((i = encode_arm_immediate(~i1)) != -1)
2931 		BICSI(rn(reg), r0, i);
2932 	    else {
2933 		movi(rn(reg), i1);
2934 		ANDS(rn(reg), r0, rn(reg));
2935 	    }
2936 	    jit_unget_reg(reg);
2937 	}
2938 	w = _jit->pc.w;
2939 	d = ((i0 - w) >> 2) - 2;
2940 	assert(_s24P(d));
2941 	CC_B(cc, d & 0x00ffffff);
2942     }
2943     return (w);
2944 }
2945 
2946 static void
_ldr_c(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)2947 _ldr_c(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2948 {
2949     if (jit_thumb_p())
2950 	T2_LDRSBI(r0, r1, 0);
2951     else
2952 	LDRSBI(r0, r1, 0);
2953 }
2954 
2955 static void
_ldi_c(jit_state_t * _jit,jit_int32_t r0,jit_word_t i0)2956 _ldi_c(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
2957 {
2958     jit_int32_t		reg;
2959     reg = jit_get_reg(jit_class_gpr);
2960     movi(rn(reg), i0);
2961     if (jit_thumb_p())
2962 	T2_LDRSBI(r0, rn(reg), 0);
2963     else
2964 	LDRSBI(r0, rn(reg), 0);
2965     jit_unget_reg(reg);
2966 }
2967 
2968 static void
_ldxr_c(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2969 _ldxr_c(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2970 {
2971     if (jit_thumb_p()) {
2972 	if ((r0|r1|r2) < 8)
2973 	    T1_LDRSB(r0, r1, r2);
2974 	else
2975 	    T2_LDRSB(r0, r1, r2);
2976     }
2977     else
2978 	LDRSB(r0, r1, r2);
2979 }
2980 
2981 static void
_ldxi_c(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2982 _ldxi_c(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2983 {
2984     jit_int32_t		reg;
2985     if (jit_thumb_p()) {
2986 	if (jit_ldrt_strt_p() && i0 >= 0 && i0 <= 255)
2987 	    T2_LDRSBI(r0, r1, i0);
2988 	else if (i0 < 0 && i0 >= -255)
2989 	    T2_LDRSBIN(r0, r1, -i0);
2990 	else if (i0 >= 0 && i0 <= 4095)
2991 	    T2_LDRSBWI(r0, r1, i0);
2992 	else if (r0 != r1) {
2993 	    movi(r0, i0);
2994 	    if ((r0|r1) < 8)
2995 		T1_LDRSB(r0, r1, r0);
2996 	    else
2997 		T2_LDRSB(r0, r1, r0);
2998 	}
2999 	else {
3000 	    reg = jit_get_reg(jit_class_gpr);
3001 	    movi(rn(reg), i0);
3002 	    if ((r0|r1|rn(reg)) < 8)
3003 		T1_LDRSB(r0, r1, rn(reg));
3004 	    else
3005 		T2_LDRSB(r0, r1, rn(reg));
3006 	    jit_unget_reg(reg);
3007 	}
3008     }
3009     else {
3010 	if (i0 >= 0 && i0 <= 255)
3011 	    LDRSBI(r0, r1, i0);
3012 	else if (i0 < 0 && i0 >= -255)
3013 	    LDRSBIN(r0, r1, -i0);
3014 	else if (r0 != r1) {
3015 	    movi(r0, i0);
3016 	    LDRSB(r0, r1, r0);
3017 	}
3018 	else {
3019 	    reg = jit_get_reg(jit_class_gpr);
3020 	    movi(rn(reg), i0);
3021 	    LDRSB(r0, r1, rn(reg));
3022 	    jit_unget_reg(reg);
3023 	}
3024     }
3025 }
3026 
3027 static void
_ldr_uc(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3028 _ldr_uc(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3029 {
3030     if (jit_thumb_p())
3031 	T2_LDRBI(r0, r1, 0);
3032     else
3033 	LDRBI(r0, r1, 0);
3034 }
3035 
3036 static void
_ldi_uc(jit_state_t * _jit,jit_int32_t r0,jit_word_t i0)3037 _ldi_uc(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
3038 {
3039     jit_int32_t		reg;
3040     reg = jit_get_reg(jit_class_gpr);
3041     movi(rn(reg), i0);
3042     if (jit_thumb_p())
3043 	T2_LDRBI(r0, rn(reg), 0);
3044     else
3045 	LDRBI(r0, rn(reg), 0);
3046     jit_unget_reg(reg);
3047 }
3048 
3049 static void
_ldxr_uc(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)3050 _ldxr_uc(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
3051 {
3052     if (jit_thumb_p()) {
3053 	if ((r0|r1|r2) < 8)
3054 	    T1_LDRB(r0, r1, r2);
3055 	else
3056 	    T2_LDRB(r0, r1, r2);
3057     }
3058     else
3059 	LDRB(r0, r1, r2);
3060 }
3061 
3062 static void
_ldxi_uc(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)3063 _ldxi_uc(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
3064 {
3065     jit_int32_t		reg;
3066     if (jit_thumb_p()) {
3067 	if ((r0|r1) < 8 && i0 >= 0 && i0 < 0x20)
3068 	    T1_LDRBI(r0, r1, i0);
3069 	else if (jit_ldrt_strt_p() && i0 >= 0 && i0 <= 255)
3070 	    T2_LDRBI(r0, r1, i0);
3071 	else if (i0 < 0 && i0 >= -255)
3072 	    T2_LDRBIN(r0, r1, -i0);
3073 	else if (i0 >= 0 && i0 <= 4095)
3074 	    T2_LDRBWI(r0, r1, i0);
3075 	else if (r0 != r1) {
3076 	    movi(r0, i0);
3077 	    if ((r0|r1) < 8)
3078 		T1_LDRB(r0, r1, r0);
3079 	    else
3080 		T2_LDRB(r0, r1, r0);
3081 	}
3082 	else {
3083 	    reg = jit_get_reg(jit_class_gpr);
3084 	    movi(rn(reg), i0);
3085 	    if ((r0|r1|rn(reg)) < 8)
3086 		T1_LDRB(r0, r1, rn(reg));
3087 	    else
3088 		T2_LDRB(r0, r1, rn(reg));
3089 	    jit_unget_reg(reg);
3090 	}
3091     }
3092     else {
3093 	if (i0 >= 0 && i0 <= 4095)
3094 	    LDRBI(r0, r1, i0);
3095 	else if (i0 < 0 && i0 >= -4095)
3096 	    LDRBIN(r0, r1, -i0);
3097 	else if (r0 != r1) {
3098 	    movi(r0, i0);
3099 	    LDRB(r0, r1, r0);
3100 	}
3101 	else {
3102 	    reg = jit_get_reg(jit_class_gpr);
3103 	    movi(rn(reg), i0);
3104 	    LDRB(r0, r1, rn(reg));
3105 	    jit_unget_reg(reg);
3106 	}
3107     }
3108 }
3109 
3110 static void
_ldr_s(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3111 _ldr_s(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3112 {
3113     if (jit_thumb_p())
3114 	T2_LDRSHI(r0, r1, 0);
3115     else
3116 	LDRSHI(r0, r1, 0);
3117 }
3118 
3119 static void
_ldi_s(jit_state_t * _jit,jit_int32_t r0,jit_word_t i0)3120 _ldi_s(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
3121 {
3122     jit_int32_t		reg;
3123     reg = jit_get_reg(jit_class_gpr);
3124     movi(rn(reg), i0);
3125     if (jit_thumb_p())
3126 	T2_LDRSHI(r0, rn(reg), 0);
3127     else
3128 	LDRSHI(r0, rn(reg), 0);
3129     jit_unget_reg(reg);
3130 }
3131 
3132 static void
_ldxr_s(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)3133 _ldxr_s(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
3134 {
3135     if (jit_thumb_p()) {
3136 	if ((r0|r1|r2) < 8)
3137 	    T1_LDRSH(r0, r1, r2);
3138 	else
3139 	    T2_LDRSH(r0, r1, r2);
3140     }
3141     else
3142 	LDRSH(r0, r1, r2);
3143 }
3144 
3145 static void
_ldxi_s(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)3146 _ldxi_s(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
3147 {
3148     jit_int32_t		reg;
3149     if (jit_thumb_p()) {
3150 	if (jit_ldrt_strt_p() && i0 >= 0 && i0 <= 255)
3151 	    T2_LDRSHI(r0, r1, i0);
3152 	else if (i0 < 0 && i0 >= -255)
3153 	    T2_LDRSHIN(r0, r1, -i0);
3154 	else if (i0 >= 0 && i0 <= 4095)
3155 	    T2_LDRSHWI(r0, r1, i0);
3156 	else if (r0 != r1) {
3157 	    movi(r0, i0);
3158 	    if ((r0|r1) < 8)
3159 		T1_LDRSH(r0, r1, r0);
3160 	    else
3161 		T2_LDRSH(r0, r1, r0);
3162 	}
3163 	else {
3164 	    reg = jit_get_reg(jit_class_gpr);
3165 	    movi(rn(reg), i0);
3166 	    if ((r0|r1|rn(reg)) < 8)
3167 		T1_LDRSH(r0, r1, rn(reg));
3168 	    else
3169 		T2_LDRSH(r0, r1, rn(reg));
3170 	    jit_unget_reg(reg);
3171 	}
3172     }
3173     else {
3174 	if (i0 >= 0 && i0 <= 255)
3175 	    LDRSHI(r0, r1, i0);
3176 	else if (i0 < 0 && i0 >= -255)
3177 	    LDRSHIN(r0, r1, -i0);
3178 	else if (r0 != r1) {
3179 	    movi(r0, i0);
3180 	    LDRSH(r0, r1, r0);
3181 	}
3182 	else {
3183 	    reg = jit_get_reg(jit_class_gpr);
3184 	    movi(rn(reg), i0);
3185 	    LDRSH(r0, r1, rn(reg));
3186 	    jit_unget_reg(reg);
3187 	}
3188     }
3189 }
3190 
3191 static void
_ldr_us(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3192 _ldr_us(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3193 {
3194     if (jit_thumb_p())
3195 	T2_LDRHI(r0, r1, 0);
3196     else
3197 	LDRHI(r0, r1, 0);
3198 }
3199 
3200 static void
_ldi_us(jit_state_t * _jit,jit_int32_t r0,jit_word_t i0)3201 _ldi_us(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
3202 {
3203     jit_int32_t		reg;
3204     reg = jit_get_reg(jit_class_gpr);
3205     movi(rn(reg), i0);
3206     if (jit_thumb_p())
3207 	T2_LDRHI(r0, rn(reg), 0);
3208     else
3209 	LDRHI(r0, rn(reg), 0);
3210     jit_unget_reg(reg);
3211 }
3212 
3213 static void
_ldxr_us(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)3214 _ldxr_us(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
3215 {
3216     if (jit_thumb_p()) {
3217 	if ((r0|r1|r2) < 8)
3218 	    T1_LDRH(r0, r1, r2);
3219 	else
3220 	    T2_LDRH(r0, r1, r2);
3221     }
3222     else
3223 	LDRH(r0, r1, r2);
3224 }
3225 
3226 static void
_ldxi_us(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)3227 _ldxi_us(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
3228 {
3229     jit_int32_t		reg;
3230     if (jit_thumb_p()) {
3231 	if ((r0|r1) < 8 && i0 >= 0 && !(i0 & 1) && (i0 >> 1) < 0x20)
3232 	    T1_LDRHI(r0, r1, i0 >> 1);
3233 	else if (jit_ldrt_strt_p() && i0 >= 0 && i0 <= 255)
3234 	    T2_LDRHI(r0, r1, i0);
3235 	else if (i0 < 0 && i0 >= -255)
3236 	    T2_LDRHIN(r0, r1, -i0);
3237 	else if (i0 >= 0 && i0 <= 4095)
3238 	    T2_LDRHWI(r0, r1, i0);
3239 	else if (r0 != r1) {
3240 	    movi(r0, i0);
3241 	    if ((r0|r1) < 8)
3242 		T1_LDRH(r0, r1, r0);
3243 	    else
3244 		T2_LDRH(r0, r1, r0);
3245 	}
3246 	else {
3247 	    reg = jit_get_reg(jit_class_gpr);
3248 	    movi(rn(reg), i0);
3249 	    if ((r0|r1|rn(reg)) < 8)
3250 		T1_LDRH(r0, r1, rn(reg));
3251 	    else
3252 		T2_LDRH(r0, r1, rn(reg));
3253 	    jit_unget_reg(reg);
3254 	}
3255     }
3256     else {
3257 	if (i0 >= 0 && i0 <= 255)
3258 	    LDRHI(r0, r1, i0);
3259 	else if (i0 < 0 && i0 >= -255)
3260 	    LDRHIN(r0, r1, -i0);
3261 	else if (r0 != r1) {
3262 	    movi(r0, i0);
3263 	    LDRH(r0, r1, r0);
3264 	}
3265 	else {
3266 	    reg = jit_get_reg(jit_class_gpr);
3267 	    movi(rn(reg), i0);
3268 	    LDRH(r0, r1, rn(reg));
3269 	    jit_unget_reg(reg);
3270 	}
3271     }
3272 }
3273 
3274 static void
_ldr_i(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3275 _ldr_i(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3276 {
3277     if (jit_thumb_p())
3278 	T2_LDRI(r0, r1, 0);
3279     else
3280 	LDRI(r0, r1, 0);
3281 }
3282 
3283 static void
_ldi_i(jit_state_t * _jit,jit_int32_t r0,jit_word_t i0)3284 _ldi_i(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
3285 {
3286     jit_int32_t		reg;
3287     reg = jit_get_reg(jit_class_gpr);
3288     movi(rn(reg), i0);
3289     if (jit_thumb_p())
3290 	T2_LDRI(r0, rn(reg), 0);
3291     else
3292 	LDRI(r0, rn(reg), 0);
3293     jit_unget_reg(reg);
3294 }
3295 
3296 static void
_ldxr_i(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)3297 _ldxr_i(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
3298 {
3299     if (jit_thumb_p()) {
3300 	if ((r0|r1|r2) < 8)
3301 	    T1_LDR(r0, r1, r2);
3302 	else
3303 	    T2_LDR(r0, r1, r2);
3304     }
3305     else
3306 	LDR(r0, r1, r2);
3307 }
3308 
3309 static void
_ldxi_i(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)3310 _ldxi_i(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
3311 {
3312     jit_int32_t		reg;
3313     if (jit_thumb_p()) {
3314 	if ((r0|r1) < 8 && i0 >= 0 && !(i0 & 3) && (i0 >> 2) < 0x20)
3315 	    T1_LDRI(r0, r1, i0 >> 2);
3316 	else if (r1 == _R13_REGNO && r0 < 8 &&
3317 		 i0 >= 0 && !(i0 & 3) && (i0 >> 2) <= 255)
3318 	    T1_LDRISP(r0, i0 >> 2);
3319 	else if (jit_ldrt_strt_p() && i0 >= 0 && i0 <= 255)
3320 	    T2_LDRI(r0, r1, i0);
3321 	else if (i0 < 0 && i0 > -255)
3322 	    T2_LDRIN(r0, r1, -i0);
3323 	else if (i0 >= 0 && i0 <= 4095)
3324 	    T2_LDRWI(r0, r1, i0);
3325 	else if (r0 != r1) {
3326 	    movi(r0, i0);
3327 	    if ((r0|r1) < 8)
3328 		T1_LDR(r0, r1, r0);
3329 	    else
3330 		T2_LDR(r0, r1, r0);
3331 	}
3332 	else {
3333 	    reg = jit_get_reg(jit_class_gpr);
3334 	    movi(rn(reg), i0);
3335 	    if ((r0|r1|rn(reg)) < 8)
3336 		T1_LDR(r0, r1, rn(reg));
3337 	    else
3338 		T2_LDR(r0, r1, rn(reg));
3339 	    jit_unget_reg(reg);
3340 	}
3341     }
3342     else {
3343 	if (i0 >= 0 && i0 <= 4095)
3344 	    LDRI(r0, r1, i0);
3345 	else if (i0 < 0 && i0 >= -4095)
3346 	    LDRIN(r0, r1, -i0);
3347 	else if (r0 != r1) {
3348 	    movi(r0, i0);
3349 	    LDR(r0, r1, r0);
3350 	}
3351 	else {
3352 	    reg = jit_get_reg(jit_class_gpr);
3353 	    movi(rn(reg), i0);
3354 	    LDR(r0, r1, rn(reg));
3355 	    jit_unget_reg(reg);
3356 	}
3357     }
3358 }
3359 
3360 static void
_str_c(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3361 _str_c(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3362 {
3363     if (jit_thumb_p())
3364 	T2_STRBI(r1, r0, 0);
3365     else
3366 	STRBI(r1, r0, 0);
3367 }
3368 
3369 static void
_sti_c(jit_state_t * _jit,jit_word_t i0,jit_int32_t r0)3370 _sti_c(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0)
3371 {
3372     jit_int32_t		reg;
3373     reg = jit_get_reg(jit_class_gpr);
3374     movi(rn(reg), i0);
3375     if (jit_thumb_p())
3376 	T2_STRBI(r0, rn(reg), 0);
3377     else
3378 	STRBI(r0, rn(reg), 0);
3379     jit_unget_reg(reg);
3380 }
3381 
3382 static void
_stxr_c(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)3383 _stxr_c(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
3384 {
3385     if (jit_thumb_p()) {
3386 	if ((r0|r1|r2) < 8)
3387 	    T1_STRB(r2, r1, r0);
3388 	else
3389 	    T2_STRB(r2, r1, r0);
3390     }
3391     else
3392 	STRB(r2, r1, r0);
3393 }
3394 
3395 static void
_stxi_c(jit_state_t * _jit,jit_word_t i0,jit_int32_t r0,jit_int32_t r1)3396 _stxi_c(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3397 {
3398     jit_int32_t		reg;
3399     if (jit_thumb_p()) {
3400 	if ((r0|r1) < 8 && i0 >= 0 && i0 < 0x20)
3401 	    T1_STRBI(r1, r0, i0);
3402 	else if (jit_ldrt_strt_p() && i0 >= 0 && i0 <= 255)
3403 	    T2_STRBI(r1, r0, i0);
3404 	else if (i0 < 0 && i0 >= -255)
3405 	    T2_STRBIN(r1, r0, -i0);
3406 	else if (i0 >= 0 && i0 <= 4095)
3407 	    T2_STRBWI(r1, r0, i0);
3408 	else {
3409 	    reg = jit_get_reg(jit_class_gpr);
3410 	    movi(rn(reg), i0);
3411 	    if ((r0|r1|rn(reg)) < 8)
3412 		T1_STRB(r1, r0, rn(reg));
3413 	    else
3414 		T2_STRB(r1, r0, rn(reg));
3415 	    jit_unget_reg(reg);
3416 	}
3417     }
3418     else {
3419 	if (i0 >= 0 && i0 <= 4095)
3420 	    STRBI(r1, r0, i0);
3421 	else if (i0 < 0 && i0 >= -4095)
3422 	    STRBIN(r1, r0, -i0);
3423 	else {
3424 	    reg = jit_get_reg(jit_class_gpr);
3425 	    movi(rn(reg), i0);
3426 	    STRB(r1, r0, rn(reg));
3427 	    jit_unget_reg(reg);
3428 	}
3429     }
3430 }
3431 
3432 static void
_str_s(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3433 _str_s(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3434 {
3435     if (jit_thumb_p())
3436 	T2_STRHI(r1, r0, 0);
3437     else
3438 	STRHI(r1, r0, 0);
3439 }
3440 
3441 static void
_sti_s(jit_state_t * _jit,jit_word_t i0,jit_int32_t r0)3442 _sti_s(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0)
3443 {
3444     jit_int32_t		reg;
3445     reg = jit_get_reg(jit_class_gpr);
3446     movi(rn(reg), i0);
3447     if (jit_thumb_p())
3448 	T2_STRHI(r0, rn(reg), 0);
3449     else
3450 	STRHI(r0, rn(reg), 0);
3451     jit_unget_reg(reg);
3452 }
3453 
3454 static void
_stxr_s(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)3455 _stxr_s(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
3456 {
3457     if (jit_thumb_p()) {
3458 	if ((r0|r1|r2) < 8)
3459 	    T1_STRH(r2, r1, r0);
3460 	else
3461 	    T2_STRH(r2, r1, r0);
3462     }
3463     else
3464 	STRH(r2, r1, r0);
3465 }
3466 
3467 static void
_stxi_s(jit_state_t * _jit,jit_word_t i0,jit_int32_t r0,jit_int32_t r1)3468 _stxi_s(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3469 {
3470     jit_int32_t		reg;
3471     if (jit_thumb_p()) {
3472 	if ((r0|r1) < 8 && i0 >= 0 && !(i0 & 1) && (i0 >> 1) < 0x20)
3473 	    T1_STRHI(r1, r0, i0 >> 1);
3474 	else if (jit_ldrt_strt_p() && i0 >= 0 && i0 <= 255)
3475 	    T2_STRHI(r1, r0, i0);
3476 	else if (i0 < 0 && i0 >= -255)
3477 	    T2_STRHIN(r1, r0, -i0);
3478 	else if (i0 >= 0 && i0 <= 4095)
3479 	    T2_STRHWI(r1, r0, i0);
3480 	else {
3481 	    reg = jit_get_reg(jit_class_gpr);
3482 	    movi(rn(reg), i0);
3483 	    if ((r0|r1|rn(reg)) < 8)
3484 		T1_STRH(r1, r0, rn(reg));
3485 	    else
3486 		T2_STRH(r1, r0, rn(reg));
3487 	    jit_unget_reg(reg);
3488 	}
3489     }
3490     else {
3491 	if (i0 >= 0 && i0 <= 255)
3492 	    STRHI(r1, r0, i0);
3493 	else if (i0 < 0 && i0 >= -255)
3494 	    STRHIN(r1, r0, -i0);
3495 	else {
3496 	    reg = jit_get_reg(jit_class_gpr);
3497 	    movi(rn(reg), i0);
3498 	    STRH(r1, r0, rn(reg));
3499 	    jit_unget_reg(reg);
3500 	}
3501     }
3502 }
3503 
3504 static void
_str_i(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3505 _str_i(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3506 {
3507     if (jit_thumb_p())
3508 	T2_STRI(r1, r0, 0);
3509     else
3510 	STRI(r1, r0, 0);
3511 }
3512 
3513 static void
_sti_i(jit_state_t * _jit,jit_word_t i0,jit_int32_t r0)3514 _sti_i(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0)
3515 {
3516     jit_int32_t		reg;
3517     reg = jit_get_reg(jit_class_gpr);
3518     movi(rn(reg), i0);
3519     if (jit_thumb_p())
3520 	T2_STRI(r0, rn(reg), 0);
3521     else
3522 	STRI(r0, rn(reg), 0);
3523     jit_unget_reg(reg);
3524 }
3525 
3526 static void
_stxr_i(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)3527 _stxr_i(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
3528 {
3529     if (jit_thumb_p()) {
3530 	if ((r0|r1|r2) < 8)
3531 	    T1_STR(r2, r1, r0);
3532 	else
3533 	    T2_STR(r2, r1, r0);
3534     }
3535     else
3536 	STR(r2, r1, r0);
3537 }
3538 
3539 static void
_stxi_i(jit_state_t * _jit,jit_word_t i0,jit_int32_t r0,jit_int32_t r1)3540 _stxi_i(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3541 {
3542     jit_int32_t		reg;
3543     if (jit_thumb_p()) {
3544 	if ((r0|r1) < 8 && i0 >= 0 && !(i0 & 3) && (i0 >> 2) < 0x20)
3545 	    T1_STRI(r1, r0, i0 >> 2);
3546 	else if (r0 == _R13_REGNO && r1 < 8 &&
3547 		 i0 >= 0 && !(i0 & 3) && (i0 >> 2) <= 255)
3548 	    T1_STRISP(r1, i0 >> 2);
3549 	else if (jit_ldrt_strt_p() && i0 >= 0 && i0 <= 255)
3550 	    T2_STRI(r1, r0, i0);
3551 	else if (i0 < 0 && i0 >= -255)
3552 	    T2_STRIN(r1, r0, -i0);
3553 	else if (i0 >= 0 && i0 <= 4095)
3554 	    T2_STRWI(r1, r0, i0);
3555 	else {
3556 	    reg = jit_get_reg(jit_class_gpr);
3557 	    movi(rn(reg), i0);
3558 	    if ((r0|r1|rn(reg)) < 8)
3559 		T1_STR(r1, r0, rn(reg));
3560 	    else
3561 		T2_STR(r1, r0, rn(reg));
3562 	    jit_unget_reg(reg);
3563 	}
3564     }
3565     else {
3566 	if (i0 >= 0 && i0 <= 4095)
3567 	    STRI(r1, r0, i0);
3568 	else if (i0 < 0 && i0 >= -4095)
3569 	    STRIN(r1, r0, -i0);
3570 	else {
3571 	    reg = jit_get_reg(jit_class_gpr);
3572 	    movi(rn(reg), i0);
3573 	    STR(r1, r0, rn(reg));
3574 	    jit_unget_reg(reg);
3575 	}
3576     }
3577 }
3578 
3579 #  if __BYTE_ORDER == __LITTLE_ENDIAN
3580 static void
_htonr_us(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3581 _htonr_us(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3582 {
3583     jit_int32_t		t0;
3584     if (jit_thumb_p()) {
3585 	if ((r0|r1) < 8)
3586 	    T1_REV(r0, r1);
3587 	else
3588 	    T2_REV(r0, r1);
3589 	rshi_u(r0, r0, 16);
3590     }
3591     else {
3592 	if (jit_armv6_p()) {
3593 	    REV(r0, r1);
3594 	    rshi_u(r0, r0, 16);
3595 	}
3596 	else {
3597 	    t0 = jit_get_reg(jit_class_gpr);
3598 	    rshi(rn(t0), r1, 8);
3599 	    andi(r0, r1, 0xff);
3600 	    andi(rn(t0), rn(t0), 0xff);
3601 	    lshi(r0, r0, 8);
3602 	    orr(r0, r0, rn(t0));
3603 	    jit_unget_reg(t0);
3604 	}
3605     }
3606 }
3607 
3608 /* inline glibc htonl (without register clobber) */
3609 static void
_htonr_ui(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3610 _htonr_ui(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3611 {
3612     jit_int32_t		reg;
3613     if (jit_thumb_p()) {
3614 	if ((r0|r1) < 8)
3615 	    T1_REV(r0, r1);
3616 	else
3617 	    T2_REV(r0, r1);
3618     }
3619     else {
3620 	if (jit_armv6_p())
3621 	    REV(r0, r1);
3622 	else {
3623 	    reg = jit_get_reg(jit_class_gpr);
3624 	    EOR_SI(rn(reg), r1, r1, ARM_ROR, 16);
3625 	    LSRI(rn(reg), rn(reg), 8);
3626 	    BICI(rn(reg), rn(reg), encode_arm_immediate(0xff00));
3627 	    EOR_SI(r0, rn(reg), r1, ARM_ROR, 8);
3628 	    jit_unget_reg(reg);
3629 	}
3630     }
3631 }
3632 #endif
3633 
3634 static void
_extr_c(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3635 _extr_c(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3636 {
3637     if (jit_thumb_p()) {
3638 	if ((r0|r1) < 8)
3639 	    T1_SXTB(r0, r1);
3640 	else
3641 	    T2_SXTB(r0, r1);
3642     }
3643     else {
3644 	if (jit_armv6_p())
3645 	    SXTB(r0, r1);
3646 	else {
3647 	    LSLI(r0, r1, 24);
3648 	    ASRI(r0, r0, 24);
3649 	}
3650     }
3651 }
3652 
3653 static void
_extr_uc(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3654 _extr_uc(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3655 {
3656     if (jit_thumb_p()) {
3657 	if ((r0|r1) < 8)
3658 	    T1_UXTB(r0, r1);
3659 	else
3660 	    T2_UXTB(r0, r1);
3661     }
3662     else {
3663 	if (jit_armv6_p())
3664 	    UXTB(r0, r1);
3665 	else
3666 	    ANDI(r0, r1, 0xff);
3667     }
3668 }
3669 
3670 static void
_extr_s(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3671 _extr_s(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3672 {
3673     if (jit_thumb_p()) {
3674 	if ((r0|r1) < 8)
3675 	    T1_SXTH(r0, r1);
3676 	else
3677 	    T2_SXTH(r0, r1);
3678     }
3679     else {
3680 	if (jit_armv6_p())
3681 	    SXTH(r0, r1);
3682 	else {
3683 	    LSLI(r0, r1, 16);
3684 	    ASRI(r0, r0, 16);
3685 	}
3686     }
3687 }
3688 
3689 static void
_extr_us(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3690 _extr_us(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3691 {
3692     if (jit_thumb_p()) {
3693 	if ((r0|r1) < 8)
3694 	    T1_UXTH(r0, r1);
3695 	else
3696 	    T2_UXTH(r0, r1);
3697     }
3698     else {
3699 	if (jit_armv6_p())
3700 	    UXTH(r0, r1);
3701 	else {
3702 	    LSLI(r0, r1, 16);
3703 	    LSRI(r0, r0, 16);
3704 	}
3705     }
3706 }
3707 
3708 static void
_callr(jit_state_t * _jit,jit_int32_t r0)3709 _callr(jit_state_t *_jit, jit_int32_t r0)
3710 {
3711     if (jit_thumb_p())
3712 	T1_BLX(r0);
3713     else
3714 	BLX(r0);
3715 }
3716 
3717 static void
_calli(jit_state_t * _jit,jit_word_t i0)3718 _calli(jit_state_t *_jit, jit_word_t i0)
3719 {
3720     jit_word_t		d;
3721     jit_int32_t		reg;
3722     d = ((i0 - _jit->pc.w) >> 2) - 2;
3723     if (!jit_exchange_p() && !jit_thumb_p() && _s24P(d))
3724 	BLI(d & 0x00ffffff);
3725     else {
3726 	reg = jit_get_reg(jit_class_gpr);
3727 	movi(rn(reg), i0);
3728 	if (jit_thumb_p())
3729 	    T1_BLX(rn(reg));
3730 	else
3731 	    BLX(rn(reg));
3732 	jit_unget_reg(reg);
3733     }
3734 }
3735 
3736 static jit_word_t
_calli_p(jit_state_t * _jit,jit_word_t i0)3737 _calli_p(jit_state_t *_jit, jit_word_t i0)
3738 {
3739     jit_word_t		w;
3740     jit_int32_t		reg;
3741     reg = jit_get_reg(jit_class_gpr);
3742     w = _jit->pc.w;
3743     movi_p(rn(reg), i0);
3744     if (jit_thumb_p())
3745 	T1_BLX(rn(reg));
3746     else
3747 	BLX(rn(reg));
3748     jit_unget_reg(reg);
3749     return (w);
3750 }
3751 
3752 static void
_prolog(jit_state_t * _jit,jit_node_t * node)3753 _prolog(jit_state_t *_jit, jit_node_t *node)
3754 {
3755     jit_int32_t		reg;
3756     if (_jitc->function->define_frame || _jitc->function->assume_frame) {
3757 	jit_int32_t	frame = -_jitc->function->frame;
3758 	assert(_jitc->function->self.aoff >= frame);
3759 	if (_jitc->function->assume_frame) {
3760 	    if (jit_thumb_p() && !_jitc->thumb)
3761 		_jitc->thumb = _jit->pc.w;
3762 	    return;
3763 	}
3764 	_jitc->function->self.aoff = frame;
3765     }
3766     if (_jitc->function->allocar)
3767 	_jitc->function->self.aoff &= -8;
3768     _jitc->function->stack = ((_jitc->function->self.alen -
3769 			      /* align stack at 8 bytes */
3770 			      _jitc->function->self.aoff) + 7) & -8;
3771 
3772     if (jit_thumb_p()) {
3773 	/*  switch to thumb mode (better approach would be to
3774 	 * ORR 1 address being called, but no clear distinction
3775 	 * of what is a pointer to a jit function, or if patching
3776 	 * a pointer to a jit function) */
3777 	ADDI(_R12_REGNO, _R15_REGNO, 1);
3778 	BX(_R12_REGNO);
3779 	if (!_jitc->thumb)
3780 	    _jitc->thumb = _jit->pc.w;
3781 	if (jit_cpu.abi) {
3782 	    T2_PUSH(0xf);
3783 	    T2_PUSH(0x3f0|(1<<_FP_REGNO)|(1<<_LR_REGNO));
3784 	    VPUSH_F64(_D8_REGNO, 8);
3785 	}
3786 	else {
3787 	    T2_PUSH(0xf);
3788 	    T2_PUSH(0x3f0|(1<<_FP_REGNO)|(1<<_LR_REGNO));
3789 	}
3790     }
3791     else {
3792 	if (jit_cpu.abi) {
3793 	    PUSH(0xf);
3794 	    PUSH(0x3f0|(1<<_FP_REGNO)|(1<<_LR_REGNO));
3795 	    VPUSH_F64(_D8_REGNO, 8);
3796 	}
3797 	else {
3798 	    PUSH(0xf);
3799 	    PUSH(0x3f0|(1<<_FP_REGNO)|(1<<_LR_REGNO));
3800 	}
3801     }
3802     movr(_FP_REGNO, _SP_REGNO);
3803     if (_jitc->function->stack)
3804 	subi(_SP_REGNO, _SP_REGNO, _jitc->function->stack);
3805     if (_jitc->function->allocar) {
3806 	reg = jit_get_reg(jit_class_gpr);
3807 	movi(rn(reg), _jitc->function->self.aoff);
3808 	stxi_i(_jitc->function->aoffoff, _FP_REGNO, rn(reg));
3809 	jit_unget_reg(reg);
3810     }
3811 }
3812 
3813 static void
_epilog(jit_state_t * _jit,jit_node_t * node)3814 _epilog(jit_state_t *_jit, jit_node_t *node)
3815 {
3816     if (_jitc->function->assume_frame)
3817 	return;
3818 
3819     movr(_SP_REGNO, _FP_REGNO);
3820     if (jit_cpu.abi)
3821 	VPOP_F64(_D8_REGNO, 8);
3822     if (jit_thumb_p())
3823 	T2_POP(0x3f0|(1<<_FP_REGNO)|(1<<_LR_REGNO));
3824     else
3825 	POP(0x3f0|(1<<_FP_REGNO)|(1<<_LR_REGNO));
3826     addi(_SP_REGNO, _SP_REGNO, 16);
3827     if (jit_thumb_p())
3828 	T1_BX(_LR_REGNO);
3829     else
3830 	BX(_LR_REGNO);
3831     if (jit_thumb_p() && (_jit->pc.w & 2))
3832 	T1_NOP();
3833 }
3834 
3835 static void
_vastart(jit_state_t * _jit,jit_int32_t r0)3836 _vastart(jit_state_t *_jit, jit_int32_t r0)
3837 {
3838     assert(_jitc->function->self.call & jit_call_varargs);
3839 
3840     /* Initialize stack pointer to the first stack argument.
3841      * The -16 is to account for the 4 argument registers
3842      * always saved, and _jitc->function->vagp is to account
3843      * for declared arguments. */
3844     addi(r0, _FP_REGNO, _jitc->function->self.size -
3845 	 16 + _jitc->function->vagp);
3846 }
3847 
3848 static void
_vaarg(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3849 _vaarg(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3850 {
3851     assert(_jitc->function->self.call & jit_call_varargs);
3852 
3853     /* Load argument. */
3854     ldr(r0, r1);
3855 
3856     /* Update stack pointer. */
3857     addi(r1, r1, sizeof(jit_word_t));
3858 }
3859 
3860 static void
_patch_at(jit_state_t * _jit,jit_int32_t kind,jit_word_t instr,jit_word_t label)3861 _patch_at(jit_state_t *_jit,
3862 	  jit_int32_t kind, jit_word_t instr, jit_word_t label)
3863 {
3864     jit_word_t		 d;
3865     jit_thumb_t		 thumb;
3866     union {
3867 	jit_int16_t	*s;
3868 	jit_int32_t	*i;
3869 	jit_word_t	 w;
3870     } u;
3871     u.w = instr;
3872     if (kind == arm_patch_jump) {
3873 	if (jit_thumb_p() && (jit_uword_t)instr >= _jitc->thumb) {
3874 	    code2thumb(thumb.s[0], thumb.s[1], u.s[0], u.s[1]);
3875 	    if ((thumb.i & THUMB2_B) == THUMB2_B) {
3876 		d = ((label - instr) >> 1) - 2;
3877 		assert(_s24P(d));
3878 		thumb.i = THUMB2_B | encode_thumb_jump(d);
3879 		thumb2code(thumb.s[0], thumb.s[1], u.s[0], u.s[1]);
3880 	    }
3881 	    else if ((thumb.i & THUMB2_B) == THUMB2_CC_B) {
3882 		d = ((label - instr) >> 1) - 2;
3883 		assert(_s20P(d));
3884 		thumb.i = THUMB2_CC_B | (thumb.i & 0x3c00000) |
3885 			  encode_thumb_cc_jump(d);
3886 		thumb2code(thumb.s[0], thumb.s[1], u.s[0], u.s[1]);
3887 	    }
3888 	    else {
3889 		/* for the sake of simplicity in case choose to
3890 		 * movw+movt+[bx|blx], e.g. if changing to instead
3891 		 * of asserting target is reachable, load constant
3892 		 * and do indirect jump if not reachable */
3893 		if ((thumb.i & 0xfbf00000) == THUMB2_MOVWI)
3894 		    goto indirect_jump;
3895 		assert(!"handled branch opcode");
3896 	    }
3897 	}
3898 	else {
3899 	    thumb.i = u.i[0];
3900 	    /* 0x0e000000 because 0x01000000 is (branch&) link modifier */
3901 	    assert((thumb.i & 0x0e000000) == ARM_B);
3902 	    d = ((label - instr) >> 2) - 2;
3903 	    assert(_s24P(d));
3904 	    u.i[0] = (thumb.i & 0xff000000) | (d & 0x00ffffff);
3905 	}
3906     }
3907     else if (kind == arm_patch_load) {
3908 	/* offset may be negative for a forward patch because it
3909 	 * is relative to pc + 8, for example:
3910 	 *	    ldr r0, [pc, #-4]
3911 	 *	    bx r0		;; [pc, #-8]
3912 	 *	    .data ...		;; [pc, #-4]
3913 	 *	    ... 		;; [pc]
3914 	 */
3915 	assert(!jit_thumb_p());
3916 	thumb.i = u.i[0];
3917 	assert((thumb.i & 0x0f700000) == ARM_LDRI);
3918 	d = label - (instr + 8);
3919 	if (d < 0) {
3920 	    thumb.i &= ~ARM_P;
3921 	    d = -d;
3922 	}
3923 	else
3924 	    thumb.i |= ARM_P;
3925 	assert(!(d & 0xfffff000));
3926 	u.i[0] = (thumb.i & 0xfffff000) | d;
3927     }
3928     else if (kind == arm_patch_word) {
3929 	if (jit_thumb_p()) {
3930 	    code2thumb(thumb.s[0], thumb.s[1], u.s[0], u.s[1]);
3931 	    assert((thumb.i & 0xfbf00000) == THUMB2_MOVWI);
3932 	indirect_jump:
3933 	    thumb.i = ((thumb.i & 0xfbf00f00) |
3934 		       ( (label & 0x0000f000) <<  4) |
3935 		       ( (label & 0x00000800) << 15) |
3936 		       ( (label & 0x00000700) <<  4) |
3937 		       (  label & 0x000000ff));
3938 	    thumb2code(thumb.s[0], thumb.s[1], u.s[0], u.s[1]);
3939 	    label >>= 16;
3940 	    code2thumb(thumb.s[0], thumb.s[1], u.s[2], u.s[3]);
3941 	    assert((thumb.i & 0xfbf00000) == THUMB2_MOVTI);
3942 	    thumb.i = ((thumb.i & 0xfbf00f00) |
3943 		       ( (label & 0x0000f000) <<  4) |
3944 		       ( (label & 0x00000800) << 15) |
3945 		       ( (label & 0x00000700) <<  4) |
3946 		       (  label & 0x000000ff));
3947 	    thumb2code(thumb.s[0], thumb.s[1], u.s[2], u.s[3]);
3948 	}
3949 	else
3950 	    u.i[0] = label;
3951     }
3952     else
3953 	assert(!"handled patch");
3954 }
3955 #endif
3956