1 /*
2 * Copyright (C) 2012-2019 Free Software Foundation, Inc.
3 *
4 * This file is part of GNU lightning.
5 *
6 * GNU lightning is free software; you can redistribute it and/or modify it
7 * under the terms of the GNU Lesser General Public License as published
8 * by the Free Software Foundation; either version 3, or (at your option)
9 * any later version.
10 *
11 * GNU lightning is distributed in the hope that it will be useful, but
12 * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
13 * or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public
14 * License for more details.
15 *
16 * Authors:
17 * Paulo Cesar Pereira de Andrade
18 */
19
20 #if PROTO
21 # define stxi(i0,r0,r1) stxi_i(i0,r0,r1)
22 # define ldxi(r0,r1,i0) ldxi_i(r0,r1,i0)
23 # define ldr(r0,r1) ldr_i(r0,r1)
24 # define _s20P(d) ((d) >= -(int)0x80000 && d <= 0x7ffff)
25 # define _s24P(d) ((d) >= -(int)0x800000 && d <= 0x7fffff)
26 # define _u3(v) ((v) & 0x7)
27 # define _u4(v) ((v) & 0xf)
28 # define _u5(v) ((v) & 0x1f)
29 # define _u8(v) ((v) & 0xff)
30 # define _u12(v) ((v) & 0xfff)
31 # define _u13(v) ((v) & 0x1fff)
32 # define _u16(v) ((v) & 0xffff)
33 # define _u24(v) ((v) & 0xffffff)
34 # define jit_thumb_p() jit_cpu.thumb
35 # define jit_no_set_flags() _jitc->no_set_flags
36 # define jit_armv5_p() (jit_cpu.version >= 5)
37 # define jit_armv5e_p() (jit_cpu.version > 5 || (jit_cpu.version == 5 && jit_cpu.extend))
38 # define jit_armv6_p() (jit_cpu.version >= 6)
39 # define jit_armv7r_p() 0
40 # define stack_framesize 48
41 extern int __aeabi_idivmod(int, int);
42 extern unsigned __aeabi_uidivmod(unsigned, unsigned);
43 # define _R0_REGNO 0x00
44 # define _R1_REGNO 0x01
45 # define _R2_REGNO 0x02
46 # define _R3_REGNO 0x03
47 # define _R4_REGNO 0x04
48 # define _R5_REGNO 0x05
49 # define _R6_REGNO 0x06
50 # define _R7_REGNO 0x07
51 # define _R8_REGNO 0x08
52 # define _R9_REGNO 0x09
53 # define _R10_REGNO 0x0a
54 # define _R11_REGNO 0x0b
55 # define _R12_REGNO 0x0c
56 # define _R13_REGNO 0x0d
57 # define _R14_REGNO 0x0e
58 # define _R15_REGNO 0x0f
59 # define _FP_REGNO _R11_REGNO
60 # define _SP_REGNO _R13_REGNO
61 # define _LR_REGNO _R14_REGNO
62 # define _PC_REGNO _R15_REGNO
63 # define ARM_CC_EQ 0x00000000 /* Z=1 */
64 # define ARM_CC_NE 0x10000000 /* Z=0 */
65 # define ARM_CC_HS 0x20000000 /* C=1 */
66 # define ARM_CC_CS ARM_CC_HS
67 # define ARM_CC_LO 0x30000000 /* C=0 */
68 # define ARM_CC_CC ARM_CC_LO
69 # define ARM_CC_MI 0x40000000 /* N=1 */
70 # define ARM_CC_PL 0x50000000 /* N=0 */
71 # define ARM_CC_VS 0x60000000 /* V=1 */
72 # define ARM_CC_VC 0x70000000 /* V=0 */
73 # define ARM_CC_HI 0x80000000 /* C=1 && Z=0 */
74 # define ARM_CC_LS 0x90000000 /* C=0 || Z=1 */
75 # define ARM_CC_GE 0xa0000000 /* N=V */
76 # define ARM_CC_LT 0xb0000000 /* N!=V */
77 # define ARM_CC_GT 0xc0000000 /* Z=0 && N=V */
78 # define ARM_CC_LE 0xd0000000 /* Z=1 || N!=V */
79 # define ARM_CC_AL 0xe0000000 /* always */
80 # define ARM_CC_NV 0xf0000000 /* reserved */
81 # define THUMB2_IT 0
82 # define THUMB2_ITT 1
83 # define THUMB2_ITE 2
84 # define THUMB2_ITTT 3
85 # define THUMB2_ITET 4
86 # define THUMB2_ITTE 5
87 # define THUMB2_ITEE 6
88 # define THUMB2_ITTTT 7
89 # define THUMB2_ITETT 8
90 # define THUMB2_ITTET 9
91 # define THUMB2_ITEET 10
92 # define THUMB2_ITTTE 11
93 # define THUMB2_ITETE 12
94 # define THUMB2_ITTEE 13
95 # define THUMB2_ITEEE 14
96 # define ARM_MOV 0x01a00000
97 # define THUMB_MOV 0x4600
98 # define ARM_MOVWI 0x03000000 /* v6t2, v7 */
99 # define THUMB_MOVI 0x2000
100 # define THUMB2_MOVI 0xf0400000
101 # define THUMB2_MOVWI 0xf2400000
102 # define ARM_MOVTI 0x03400000
103 # define THUMB2_MOVTI 0xf2c00000
104 # define ARM_MVN 0x01e00000
105 # define THUMB_MVN 0x43c0
106 # define THUMB2_MVN 0xea600000
107 # define THUMB2_MVNI 0xf0600000
108 # define ARM_I 0x02000000 /* immediate */
109 # define ARM_S 0x00100000 /* set flags */
110 # define ARM_ADD 0x00800000
111 # define THUMB_ADD 0x1800
112 # define THUMB_ADDX 0x4400
113 # define THUMB2_ADD 0xeb000000
114 # define THUMB_ADDI3 0x1c00
115 # define THUMB_ADDI8 0x3000
116 # define THUMB2_ADDI 0xf1000000
117 # define THUMB2_ADDWI 0xf2000000
118 # define ARM_ADC 0x00a00000
119 # define THUMB_ADC 0x4140
120 # define THUMB2_ADC 0xeb400000
121 # define THUMB2_ADCI 0xf1400000
122 # define ARM_SUB 0x00400000
123 # define THUMB_SUB 0x1a00
124 # define THUMB2_SUB 0xeba00000
125 # define THUMB_SUBI3 0x1e00
126 # define THUMB_SUBI8 0x3800
127 # define THUMB2_SUBI 0xf1a00000
128 # define THUMB2_SUBWI 0xf2a00000
129 # define ARM_SBC 0x00c00000
130 # define THUMB_SBC 0x4180
131 # define THUMB2_SBC 0xeb600000
132 # define THUMB2_SBCI 0xf1600000
133 # define ARM_RSB 0x00600000
134 # define THUMB_RSBI 0x4240
135 # define THUMB2_RSBI 0xf1c00000
136 # define ARM_MUL 0x00000090
137 # define THUMB_MUL 0x4340
138 # define THUMB2_MUL 0xfb00f000
139 # define ARM_UMULL 0x00800090
140 # define THUMB2_UMULL 0xfba00000
141 # define ARM_SMULL 0x00c00090
142 # define THUMB2_SMULL 0xfb800000
143 # define THUMB2_SDIV 0xfb90f0f0
144 # define THUMB2_UDIV 0xfbb0f0f0
145 # define ARM_AND 0x00000000
146 # define THUMB_AND 0x4000
147 # define THUMB2_AND 0xea000000
148 # define THUMB2_ANDI 0xf0000000
149 # define ARM_BIC 0x01c00000
150 # define THUMB2_BIC 0xea200000
151 # define THUMB2_BICI 0xf0200000
152 # define ARM_ORR 0x01800000
153 # define THUMB_ORR 0x4300
154 # define THUMB2_ORR 0xea400000
155 # define THUMB2_ORRI 0xf0400000
156 # define ARM_EOR 0x00200000
157 # define THUMB_EOR 0x4040
158 # define THUMB2_EOR 0xea800000
159 # define THUMB2_EORI 0xf0800000
160 /* >> ARMv6* */
161 # define ARM_REV 0x06bf0f30
162 # define THUMB_REV 0xba00
163 # define THUMB2_REV 0xfa90f080
164 # define ARM_REV16 0x06bf0fb0
165 # define THUMB_REV16 0xba40
166 # define THUMB2_REV16 0xfa90f090
167 # define ARM_SXTB 0x06af0070
168 # define THUMB_SXTB 0xb240
169 # define THUMB2_SXTB 0xfa40f080
170 # define ARM_UXTB 0x06ef0070
171 # define THUMB_UXTB 0xb2c0
172 # define THUMB2_UXTB 0xfa50f080
173 # define ARM_SXTH 0x06bf0070
174 # define THUMB_SXTH 0xb200
175 # define THUMB2_SXTH 0xfa00f080
176 # define ARM_UXTH 0x06ff0070
177 # define THUMB_UXTH 0xb280
178 # define THUMB2_UXTH 0xfa10f080
179 # define ARM_XTR8 0x00000400 /* ?xt? rotate 8 bits */
180 # define ARM_XTR16 0x00000800 /* ?xt? rotate 16 bits */
181 # define ARM_XTR24 0x00000c00 /* ?xt? rotate 24 bits */
182 /* << ARMv6* */
183 # define ARM_SHIFT 0x01a00000
184 # define ARM_R 0x00000010 /* register shift */
185 # define ARM_LSL 0x00000000
186 # define THUMB_LSL 0x4080
187 # define THUMB2_LSL 0xfa00f000
188 # define THUMB_LSLI 0x0000
189 # define THUMB2_LSLI 0xea4f0000
190 # define ARM_LSR 0x00000020
191 # define THUMB_LSR 0x40c0
192 # define THUMB2_LSR 0xfa20f000
193 # define THUMB_LSRI 0x0800
194 # define THUMB2_LSRI 0xea4f0010
195 # define ARM_ASR 0x00000040
196 # define THUMB_ASR 0x4100
197 # define THUMB2_ASR 0xfa40f000
198 # define THUMB_ASRI 0x1000
199 # define THUMB2_ASRI 0xea4f0020
200 # define ARM_ROR 0x00000060
201 # define ARM_CMP 0x01500000
202 # define THUMB_CMP 0x4280
203 # define THUMB_CMPX 0x4500
204 # define THUMB2_CMP 0xebb00000
205 # define THUMB_CMPI 0x2800
206 # define THUMB2_CMPI 0xf1b00000
207 # define ARM_CMN 0x01700000
208 # define THUMB_CMN 0x42c0
209 # define THUMB2_CMN 0xeb100000
210 # define THUMB2_CMNI 0xf1100000
211 # define ARM_TST 0x01100000
212 # define THUMB_TST 0x4200
213 # define THUMB2_TST 0xea100000
214 # define THUMB2_TSTI 0xf0100000
215 # define ARM_TEQ 0x01300000
216 /* branch */
217 # define ARM_BX 0x012fff10
218 # define ARM_BLX 0x012fff30
219 # define THUMB_BLX 0x4780
220 # define ARM_BLXI 0xfa000000
221 # define THUMB2_BLXI 0xf000c000
222 # define ARM_B 0x0a000000
223 # define THUMB_CC_B 0xd000
224 # define THUMB_B 0xe000
225 # define THUMB2_CC_B 0xf0008000
226 # define THUMB2_B 0xf0009000
227 # define ARM_BLI 0x0b000000
228 # define THUMB2_BLI 0xf000d000
229 /* ldr/str */
230 # define ARM_P 0x00800000 /* positive offset */
231 # define THUMB2_P 0x00000400
232 # define THUMB2_U 0x00000200
233 # define THUMB2_W 0x00000100
234 # define ARM_LDRSB 0x011000d0
235 # define THUMB_LDRSB 0x5600
236 # define THUMB2_LDRSB 0xf9100000
237 # define ARM_LDRSBI 0x015000d0
238 # define THUMB2_LDRSBI 0xf9100c00
239 # define THUMB2_LDRSBWI 0xf9900000
240 # define ARM_LDRB 0x07500000
241 # define THUMB_LDRB 0x5c00
242 # define THUMB2_LDRB 0xf8100000
243 # define ARM_LDRBI 0x05500000
244 # define THUMB_LDRBI 0x7800
245 # define THUMB2_LDRBI 0xf8100c00
246 # define THUMB2_LDRBWI 0xf8900000
247 # define ARM_LDRSH 0x011000f0
248 # define THUMB_LDRSH 0x5e00
249 # define THUMB2_LDRSH 0xf9300000
250 # define ARM_LDRSHI 0x015000f0
251 # define THUMB2_LDRSHI 0xf9300c00
252 # define THUMB2_LDRSHWI 0xf9b00000
253 # define ARM_LDRH 0x011000b0
254 # define THUMB_LDRH 0x5a00
255 # define THUMB2_LDRH 0xf8300000
256 # define ARM_LDRHI 0x015000b0
257 # define THUMB_LDRHI 0x8800
258 # define THUMB2_LDRHI 0xf8300c00
259 # define THUMB2_LDRHWI 0xf8b00000
260 # define ARM_LDR 0x07100000
261 # define THUMB_LDR 0x5800
262 # define THUMB2_LDR 0xf8500000
263 # define ARM_LDRI 0x05100000
264 # define THUMB_LDRI 0x6800
265 # define THUMB_LDRISP 0x9800
266 # define THUMB2_LDRI 0xf8500c00
267 # define THUMB2_LDRWI 0xf8d00000
268 # define ARM_LDRD 0x010000d0
269 # define ARM_LDRDI 0x014000d0
270 # define THUMB2_LDRDI 0xe8500000
271 # define ARM_STRB 0x07400000
272 # define THUMB_STRB 0x5400
273 # define THUMB2_STRB 0xf8000000
274 # define ARM_STRBI 0x05400000
275 # define THUMB_STRBI 0x7000
276 # define THUMB2_STRBI 0xf8000c00
277 # define THUMB2_STRBWI 0xf8800000
278 # define ARM_STRH 0x010000b0
279 # define THUMB_STRH 0x5200
280 # define THUMB2_STRH 0xf8200000
281 # define ARM_STRHI 0x014000b0
282 # define THUMB_STRHI 0x8000
283 # define THUMB2_STRHI 0xf8200c00
284 # define THUMB2_STRHWI 0xf8a00000
285 # define ARM_STR 0x07000000
286 # define THUMB_STR 0x5000
287 # define THUMB2_STR 0xf8400000
288 # define ARM_STRI 0x05000000
289 # define THUMB_STRI 0x6000
290 # define THUMB2_STRWI 0xf8c00000
291 # define THUMB_STRISP 0x9000
292 # define THUMB2_STRI 0xf8400c00
293 # define ARM_STRD 0x010000f0
294 # define ARM_STRDI 0x014000f0
295 # define THUMB2_STRDI 0xe8400000
296 /* ldm/stm */
297 # define ARM_M 0x08000000
298 # define ARM_M_L 0x00100000 /* load; store if not set */
299 # define ARM_M_I 0x00800000 /* inc; dec if not set */
300 # define ARM_M_B 0x01000000 /* before; after if not set */
301 # define ARM_M_U 0x00200000 /* update Rn */
302 # define THUMB2_LDM_W 0x00200000
303 # define THUMB2_LDM_P 0x00008000
304 # define THUMB2_LDM_M 0x00004000
305 # define THUMB_LDMIA 0xc800
306 # define THUMB2_LDMIA 0xe8900000
307 # define THUMB2_LDMB 0xe9100000
308 # define THUMB_PUSH 0xb400
309 # define THUMB2_PUSH 0xe92d0000
310 # define THUMB_POP 0xbc00
311 # define THUMB2_POP 0xe8bd0000
312 # define ii(i) *_jit->pc.ui++ = i
313 # define is(i) *_jit->pc.us++ = i
314 # if __BYTE_ORDER == __LITTLE_ENDIAN
315 # define iss(i, j) do { is(j); is(i); } while (0)
316 # define code2thumb(t0, t1, c0, c1) do { t1 = c0; t0 = c1; } while (0)
317 # define thumb2code(t0, t1, c0, c1) do { c0 = t1; c1 = t0; } while (0)
318 # else
319 # define iss(i, j) do { is(i); is(j); } while (0)
320 # define code2thumb(t0, t1, c0, c1) do { t0 = c0; t1 = c1; } while (0)
321 # define thumb2code(t0, t1, c0, c1) do { c0 = t0; c1 = t1; } while (0)
322 # endif
323 static int encode_arm_immediate(unsigned int v);
324 static int encode_thumb_immediate(unsigned int v);
325 static int encode_thumb_word_immediate(unsigned int v);
326 static int encode_thumb_jump(int v);
327 static int encode_thumb_cc_jump(int v);
328 static int encode_thumb_shift(int v, int type) maybe_unused;
329 # define corrr(cc,o,rn,rd,rm) _corrr(_jit,cc,o,rn,rd,rm)
330 static void _corrr(jit_state_t*,int,int,int,int,int);
331 # define corri(cc,o,rn,rd,im) _corri(_jit,cc,o,rn,rd,im)
332 static void _corri(jit_state_t*,int,int,int,int,int);
333 #define corri8(cc,o,rn,rt,im) _corri8(_jit,cc,o,rn,rt,im)
334 static void _corri8(jit_state_t*,int,int,int,int,int);
335 # define torrr(o,rn,rd,rm) _torrr(_jit,o,rn,rd,rm)
336 static void _torrr(jit_state_t*,int,int,int,int);
337 # define torrrs(o,rn,rd,rm,im) _torrrs(_jit,o,rn,rd,rm,im)
338 static void _torrrs(jit_state_t*,int,int,int,int,int) maybe_unused;
339 # define torxr(o,rn,rt,rm) _torxr(_jit,o,rn,rt,rm)
340 static void _torxr(jit_state_t*,int,int,int,int);
341 # define torrrr(o,rn,rl,rh,rm) _torrrr(_jit,o,rn,rl,rh,rm)
342 static void _torrrr(jit_state_t*,int,int,int,int,int) maybe_unused;
343 # define torrri8(o,rn,rt,rt2,im) _torrri8(_jit,o,rn,rt,rt2,im)
344 static void _torrri8(jit_state_t*,int,int,int,int,int) maybe_unused;
345 # define coriw(cc,o,rd,im) _coriw(_jit,cc,o,rd,im)
346 static void _coriw(jit_state_t*,int,int,int,int);
347 # define torri(o,rd,rn,im) _torri(_jit,o,rd,rn,im)
348 static void _torri(jit_state_t*,int,int,int,int);
349 # define torri8(o,rn,rt,im) _torri8(_jit,o,rn,rt,im)
350 static void _torri8(jit_state_t*,int,int,int,int);
351 # define torri12(o,rn,rt,im) _torri12(_jit,o,rn,rt,im)
352 static void _torri12(jit_state_t*,int,int,int,int);
353 # define tshift(o,rd,rm,im) _tshift(_jit,o,rd,rm,im)
354 static void _tshift(jit_state_t*,int,int,int,int);
355 # define toriw(o,rd,im) _toriw(_jit,o,rd,im)
356 static void _toriw(jit_state_t*,int,int,int);
357 # define tc8(cc,im) _tc8(_jit,cc,im)
358 static void _tc8(jit_state_t*,int,int) maybe_unused;
359 # define t11(im) _t11(_jit,im)
360 static void _t11(jit_state_t*,int);
361 # define tcb(cc,im) _tcb(_jit,cc,im)
362 static void _tcb(jit_state_t*,int,int);
363 # define blxi(im) _blxi(_jit,im)
364 static void _blxi(jit_state_t*,int) maybe_unused;
365 # define tb(o,im) _tb(_jit,o,im)
366 static void _tb(jit_state_t*,int,int);
367 # define corrrr(cc,o,rh,rl,rm,rn) _corrrr(_jit,cc,o,rh,rl,rm,rn)
368 static void _corrrr(jit_state_t*,int,int,int,int,int,int);
369 # define corrrs(cc,o,rn,rd,rm,im) _corrrs(_jit,cc,o,rn,rd,rm,im)
370 static void _corrrs(jit_state_t*,int,int,int,int,int,int);
371 # define cshift(cc,o,rd,rm,rn,im) _cshift(_jit,cc,o,rd,rm,rn,im)
372 static void _cshift(jit_state_t*,int,int,int,int,int,int);
373 # define cb(cc,o,im) _cb(_jit,cc,o,im)
374 static void _cb(jit_state_t*,int,int,int);
375 # define cbx(cc,o,rm) _cbx(_jit,cc,o,rm)
376 static void _cbx(jit_state_t*,int,int,int);
377 # define corl(cc,o,r0,i0) _corl(_jit,cc,o,r0,i0)
378 static void _corl(jit_state_t*,int,int,int,int);
379 # define c6orr(cc,o,r0,r1) _c6orr(_jit,cc,o,r0,r1)
380 static void _c6orr(jit_state_t*,int,int,int,int);
381 # define tcit(cc,it) _tcit(_jit,cc,it)
382 static void _tcit(jit_state_t*,unsigned int,int);
383 # define IT(cc) tcit(cc,THUMB2_IT)
384 # define ITT(cc) tcit(cc,THUMB2_ITT)
385 # define ITE(cc) tcit(cc,THUMB2_ITE)
386 # define ITTT(cc) tcit(cc,THUMB2_ITTT)
387 # define ITTE(cc) tcit(cc,THUMB2_ITTE)
388 # define ITET(cc) tcit(cc,THUMB2_ITET)
389 # define ITEE(cc) tcit(cc,THUMB2_ITEE)
390 # define ITTTT(cc) tcit(cc,THUMB2_ITTTT)
391 # define ITETT(cc) tcit(cc,THUMB2_ITETT)
392 # define ITTET(cc) tcit(cc,THUMB2_ITTET)
393 # define ITEET(cc) tcit(cc,THUMB2_ITEET)
394 # define ITTTE(cc) tcit(cc,THUMB2_ITTTE)
395 # define ITETE(cc) tcit(cc,THUMB2_ITETE)
396 # define ITTEE(cc) tcit(cc,THUMB2_ITTEE)
397 # define ITEEE(cc) tcit(cc,THUMB2_ITEEE)
398 # define tpp(o,im) _tpp(_jit,o,im)
399 static void _tpp(jit_state_t*,int,int);
400 # define torl(o,rn,im) _torl(_jit,o,rn,im)
401 static void _torl(jit_state_t*,int,int,int) maybe_unused;
402 # define CC_MOV(cc,rd,rm) corrr(cc,ARM_MOV,0,rd,rm)
403 # define MOV(rd,rm) CC_MOV(ARM_CC_AL,rd,rm)
404 # define T1_MOV(rd,rm) is(THUMB_MOV|((_u4(rd)&8)<<4)|(_u4(rm)<<3)|(rd&7))
405 # define T2_MOV(rd,rm) T2_ORR(rd,_R15_REGNO,rm)
406 # define CC_MOVI(cc,rd,im) corri(cc,ARM_MOV|ARM_I,0,rd,im)
407 # define MOVI(rd,im) CC_MOVI(ARM_CC_AL,rd,im)
408 # define CC_MOVWI(cc,rd,im) coriw(cc,ARM_MOVWI,rd,im)
409 # define MOVWI(rd,im) CC_MOVWI(ARM_CC_AL,rd,im)
410 # define T1_MOVI(rd,im) is(THUMB_MOVI|(_u3(rd)<<8)|_u8(im))
411 # define T2_MOVI(rd,im) torri(THUMB2_MOVI,_R15_REGNO,rd,im)
412 # define T2_MOVWI(rd,im) toriw(THUMB2_MOVWI,rd,im)
413 # define CC_MOVTI(cc,rd,im) coriw(cc,ARM_MOVTI,rd,im)
414 # define MOVTI(rd,im) CC_MOVTI(ARM_CC_AL,rd,im)
415 # define T2_MOVTI(rd,im) toriw(THUMB2_MOVTI,rd,im)
416 # define CC_MVN(cc,rd,rm) corrr(cc,ARM_MVN,0,rd,rm)
417 # define MVN(rd,rm) CC_MVN(ARM_CC_AL,rd,rm)
418 # define T1_MVN(rd,rm) is(THUMB_MVN|(_u3(rm)<<3)|_u3(rd))
419 # define T2_MVN(rd,rm) torrr(THUMB2_MVN,_R15_REGNO,rd,rm)
420 # define CC_MVNI(cc,rd,im) corri(cc,ARM_MVN|ARM_I,0,rd,im)
421 # define MVNI(rd,im) CC_MVNI(ARM_CC_AL,rd,im)
422 # define T2_MVNI(rd,im) torri(THUMB2_MVNI,_R15_REGNO,rd,im)
423 # define CC_NOT(cc,rd,rm) CC_MVN(cc,rd,rm)
424 # define NOT(rd,rm) CC_NOT(ARM_CC_AL,rd,rm)
425 # define T1_NOT(rd,rm) T1_MVN(rd,rm)
426 # define T2_NOT(rd,rm) T2_MVN(rd,rm)
427 # define NOP() MOV(_R0_REGNO, _R0_REGNO)
428 # define T1_NOP() is(0xbf00)
429 # define CC_ADD(cc,rd,rn,rm) corrr(cc,ARM_ADD,rn,rd,rm)
430 # define ADD(rd,rn,rm) CC_ADD(ARM_CC_AL,rd,rn,rm)
431 # define T1_ADD(rd,rn,rm) is(THUMB_ADD|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rd))
432 # define T1_ADDX(rdn,rm) is(THUMB_ADDX|((_u4(rdn)&8)<<4)|(_u4(rm)<<3)|(rdn&7))
433 # define T2_ADD(rd,rn,rm) torrr(THUMB2_ADD,rn,rd,rm)
434 # define CC_ADDI(cc,rd,rn,im) corri(cc,ARM_ADD|ARM_I,rn,rd,im)
435 # define ADDI(rd,rn,im) CC_ADDI(ARM_CC_AL,rd,rn,im)
436 # define T1_ADDI3(rd,rn,im) is(THUMB_ADDI3|(_u3(im)<<6)|(_u3(rn)<<3)|_u3(rd))
437 # define T1_ADDI8(rdn,im) is(THUMB_ADDI8|(_u3(rdn)<<8)|_u8(im))
438 # define T2_ADDI(rd,rn,im) torri(THUMB2_ADDI,rn,rd,im)
439 # define T2_ADDWI(rd,rn,im) torri(THUMB2_ADDWI,rn,rd,im)
440 # define CC_ADDS(cc,rd,rn,rm) corrr(cc,ARM_ADD|ARM_S,rn,rd,rm)
441 # define ADDS(rd,rn,rm) CC_ADDS(ARM_CC_AL,rd,rn,rm)
442 # define T2_ADDS(rd,rn,rm) torrr(THUMB2_ADD|ARM_S,rn,rd,rm)
443 # define ADDSI(rd,rn,im) corri(ARM_CC_AL,ARM_ADD|ARM_S|ARM_I,rn,rd,im)
444 # define T2_ADDSI(rd,rn,im) torri(THUMB2_ADDI|ARM_S,rn,rd,im)
445 # define CC_ADC(cc,rd,rn,rm) corrr(cc,ARM_ADC,rn,rd,rm)
446 # define ADC(rd,rn,rm) CC_ADC(ARM_CC_AL,rd,rn,rm)
447 # define T1_ADC(rdn,rm) is(THUMB_ADC|(_u3(rm)<<3)|_u3(rdn))
448 # define T2_ADC(rd,rn,rm) torrr(THUMB2_ADC,rn,rd,rm)
449 # define CC_ADCI(cc,rd,rn,im) corri(cc,ARM_ADC|ARM_I,rn,rd,im)
450 # define ADCI(rd,rn,im) CC_ADCI(ARM_CC_AL,rd,rn,im)
451 # define T2_ADCI(rd,rn,im) torri(THUMB2_ADCI,rn,rd,im)
452 # define CC_ADCS(cc,rd,rn,rm) corrr(cc,ARM_ADC|ARM_S,rn,rd,rm)
453 # define ADCS(rd,rn,rm) CC_ADCS(ARM_CC_AL,rd,rn,rm)
454 # define T2_ADCS(rd,rn,rm) torrr(THUMB2_ADC|ARM_S,rn,rd,rm)
455 # define CC_ADCSI(cc,rd,rn,im) corri(cc,ARM_ADC|ARM_S|ARM_I,rn,rd,im)
456 # define ADCSI(rd,rn,im) CC_ADCSI(ARM_CC_AL,rd,rn,im)
457 # define T2_ADCSI(rd,rn,im) torri(THUMB2_ADCI|ARM_S,rn,rd,im)
458 # define CC_SUB(cc,rd,rn,rm) corrr(cc,ARM_SUB,rn,rd,rm)
459 # define SUB(rd,rn,rm) CC_SUB(ARM_CC_AL,rd,rn,rm)
460 # define T1_SUB(rd,rn,rm) is(THUMB_SUB|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rd))
461 # define T2_SUB(rd,rn,rm) torrr(THUMB2_SUB,rn,rd,rm)
462 # define CC_SUBI(cc,rd,rn,im) corri(cc,ARM_SUB|ARM_I,rn,rd,im)
463 # define SUBI(rd,rn,im) CC_SUBI(ARM_CC_AL,rd,rn,im)
464 # define T1_SUBI3(rd,rn,im) is(THUMB_SUBI3|(_u3(im)<<6)|(_u3(rn)<<3)|_u3(rd))
465 # define T1_SUBI8(rdn,im) is(THUMB_SUBI8|(_u3(rdn)<<8)|_u8(im))
466 # define T2_SUBI(rd,rn,im) torri(THUMB2_SUBI,rn,rd,im)
467 # define T2_SUBWI(rd,rn,im) torri(THUMB2_SUBWI,rn,rd,im)
468 # define CC_SUBS(cc,rd,rn,rm) corrr(cc,ARM_SUB|ARM_S,rn,rd,rm)
469 # define SUBS(rd,rn,rm) CC_SUBS(ARM_CC_AL,rd,rn,rm)
470 # define T2_SUBS(rd,rn,rm) torrr(THUMB2_SUB|ARM_S,rn,rd,rm)
471 # define CC_SUBSI(cc,rd,rn,im) corri(cc,ARM_SUB|ARM_S|ARM_I,rn,rd,im)
472 # define SUBSI(rd,rn,im) CC_SUBSI(ARM_CC_AL,rd,rn,im)
473 # define T2_SUBSI(rd,rn,im) torri(THUMB2_SUBI|ARM_S,rn,rd,im)
474 # define CC_SBC(cc,rd,rn,rm) corrr(cc,ARM_SBC,rn,rd,rm)
475 # define SBC(rd,rn,rm) CC_SBC(ARM_CC_AL,rd,rn,rm)
476 # define T1_SBC(rdn,rm) is(THUMB_SBC|(_u3(rm)<<3)|_u3(rdn))
477 # define T2_SBC(rd,rn,rm) torrr(THUMB2_SBC,rn,rd,rm)
478 # define CC_SBCI(cc,rd,rn,im) corri(cc,ARM_SBC|ARM_I,rn,rd,im)
479 # define SBCI(rd,rn,im) CC_SBCI(ARM_CC_AL,rd,rn,im)
480 # define T2_SBCI(rd,rn,im) torri(THUMB2_SBCI,rn,rd,im)
481 # define CC_SBCS(cc,rd,rn,rm) corrr(cc,ARM_SBC|ARM_S,rn,rd,rm)
482 # define SBCS(rd,rn,rm) CC_SBCS(ARM_CC_AL,rd,rn,rm)
483 # define T2_SBCS(rd,rn,rm) torrr(THUMB2_SBC|ARM_S,rn,rd,rm)
484 # define CC_SBCSI(cc,rd,rn,im) corri(cc,ARM_SBC|ARM_S|ARM_I,rn,rd,im)
485 # define SBCSI(rd,rn,im) CC_SBCSI(ARM_CC_AL,rd,rn,im)
486 # define T2_SBCSI(rd,rn,im) torri(THUMB2_SBCI|ARM_S,rn,rd,im)
487 # define CC_RSB(cc,rd,rn,rm) corrr(cc,ARM_RSB,rn,rd,rm)
488 # define RSB(rd,rn,rm) CC_RSB(ARM_CC_AL,rd,rn,rm)
489 # define T2_RSB(rd,rn,rm) torrr(THUMB2_RSB,rn,rd,rm)
490 # define CC_RSBI(cc,rd,rn,im) corri(cc,ARM_RSB|ARM_I,rn,rd,im)
491 # define RSBI(rd,rn,im) CC_RSBI(ARM_CC_AL,rd,rn,im)
492 # define T1_RSBI(rd,rn) is(THUMB_RSBI|(_u3(rn)<<3)|_u3(rd))
493 # define T2_RSBI(rd,rn,im) torri(THUMB2_RSBI,rn,rd,im)
494 # define CC_MUL(cc,rl,rn,rm) corrrr(cc,ARM_MUL,rl,0,rm,rn)
495 # define MUL(rl,rn,rm) CC_MUL(ARM_CC_AL,rl,rn,rm)
496 # define T1_MUL(rdm,rn) is(THUMB_MUL|(_u3(rn)<<3)|_u3(rdm))
497 # define T2_MUL(rd,rn,rm) torrr(THUMB2_MUL,rn,rd,rm)
498 # define CC_SMULL(cc,rl,rh,rn,rm) corrrr(cc,ARM_SMULL,rh,rl,rm,rn)
499 # define SMULL(rl,rh,rn,rm) CC_SMULL(ARM_CC_AL,rl,rh,rn,rm)
500 # define T2_SMULL(rl,rh,rn,rm) torrrr(THUMB2_SMULL,rn,rl,rh,rm)
501 # define CC_UMULL(cc,rl,rh,rn,rm) corrrr(cc,ARM_UMULL,rh,rl,rm,rn)
502 # define UMULL(rl,rh,rn,rm) CC_UMULL(ARM_CC_AL,rl,rh,rn,rm)
503 # define T2_UMULL(rl,rh,rn,rm) torrrr(THUMB2_UMULL,rn,rl,rh,rm)
504 # define T2_SDIV(rd,rn,rm) torrr(THUMB2_SDIV,rn,rd,rm)
505 # define T2_UDIV(rd,rn,rm) torrr(THUMB2_UDIV,rn,rd,rm)
506 # define CC_AND(cc,rd,rn,rm) corrr(cc,ARM_AND,rn,rd,rm)
507 # define AND(rd,rn,rm) CC_AND(ARM_CC_AL,rd,rn,rm)
508 # define T1_AND(rdn,rm) is(THUMB_AND|(_u3(rm)<<3)|_u3(rdn))
509 # define T2_AND(rd,rn,rm) torrr(THUMB2_AND,rn,rd,rm)
510 # define CC_ANDI(cc,rd,rn,im) corri(cc,ARM_AND|ARM_I,rn,rd,im)
511 # define ANDI(rd,rn,im) CC_ANDI(ARM_CC_AL,rd,rn,im)
512 # define T2_ANDI(rd,rn,im) torri(THUMB2_ANDI,rn,rd,im)
513 # define CC_ANDS(cc,rd,rn,rm) corrr(cc,ARM_AND|ARM_S,rn,rd,rm)
514 # define ANDS(rd,rn,rm) CC_ANDS(ARM_CC_AL,rd,rn,rm)
515 # define T2_ANDS(rd,rn,rm) torrr(THUMB2_AND|ARM_S,rn,rd,rm)
516 # define CC_ANDSI(cc,rd,rn,im) corri(cc,ARM_AND|ARM_S|ARM_I,rn,rd,im)
517 # define ANDSI(rd,rn,im) CC_ANDSI(ARM_CC_AL,rd,rn,im)
518 # define T2_ANDSI(rd,rn,im) torri(ARM_CC_AL,THUMB2_ANDI|ARM_S,rn,rd,im)
519 # define CC_BIC(cc,rd,rn,rm) corrr(cc,ARM_BIC,rn,rd,rm)
520 # define BIC(rd,rn,rm) CC_BIC(ARM_CC_AL,rd,rn,rm)
521 # define T2_BIC(rd,rn,rm) torrr(THUMB2_BIC,rn,rd,rm)
522 # define CC_BICI(cc,rd,rn,im) corri(cc,ARM_BIC|ARM_I,rn,rd,im)
523 # define BICI(rd,rn,im) CC_BICI(ARM_CC_AL,rd,rn,im)
524 # define T2_BICI(rd,rn,im) torri(THUMB2_BICI,rn,rd,im)
525 # define CC_BICS(cc,rd,rn,rm) corrr(cc,ARM_BIC|ARM_S,rn,rd,rm)
526 # define BICS(rd,rn,rm) CC_BICS(ARM_CC_AL,rd,rn,rm)
527 # define T2_BICS(rd,rn,rm) torrr(THUMB2_BIC|ARM_S,rn,rd,rm)
528 # define CC_BICSI(cc,rd,rn,im) corri(cc,ARM_BIC|ARM_S|ARM_I,rn,rd,im)
529 # define BICSI(rd,rn,im) CC_BICSI(ARM_CC_AL,rd,rn,im)
530 # define T2_BICSI(rd,rn,im) torri(ARM_CC_AL,THUMB2_BICI|ARM_S,rn,rd,im)
531 # define CC_ORR(cc,rd,rn,rm) corrr(cc,ARM_ORR,rn,rd,rm)
532 # define ORR(rd,rn,rm) CC_ORR(ARM_CC_AL,rd,rn,rm)
533 # define T1_ORR(rdn,rm) is(THUMB_ORR|(_u3(rm)<<3)|_u3(rdn))
534 # define T2_ORR(rd,rn,rm) torrr(THUMB2_ORR,rn,rd,rm)
535 # define CC_ORR_SI(cc,rd,rn,rt,sh,im) corrrs(cc,ARM_ORR|sh,rn,rd,rm,im)
536 # define ORR_SI(r0,r1,r2,sh,im) CC_ORR_SI(ARM_CC_AL,r0,r1,r2,sh,im)
537 # define CC_ORRI(cc,rd,rn,im) corri(cc,ARM_ORR|ARM_I,rn,rd,im)
538 # define ORRI(rd,rn,im) CC_ORRI(ARM_CC_AL,rd,rn,im)
539 # define T2_ORRI(rd,rn,im) torri(THUMB2_ORRI,rn,rd,im)
540 # define CC_EOR(cc,rd,rn,rm) corrr(cc,ARM_EOR,rn,rd,rm)
541 # define EOR(rd,rn,rm) CC_EOR(ARM_CC_AL,rd,rn,rm)
542 # define T1_EOR(rdn,rm) is(THUMB_EOR|(_u3(rm)<<3)|_u3(rdn))
543 # define T2_EOR(rd,rn,rm) torrr(THUMB2_EOR,rn,rd,rm)
544 # define CC_EOR_SI(cc,rd,rn,rm,sh,im) corrrs(cc,ARM_EOR|sh,rn,rd,rm,im)
545 # define EOR_SI(r0,r1,r2,sh,im) CC_EOR_SI(ARM_CC_AL,r0,r1,r2,sh,im)
546 # define CC_EORI(cc,rd,rn,im) corri(cc,ARM_EOR|ARM_I,rn,rd,im)
547 # define EORI(rd,rn,im) CC_EORI(ARM_CC_AL,rd,rn,im)
548 # define T2_EORI(rd,rn,im) torri(THUMB2_EORI,rn,rd,im)
549 # define CC_REV(cc,rd,rm) c6orr(cc,ARM_REV,rd,rm)
550 # define REV(rd,rm) CC_REV(ARM_CC_AL,rd,rm)
551 # define T1_REV(rd,rm) is(THUMB_REV|(_u3(rm)<<3)|_u3(rd))
552 # define T2_REV(rd,rm) torrr(THUMB2_REV,rm,rd,rm)
553 # define CC_REV16(cc,rd,rm) c6orr(cc,ARM_REV16,rd,rm)
554 # define REV16(rd,rm) CC_REV16(ARM_CC_AL,rd,rm)
555 # define T1_REV16(rd,rm) is(THUMB_REV16|(_u3(rm)<<3)|_u3(rd))
556 # define T2_REV16(rd,rm) torrr(THUMB2_REV16,rm,rd,rm)
557 # define CC_SXTB(cc,rd,rm) c6orr(cc,ARM_SXTB,rd,rm)
558 # define SXTB(rd,rm) CC_SXTB(ARM_CC_AL,rd,rm)
559 # define T1_SXTB(rd,rm) is(THUMB_SXTB|(_u3(rm)<<3)|_u3(rd))
560 # define T2_SXTB(rd,rm) torrr(THUMB2_SXTB,_R15_REGNO,rd,rm)
561 # define CC_UXTB(cc,rd,rm) c6orr(cc,ARM_UXTB,rd,rm)
562 # define UXTB(rd,rm) CC_UXTB(ARM_CC_AL,rd,rm)
563 # define T1_UXTB(rd,rm) is(THUMB_UXTB|(_u3(rm)<<3)|_u3(rd))
564 # define T2_UXTB(rd,rm) torrr(THUMB2_UXTB,_R15_REGNO,rd,rm)
565 # define CC_SXTH(cc,rd,rm) c6orr(cc,ARM_SXTH,rd,rm)
566 # define SXTH(rd,rm) CC_SXTH(ARM_CC_AL,rd,rm)
567 # define T1_SXTH(rd,rm) is(THUMB_SXTH|(_u3(rm)<<3)|_u3(rd))
568 # define T2_SXTH(rd,rm) torrr(THUMB2_SXTH,_R15_REGNO,rd,rm)
569 # define CC_UXTH(cc,rd,rm) c6orr(cc,ARM_UXTH,rd,rm)
570 # define UXTH(rd,rm) CC_UXTH(ARM_CC_AL,rd,rm)
571 # define T1_UXTH(rd,rm) is(THUMB_UXTH|(_u3(rm)<<3)|_u3(rd))
572 # define T2_UXTH(rd,rm) torrr(THUMB2_UXTH,_R15_REGNO,rd,rm)
573 # define CC_SHIFT(cc,o,rd,rm,rn,im) cshift(cc,o,rd,rm,rn,im)
574 # define CC_LSL(cc,rd,rn,rm) CC_SHIFT(cc,ARM_LSL|ARM_R,rd,rm,rn,0)
575 # define LSL(rd,rn,rm) CC_LSL(ARM_CC_AL,rd,rn,rm)
576 # define T1_LSL(rdn,rm) is(THUMB_LSL|(_u3(rm)<<3)|_u3(rdn))
577 # define T2_LSL(rd,rn,rm) torrr(THUMB2_LSL,rn,rd,rm)
578 # define CC_LSLI(cc,rd,rn,im) CC_SHIFT(cc,ARM_LSL,rd,0,rn,im)
579 # define LSLI(rd,rn,im) CC_LSLI(ARM_CC_AL,rd,rn,im)
580 # define T1_LSLI(rd,rm,im) is(THUMB_LSLI|(_u5(im)<<6)|(_u3(rm)<<3)|_u3(rd))
581 # define T2_LSLI(rd,rm,im) tshift(THUMB2_LSLI,rd,rm,im)
582 # define CC_LSR(cc,rd,rn,rm) CC_SHIFT(cc,ARM_LSR|ARM_R,rd,rm,rn,0)
583 # define LSR(rd,rn,rm) CC_LSR(ARM_CC_AL,rd,rn,rm)
584 # define T1_LSR(rdn,rm) is(THUMB_LSR|(_u3(rm)<<3)|_u3(rdn))
585 # define T2_LSR(rd,rn,rm) torrr(THUMB2_LSR,rn,rd,rm)
586 # define CC_LSRI(cc,rd,rn,im) CC_SHIFT(cc,ARM_LSR,rd,0,rn,im)
587 # define LSRI(rd,rn,im) CC_LSRI(ARM_CC_AL,rd,rn,im)
588 # define T1_LSRI(rd,rm,im) is(THUMB_LSRI|(_u5(im)<<6)|(_u3(rm)<<3)|_u3(rd))
589 # define T2_LSRI(rd,rm,im) tshift(THUMB2_LSRI,rd,rm,im)
590 # define CC_ASR(cc,rd,rn,rm) CC_SHIFT(cc,ARM_ASR|ARM_R,rd,rm,rn,0)
591 # define ASR(rd,rn,rm) CC_ASR(ARM_CC_AL,rd,rn,rm)
592 # define T1_ASR(rdn,rm) is(THUMB_ASR|(_u3(rm)<<3)|_u3(rdn))
593 # define T2_ASR(rd,rn,rm) torrr(THUMB2_ASR,rn,rd,rm)
594 # define CC_ASRI(cc,rd,rn,im) CC_SHIFT(cc,ARM_ASR,rd,0,rn,im)
595 # define ASRI(rd,rn,im) CC_ASRI(ARM_CC_AL,rd,rn,im)
596 # define T1_ASRI(rd,rm,im) is(THUMB_ASRI|(_u5(im)<<6)|(_u3(rm)<<3)|_u3(rd))
597 # define T2_ASRI(rd,rm,im) tshift(THUMB2_ASRI,rd,rm,im)
598 # define CC_CMP(cc,rn,rm) corrr(cc,ARM_CMP,rn,0,rm)
599 # define CMP(rn,rm) CC_CMP(ARM_CC_AL,rn,rm)
600 # define T1_CMP(rn,rm) is(THUMB_CMP|(_u3(rm)<<3)|_u3(rn))
601 # define T1_CMPX(rn,rm) is(THUMB_CMPX|((_u4(rn)&8)<<4)|(_u4(rm)<<3)|(rn&7))
602 # define T2_CMP(rn,rm) torrr(THUMB2_CMP,rn,_R15_REGNO,rm)
603 # define CC_CMPI(cc,rn,im) corri(cc,ARM_CMP|ARM_I,rn,0,im)
604 # define CMPI(rn,im) CC_CMPI(ARM_CC_AL,rn,im)
605 # define T1_CMPI(rn,im) is(THUMB_CMPI|(_u3(rn)<<8)|_u8(im))
606 # define T2_CMPI(rn,im) torri(THUMB2_CMPI,rn,_R15_REGNO,im)
607 # define CC_CMN(cc,rn,rm) corrr(cc,ARM_CMN,rn,0,rm)
608 # define CMN(rn,rm) CC_CMN(ARM_CC_AL,rn,rm)
609 # define T1_CMN(rn,rm) is(THUMB_CMN|(_u3(rm)<<3)|_u3(rm))
610 # define T2_CMN(rn,rm) torrr(THUMB2_CMN,rn,_R15_REGNO,rm)
611 # define CC_CMNI(cc,rn,im) corri(cc,ARM_CMN|ARM_I,rn,0,im)
612 # define CMNI(rn,im) CC_CMNI(ARM_CC_AL,rn,im)
613 # define T2_CMNI(rn,im) torri(THUMB2_CMNI,rn,_R15_REGNO,im)
614 # define CC_TST(cc,rn,rm) corrr(cc,ARM_TST,rn,r0,rm)
615 # define TST(rn,rm) CC_TST(ARM_CC_AL,rn,rm)
616 # define T1_TST(rn,rm) is(THUMB_TST|(_u3(rm)<<3)|_u3(rn))
617 # define T2_TST(rn,rm) torrr(THUMB2_TST,rn,_R15_REGNO,rm)
618 # define CC_TSTI(cc,rn,im) corri(cc,ARM_TST|ARM_I,rn,0,im)
619 # define TSTI(rn,im) CC_TSTI(ARM_CC_AL,rn,im)
620 # define T2_TSTI(rn,im) torri(THUMB2_TSTI,rn,_R15_REGNO,im)
621 # define CC_TEQ(cc,rn,rm) corrr(cc,ARM_TEQ,rn,0,rm)
622 # define TEQ(rn,rm) CC_TEQ(ARM_CC_AL,rn,rm)
623 # define CC_TEQI(cc,rm,im) corri(cc,ARM_TEQ|ARM_I,rn,0,im)
624 # define TEQI(rn,im) CC_TEQI(ARM_CC_AL,rn,im)
625 # define CC_BX(cc,rm) cbx(cc,ARM_BX,rm)
626 # define BX(rm) CC_BX(ARM_CC_AL,rm)
627 # define T1_BX(rm) is(0x4700|(_u4(rm)<<3))
628 # define CC_BLX(cc,rm) cbx(cc,ARM_BLX,rm)
629 # define BLX(rm) CC_BLX(ARM_CC_AL,rm)
630 # define T1_BLX(rm) is(THUMB_BLX|(_u4(rm)<<3))
631 # define BLXI(im) blxi(im)
632 # define T2_BLXI(im) tb(THUMB2_BLXI,im)
633 # define CC_B(cc,im) cb(cc,ARM_B,im)
634 # define B(im) CC_B(ARM_CC_AL,im)
635 # define T1_CC_B(cc,im) tc8(cc,im)
636 # define T1_B(im) t11(im)
637 # define T2_CC_B(cc,im) tcb(cc,im)
638 # define T2_B(im) tb(THUMB2_B,im)
639 # define CC_BLI(cc,im) cb(cc,ARM_BLI,im)
640 # define BLI(im) CC_BLI(ARM_CC_AL,im)
641 # define T2_BLI(im) tb(THUMB2_BLI,im)
642 # define CC_LDRSB(cc,rt,rn,rm) corrr(cc,ARM_LDRSB|ARM_P,rn,rt,rm)
643 # define LDRSB(rt,rn,rm) CC_LDRSB(ARM_CC_AL,rt,rn,rm)
644 # define T1_LDRSB(rt,rn,rm) is(THUMB_LDRSB|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rt))
645 # define T2_LDRSB(rt,rn,rm) torxr(THUMB2_LDRSB,rn,rt,rm)
646 # define CC_LDRSBN(cc,rt,rn,rm) corrr(cc,ARM_LDRSB,rn,rt,rm)
647 # define LDRSBN(rt,rn,rm) CC_LDRSBN(ARM_CC_AL,rt,rn,rm)
648 # define CC_LDRSBI(cc,rt,rn,im) corri8(cc,ARM_LDRSBI|ARM_P,rn,rt,im)
649 # define LDRSBI(rt,rn,im) CC_LDRSBI(ARM_CC_AL,rt,rn,im)
650 # define T2_LDRSBI(rt,rn,im) torri8(THUMB2_LDRSBI|THUMB2_U,rn,rt,im)
651 # define T2_LDRSBWI(rt,rn,im) torri12(THUMB2_LDRSBWI,rn,rt,im)
652 # define CC_LDRSBIN(cc,rt,rn,im) corri8(cc,ARM_LDRSBI,rn,rt,im)
653 # define LDRSBIN(rt,rn,im) CC_LDRSBIN(ARM_CC_AL,rt,rn,im)
654 # define T2_LDRSBIN(rt,rn,im) torri8(THUMB2_LDRSBI,rn,rt,im)
655 # define CC_LDRB(cc,rt,rn,rm) corrr(cc,ARM_LDRB|ARM_P,rn,rt,rm)
656 # define LDRB(rt,rn,rm) CC_LDRB(ARM_CC_AL,rt,rn,rm)
657 # define T1_LDRB(rt,rn,rm) is(THUMB_LDRB|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rt))
658 # define T2_LDRB(rt,rn,rm) torxr(THUMB2_LDRB,rn,rt,rm)
659 # define CC_LDRBN(cc,rt,rn,rm) corrr(cc,ARM_LDRB,rn,rt,rm)
660 # define LDRBN(rt,rn,rm) CC_LDRBN(ARM_CC_AL,rt,rn,rm)
661 # define CC_LDRBI(cc,rt,rn,im) corri(cc,ARM_LDRBI|ARM_P,rn,rt,im)
662 # define LDRBI(rt,rn,im) CC_LDRBI(ARM_CC_AL,rt,rn,im)
663 # define T1_LDRBI(rt,rn,im) is(THUMB_LDRBI|(_u5(im)<<6)|(_u3(rn)<<3)|_u3(rt))
664 # define T2_LDRBI(rt,rn,im) torri8(THUMB2_LDRBI|THUMB2_U,rn,rt,im)
665 # define T2_LDRBWI(rt,rn,im) torri12(THUMB2_LDRBWI,rn,rt,im)
666 # define CC_LDRBIN(cc,rt,rn,im) corri(cc,ARM_LDRBI,rn,rt,im)
667 # define LDRBIN(rt,rn,im) CC_LDRBIN(ARM_CC_AL,rt,rn,im)
668 # define T2_LDRBIN(rt,rn,im) torri8(THUMB2_LDRBI,rn,rt,im)
669 # define CC_LDRSH(cc,rt,rn,rm) corrr(cc,ARM_LDRSH|ARM_P,rn,rt,rm)
670 # define LDRSH(rt,rn,rm) CC_LDRSH(ARM_CC_AL,rt,rn,rm)
671 # define T1_LDRSH(rt,rn,rm) is(THUMB_LDRSH|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rt))
672 # define T2_LDRSH(rt,rn,rm) torxr(THUMB2_LDRSH,rn,rt,rm)
673 # define CC_LDRSHN(cc,rt,rn,rm) corrr(cc,ARM_LDRSH,rn,rt,rm)
674 # define LDRSHN(rt,rn,rm) CC_LDRSHN(ARM_CC_AL,rt,rn,rm)
675 # define CC_LDRSHI(cc,rt,rn,im) corri8(cc,ARM_LDRSHI|ARM_P,rn,rt,im)
676 # define LDRSHI(rt,rn,im) CC_LDRSHI(ARM_CC_AL,rt,rn,im)
677 # define T2_LDRSHI(rt,rn,im) torri8(THUMB2_LDRSHI|THUMB2_U,rn,rt,im)
678 # define T2_LDRSHWI(rt,rn,im) torri12(THUMB2_LDRSHWI,rn,rt,im)
679 # define CC_LDRSHIN(cc,rt,rn,im) corri8(cc,ARM_LDRSHI,rn,rt,im)
680 # define LDRSHIN(rt,rn,im) CC_LDRSHIN(ARM_CC_AL,rt,rn,im)
681 # define T2_LDRSHIN(rt,rn,im) torri8(THUMB2_LDRSHI,rn,rt,im)
682 # define CC_LDRH(cc,rt,rn,rm) corrr(cc,ARM_LDRH|ARM_P,rn,rt,rm)
683 # define LDRH(rt,rn,rm) CC_LDRH(ARM_CC_AL,rt,rn,rm)
684 # define T1_LDRH(rt,rn,rm) is(THUMB_LDRH|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rt))
685 # define T2_LDRH(rt,rn,rm) torxr(THUMB2_LDRH,rn,rt,rm)
686 # define CC_LDRHN(cc,rt,rn,rm) corrr(cc,ARM_LDRH,rn,rt,rm)
687 # define LDRHN(rt,rn,rm) CC_LDRHN(ARM_CC_AL,rt,rn,rm)
688 # define CC_LDRHI(cc,rt,rn,im) corri8(cc,ARM_LDRHI|ARM_P,rn,rt,im)
689 # define LDRHI(rt,rn,im) CC_LDRHI(ARM_CC_AL,rt,rn,im)
690 # define T1_LDRHI(rt,rn,im) is(THUMB_LDRHI|(_u5(im)<<6)|(_u3(rn)<<3)|_u3(rt))
691 # define T2_LDRHI(rt,rn,im) torri8(THUMB2_LDRHI|THUMB2_U,rn,rt,im)
692 # define T2_LDRHWI(rt,rn,im) torri12(THUMB2_LDRHWI,rn,rt,im)
693 # define CC_LDRHIN(cc,rt,rn,im) corri8(cc,ARM_LDRHI,rn,rt,im)
694 # define LDRHIN(rt,rn,im) CC_LDRHIN(ARM_CC_AL,rt,rn,im)
695 # define T2_LDRHIN(rt,rn,im) torri8(THUMB2_LDRHI,rn,rt,im)
696 # define CC_LDR(cc,rt,rn,rm) corrr(cc,ARM_LDR|ARM_P,rn,rt,rm)
697 # define LDR(rt,rn,rm) CC_LDR(ARM_CC_AL,rt,rn,rm)
698 # define T1_LDR(rt,rn,rm) is(THUMB_LDR|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rt))
699 # define T2_LDR(rt,rn,rm) torxr(THUMB2_LDR,rn,rt,rm)
700 # define CC_LDRN(cc,rt,rn,rm) corrr(cc,ARM_LDR,rn,rt,rm)
701 # define LDRN(rt,rn,rm) CC_LDRN(ARM_CC_AL,rt,rn,rm)
702 # define CC_LDRI(cc,rt,rn,im) corri(cc,ARM_LDRI|ARM_P,rn,rt,im)
703 # define LDRI(rt,rn,im) CC_LDRI(ARM_CC_AL,rt,rn,im)
704 # define T1_LDRI(rt,rn,im) is(THUMB_LDRI|(_u5(im)<<6)|(_u3(rn)<<3)|_u3(rt))
705 # define T1_LDRISP(rt,im) is(THUMB_LDRISP|(_u3(rt)<<8)|_u8(im))
706 # define T2_LDRI(rt,rn,im) torri8(THUMB2_LDRI|THUMB2_U,rn,rt,im)
707 # define T2_LDRWI(rt,rn,im) torri12(THUMB2_LDRWI,rn,rt,im)
708 # define CC_LDRIN(cc,rt,rn,im) corri(cc,ARM_LDRI,rn,rt,im)
709 # define LDRIN(rt,rn,im) CC_LDRIN(ARM_CC_AL,rt,rn,im)
710 # define T2_LDRIN(rt,rn,im) torri8(THUMB2_LDRI,rn,rt,im)
711 # define CC_LDRD(cc,rt,rn,rm) corrr(cc,ARM_LDRD|ARM_P,rn,rt,rm)
712 # define LDRD(rt,rn,rm) CC_LDRD(ARM_CC_AL,rt,rn,rm)
713 # define T2_LDRDI(rt,rt2,rn,im) torrri8(THUMB2_LDRDI|ARM_P,rn,rt,rt2,im)
714 # define CC_LDRDN(cc,rt,rn,rm) corrr(cc,ARM_LDRD,rn,rt,rm)
715 # define LDRDN(rd,rn,rm) CC_LDRDN(ARM_CC_AL,rt,rn,rm)
716 # define CC_LDRDI(cc,rt,rn,im) corri8(cc,ARM_LDRDI|ARM_P,rn,rt,im)
717 # define LDRDI(rt,rn,im) CC_LDRDI(ARM_CC_AL,rt,rn,im)
718 # define CC_LDRDIN(cc,rt,rn,im) corri8(cc,ARM_LDRDI,rn,rt,im)
719 # define LDRDIN(rt,rn,im) CC_LDRDIN(ARM_CC_AL,rt,rn,im)
720 # define T2_LDRDIN(rt,rt2,rn,im) torrri8(THUMB2_LDRDI,rn,rt,rt2,im)
721 # define CC_STRB(cc,rt,rn,rm) corrr(cc,ARM_STRB|ARM_P,rn,rt,rm)
722 # define STRB(rt,rn,rm) CC_STRB(ARM_CC_AL,rt,rn,rm)
723 # define T1_STRB(rt,rn,rm) is(THUMB_STRB|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rt))
724 # define T2_STRB(rt,rn,rm) torxr(THUMB2_STRB,rn,rt,rm)
725 # define CC_STRBN(cc,rt,rn,rm) corrr(cc,ARM_STRB,rn,rt,rm)
726 # define STRBN(rt,rn,rm) CC_STRBN(ARM_CC_AL,rt,rn,rm)
727 # define CC_STRBI(cc,rt,rn,im) corri(cc,ARM_STRBI|ARM_P,rn,rt,im)
728 # define STRBI(rt,rn,im) CC_STRBI(ARM_CC_AL,rt,rn,im)
729 # define T1_STRBI(rt,rn,im) is(THUMB_STRBI|(_u5(im)<<6)|(_u3(rn)<<3)|_u3(rt))
730 # define T2_STRBI(rt,rn,im) torri8(THUMB2_STRBI|THUMB2_U,rn,rt,im)
731 # define T2_STRBWI(rt,rn,im) torri12(THUMB2_STRBWI,rn,rt,im)
732 # define CC_STRBIN(cc,rt,rn,im) corri(cc,ARM_STRBI,rn,rt,im)
733 # define STRBIN(rt,rn,im) CC_STRBIN(ARM_CC_AL,rt,rn,im)
734 # define T2_STRBIN(rt,rn,im) torri8(THUMB2_STRBI,rn,rt,im)
735 # define CC_STRH(cc,rt,rn,rm) corrr(cc,ARM_STRH|ARM_P,rn,rt,rm)
736 # define STRH(rt,rn,rm) CC_STRH(ARM_CC_AL,rt,rn,rm)
737 # define T1_STRH(rt,rn,rm) is(THUMB_STRH|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rt))
738 # define T2_STRH(rt,rn,rm) torxr(THUMB2_STRH,rn,rt,rm)
739 # define CC_STRHN(cc,rt,rn,rm) corrr(cc,ARM_STRH,rn,rt,rm)
740 # define STRHN(rt,rn,rm) CC_STRHN(ARM_CC_AL,rt,rn,rm)
741 # define CC_STRHI(cc,rt,rn,im) corri8(cc,ARM_STRHI|ARM_P,rn,rt,im)
742 # define STRHI(rt,rn,im) CC_STRHI(ARM_CC_AL,rt,rn,im)
743 # define T1_STRHI(rt,rn,im) is(THUMB_STRHI|(_u5(im)<<6)|(_u3(rn)<<3)|_u3(rt))
744 # define T2_STRHI(rt,rn,im) torri8(THUMB2_STRHI|THUMB2_U,rn,rt,im)
745 # define T2_STRHWI(rt,rn,im) torri12(THUMB2_STRHWI,rn,rt,im)
746 # define CC_STRHIN(cc,rt,rn,im) corri8(cc,ARM_STRHI,rn,rt,im)
747 # define STRHIN(rt,rn,im) CC_STRHIN(ARM_CC_AL,rt,rn,im)
748 # define T2_STRHIN(rt,rn,im) torri8(THUMB2_STRHI,rn,rt,im)
749 # define CC_STR(cc,rt,rn,rm) corrr(cc,ARM_STR|ARM_P,rn,rt,rm)
750 # define STR(rt,rn,rm) CC_STR(ARM_CC_AL,rt,rn,rm)
751 # define T1_STR(rt,rn,rm) is(THUMB_STR|(_u3(rm)<<6)|(_u3(rn)<<3)|_u3(rt))
752 # define T2_STR(rt,rn,rm) torxr(THUMB2_STR,rn,rt,rm)
753 # define CC_STRN(cc,rt,rn,rm) corrr(cc,ARM_STR,rn,rt,rm)
754 # define STRN(rt,rn,rm) CC_STRN(ARM_CC_AL,rt,rn,rm)
755 # define CC_STRI(cc,rt,rn,im) corri(cc,ARM_STRI|ARM_P,rn,rt,im)
756 # define STRI(rt,rn,im) CC_STRI(ARM_CC_AL,rt,rn,im)
757 # define T1_STRI(rt,rn,im) is(THUMB_STRI|(_u5(im)<<6)|(_u3(rn)<<3)|_u3(rt))
758 # define T1_STRISP(rt,im) is(THUMB_STRISP|(_u3(rt)<<8)|(_u8(im)))
759 # define T2_STRI(rt,rn,im) torri8(THUMB2_STRI|THUMB2_U,rn,rt,im)
760 # define T2_STRWI(rt,rn,im) torri12(THUMB2_STRWI,rn,rt,im)
761 # define CC_STRIN(cc,rt,rn,im) corri(cc,ARM_STRI,rn,rt,im)
762 # define STRIN(rt,rn,im) CC_STRIN(ARM_CC_AL,rt,rn,im)
763 # define T2_STRIN(rt,rn,im) torri8(THUMB2_STRI,rn,rt,im)
764 # define CC_STRD(cc,rt,rn,rm) corrr(cc,ARM_STRD|ARM_P,rn,rt,rm)
765 # define STRD(rt,rn,rm) CC_STRD(ARM_CC_AL,rt,rn,rm)
766 # define CC_STRDN(cc,rt,rn,rm) corrr(cc,ARM_STRD,rn,rt,rm)
767 # define STRDN(rt,rn,rm) CC_STRDN(ARM_CC_AL,rt,rn,rm)
768 # define CC_STRDI(cc,rt,rn,im) corri8(cc,ARM_STRDI|ARM_P,rn,rt,im)
769 # define STRDI(rt,rn,im) CC_STRDI(ARM_CC_AL,rt,rn,im)
770 # define T2_STRDI(rt,rt2,rn,im) torrri8(THUMB2_STRDI|ARM_P,rn,rt,rt2,im)
771 # define CC_STRDIN(cc,rt,rn,im) corri8(cc,ARM_STRDI,rn,rt,im)
772 # define STRDIN(rt,rn,im) CC_STRDIN(ARM_CC_AL,rt,rn,im)
773 # define T2_STRDIN(rt,rt2,rn,im) torrri8(THUMB2_STRDI,rn,rt,rt2,im)
774 # define CC_LDMIA(cc,rn,im) corl(cc,ARM_M|ARM_M_L|ARM_M_I,rn,im)
775 # define LDMIA(rn,im) CC_LDMIA(ARM_CC_AL,rn,im)
776 # define CC_LDM(cc,rn,im) CC_LDMIA(cc,rn,im)
777 # define LDM(rn,im) LDMIA(rn,im)
778 # define T1_LDMIA(rn,im) is(THUMB_LDMIA|(_u3(rn)<<8)|im)
779 # define T2_LDMIA(rn,im) torl(THUMB2_LDMIA,rn,im)
780 # define CC_LDMIA_U(cc,rn,im) corl(cc,ARM_M|ARM_M_L|ARM_M_I|ARM_M_U,rn,im)
781 # define LDMIA_U(rn,im) CC_LDMIA_U(ARM_CC_AL,rn,im)
782 # define LDM_U(r0,i0) LDMIA_U(r0,i0)
783 # define CC_LDMIB(cc,rn,im) corl(cc,ARM_M|ARM_M_L|ARM_M_I|ARM_M_B,rn,im)
784 # define LDMIB(rn,im) CC_LDMIB(ARM_CC_AL,rn,im)
785 # define CC_LDMIB_U(cc,rn,im) corl(cc,ARM_M|ARM_M_L|ARM_M_I|ARM_M_B|ARM_M_U,rn,im)
786 # define LDMIB_U(rn,im) CC_LDMIB_U(ARM_CC_AL,rn,im)
787 # define CC_LDMDA(cc,rn,im) corl(cc,ARM_M|ARM_M_L,rn,im)
788 # define LDMDA(rn,im) CC_LDMDA(ARM_CC_AL,rn,im)
789 # define CC_LDMDA_U(cc,rn,im) corl(cc,ARM_M|ARM_M_L|ARM_M_U,rn,im)
790 # define LDMDA_U(rn,im) CC_LDMDA_U(ARM_CC_AL,rn,im)
791 # define CC_LDMDB(cc,rn,im) corl(cc,ARM_M|ARM_M_L|ARM_M_B,rn,im)
792 # define LDMDB(rn,im) CC_LDMDB(ARM_CC_AL,rn,im)
793 # define T2_LDMDB(rn,im) torl(THUMB2_LDMDB,rn,im)
794 # define CC_LDMDB_U(cc,rn,im) corl(cc,ARM_M|ARM_M_L|ARM_M_B|ARM_M_U,rn,im)
795 # define LDMDB_U(rn,im) CC_LDMDB_U(ARM_CC_AL,rn,im)
796 # define CC_STMIA(cc,rn,im) corl(cc,ARM_M|ARM_M_I,rn,im)
797 # define STMIA(rn,im) CC_STMIA(ARM_CC_AL,rn,im)
798 # define CC_STM(cc,rn,im) CC_STMIA(cc,rn,im)
799 # define STM(rn,im) STMIA(rn,im)
800 # define CC_STMIA_U(cc,rn,im) corl(cc,ARM_M|ARM_M_I|ARM_M_U,rn,im)
801 # define STMIA_U(rn,im) CC_STMIA_U(ARM_CC_AL,rn,im)
802 # define CC_STM_U(cc,rn,im) CC_STMIA_U(cc,rn,im)
803 # define STM_U(rn,im) STMIA_U(rn,im)
804 # define CC_STMIB(cc,rn,im) corl(cc,ARM_M|ARM_M_I|ARM_M_B,rn,im)
805 # define STMIB(rn,im) CC_STMIB(ARM_CC_AL,rn,im)
806 # define CC_STMIB_U(cc,rn,im) corl(cc,ARM_M|ARM_M_I|ARM_M_B|ARM_M_U,rn,im)
807 # define STMIB_U(rn,im) CC_STMIB_U(ARM_CC_AL,rn,im)
808 # define CC_STMDA(cc,rn,im) corl(cc,ARM_M,rn,im)
809 # define STMDA(rn,im) CC_STMDA(ARM_CC_AL,rn,im)
810 # define CC_STMDA_U(cc,rn,im) corl(cc,ARM_M|ARM_M_U,rn,im)
811 # define STMDA_U(rn,im) CC_STMDA_U(ARM_CC_AL,rn,im)
812 # define CC_STMDB(cc,rn,im) corl(cc,ARM_M|ARM_M_B,rn,im)
813 # define STMDB(rn,im) CC_STMDB(ARM_CC_AL,rn,im)
814 # define CC_STMDB_U(cc,rn,im) corl(cc,ARM_M|ARM_M_B|ARM_M_U,rn,im)
815 # define STMDB_U(rn,im) CC_STMDB_U(ARM_CC_AL,rn,im)
816 # define CC_PUSH(cc,im) CC_STMDB_U(cc,_SP_REGNO,im)
817 # define PUSH(im) STMDB_U(_SP_REGNO,im)
818 # define T1_PUSH(im) is(THUMB_PUSH|((im&0x4000)>>6)|(im&0xff))
819 # define T2_PUSH(im) tpp(THUMB2_PUSH,im)
820 # define CC_POP(cc,im) LDMIA_U(cc,_SP_REGNO,im)
821 # define POP(im) LDMIA_U(_SP_REGNO,im)
822 # define T1_POP(im) is(THUMB_POP|((im&0x8000)>>7)|(im&0xff))
823 # define T2_POP(im) tpp(THUMB2_POP,im)
824 # define jit_get_reg_args() \
825 do { \
826 (void)jit_get_reg(_R0|jit_class_named|jit_class_gpr); \
827 (void)jit_get_reg(_R1|jit_class_named|jit_class_gpr); \
828 (void)jit_get_reg(_R2|jit_class_named|jit_class_gpr); \
829 (void)jit_get_reg(_R3|jit_class_named|jit_class_gpr); \
830 } while (0)
831 # define jit_unget_reg_args() \
832 do { \
833 jit_unget_reg(_R3); \
834 jit_unget_reg(_R2); \
835 jit_unget_reg(_R1); \
836 jit_unget_reg(_R0); \
837 } while (0)
838 # define nop(i0) _nop(_jit,i0)
839 static void _nop(jit_state_t*,jit_int32_t);
840 # define movr(r0,r1) _movr(_jit,r0,r1)
841 static void _movr(jit_state_t*,jit_int32_t,jit_int32_t);
842 # define movi(r0,i0) _movi(_jit,r0,i0)
843 static void _movi(jit_state_t*,jit_int32_t,jit_word_t);
844 # define movi_p(r0,i0) _movi_p(_jit,r0,i0)
845 static jit_word_t _movi_p(jit_state_t*,jit_int32_t,jit_word_t);
846 # define comr(r0,r1) _comr(_jit,r0,r1)
847 static void _comr(jit_state_t*,jit_int32_t,jit_int32_t);
848 # define negr(r0,r1) _negr(_jit,r0,r1)
849 static void _negr(jit_state_t*,jit_int32_t,jit_int32_t);
850 # define addr(r0,r1,r2) _addr(_jit,r0,r1,r2)
851 static void _addr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
852 # define addi(r0,r1,i0) _addi(_jit,r0,r1,i0)
853 static void _addi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
854 # define addcr(r0,r1,r2) _addcr(_jit,r0,r1,r2)
855 static void _addcr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
856 # define addci(r0,r1,i0) _addci(_jit,r0,r1,i0)
857 static void _addci(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
858 # define addxr(r0,r1,r2) _addxr(_jit,r0,r1,r2)
859 static void _addxr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
860 # define addxi(r0,r1,i0) _addxi(_jit,r0,r1,i0)
861 static void _addxi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
862 # define subr(r0,r1,r2) _subr(_jit,r0,r1,r2)
863 static void _subr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
864 # define subi(r0,r1,i0) _subi(_jit,r0,r1,i0)
865 static void _subi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
866 # define subcr(r0,r1,r2) _subcr(_jit,r0,r1,r2)
867 static void _subcr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
868 # define subci(r0,r1,i0) _subci(_jit,r0,r1,i0)
869 static void _subci(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
870 # define subxr(r0,r1,r2) _subxr(_jit,r0,r1,r2)
871 static void _subxr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
872 # define subxi(r0,r1,i0) _subxi(_jit,r0,r1,i0)
873 static void _subxi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
874 # define rsbi(r0, r1, i0) _rsbi(_jit, r0, r1, i0)
875 static void _rsbi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
876 # define mulr(r0,r1,r2) _mulr(_jit,r0,r1,r2)
877 static void _mulr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
878 # define muli(r0,r1,i0) _muli(_jit,r0,r1,i0)
879 static void _muli(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
880 # define qmulr(r0,r1,r2,r3) iqmulr(r0,r1,r2,r3,1)
881 # define qmulr_u(r0,r1,r2,r3) iqmulr(r0,r1,r2,r3,0)
882 # define iqmulr(r0,r1,r2,r3,cc) _iqmulr(_jit,r0,r1,r2,r3,cc)
883 static void _iqmulr(jit_state_t*,jit_int32_t,jit_int32_t,
884 jit_int32_t,jit_int32_t,jit_bool_t);
885 # define qmuli(r0,r1,r2,i0) iqmuli(r0,r1,r2,i0,1)
886 # define qmuli_u(r0,r1,r2,i0) iqmuli(r0,r1,r2,i0,0)
887 # define iqmuli(r0,r1,r2,i0,cc) _iqmuli(_jit,r0,r1,r2,i0,cc)
888 static void _iqmuli(jit_state_t*,jit_int32_t,jit_int32_t,
889 jit_int32_t,jit_word_t,jit_bool_t);
890 # define divrem(d,s,r0,r1,r2) _divrem(_jit,d,s,r0,r1,r2)
891 static void _divrem(jit_state_t*,int,int,jit_int32_t,jit_int32_t,jit_int32_t);
892 # define divr(r0,r1,r2) _divr(_jit,r0,r1,r2)
893 static void _divr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
894 # define divi(r0,r1,i0) _divi(_jit,r0,r1,i0)
895 static void _divi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
896 # define divr_u(r0,r1,r2) _divr_u(_jit,r0,r1,r2)
897 static void _divr_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
898 # define divi_u(r0,r1,i0) _divi_u(_jit,r0,r1,i0)
899 static void _divi_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
900 # define qdivr(r0,r1,r2,r3) iqdivr(r0,r1,r2,r3,1)
901 # define qdivr_u(r0,r1,r2,r3) iqdivr(r0,r1,r2,r3,0)
902 # define iqdivr(r0,r1,r2,r3,cc) _iqdivr(_jit,r0,r1,r2,r3,cc)
903 static void _iqdivr(jit_state_t*,jit_int32_t,jit_int32_t,
904 jit_int32_t,jit_int32_t,jit_bool_t);
905 # define qdivi(r0,r1,r2,i0) iqdivi(r0,r1,r2,i0,1)
906 # define qdivi_u(r0,r1,r2,i0) iqdivi(r0,r1,r2,i0,0)
907 # define iqdivi(r0,r1,r2,i0,cc) _iqdivi(_jit,r0,r1,r2,i0,cc)
908 static void _iqdivi(jit_state_t*,jit_int32_t,jit_int32_t,
909 jit_int32_t,jit_word_t,jit_bool_t);
910 # define remr(r0,r1,r2) _remr(_jit,r0,r1,r2)
911 static void _remr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
912 # define remi(r0,r1,i0) _remi(_jit,r0,r1,i0)
913 static void _remi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
914 # define remr_u(r0,r1,r2) _remr_u(_jit,r0,r1,r2)
915 static void _remr_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
916 # define remi_u(r0,r1,i0) _remi_u(_jit,r0,r1,i0)
917 static void _remi_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
918 # define andr(r0,r1,r2) _andr(_jit,r0,r1,r2)
919 static void _andr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
920 # define andi(r0,r1,i0) _andi(_jit,r0,r1,i0)
921 static void _andi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
922 # define orr(r0,r1,r2) _orr(_jit,r0,r1,r2)
923 static void _orr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
924 # define ori(r0,r1,i0) _ori(_jit,r0,r1,i0)
925 static void _ori(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
926 # define xorr(r0,r1,r2) _xorr(_jit,r0,r1,r2)
927 static void _xorr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
928 # define xori(r0,r1,i0) _xori(_jit,r0,r1,i0)
929 static void _xori(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
930 # define lshr(r0,r1,r2) _lshr(_jit,r0,r1,r2)
931 static void _lshr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
932 # define lshi(r0,r1,i0) _lshi(_jit,r0,r1,i0)
933 static void _lshi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
934 # define rshr(r0,r1,r2) _rshr(_jit,r0,r1,r2)
935 static void _rshr(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
936 # define rshi(r0,r1,i0) _rshi(_jit,r0,r1,i0)
937 static void _rshi(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
938 # define rshr_u(r0,r1,r2) _rshr_u(_jit,r0,r1,r2)
939 static void _rshr_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
940 # define rshi_u(r0,r1,i0) _rshi_u(_jit,r0,r1,i0)
941 static void _rshi_u(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
942 # define ccr(ct,cf,r0,r1,r2) _ccr(_jit,ct,cf,r0,r1,r2)
943 static void _ccr(jit_state_t*,int,int,jit_int32_t,jit_int32_t,jit_int32_t);
944 # define cci(ct,cf,r0,r1,i0) _cci(_jit,ct,cf,r0,r1,i0)
945 static void _cci(jit_state_t*,int,int,jit_int32_t,jit_int32_t,jit_word_t);
946 # define ltr(r0, r1, r2) ccr(ARM_CC_LT,ARM_CC_GE,r0,r1,r2)
947 # define lti(r0, r1, i0) cci(ARM_CC_LT,ARM_CC_GE,r0,r1,i0)
948 # define ltr_u(r0, r1, r2) ccr(ARM_CC_LO,ARM_CC_HS,r0,r1,r2)
949 # define lti_u(r0, r1, i0) cci(ARM_CC_LO,ARM_CC_HS,r0,r1,i0)
950 # define ler(r0, r1, r2) ccr(ARM_CC_LE,ARM_CC_GT,r0,r1,r2)
951 # define lei(r0, r1, i0) cci(ARM_CC_LE,ARM_CC_GT,r0,r1,i0)
952 # define ler_u(r0, r1, r2) ccr(ARM_CC_LS,ARM_CC_HI,r0,r1,r2)
953 # define lei_u(r0, r1, i0) cci(ARM_CC_LS,ARM_CC_HI,r0,r1,i0)
954 # define eqr(r0, r1, r2) ccr(ARM_CC_EQ,ARM_CC_NE,r0,r1,r2)
955 # define eqi(r0, r1, i0) cci(ARM_CC_EQ,ARM_CC_NE,r0,r1,i0)
956 # define ger(r0, r1, r2) ccr(ARM_CC_GE,ARM_CC_LT,r0,r1,r2)
957 # define gei(r0, r1, i0) cci(ARM_CC_GE,ARM_CC_LT,r0,r1,i0)
958 # define ger_u(r0, r1, r2) ccr(ARM_CC_HS,ARM_CC_LO,r0,r1,r2)
959 # define gei_u(r0, r1, i0) cci(ARM_CC_HS,ARM_CC_LO,r0,r1,i0)
960 # define gtr(r0, r1, r2) ccr(ARM_CC_GT,ARM_CC_LE,r0,r1,r2)
961 # define gti(r0, r1, i0) cci(ARM_CC_GT,ARM_CC_LE,r0,r1,i0)
962 # define gtr_u(r0, r1, r2) ccr(ARM_CC_HI,ARM_CC_LS,r0,r1,r2)
963 # define gti_u(r0, r1, i0) cci(ARM_CC_HI,ARM_CC_LS,r0,r1,i0)
964 # define ner(r0,r1,r2) _ner(_jit,r0,r1,r2)
965 static void _ner(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
966 # define nei(r0,r1,i0) _nei(_jit,r0,r1,i0)
967 static void _nei(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
968 # define jmpr(r0) _jmpr(_jit,r0)
969 static void _jmpr(jit_state_t*,jit_int32_t);
970 # define jmpi(i0) _jmpi(_jit,i0)
971 static void _jmpi(jit_state_t*,jit_word_t);
972 # define jmpi_p(i0, i1) _jmpi_p(_jit,i0, i1)
973 static jit_word_t _jmpi_p(jit_state_t*,jit_word_t,jit_bool_t);
974 # define bccr(cc,i0,r0,r1) _bccr(_jit,cc,i0,r0,r1)
975 static jit_word_t _bccr(jit_state_t*,int,jit_word_t,jit_int32_t,jit_int32_t);
976 # define bcci(cc,i0,r0,i1) _bcci(_jit,cc,i0,r0,i1)
977 static jit_word_t _bcci(jit_state_t*,int,jit_word_t,jit_int32_t,jit_word_t);
978 # define bltr(i0, r0, r1) bccr(ARM_CC_LT,i0,r0,r1)
979 # define blti(i0, r0, i1) bcci(ARM_CC_LT,i0,r0,i1)
980 # define bltr_u(i0, r0, r1) bccr(ARM_CC_LO,i0,r0,r1)
981 # define blti_u(i0, r0, i1) bcci(ARM_CC_LO,i0,r0,i1)
982 # define bler(i0, r0, r1) bccr(ARM_CC_LE,i0,r0,r1)
983 # define blei(i0, r0, i1) bcci(ARM_CC_LE,i0,r0,i1)
984 # define bler_u(i0, r0, r1) bccr(ARM_CC_LS,i0,r0,r1)
985 # define blei_u(i0, r0, i1) bcci(ARM_CC_LS,i0,r0,i1)
986 # define beqr(i0, r0, r1) bccr(ARM_CC_EQ,i0,r0,r1)
987 # define beqi(i0, r0, i1) bcci(ARM_CC_EQ,i0,r0,i1)
988 # define bger(i0, r0, r1) bccr(ARM_CC_GE,i0,r0,r1)
989 # define bgei(i0, r0, i1) bcci(ARM_CC_GE,i0,r0,i1)
990 # define bger_u(i0, r0, r1) bccr(ARM_CC_HS,i0,r0,r1)
991 # define bgei_u(i0, r0, i1) bcci(ARM_CC_HS,i0,r0,i1)
992 # define bgtr(i0, r0, r1) bccr(ARM_CC_GT,i0,r0,r1)
993 # define bgti(i0, r0, i1) bcci(ARM_CC_GT,i0,r0,i1)
994 # define bgtr_u(i0, r0, r1) bccr(ARM_CC_HI,i0,r0,r1)
995 # define bgti_u(i0, r0, i1) bcci(ARM_CC_HI,i0,r0,i1)
996 # define bner(i0, r0, r1) bccr(ARM_CC_NE,i0,r0,r1)
997 # define bnei(i0, r0, i1) bcci(ARM_CC_NE,i0,r0,i1)
998 # define baddr(cc,i0,r0,r1) _baddr(_jit,cc,i0,r0,r1)
999 static jit_word_t _baddr(jit_state_t*,int,jit_word_t,jit_int32_t,jit_int32_t);
1000 # define baddi(cc,i0,r0,r1) _baddi(_jit,cc,i0,r0,r1)
1001 static jit_word_t _baddi(jit_state_t*,int,jit_word_t,jit_int32_t,jit_word_t);
1002 # define boaddr(i0,r0,r1) baddr(ARM_CC_VS,i0,r0,r1)
1003 # define boaddi(i0,r0,i1) baddi(ARM_CC_VS,i0,r0,i1)
1004 # define boaddr_u(i0,r0,r1) baddr(ARM_CC_HS,i0,r0,r1)
1005 # define boaddi_u(i0,r0,i1) baddi(ARM_CC_HS,i0,r0,i1)
1006 # define bxaddr(i0,r0,r1) baddr(ARM_CC_VC,i0,r0,r1)
1007 # define bxaddi(i0,r0,i1) baddi(ARM_CC_VC,i0,r0,i1)
1008 # define bxaddr_u(i0,r0,r1) baddr(ARM_CC_LO,i0,r0,r1)
1009 # define bxaddi_u(i0,r0,i1) baddi(ARM_CC_LO,i0,r0,i1)
1010 # define bsubr(cc,i0,r0,r1) _bsubr(_jit,cc,i0,r0,r1)
1011 static jit_word_t _bsubr(jit_state_t*,int,jit_word_t,jit_int32_t,jit_int32_t);
1012 # define bsubi(cc,i0,r0,r1) _bsubi(_jit,cc,i0,r0,r1)
1013 static jit_word_t _bsubi(jit_state_t*,int,jit_word_t,jit_int32_t,jit_word_t);
1014 # define bosubr(i0,r0,r1) bsubr(ARM_CC_VS,i0,r0,r1)
1015 # define bosubi(i0,r0,i1) bsubi(ARM_CC_VS,i0,r0,i1)
1016 # define bosubr_u(i0,r0,r1) bsubr(ARM_CC_LO,i0,r0,r1)
1017 # define bosubi_u(i0,r0,i1) bsubi(ARM_CC_LO,i0,r0,i1)
1018 # define bxsubr(i0,r0,r1) bsubr(ARM_CC_VC,i0,r0,r1)
1019 # define bxsubi(i0,r0,i1) bsubi(ARM_CC_VC,i0,r0,i1)
1020 # define bxsubr_u(i0,r0,r1) bsubr(ARM_CC_HS,i0,r0,r1)
1021 # define bxsubi_u(i0,r0,i1) bsubi(ARM_CC_HS,i0,r0,i1)
1022 # define bmxr(cc,i0,r0,r1) _bmxr(_jit,cc,i0,r0,r1)
1023 static jit_word_t _bmxr(jit_state_t*,int,jit_word_t,jit_int32_t,jit_int32_t);
1024 # define bmxi(cc,i0,r0,r1) _bmxi(_jit,cc,i0,r0,r1)
1025 static jit_word_t _bmxi(jit_state_t*,int,jit_word_t,jit_int32_t,jit_word_t);
1026 # define bmsr(i0,r0,r1) bmxr(ARM_CC_NE,i0,r0,r1)
1027 # define bmsi(i0,r0,i1) bmxi(ARM_CC_NE,i0,r0,i1)
1028 # define bmcr(i0,r0,r1) bmxr(ARM_CC_EQ,i0,r0,r1)
1029 # define bmci(i0,r0,i1) bmxi(ARM_CC_EQ,i0,r0,i1)
1030 # define ldr_c(r0,r1) _ldr_c(_jit,r0,r1)
1031 static void _ldr_c(jit_state_t*,jit_int32_t,jit_int32_t);
1032 # define ldi_c(r0,i0) _ldi_c(_jit,r0,i0)
1033 static void _ldi_c(jit_state_t*,jit_int32_t,jit_word_t);
1034 # define ldxr_c(r0,r1,r2) _ldxr_c(_jit,r0,r1,r2)
1035 static void _ldxr_c(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
1036 # define ldxi_c(r0,r1,i0) _ldxi_c(_jit,r0,r1,i0)
1037 static void _ldxi_c(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
1038 # define ldr_uc(r0,r1) _ldr_uc(_jit,r0,r1)
1039 static void _ldr_uc(jit_state_t*,jit_int32_t,jit_int32_t);
1040 # define ldi_uc(r0,i0) _ldi_uc(_jit,r0,i0)
1041 static void _ldi_uc(jit_state_t*,jit_int32_t,jit_word_t);
1042 # define ldxr_uc(r0,r1,r2) _ldxr_uc(_jit,r0,r1,r2)
1043 static void _ldxr_uc(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
1044 # define ldxi_uc(r0,r1,i0) _ldxi_uc(_jit,r0,r1,i0)
1045 static void _ldxi_uc(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
1046 # define ldr_s(r0,r1) _ldr_s(_jit,r0,r1)
1047 static void _ldr_s(jit_state_t*,jit_int32_t,jit_int32_t);
1048 # define ldi_s(r0,i0) _ldi_s(_jit,r0,i0)
1049 static void _ldi_s(jit_state_t*,jit_int32_t,jit_word_t);
1050 # define ldxr_s(r0,r1,r2) _ldxr_s(_jit,r0,r1,r2)
1051 static void _ldxr_s(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
1052 # define ldxi_s(r0,r1,i0) _ldxi_s(_jit,r0,r1,i0)
1053 static void _ldxi_s(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
1054 # define ldr_us(r0,r1) _ldr_us(_jit,r0,r1)
1055 static void _ldr_us(jit_state_t*,jit_int32_t,jit_int32_t);
1056 # define ldi_us(r0,i0) _ldi_us(_jit,r0,i0)
1057 static void _ldi_us(jit_state_t*,jit_int32_t,jit_word_t);
1058 # define ldxr_us(r0,r1,r2) _ldxr_us(_jit,r0,r1,r2)
1059 static void _ldxr_us(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
1060 # define ldxi_us(r0,r1,i0) _ldxi_us(_jit,r0,r1,i0)
1061 static void _ldxi_us(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
1062 # define ldr_i(r0,r1) _ldr_i(_jit,r0,r1)
1063 static void _ldr_i(jit_state_t*,jit_int32_t,jit_int32_t);
1064 # define ldi_i(r0,i0) _ldi_i(_jit,r0,i0)
1065 static void _ldi_i(jit_state_t*,jit_int32_t,jit_word_t);
1066 # define ldxr_i(r0,r1,r2) _ldxr_i(_jit,r0,r1,r2)
1067 static void _ldxr_i(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
1068 # define ldxi_i(r0,r1,i0) _ldxi_i(_jit,r0,r1,i0)
1069 static void _ldxi_i(jit_state_t*,jit_int32_t,jit_int32_t,jit_word_t);
1070 # define str_c(r0,r1) _str_c(_jit,r0,r1)
1071 static void _str_c(jit_state_t*,jit_int32_t,jit_int32_t);
1072 # define sti_c(i0,r0) _sti_c(_jit,i0,r0)
1073 static void _sti_c(jit_state_t*,jit_word_t,jit_int32_t);
1074 # define stxr_c(r0,r1,r2) _stxr_c(_jit,r0,r1,r2)
1075 static void _stxr_c(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
1076 # define stxi_c(r0,r1,i0) _stxi_c(_jit,r0,r1,i0)
1077 static void _stxi_c(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
1078 # define str_s(r0,r1) _str_s(_jit,r0,r1)
1079 static void _str_s(jit_state_t*,jit_int32_t,jit_int32_t);
1080 # define sti_s(i0,r0) _sti_s(_jit,i0,r0)
1081 static void _sti_s(jit_state_t*,jit_word_t,jit_int32_t);
1082 # define stxr_s(r0,r1,r2) _stxr_s(_jit,r0,r1,r2)
1083 static void _stxr_s(jit_state_t*,jit_int32_t,jit_int32_t,jit_int32_t);
1084 # define stxi_s(r0,r1,i0) _stxi_s(_jit,r0,r1,i0)
1085 static void _stxi_s(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
1086 # define str_i(r0,r1) _str_i(_jit,r0,r1)
1087 static void _str_i(jit_state_t*,jit_int32_t,jit_int32_t);
1088 # define sti_i(i0,r0) _sti_i(_jit,i0,r0)
1089 static void _sti_i(jit_state_t*,jit_word_t,jit_int32_t);
1090 # define stxr_i(r0,r1,r2) _stxr_i(_jit,r0,r1,r2)
1091 static void _stxr_i(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
1092 # define stxi_i(r0,r1,i0) _stxi_i(_jit,r0,r1,i0)
1093 static void _stxi_i(jit_state_t*,jit_word_t,jit_int32_t,jit_int32_t);
1094 # if __BYTE_ORDER == __LITTLE_ENDIAN
1095 # define htonr_us(r0,r1) _htonr_us(_jit,r0,r1)
1096 static void _htonr_us(jit_state_t*,jit_int32_t,jit_int32_t);
1097 # define htonr_ui(r0,r1) _htonr_ui(_jit,r0,r1)
1098 static void _htonr_ui(jit_state_t*,jit_int32_t,jit_int32_t);
1099 # else
1100 # define htonr_us(r0,r1) extr_us(r0,r1)
1101 # define htonr(r0,r1) movr(r0,r1)
1102 # endif
1103 # define extr_c(r0,r1) _extr_c(_jit,r0,r1)
1104 static void _extr_c(jit_state_t*,jit_int32_t,jit_int32_t);
1105 # define extr_uc(r0,r1) _extr_uc(_jit,r0,r1)
1106 static void _extr_uc(jit_state_t*,jit_int32_t,jit_int32_t);
1107 # define extr_s(r0,r1) _extr_s(_jit,r0,r1)
1108 static void _extr_s(jit_state_t*,jit_int32_t,jit_int32_t);
1109 # define extr_us(r0,r1) _extr_us(_jit,r0,r1)
1110 static void _extr_us(jit_state_t*,jit_int32_t,jit_int32_t);
1111 # define prolog(i0) _prolog(_jit,i0)
1112 static void _prolog(jit_state_t*,jit_node_t*);
1113 # define epilog(i0) _epilog(_jit,i0)
1114 static void _epilog(jit_state_t*,jit_node_t*);
1115 # define callr(r0) _callr(_jit,r0)
1116 static void _callr(jit_state_t*,jit_int32_t);
1117 # define calli(i0) _calli(_jit,i0)
1118 static void _calli(jit_state_t*,jit_word_t);
1119 # define calli_p(i0) _calli_p(_jit,i0)
1120 static jit_word_t _calli_p(jit_state_t*,jit_word_t);
1121 # define vastart(r0) _vastart(_jit, r0)
1122 static void _vastart(jit_state_t*, jit_int32_t);
1123 # define vaarg(r0, r1) _vaarg(_jit, r0, r1)
1124 static void _vaarg(jit_state_t*, jit_int32_t, jit_int32_t);
1125 # define patch_at(kind,jump,label) _patch_at(_jit,kind,jump,label)
1126 static void _patch_at(jit_state_t*,jit_int32_t,jit_word_t,jit_word_t);
1127 #endif
1128
1129 #if CODE
1130 /* from binutils */
1131 # define rotate_left(v, n) (v << n | v >> (32 - n))
1132 static int
encode_arm_immediate(unsigned int v)1133 encode_arm_immediate(unsigned int v)
1134 {
1135 unsigned int a, i;
1136
1137 for (i = 0; i < 32; i += 2)
1138 if ((a = rotate_left(v, i)) <= 0xff)
1139 return (a | (i << 7));
1140
1141 return (-1);
1142 }
1143
1144 static int
encode_thumb_immediate(unsigned int v)1145 encode_thumb_immediate(unsigned int v)
1146 {
1147 int i;
1148 unsigned int m;
1149 unsigned int n;
1150 /* 00000000 00000000 00000000 abcdefgh */
1151 if ((v & 0xff) == v)
1152 return (v);
1153 /* 00000000 abcdefgh 00000000 abcdefgh */
1154 if ((v & 0xff00ff) == v && ((v & 0xff0000) >> 16) == (v & 0xff))
1155 return ((v & 0xff) | (1 << 12));
1156 /* abcdefgh 00000000 abcdefgh 00000000 */
1157 if (((v & 0xffff0000) >> 16) == (v & 0xffff) && (v & 0xff) == 0)
1158 return ((v & 0x000000ff) | (2 << 12));
1159 /* abcdefgh abcdefgh abcdefgh abcdefgh */
1160 if ( (v & 0xff) == ((v & 0xff00) >> 8) &&
1161 ((v & 0xff00) >> 8) == ((v & 0xff0000) >> 16) &&
1162 ((v & 0xff0000) << 8) == (v & 0xff000000))
1163 return ((v & 0xff) | (3 << 12));
1164 /* 1bcdefgh << 24 ... 1bcdefgh << 1 */
1165 for (i = 8, m = 0xff000000, n = 0x80000000;
1166 i < 23; i++, m >>= 1, n >>= 1) {
1167 if ((v & m) == v && (v & n)) {
1168 v >>= 32 - i;
1169 if (!(i & 1))
1170 v &= 0x7f;
1171 i >>= 1;
1172 return (((i & 7) << 12) | ((i & 8) << 23) | v);
1173 }
1174 }
1175 return (-1);
1176 }
1177
1178 static int
encode_thumb_word_immediate(unsigned int v)1179 encode_thumb_word_immediate(unsigned int v)
1180 {
1181 if ((v & 0xfffff000) == 0)
1182 return (((v & 0x800) << 15) | ((v & 0x700) << 4) | (v & 0xff));
1183 return (-1);
1184 }
1185
1186 static int
encode_thumb_jump(int v)1187 encode_thumb_jump(int v)
1188 {
1189 int s, i1, i2, j1, j2;
1190 if (v >= (int)-0x800000 && v <= 0x7fffff) {
1191 s = !!(v & 0x800000);
1192 i1 = !!(v & 0x400000);
1193 i2 = !!(v & 0x200000);
1194 j1 = s ? i1 : !i1;
1195 j2 = s ? i2 : !i2;
1196 return ((s<<26)|((v&0x1ff800)<<5)|(j1<<13)|(j2<<11)|(v&0x7ff));
1197 }
1198 return (-1);
1199 }
1200
1201 static int
encode_thumb_cc_jump(int v)1202 encode_thumb_cc_jump(int v)
1203 {
1204 int s, j1, j2;
1205 if (v >= (int)-0x80000 && v <= 0x7ffff) {
1206 s = !!(v & 0x80000);
1207 j1 = !!(v & 0x20000);
1208 j2 = !!(v & 0x40000);
1209 return ((s<<26)|((v&0x1f800)<<5)|(j1<<13)|(j2<<11)|(v&0x7ff));
1210 }
1211 return (-1);
1212 }
1213
1214 static int
encode_thumb_shift(int v,int type)1215 encode_thumb_shift(int v, int type)
1216 {
1217 switch (type) {
1218 case ARM_ASR:
1219 case ARM_LSL:
1220 case ARM_LSR: type >>= 1; break;
1221 default: assert(!"handled shift");
1222 }
1223 assert(v >= 0 && v <= 31);
1224 return (((v & 0x1c) << 10) | ((v & 3) << 6) | type);
1225 }
1226
1227 static void
_tcit(jit_state_t * _jit,unsigned int tc,int it)1228 _tcit(jit_state_t *_jit, unsigned int tc, int it)
1229 {
1230 int c;
1231 int m;
1232 c = (tc >> 28) & 1;
1233 assert(!(tc & 0xfffffff) && tc != ARM_CC_NV);
1234 switch (it) {
1235 case THUMB2_IT: m = 1<<3; break;
1236 case THUMB2_ITT: m = (c<<3)| (1<<2); break;
1237 case THUMB2_ITE: m = (!c<<3)| (1<<2); break;
1238 case THUMB2_ITTT: m = (c<<3)| (c<<2)| (1<<1); break;
1239 case THUMB2_ITET: m = (!c<<3)| (c<<2)| (1<<1); break;
1240 case THUMB2_ITTE: m = (c<<3)|(!c<<2)| (1<<1); break;
1241 case THUMB2_ITEE: m = (!c<<3)|(!c<<2)| (1<<1); break;
1242 case THUMB2_ITTTT: m = (c<<3)| (c<<2)| (c<<1)|1; break;
1243 case THUMB2_ITETT: m = (!c<<3)| (c<<2)| (c<<1)|1; break;
1244 case THUMB2_ITTET: m = (c<<3)|(!c<<2)| (c<<1)|1; break;
1245 case THUMB2_ITEET: m = (!c<<3)|(!c<<2)| (c<<1)|1; break;
1246 case THUMB2_ITTTE: m = (c<<3)| (c<<2)|(!c<<1)|1; break;
1247 case THUMB2_ITETE: m = (!c<<3)| (c<<2)|(!c<<1)|1; break;
1248 case THUMB2_ITTEE: m = (c<<3)|(!c<<2)|(!c<<1)|1; break;
1249 case THUMB2_ITEEE: m = (!c<<3)|(!c<<2)|(!c<<1)|1; break;
1250 default: abort();
1251 }
1252 assert(m && (tc != ARM_CC_AL || !(m & (m - 1))));
1253 is(0xbf00 | (tc >> 24) | m);
1254 }
1255
1256 static void
_corrr(jit_state_t * _jit,int cc,int o,int rn,int rd,int rm)1257 _corrr(jit_state_t *_jit, int cc, int o, int rn, int rd, int rm)
1258 {
1259 assert(!(cc & 0x0fffffff));
1260 assert(!(o & 0xf00fff0f));
1261 ii(cc|o|(_u4(rn)<<16)|(_u4(rd)<<12)|_u4(rm));
1262 }
1263
1264 static void
_corri(jit_state_t * _jit,int cc,int o,int rn,int rd,int im)1265 _corri(jit_state_t *_jit, int cc, int o, int rn, int rd, int im)
1266 {
1267 assert(!(cc & 0x0fffffff));
1268 assert(!(o & 0xf00fffff));
1269 assert(!(im & 0xfffff000));
1270 ii(cc|o|(_u4(rn)<<16)|(_u4(rd)<<12)|_u12(im));
1271 }
1272
1273 static void
_corri8(jit_state_t * _jit,int cc,int o,int rn,int rt,int im)1274 _corri8(jit_state_t *_jit, int cc, int o, int rn, int rt, int im)
1275 {
1276 assert(!(cc & 0x0fffffff));
1277 assert(!(o & 0xf00fff0f));
1278 assert(!(im & 0xffffff00));
1279 ii(cc|o|(_u4(rn)<<16)|(_u4(rt)<<12)|((im&0xf0)<<4)|(im&0x0f));
1280 }
1281
1282 static void
_coriw(jit_state_t * _jit,int cc,int o,int rd,int im)1283 _coriw(jit_state_t *_jit, int cc, int o, int rd, int im)
1284 {
1285 assert(!(cc & 0x0fffffff));
1286 assert(!(o & 0xf00fffff));
1287 assert(!(im & 0xffff0000));
1288 ii(cc|o|((im&0xf000)<<4)|(_u4(rd)<<12)|(im&0xfff));
1289 }
1290
1291 static void
_torrr(jit_state_t * _jit,int o,int rn,int rd,int rm)1292 _torrr(jit_state_t *_jit, int o, int rn, int rd, int rm)
1293 {
1294 jit_thumb_t thumb;
1295 assert(!(o & 0xf0f0f));
1296 thumb.i = o|(_u4(rn)<<16)|(_u4(rd)<<8)|_u4(rm);
1297 iss(thumb.s[0], thumb.s[1]);
1298 }
1299
1300 static void
_torrrs(jit_state_t * _jit,int o,int rn,int rd,int rm,int im)1301 _torrrs(jit_state_t *_jit, int o, int rn, int rd, int rm, int im)
1302 {
1303 jit_thumb_t thumb;
1304 assert(!(o & 0x000f0f0f));
1305 assert(!(im & 0xffff8f0f));
1306 thumb.i = o|(_u4(rn)<<16)|(_u4(rd)<<8)|im|_u4(rm);
1307 iss(thumb.s[0], thumb.s[1]);
1308 }
1309
1310 static void
_torxr(jit_state_t * _jit,int o,int rn,int rt,int rm)1311 _torxr(jit_state_t *_jit, int o, int rn, int rt, int rm)
1312 {
1313 jit_thumb_t thumb;
1314 assert(!(o & 0xf0f0f));
1315 thumb.i = o|(_u4(rn)<<16)|(_u4(rt)<<12)|_u4(rm);
1316 iss(thumb.s[0], thumb.s[1]);
1317 }
1318
1319 static void
_torrrr(jit_state_t * _jit,int o,int rn,int rl,int rh,int rm)1320 _torrrr(jit_state_t *_jit, int o, int rn, int rl, int rh, int rm)
1321 {
1322 jit_thumb_t thumb;
1323 assert(!(o & 0x000fff0f));
1324 thumb.i = o|(_u4(rn)<<16)|(_u4(rl)<<12)|(_u4(rh)<<8)|_u4(rm);
1325 iss(thumb.s[0], thumb.s[1]);
1326 }
1327
1328 static void
_torrri8(jit_state_t * _jit,int o,int rn,int rt,int rt2,int im)1329 _torrri8(jit_state_t *_jit, int o, int rn, int rt, int rt2, int im)
1330 {
1331 jit_thumb_t thumb;
1332 assert(!(o & 0x000fffff));
1333 assert(!(im & 0xffffff00));
1334 thumb.i = o|(_u4(rn)<<16)|(_u4(rt)<<12)|(_u4(rt2)<<8)|im;
1335 iss(thumb.s[0], thumb.s[1]);
1336 }
1337
1338 static void
_torri(jit_state_t * _jit,int o,int rn,int rd,int im)1339 _torri(jit_state_t *_jit, int o, int rn, int rd, int im)
1340 {
1341 jit_thumb_t thumb;
1342 assert(!(o & 0x0c0f7fff));
1343 assert(!(im & 0xfbff8f00));
1344 thumb.i = o|(_u4(rn)<<16)|(_u4(rd)<<8)|im;
1345 iss(thumb.s[0], thumb.s[1]);
1346 }
1347
1348 static void
_torri8(jit_state_t * _jit,int o,int rn,int rt,int im)1349 _torri8(jit_state_t *_jit, int o, int rn, int rt, int im)
1350 {
1351 jit_thumb_t thumb;
1352 assert(!(o & 0x000ff0ff));
1353 assert(!(im & 0xffffff00));
1354 thumb.i = o|(_u4(rn)<<16)|(_u4(rt)<<12)|im;
1355 iss(thumb.s[0], thumb.s[1]);
1356 }
1357
1358 static void
_torri12(jit_state_t * _jit,int o,int rn,int rt,int im)1359 _torri12(jit_state_t *_jit, int o, int rn, int rt, int im)
1360 {
1361 jit_thumb_t thumb;
1362 assert(!(o & 0x000fffff));
1363 assert(!(im & 0xfffff000));
1364 thumb.i = o|(_u4(rn)<<16)|(_u4(rt)<<12)|im;
1365 iss(thumb.s[0], thumb.s[1]);
1366 }
1367
1368 static void
_tshift(jit_state_t * _jit,int o,int rd,int rm,int im)1369 _tshift(jit_state_t *_jit, int o, int rd, int rm, int im)
1370 {
1371 jit_thumb_t thumb;
1372 assert(!(o & 0x7fcf));
1373 assert(im >= 0 && im < 32);
1374 thumb.i = o|((im&0x1c)<<10)|(_u4(rd)<<8)|((im&3)<<6)|_u4(rm);
1375 iss(thumb.s[0], thumb.s[1]);
1376 }
1377
1378 static void
_toriw(jit_state_t * _jit,int o,int rd,int im)1379 _toriw(jit_state_t *_jit, int o, int rd, int im)
1380 {
1381 jit_thumb_t thumb;
1382 assert(!(im & 0xffff0000));
1383 thumb.i = o|((im&0xf000)<<4)|((im&0x800)<<15)|((im&0x700)<<4)|(_u4(rd)<<8)|(im&0xff);
1384 iss(thumb.s[0], thumb.s[1]);
1385 }
1386
1387 static void
_tc8(jit_state_t * _jit,int cc,int im)1388 _tc8(jit_state_t *_jit, int cc, int im)
1389 {
1390 assert(!(cc & 0x0fffffff));
1391 assert(cc != ARM_CC_AL && cc != ARM_CC_NV);
1392 assert(im >= -128 && im <= 127);
1393 is(THUMB_CC_B|(cc>>20)|(im&0xff));
1394 }
1395
1396 static void
_t11(jit_state_t * _jit,int im)1397 _t11(jit_state_t *_jit, int im)
1398 {
1399 assert(!(im & 0xfffff800));
1400 is(THUMB_B|im);
1401 }
1402
1403 static void
_tcb(jit_state_t * _jit,int cc,int im)1404 _tcb(jit_state_t *_jit, int cc, int im)
1405 {
1406 jit_thumb_t thumb;
1407 assert(!(cc & 0xfffffff));
1408 assert(cc != ARM_CC_AL && cc != ARM_CC_NV);
1409 cc = ((jit_uint32_t)cc) >> 6;
1410 assert(!(im & (THUMB2_CC_B|cc)));
1411 thumb.i = THUMB2_CC_B|cc|im;
1412 iss(thumb.s[0], thumb.s[1]);
1413 }
1414
1415 static void
_blxi(jit_state_t * _jit,int im)1416 _blxi(jit_state_t *_jit, int im)
1417 {
1418 assert(!(im & 0xfe000000));
1419 ii(ARM_BLXI|im);
1420 }
1421
1422 static void
_tb(jit_state_t * _jit,int o,int im)1423 _tb(jit_state_t *_jit, int o, int im)
1424 {
1425 jit_thumb_t thumb;
1426 assert(!(o & 0x07ff2fff));
1427 assert(!(o & im));
1428 thumb.i = o|im;
1429 iss(thumb.s[0], thumb.s[1]);
1430 }
1431
1432 static void
_corrrr(jit_state_t * _jit,int cc,int o,int rh,int rl,int rm,int rn)1433 _corrrr(jit_state_t *_jit, int cc, int o, int rh, int rl, int rm, int rn)
1434 {
1435 assert(!(cc & 0x0fffffff));
1436 assert(!(o & 0xf00fff0f));
1437 ii(cc|o|(_u4(rh)<<16)|(_u4(rl)<<12)|(_u4(rm)<<8)|_u4(rn));
1438 }
1439
1440 static void
_corrrs(jit_state_t * _jit,int cc,int o,int rn,int rd,int rm,int im)1441 _corrrs(jit_state_t *_jit, int cc, int o, int rn, int rd, int rm, int im)
1442 {
1443 assert(!(cc & 0x0fffffff));
1444 assert(!(o & 0xf000ff8f));
1445 ii(cc|o|(_u4(rd)<<12)|(_u4(rn)<<16)|(im<<7)|_u4(rm));
1446 }
1447
1448 static void
_cshift(jit_state_t * _jit,int cc,int o,int rd,int rm,int rn,int im)1449 _cshift(jit_state_t *_jit, int cc, int o, int rd, int rm, int rn, int im)
1450 {
1451 assert(!(cc & 0x0fffffff));
1452 assert(!(o & 0xffe0ff8f));
1453 assert(((_u4(rm)<<8)&(im<<7)) == 0);
1454 ii(cc|ARM_SHIFT|o|(_u4(rd)<<12)|(_u4(rm)<<8)|(im<<7)|_u4(rn));
1455 }
1456
1457 static void
_cb(jit_state_t * _jit,int cc,int o,int im)1458 _cb(jit_state_t *_jit, int cc, int o, int im)
1459 {
1460 assert(!(cc & 0x0fffffff));
1461 assert(!(o & 0xf0ffffff));
1462 ii(cc|o|_u24(im));
1463 }
1464
1465 static void
_cbx(jit_state_t * _jit,int cc,int o,int rm)1466 _cbx(jit_state_t *_jit, int cc, int o, int rm)
1467 {
1468 assert(!(cc & 0x0fffffff));
1469 assert(!(o & 0xf000000f));
1470 ii(cc|o|_u4(rm));
1471 }
1472
1473 static void
_corl(jit_state_t * _jit,int cc,int o,int r0,int i0)1474 _corl(jit_state_t *_jit, int cc, int o, int r0, int i0)
1475 {
1476 assert(!(cc & 0x0fffffff));
1477 assert(!(o & 0xf00fffff));
1478 ii(cc|o|(_u4(r0)<<16)|_u16(i0));
1479 }
1480
1481 static void
_c6orr(jit_state_t * _jit,int cc,int o,int rd,int rm)1482 _c6orr(jit_state_t *_jit, int cc, int o, int rd, int rm)
1483 {
1484 assert(!(cc & 0x0fffffff));
1485 assert(!(o & 0xf000f00f));
1486 ii(cc|o|(_u4(rd)<<12)|_u4(rm));
1487 }
1488
1489 static void
_tpp(jit_state_t * _jit,int o,int im)1490 _tpp(jit_state_t *_jit, int o, int im)
1491 {
1492 jit_thumb_t thumb;
1493 assert(!(o & 0x0000ffff));
1494 if (o == THUMB2_PUSH)
1495 assert(!(im & 0x8000));
1496 assert(__builtin_popcount(im & 0x1fff) > 1);
1497 thumb.i = o|im;
1498 iss(thumb.s[0], thumb.s[1]);
1499 }
1500
1501 static void
_torl(jit_state_t * _jit,int o,int rn,int im)1502 _torl(jit_state_t *_jit, int o, int rn, int im)
1503 {
1504 jit_thumb_t thumb;
1505 assert(!(o & 0xf1fff));
1506 assert(rn != _R15 || !im || ((o & 0xc000) == 0xc000));
1507 assert(!(o & THUMB2_LDM_W) || !(im & (1 << rn)));
1508 thumb.i = o | (_u4(rn)<<16)|_u13(im);
1509 iss(thumb.s[0], thumb.s[1]);
1510 }
1511
1512 static void
_nop(jit_state_t * _jit,jit_int32_t i0)1513 _nop(jit_state_t *_jit, jit_int32_t i0)
1514 {
1515 if (jit_thumb_p()) {
1516 for (; i0 > 0; i0 -= 2)
1517 T1_NOP();
1518 }
1519 else {
1520 for (; i0 > 0; i0 -= 4)
1521 NOP();
1522 }
1523 assert(i0 == 0);
1524 }
1525
1526 static void
_movr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)1527 _movr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
1528 {
1529 if (r0 != r1) {
1530 if (jit_thumb_p())
1531 T1_MOV(r0, r1);
1532 else
1533 MOV(r0, r1);
1534 }
1535 }
1536
1537 static void
_movi(jit_state_t * _jit,jit_int32_t r0,jit_word_t i0)1538 _movi(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
1539 {
1540 int i;
1541 if (jit_thumb_p()) {
1542 if (!jit_no_set_flags() && r0 < 8 && !(i0 & 0xffffff80))
1543 T1_MOVI(r0, i0);
1544 else if ((i = encode_thumb_immediate(i0)) != -1)
1545 T2_MOVI(r0, i);
1546 else if ((i = encode_thumb_immediate(~i0)) != -1)
1547 T2_MVNI(r0, i);
1548 else {
1549 T2_MOVWI(r0, (jit_uint16_t)i0);
1550 if (i0 & 0xffff0000)
1551 T2_MOVTI(r0, (jit_uint16_t)((unsigned)i0 >> 16));
1552 }
1553 }
1554 else {
1555 if (jit_armv6_p() && !(i0 & 0xffff0000))
1556 MOVWI(r0, i0);
1557 else if ((i = encode_arm_immediate(i0)) != -1)
1558 MOVI(r0, i);
1559 else if ((i = encode_arm_immediate(~i0)) != -1)
1560 MVNI(r0, i);
1561 else if (jit_armv6_p()) {
1562 MOVWI(r0, (jit_uint16_t)(i0));
1563 if ((i0 & 0xffff0000))
1564 MOVTI(r0, (jit_uint16_t)((unsigned)i0 >> 16));
1565 }
1566 else
1567 load_const(0, r0, i0);
1568 }
1569 }
1570
1571 static jit_word_t
_movi_p(jit_state_t * _jit,jit_int32_t r0,jit_word_t i0)1572 _movi_p(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
1573 {
1574 jit_word_t w;
1575 w = _jit->pc.w;
1576 if (jit_thumb_p()) {
1577 T2_MOVWI(r0, (jit_uint16_t)(i0));
1578 T2_MOVTI(r0, (jit_uint16_t)((unsigned)i0 >> 16));
1579 }
1580 else
1581 load_const(1, r0, 0);
1582 return (w);
1583 }
1584
1585 static void
_comr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)1586 _comr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
1587 {
1588 if (jit_thumb_p()) {
1589 if (!jit_no_set_flags() && (r0|r1) < 8)
1590 T1_NOT(r0, r1);
1591 else
1592 T2_NOT(r0, r1);
1593 }
1594 else
1595 NOT(r0, r1);
1596 }
1597
1598 static void
_negr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)1599 _negr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
1600 {
1601 if (jit_thumb_p()) {
1602 if (!jit_no_set_flags() && (r0|r1) < 8)
1603 T1_RSBI(r0, r1);
1604 else
1605 T2_RSBI(r0, r1, 0);
1606 }
1607 else
1608 RSBI(r0, r1, 0);
1609 }
1610
1611 static void
_addr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)1612 _addr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1613 {
1614 if (jit_thumb_p()) {
1615 if (!jit_no_set_flags() && (r0|r1|r2) < 8)
1616 T1_ADD(r0, r1, r2);
1617 else if (r0 == r1 || r0 == r2)
1618 T1_ADDX(r0, r0 == r1 ? r2 : r1);
1619 else
1620 T2_ADD(r0, r1, r2);
1621 }
1622 else
1623 ADD(r0, r1, r2);
1624 }
1625
1626 static void
_addi(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)1627 _addi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1628 {
1629 int i;
1630 jit_int32_t reg;
1631 if (jit_thumb_p()) {
1632 if (!jit_no_set_flags() && (r0|r1) < 8 && !(i0 & ~7))
1633 T1_ADDI3(r0, r1, i0);
1634 else if (!jit_no_set_flags() && (r0|r1) < 8 && !(-i0 & ~7))
1635 T1_SUBI3(r0, r1, -i0);
1636 else if (!jit_no_set_flags() && r0 < 8 && r0 == r1 && !(i0 & ~0xff))
1637 T1_ADDI8(r0, i0);
1638 else if (!jit_no_set_flags() && r0 < 8 && r0 == r1 && !(-i0 & ~0xff))
1639 T1_SUBI8(r0, -i0);
1640 else if ((i = encode_thumb_immediate(i0)) != -1)
1641 T2_ADDI(r0, r1, i);
1642 else if ((i = encode_thumb_immediate(-i0)) != -1)
1643 T2_SUBI(r0, r1, i);
1644 else if ((i = encode_thumb_word_immediate(i0)) != -1)
1645 T2_ADDWI(r0, r1, i);
1646 else if ((i = encode_thumb_word_immediate(-i0)) != -1)
1647 T2_SUBWI(r0, r1, i);
1648 else {
1649 reg = jit_get_reg(jit_class_gpr);
1650 movi(rn(reg), i0);
1651 T2_ADD(r0, r1, rn(reg));
1652 jit_unget_reg(reg);
1653 }
1654 }
1655 else {
1656 if ((i = encode_arm_immediate(i0)) != -1)
1657 ADDI(r0, r1, i);
1658 else if ((i = encode_arm_immediate(-i0)) != -1)
1659 SUBI(r0, r1, i);
1660 else if (r0 != r1) {
1661 movi(r0, i0);
1662 ADD(r0, r1, r0);
1663 }
1664 else {
1665 reg = jit_get_reg(jit_class_gpr);
1666 movi(rn(reg), i0);
1667 ADD(r0, r1, rn(reg));
1668 jit_unget_reg(reg);
1669 }
1670 }
1671 }
1672
1673 static void
_addcr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)1674 _addcr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1675 {
1676 if (jit_thumb_p()) {
1677 /* thumb auto set carry if not inside IT block */
1678 if ((r0|r1|r2) < 8)
1679 T1_ADD(r0, r1, r2);
1680 else
1681 T2_ADDS(r0, r1, r2);
1682 }
1683 else
1684 ADDS(r0, r1, r2);
1685 }
1686
1687 static void
_addci(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)1688 _addci(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1689 {
1690 int i;
1691 jit_int32_t reg;
1692 if (jit_thumb_p()) {
1693 if ((r0|r1) < 8 && !(i0 & ~7))
1694 T1_ADDI3(r0, r1, i0);
1695 else if ((r0|r1) < 8 && !(-i0 & ~7))
1696 T1_SUBI3(r0, r1, -i0);
1697 else if (r0 < 8 && r0 == r1 && !(i0 & ~0xff))
1698 T1_ADDI8(r0, i0);
1699 else if (r0 < 8 && r0 == r1 && !(-i0 & ~0xff))
1700 T1_SUBI8(r0, -i0);
1701 else if ((i = encode_thumb_immediate(i0)) != -1)
1702 T2_ADDSI(r0, r1, i);
1703 else if ((i = encode_thumb_immediate(-i0)) != -1)
1704 T2_SUBSI(r0, r1, i);
1705 else {
1706 reg = jit_get_reg(jit_class_gpr);
1707 movi(rn(reg), i0);
1708 T2_ADDS(r0, r1, rn(reg));
1709 jit_unget_reg(reg);
1710 }
1711 }
1712 else {
1713 if ((i = encode_arm_immediate(i0)) != -1)
1714 ADDSI(r0, r1, i);
1715 else if ((i = encode_arm_immediate(-i0)) != -1)
1716 SUBSI(r0, r1, i);
1717 else if (r0 != r1) {
1718 movi(r0, i0);
1719 ADDS(r0, r1, r0);
1720 }
1721 else {
1722 reg = jit_get_reg(jit_class_gpr);
1723 movi(rn(reg), i0);
1724 ADDS(r0, r1, rn(reg));
1725 jit_unget_reg(reg);
1726 }
1727 }
1728 }
1729
1730 static void
_addxr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)1731 _addxr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1732 {
1733 /* keep setting carry because don't know last ADC */
1734 if (jit_thumb_p()) {
1735 /* thumb auto set carry if not inside IT block */
1736 if ((r0|r1|r2) < 8 && (r0 == r1 || r0 == r2))
1737 T1_ADC(r0, r0 == r1 ? r2 : r1);
1738 else
1739 T2_ADCS(r0, r1, r2);
1740 }
1741 else
1742 ADCS(r0, r1, r2);
1743 }
1744
1745 static void
_addxi(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)1746 _addxi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1747 {
1748 int i;
1749 jit_int32_t reg;
1750 int no_set_flags;
1751 if (jit_thumb_p()) {
1752 no_set_flags = jit_no_set_flags();
1753 jit_no_set_flags() = 1;
1754 if ((i = encode_thumb_immediate(i0)) != -1)
1755 T2_ADCSI(r0, r1, i);
1756 else if ((i = encode_thumb_immediate(-i0)) != -1)
1757 T2_SBCSI(r0, r1, i);
1758 else if (r0 != r1) {
1759 movi(r0, i0);
1760 T2_ADCS(r0, r1, r0);
1761 }
1762 else {
1763 reg = jit_get_reg(jit_class_gpr);
1764 movi(rn(reg), i0);
1765 T2_ADCS(r0, r1, rn(reg));
1766 jit_unget_reg(reg);
1767 }
1768 jit_no_set_flags() = no_set_flags;
1769 }
1770 else {
1771 if ((i = encode_arm_immediate(i0)) != -1)
1772 ADCSI(r0, r1, i);
1773 else if ((i = encode_arm_immediate(-i0)) != -1)
1774 SBCSI(r0, r1, i);
1775 else if (r0 != r1) {
1776 movi(r0, i0);
1777 ADCS(r0, r1, r0);
1778 }
1779 else {
1780 reg = jit_get_reg(jit_class_gpr);
1781 movi(rn(reg), i0);
1782 ADCS(r0, r1, rn(reg));
1783 jit_unget_reg(reg);
1784 }
1785 }
1786 }
1787
1788 static void
_subr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)1789 _subr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1790 {
1791 if (jit_thumb_p()) {
1792 if (!jit_no_set_flags() && (r0|r1|r2) < 8)
1793 T1_SUB(r0, r1, r2);
1794 else
1795 T2_SUB(r0, r1, r2);
1796 }
1797 else
1798 SUB(r0, r1, r2);
1799 }
1800
1801 static void
_subi(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)1802 _subi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1803 {
1804 int i;
1805 jit_int32_t reg;
1806 if (jit_thumb_p()) {
1807 if (!jit_no_set_flags() && (r0|r1) < 8 && !(i0 & ~7))
1808 T1_SUBI3(r0, r1, i0);
1809 else if (!jit_no_set_flags() && (r0|r1) < 8 && !(-i0 & ~7))
1810 T1_ADDI3(r0, r1, -i0);
1811 else if (!jit_no_set_flags() && r0 < 8 && r0 == r1 && !(i0 & ~0xff))
1812 T1_SUBI8(r0, i0);
1813 else if (!jit_no_set_flags() && r0 < 8 && r0 == r1 && !(-i0 & ~0xff))
1814 T1_ADDI8(r0, -i0);
1815 else if ((i = encode_thumb_immediate(i0)) != -1)
1816 T2_SUBI(r0, r1, i);
1817 else if ((i = encode_thumb_immediate(-i0)) != -1)
1818 T2_ADDI(r0, r1, i);
1819 else if ((i = encode_thumb_word_immediate(i0)) != -1)
1820 T2_SUBWI(r0, r1, i);
1821 else if ((i = encode_thumb_word_immediate(-i0)) != -1)
1822 T2_ADDWI(r0, r1, i);
1823 else {
1824 reg = jit_get_reg(jit_class_gpr);
1825 movi(rn(reg), i0);
1826 T2_SUB(r0, r1, rn(reg));
1827 jit_unget_reg(reg);
1828 }
1829 }
1830 else {
1831 if ((i = encode_arm_immediate(i0)) != -1)
1832 SUBI(r0, r1, i);
1833 else if ((i = encode_arm_immediate(-i0)) != -1)
1834 ADDI(r0, r1, i);
1835 else if (r0 != r1) {
1836 movi(r0, i0);
1837 SUB(r0, r1, r0);
1838 }
1839 else {
1840 reg = jit_get_reg(jit_class_gpr);
1841 movi(rn(reg), i0);
1842 SUB(r0, r1, rn(reg));
1843 jit_unget_reg(reg);
1844 }
1845 }
1846 }
1847
1848 static void
_subcr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)1849 _subcr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1850 {
1851 if (jit_thumb_p()) {
1852 /* thumb auto set carry if not inside IT block */
1853 if ((r0|r1|r2) < 8)
1854 T1_SUB(r0, r1, r2);
1855 else
1856 T2_SUBS(r0, r1, r2);
1857 }
1858 else
1859 SUBS(r0, r1, r2);
1860 }
1861
1862 static void
_subci(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)1863 _subci(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1864 {
1865 int i;
1866 jit_int32_t reg;
1867 if (jit_thumb_p()) {
1868 if ((r0|r1) < 8 && !(i0 & ~7))
1869 T1_SUBI3(r0, r1, i0);
1870 else if ((r0|r1) < 8 && !(-i0 & ~7))
1871 T1_ADDI3(r0, r1, -i0);
1872 else if (r0 < 8 && r0 == r1 && !(i0 & ~0xff))
1873 T1_SUBI8(r0, i0);
1874 else if (r0 < 8 && r0 == r1 && !(-i0 & ~0xff))
1875 T1_ADDI8(r0, -i0);
1876 else if ((i = encode_thumb_immediate(i0)) != -1)
1877 T2_SUBSI(r0, r1, i);
1878 else if ((i = encode_thumb_immediate(-i0)) != -1)
1879 T2_ADDSI(r0, r1, i);
1880 else {
1881 reg = jit_get_reg(jit_class_gpr);
1882 movi(rn(reg), i0);
1883 T2_SUBS(r0, r1, rn(reg));
1884 jit_unget_reg(reg);
1885 }
1886 }
1887 else {
1888 if ((i = encode_arm_immediate(i0)) != -1)
1889 SUBSI(r0, r1, i);
1890 else if ((i = encode_arm_immediate(-i0)) != -1)
1891 ADDSI(r0, r1, i);
1892 else if (r0 != r1) {
1893 movi(r0, i0);
1894 SUBS(r0, r1, r0);
1895 }
1896 else {
1897 reg = jit_get_reg(jit_class_gpr);
1898 movi(rn(reg), i0);
1899 SUBS(r0, r1, rn(reg));
1900 jit_unget_reg(reg);
1901 }
1902 }
1903 }
1904
1905 static void
_subxr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)1906 _subxr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1907 {
1908 /* keep setting carry because don't know last SBC */
1909 if (jit_thumb_p()) {
1910 /* thumb auto set carry if not inside IT block */
1911 if ((r0|r1|r2) < 8 && r0 == r1)
1912 T1_SBC(r0, r2);
1913 else
1914 T2_SBCS(r0, r1, r2);
1915 }
1916 else
1917 SBCS(r0, r1, r2);
1918 }
1919
1920 static void
_subxi(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)1921 _subxi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1922 {
1923 int i;
1924 jit_int32_t reg;
1925 int no_set_flags;
1926 if (jit_thumb_p()) {
1927 no_set_flags = jit_no_set_flags();
1928 jit_no_set_flags() = 1;
1929 if ((i = encode_arm_immediate(i0)) != -1)
1930 T2_SBCSI(r0, r1, i);
1931 else if ((i = encode_arm_immediate(-i0)) != -1)
1932 T2_ADCSI(r0, r1, i);
1933 else if (r0 != r1) {
1934 movi(r0, i0);
1935 T2_SBCS(r0, r1, r0);
1936 }
1937 else {
1938 reg = jit_get_reg(jit_class_gpr);
1939 movi(rn(reg), i0);
1940 SBCS(r0, r1, rn(reg));
1941 jit_unget_reg(reg);
1942 }
1943 jit_no_set_flags() = no_set_flags;
1944 }
1945 else {
1946 if ((i = encode_arm_immediate(i0)) != -1)
1947 SBCSI(r0, r1, i);
1948 else if ((i = encode_arm_immediate(-i0)) != -1)
1949 ADCSI(r0, r1, i);
1950 else if (r0 != r1) {
1951 movi(r0, i0);
1952 SBCS(r0, r1, r0);
1953 }
1954 else {
1955 reg = jit_get_reg(jit_class_gpr);
1956 movi(rn(reg), i0);
1957 SBCS(r0, r1, rn(reg));
1958 jit_unget_reg(reg);
1959 }
1960 }
1961 }
1962
1963 static void
_rsbi(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)1964 _rsbi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
1965 {
1966 subi(r0, r1, i0);
1967 negr(r0, r0);
1968 }
1969
1970 static void
_mulr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)1971 _mulr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
1972 {
1973 jit_int32_t reg;
1974 if (jit_thumb_p()) {
1975 if (!jit_no_set_flags() && r0 == r2 && (r0|r1) < 8)
1976 T1_MUL(r0, r1);
1977 else if (!jit_no_set_flags() && r0 == r1 && (r0|r2) < 8)
1978 T1_MUL(r0, r2);
1979 else
1980 T2_MUL(r0, r1, r2);
1981 }
1982 else {
1983 if (r0 == r1 && !jit_armv6_p()) {
1984 if (r0 != r2)
1985 MUL(r0, r2, r1);
1986 else {
1987 reg = jit_get_reg(jit_class_gpr);
1988 MOV(rn(reg), r1);
1989 MUL(r0, rn(reg), r2);
1990 jit_unget_reg(reg);
1991 }
1992 }
1993 else
1994 MUL(r0, r1, r2);
1995 }
1996 }
1997
1998 static void
_muli(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)1999 _muli(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2000 {
2001 jit_int32_t reg;
2002 reg = jit_get_reg(jit_class_gpr);
2003 movi(rn(reg), i0);
2004 mulr(r0, r1, rn(reg));
2005 jit_unget_reg(reg);
2006 }
2007
2008 static void
_iqmulr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2,jit_int32_t r3,jit_bool_t sign)2009 _iqmulr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1,
2010 jit_int32_t r2, jit_int32_t r3, jit_bool_t sign)
2011 {
2012 jit_int32_t reg;
2013 if (jit_thumb_p()) {
2014 if (r2 == r3) {
2015 reg = jit_get_reg(jit_class_gpr);
2016 movr(rn(reg), r2);
2017 if (sign)
2018 T2_SMULL(r0, r1, rn(reg), r2);
2019 else
2020 T2_UMULL(r0, r1, rn(reg), r2);
2021 jit_unget_reg(reg);
2022 }
2023 else if (r0 != r2 && r1 != r2) {
2024 if (sign)
2025 T2_SMULL(r0, r1, r2, r3);
2026 else
2027 T2_UMULL(r0, r1, r2, r3);
2028 }
2029 else {
2030 if (sign)
2031 T2_SMULL(r0, r1, r3, r2);
2032 else
2033 T2_UMULL(r0, r1, r3, r2);
2034 }
2035 }
2036 else {
2037 if (r2 == r3) {
2038 reg = jit_get_reg(jit_class_gpr);
2039 movr(rn(reg), r2);
2040 if (sign)
2041 SMULL(r0, r1, rn(reg), r2);
2042 else
2043 UMULL(r0, r1, rn(reg), r2);
2044 jit_unget_reg(reg);
2045 }
2046 else if (r0 != r2 && r1 != r2) {
2047 if (sign)
2048 SMULL(r0, r1, r2, r3);
2049 else
2050 UMULL(r0, r1, r2, r3);
2051 }
2052 else {
2053 if (sign)
2054 SMULL(r0, r1, r3, r2);
2055 else
2056 UMULL(r0, r1, r3, r2);
2057 }
2058 }
2059 }
2060
2061 static void
_iqmuli(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2,jit_word_t i0,jit_bool_t sign)2062 _iqmuli(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1,
2063 jit_int32_t r2, jit_word_t i0, jit_bool_t sign)
2064 {
2065 jit_int32_t reg;
2066 reg = jit_get_reg(jit_class_gpr);
2067 movi(rn(reg), i0);
2068 iqmulr(r0, r1, r2, rn(reg), sign);
2069 jit_unget_reg(reg);
2070 }
2071
2072 static void
_divrem(jit_state_t * _jit,int div,int sign,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2073 _divrem(jit_state_t *_jit, int div, int sign,
2074 jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2075 {
2076 jit_word_t d;
2077 jit_word_t w;
2078 jit_get_reg_args();
2079 movr(_R0_REGNO, r1);
2080 movr(_R1_REGNO, r2);
2081 if (sign) w = (jit_word_t)__aeabi_idivmod;
2082 else w = (jit_word_t)__aeabi_uidivmod;
2083 if (!jit_exchange_p()) {
2084 if (jit_thumb_p()) d = ((w - _jit->pc.w) >> 1) - 2;
2085 else d = ((w - _jit->pc.w) >> 2) - 2;
2086 if (_s24P(d)) {
2087 if (jit_thumb_p()) T2_BLI(encode_thumb_jump(d));
2088 else BLI(d & 0x00ffffff);
2089 }
2090 else goto fallback;
2091 }
2092 else {
2093 fallback:
2094 movi(_R2_REGNO, w);
2095 if (jit_thumb_p()) T1_BLX(_R2_REGNO);
2096 else BLX(_R2_REGNO);
2097 }
2098 if (div) movr(r0, _R0_REGNO);
2099 else movr(r0, _R1_REGNO);
2100 jit_unget_reg_args();
2101 }
2102
2103 static void
_divr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2104 _divr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2105 {
2106 if (jit_armv7r_p() && jit_thumb_p())
2107 T2_SDIV(r0, r1, r2);
2108 else
2109 divrem(1, 1, r0, r1, r2);
2110 }
2111
2112 static void
_divi(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2113 _divi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2114 {
2115 jit_int32_t reg;
2116 reg = jit_get_reg(jit_class_gpr);
2117 movi(rn(reg), i0);
2118 divr(r0, r1, rn(reg));
2119 jit_unget_reg(reg);
2120 }
2121
2122 static void
_divr_u(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2123 _divr_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2124 {
2125 if (jit_armv7r_p() && jit_thumb_p())
2126 T2_UDIV(r0, r1, r2);
2127 else
2128 divrem(1, 0, r0, r1, r2);
2129 }
2130
2131 static void
_divi_u(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2132 _divi_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2133 {
2134 jit_int32_t reg;
2135 reg = jit_get_reg(jit_class_gpr);
2136 movi(rn(reg), i0);
2137 divr_u(r0, r1, rn(reg));
2138 jit_unget_reg(reg);
2139 }
2140
2141 static void
_iqdivr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2,jit_int32_t r3,jit_bool_t sign)2142 _iqdivr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1,
2143 jit_int32_t r2, jit_int32_t r3, jit_bool_t sign)
2144 {
2145 jit_word_t d;
2146 jit_word_t w;
2147 jit_get_reg_args();
2148 movr(_R0_REGNO, r2);
2149 movr(_R1_REGNO, r3);
2150 if (sign) w = (jit_word_t)__aeabi_idivmod;
2151 else w = (jit_word_t)__aeabi_uidivmod;
2152 if (!jit_exchange_p()) {
2153 if (jit_thumb_p()) d = ((w - _jit->pc.w) >> 1) - 2;
2154 else d = ((w - _jit->pc.w) >> 2) - 2;
2155 if (_s24P(d)) {
2156 if (jit_thumb_p()) T2_BLI(encode_thumb_jump(d));
2157 else BLI(d & 0x00ffffff);
2158 }
2159 else goto fallback;
2160 }
2161 else {
2162 fallback:
2163 movi(_R2_REGNO, w);
2164 if (jit_thumb_p()) T1_BLX(_R2_REGNO);
2165 else BLX(_R2_REGNO);
2166 }
2167 movr(r0, _R0_REGNO);
2168 movr(r1, _R1_REGNO);
2169 jit_unget_reg_args();
2170 }
2171
2172 static void
_iqdivi(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2,jit_word_t i0,jit_bool_t sign)2173 _iqdivi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1,
2174 jit_int32_t r2, jit_word_t i0, jit_bool_t sign)
2175 {
2176 jit_int32_t reg;
2177 reg = jit_get_reg(jit_class_gpr);
2178 movi(rn(reg), i0);
2179 iqdivr(r0, r1, r2, rn(reg), sign);
2180 jit_unget_reg(reg);
2181 }
2182
2183 static void
_remr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2184 _remr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2185 {
2186 divrem(0, 1, r0, r1, r2);
2187 }
2188
2189 static void
_remi(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2190 _remi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2191 {
2192 jit_int32_t reg;
2193 reg = jit_get_reg(jit_class_gpr);
2194 movi(rn(reg), i0);
2195 remr(r0, r1, rn(reg));
2196 jit_unget_reg(reg);
2197 }
2198
2199 static void
_remr_u(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2200 _remr_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2201 {
2202 divrem(0, 0, r0, r1, r2);
2203 }
2204
2205 static void
_remi_u(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2206 _remi_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2207 {
2208 jit_int32_t reg;
2209 reg = jit_get_reg(jit_class_gpr);
2210 movi(rn(reg), i0);
2211 remr_u(r0, r1,rn(reg));
2212 jit_unget_reg(reg);
2213 }
2214
2215 static void
_andr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2216 _andr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2217 {
2218 if (jit_thumb_p()) {
2219 if (!jit_no_set_flags() && (r0|r1|r2) < 8 && (r0 == r1 || r0 == r2))
2220 T1_AND(r0, r0 == r1 ? r2 : r1);
2221 else
2222 T2_AND(r0, r1, r2);
2223 }
2224 else
2225 AND(r0, r1, r2);
2226 }
2227
2228 static void
_andi(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2229 _andi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2230 {
2231 int i;
2232 jit_int32_t reg;
2233 if (jit_thumb_p()) {
2234 if ((i = encode_thumb_immediate(i0)) != -1)
2235 T2_ANDI(r0, r1, i);
2236 else if ((i = encode_thumb_immediate(~i0)) != -1)
2237 T2_BICI(r0, r1, i);
2238 else if (r0 != r1) {
2239 movi(r0, i0);
2240 T2_AND(r0, r1, r0);
2241 }
2242 else {
2243 reg = jit_get_reg(jit_class_gpr);
2244 movi(rn(reg), i0);
2245 T2_AND(r0, r1, rn(reg));
2246 jit_unget_reg(reg);
2247 }
2248 }
2249 else {
2250 if ((i = encode_arm_immediate(i0)) != -1)
2251 ANDI(r0, r1, i);
2252 else if ((i = encode_arm_immediate(~i0)) != -1)
2253 BICI(r0, r1, i);
2254 else if (r0 != r1) {
2255 movi(r0, i0);
2256 AND(r0, r1, r0);
2257 }
2258 else {
2259 reg = jit_get_reg(jit_class_gpr);
2260 movi(rn(reg), i0);
2261 AND(r0, r1, rn(reg));
2262 jit_unget_reg(reg);
2263 }
2264 }
2265 }
2266
2267 static void
_orr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2268 _orr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2269 {
2270 if (jit_thumb_p()) {
2271 if (!jit_no_set_flags() && (r0|r1|r2) < 8 && (r0 == r1 || r0 == r2))
2272 T1_ORR(r0, r0 == r1 ? r2 : r1);
2273 else
2274 T2_ORR(r0, r1, r2);
2275 }
2276 else
2277 ORR(r0, r1, r2);
2278 }
2279
2280 static void
_ori(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2281 _ori(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2282 {
2283 int i;
2284 jit_int32_t reg;
2285 if (jit_thumb_p()) {
2286 if ((i = encode_thumb_immediate(i0)) != -1)
2287 T2_ORRI(r0, r1, i);
2288 else if (r0 != r1) {
2289 movi(r0, i0);
2290 T2_ORR(r0, r1, r0);
2291 }
2292 else {
2293 reg = jit_get_reg(jit_class_gpr);
2294 movi(rn(reg), i0);
2295 T2_ORR(r0, r1, rn(reg));
2296 jit_unget_reg(reg);
2297 }
2298 }
2299 else {
2300 if ((i = encode_arm_immediate(i0)) != -1)
2301 ORRI(r0, r1, i);
2302 else if (r0 != r1) {
2303 movi(r0, i0);
2304 ORR(r0, r1, r0);
2305 }
2306 else {
2307 reg = jit_get_reg(jit_class_gpr);
2308 movi(rn(reg), i0);
2309 ORR(r0, r1, rn(reg));
2310 jit_unget_reg(reg);
2311 }
2312 }
2313 }
2314
2315 static void
_xorr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2316 _xorr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2317 {
2318 if (jit_thumb_p()) {
2319 if (!jit_no_set_flags() && (r0|r1|r2) < 8 && (r0 == r1 || r0 == r2))
2320 T1_EOR(r0, r0 == r1 ? r2 : r1);
2321 else
2322 T2_EOR(r0, r1, r2);
2323 }
2324 else
2325 EOR(r0, r1, r2);
2326 }
2327
2328 static void
_xori(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2329 _xori(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2330 {
2331 int i;
2332 jit_int32_t reg;
2333 if (jit_thumb_p()) {
2334 if ((i = encode_thumb_immediate(i0)) != -1)
2335 T2_EORI(r0, r1, i);
2336 else if (r0 != r1) {
2337 movi(r0, i0);
2338 T2_EOR(r0, r1, r0);
2339 }
2340 else {
2341 reg = jit_get_reg(jit_class_gpr);
2342 movi(rn(reg), i0);
2343 T2_EOR(r0, r1, rn(reg));
2344 jit_unget_reg(reg);
2345 }
2346 }
2347 else {
2348 if ((i = encode_arm_immediate(i0)) != -1)
2349 EORI(r0, r1, i);
2350 else if (r0 != r1) {
2351 movi(r0, i0);
2352 EOR(r0, r1, r0);
2353 }
2354 else {
2355 reg = jit_get_reg(jit_class_gpr);
2356 movi(rn(reg), i0);
2357 EOR(r0, r1, rn(reg));
2358 jit_unget_reg(reg);
2359 }
2360 }
2361 }
2362
2363 static void
_lshr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2364 _lshr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2365 {
2366 if (jit_thumb_p()) {
2367 if (!jit_no_set_flags() && (r0|r1|r2) < 8 && r0 == r1)
2368 T1_LSL(r0, r2);
2369 else
2370 T2_LSL(r0, r1, r2);
2371 }
2372 else
2373 LSL(r0, r1, r2);
2374 }
2375
2376 static void
_lshi(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2377 _lshi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2378 {
2379 assert(i0 >= 0 && i0 <= 31);
2380 if (i0 == 0)
2381 movr(r0, r1);
2382 else if (jit_thumb_p()) {
2383 if (!jit_no_set_flags() && (r0|r1) < 8)
2384 T1_LSLI(r0, r1, i0);
2385 else
2386 T2_LSLI(r0, r1, i0);
2387 }
2388 else
2389 LSLI(r0, r1, i0);
2390 }
2391
2392 static void
_rshr(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2393 _rshr(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2394 {
2395 if (jit_thumb_p()) {
2396 if (!jit_no_set_flags() && (r0|r1|r2) < 8 && r0 == r1)
2397 T1_ASR(r0, r2);
2398 else
2399 T2_ASR(r0, r1, r2);
2400 }
2401 else
2402 ASR(r0, r1, r2);
2403 }
2404
2405 static void
_rshi(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2406 _rshi(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2407 {
2408 assert(i0 >= 0 && i0 <= 31);
2409 if (i0 == 0)
2410 movr(r0, r1);
2411 else if (jit_thumb_p()) {
2412 if (!jit_no_set_flags() && (r0|r1) < 8)
2413 T1_ASRI(r0, r1, i0);
2414 else
2415 T2_ASRI(r0, r1, i0);
2416 }
2417 else
2418 ASRI(r0, r1, i0);
2419 }
2420
2421 static void
_rshr_u(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2422 _rshr_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2423 {
2424 if (jit_thumb_p()) {
2425 if (!jit_no_set_flags() && (r0|r1|r2) < 8 && r0 == r1)
2426 T1_LSR(r0, r2);
2427 else
2428 T2_LSR(r0, r1, r2);
2429 }
2430 else
2431 LSR(r0, r1, r2);
2432 }
2433
2434 static void
_rshi_u(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2435 _rshi_u(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2436 {
2437 assert(i0 >= 0 && i0 <= 31);
2438 if (i0 == 0)
2439 movr(r0, r1);
2440 else if (jit_thumb_p()) {
2441 if (!jit_no_set_flags() && (r0|r1) < 8)
2442 T1_LSRI(r0, r1, i0);
2443 else
2444 T2_LSRI(r0, r1, i0);
2445 }
2446 else
2447 LSRI(r0, r1, i0);
2448 }
2449
2450 static void
_ccr(jit_state_t * _jit,int ct,int cf,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2451 _ccr(jit_state_t *_jit, int ct, int cf,
2452 jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2453 {
2454 if (jit_thumb_p()) {
2455 assert((ct ^ cf) >> 28 == 1);
2456 if ((r1|r2) < 8)
2457 T1_CMP(r1, r2);
2458 else if ((r1&r2) & 8)
2459 T1_CMPX(r1, r2);
2460 else
2461 T2_CMP(r1, r2);
2462 ITE(ct);
2463 if (r0 < 8) {
2464 T1_MOVI(r0, 1);
2465 T1_MOVI(r0, 0);
2466 }
2467 else {
2468 T2_MOVI(r0, 1);
2469 T2_MOVI(r0, 0);
2470 }
2471 }
2472 else {
2473 CMP(r1, r2);
2474 CC_MOVI(ct, r0, 1);
2475 CC_MOVI(cf, r0, 0);
2476 }
2477 }
2478
2479 static void
_cci(jit_state_t * _jit,int ct,int cf,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2480 _cci(jit_state_t *_jit, int ct, int cf,
2481 jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2482 {
2483 int i;
2484 jit_int32_t reg;
2485 if (jit_thumb_p()) {
2486 if (r1 < 7 && !(i0 & 0xffffff00))
2487 T1_CMPI(r1, i0);
2488 else if ((i = encode_thumb_immediate(i0)) != -1)
2489 T2_CMPI(r1, i);
2490 else if ((i = encode_thumb_immediate(-i0)) != -1)
2491 T2_CMNI(r1, i);
2492 else {
2493 reg = jit_get_reg(jit_class_gpr);
2494 movi(rn(reg), i0);
2495 ccr(ct, cf, r0, r1, rn(reg));
2496 jit_unget_reg(reg);
2497 return;
2498 }
2499 ITE(ct);
2500 if (r0 < 8) {
2501 T1_MOVI(r0, 1);
2502 T1_MOVI(r0, 0);
2503 }
2504 else {
2505 T2_MOVI(r0, 1);
2506 T2_MOVI(r0, 0);
2507 }
2508 }
2509 else {
2510 if ((i = encode_arm_immediate(i0)) != -1)
2511 CMPI(r1, i);
2512 else if ((i = encode_arm_immediate(-i0)) != -1)
2513 CMNI(r1, i);
2514 else if (r0 != r1) {
2515 movi(r0, i0);
2516 CMP(r1, r0);
2517 }
2518 else {
2519 reg = jit_get_reg(jit_class_gpr);
2520 movi(rn(reg), i0);
2521 CMP(r1, rn(reg));
2522 jit_unget_reg(reg);
2523 }
2524 CC_MOVI(ct, r0, 1);
2525 CC_MOVI(cf, r0, 0);
2526 }
2527 }
2528
2529 static void
_ner(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2530 _ner(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2531 {
2532 if (jit_thumb_p())
2533 ccr(ARM_CC_NE, ARM_CC_EQ, r0, r1, r2);
2534 else {
2535 SUBS(r0, r1, r2);
2536 CC_MOVI(ARM_CC_NE, r0, 1);
2537 }
2538 }
2539
2540 static void
_nei(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2541 _nei(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2542 {
2543 int i;
2544 jit_int32_t reg;
2545 if (jit_thumb_p())
2546 cci(ARM_CC_NE, ARM_CC_EQ, r0, r1, i0);
2547 else {
2548 if ((i = encode_arm_immediate(i0)) != -1)
2549 SUBSI(r0, r1, i);
2550 else if ((i = encode_arm_immediate(-i0)) != -1)
2551 ADDSI(r0, r1, i);
2552 else if (r0 != r1) {
2553 movi(r0, i0);
2554 SUBS(r0, r1, r0);
2555 }
2556 else {
2557 reg = jit_get_reg(jit_class_gpr);
2558 movi(rn(reg), i0);
2559 SUBS(r0, r1, rn(reg));
2560 jit_unget_reg(reg);
2561 }
2562 CC_MOVI(ARM_CC_NE, r0, 1);
2563 }
2564 }
2565
2566 static void
_jmpr(jit_state_t * _jit,jit_int32_t r0)2567 _jmpr(jit_state_t *_jit, jit_int32_t r0)
2568 {
2569 if (jit_thumb_p())
2570 T1_MOV(_R15_REGNO, r0);
2571 else
2572 MOV(_R15_REGNO, r0);
2573 }
2574
2575 static void
_jmpi(jit_state_t * _jit,jit_word_t i0)2576 _jmpi(jit_state_t *_jit, jit_word_t i0)
2577 {
2578 jit_word_t w;
2579 jit_word_t d;
2580 jit_int32_t reg;
2581 w = _jit->pc.w;
2582 /* if thumb and in thumb mode */
2583 if (jit_thumb_p() && _jitc->thumb) {
2584 d = ((i0 - w) >> 1) - 2;
2585 if (d >= -1024 && d <= 1023)
2586 T1_B(d & 0x7ff);
2587 else if (_s24P(d))
2588 T2_B(encode_thumb_jump(d));
2589 else {
2590 reg = jit_get_reg(jit_class_gpr|jit_class_nospill);
2591 movi(rn(reg), i0);
2592 jmpr(rn(reg));
2593 jit_unget_reg(reg);
2594 }
2595 }
2596 else {
2597 d = ((i0 - w) >> 2) - 2;
2598 if (_s24P(d))
2599 B(d & 0x00ffffff);
2600 else {
2601 reg = jit_get_reg(jit_class_gpr|jit_class_nospill);
2602 movi(rn(reg), i0);
2603 jmpr(rn(reg));
2604 jit_unget_reg(reg);
2605 }
2606 }
2607 }
2608
2609 static jit_word_t
_jmpi_p(jit_state_t * _jit,jit_word_t i0,jit_bool_t i1)2610 _jmpi_p(jit_state_t *_jit, jit_word_t i0, jit_bool_t i1)
2611 {
2612 jit_word_t w;
2613 jit_word_t d;
2614 jit_int32_t reg;
2615 if (i1) {
2616 /* Assume jump is not longer than 23 bits if inside jit */
2617 w = _jit->pc.w;
2618 /* if thumb and in thumb mode */
2619 if (jit_thumb_p() && _jitc->thumb) {
2620 d = ((i0 - w) >> 1) - 2;
2621 assert(_s24P(d));
2622 T2_B(encode_thumb_jump(d));
2623 }
2624 else {
2625 d = ((i0 - w) >> 2) - 2;
2626 assert(_s24P(d));
2627 B(d & 0x00ffffff);
2628 }
2629 }
2630 else {
2631 reg = jit_get_reg(jit_class_gpr|jit_class_nospill);
2632 w = movi_p(rn(reg), i0);
2633 jmpr(rn(reg));
2634 jit_unget_reg(reg);
2635 }
2636 return (w);
2637 }
2638
2639 static jit_word_t
_bccr(jit_state_t * _jit,int cc,jit_word_t i0,jit_int32_t r0,jit_int32_t r1)2640 _bccr(jit_state_t *_jit, int cc, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
2641 {
2642 jit_word_t w;
2643 jit_word_t d;
2644 if (jit_thumb_p()) {
2645 if ((r0|r1) < 8)
2646 T1_CMP(r0, r1);
2647 else if ((r0&r1) & 8)
2648 T1_CMPX(r0, r1);
2649 else
2650 T2_CMP(r0, r1);
2651 /* use only thumb2 conditional as does not know if will be patched */
2652 w = _jit->pc.w;
2653 d = ((i0 - w) >> 1) - 2;
2654 assert(_s20P(d));
2655 T2_CC_B(cc, encode_thumb_cc_jump(d));
2656 }
2657 else {
2658 CMP(r0, r1);
2659 w = _jit->pc.w;
2660 d = ((i0 - w) >> 2) - 2;
2661 assert(_s24P(d));
2662 CC_B(cc, d & 0x00ffffff);
2663 }
2664 return (w);
2665 }
2666
2667 static jit_word_t
_bcci(jit_state_t * _jit,int cc,jit_word_t i0,jit_int32_t r0,jit_word_t i1)2668 _bcci(jit_state_t *_jit, int cc, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
2669 {
2670 jit_word_t w;
2671 jit_word_t d;
2672 int i;
2673 jit_int32_t reg;
2674 if (jit_thumb_p()) {
2675 if (r0 < 7 && !(i1 & 0xffffff00))
2676 T1_CMPI(r0, i1);
2677 else if ((i = encode_thumb_immediate(i1)) != -1)
2678 T2_CMPI(r0, i);
2679 else if ((i = encode_thumb_immediate(-i1)) != -1)
2680 T2_CMNI(r0, i);
2681 else {
2682 reg = jit_get_reg(jit_class_gpr);
2683 movi(rn(reg), i1);
2684 T2_CMP(r0, rn(reg));
2685 jit_unget_reg(reg);
2686 }
2687 /* use only thumb2 conditional as does not know if will be patched */
2688 w = _jit->pc.w;
2689 d = ((i0 - w) >> 1) - 2;
2690 assert(_s20P(d));
2691 T2_CC_B(cc, encode_thumb_cc_jump(d));
2692 }
2693 else {
2694 if ((i = encode_arm_immediate(i1)) != -1)
2695 CMPI(r0, i);
2696 else if ((i = encode_arm_immediate(-i1)) != -1)
2697 CMNI(r0, i);
2698 else {
2699 reg = jit_get_reg(jit_class_gpr);
2700 movi(rn(reg), i1);
2701 CMP(r0, rn(reg));
2702 jit_unget_reg(reg);
2703 }
2704 w = _jit->pc.w;
2705 d = ((i0 - w) >> 2) - 2;
2706 assert(_s24P(d));
2707 CC_B(cc, d & 0x00ffffff);
2708 }
2709 return (w);
2710 }
2711
2712 static jit_word_t
_baddr(jit_state_t * _jit,int cc,jit_word_t i0,jit_int32_t r0,jit_int32_t r1)2713 _baddr(jit_state_t *_jit, int cc, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
2714 {
2715 jit_word_t w;
2716 jit_word_t d;
2717 if (jit_thumb_p()) {
2718 if ((r0|r1) < 8)
2719 T1_ADD(r0, r0, r1);
2720 else
2721 T2_ADDS(r0, r0, r1);
2722 w = _jit->pc.w;
2723 d = ((i0 - w) >> 1) - 2;
2724 assert(_s20P(d));
2725 T2_CC_B(cc, encode_thumb_cc_jump(d));
2726 }
2727 else {
2728 ADDS(r0, r0, r1);
2729 w = _jit->pc.w;
2730 d = ((i0 - w) >> 2) - 2;
2731 assert(_s24P(d));
2732 CC_B(cc, d & 0x00ffffff);
2733 }
2734 return (w);
2735 }
2736
2737 static jit_word_t
_baddi(jit_state_t * _jit,int cc,jit_word_t i0,jit_int32_t r0,int i1)2738 _baddi(jit_state_t *_jit, int cc, jit_word_t i0, jit_int32_t r0, int i1)
2739 {
2740 int i;
2741 jit_word_t w;
2742 jit_word_t d;
2743 jit_int32_t reg;
2744 if (jit_thumb_p()) {
2745 if (r0 < 8 && !(i1 & ~7))
2746 T1_ADDI3(r0, r0, i1);
2747 else if (r0 < 8 && !(-i1 & ~7))
2748 T1_SUBI3(r0, r0, -i1);
2749 else if (r0 < 8 && !(i1 & ~0xff))
2750 T1_ADDI8(r0, i1);
2751 else if (r0 < 8 && !(-i1 & ~0xff))
2752 T1_SUBI8(r0, -i1);
2753 else if ((i = encode_thumb_immediate(i1)) != -1)
2754 T2_ADDSI(r0, r0, i);
2755 else if ((i = encode_thumb_immediate(-i1)) != -1)
2756 T2_SUBSI(r0, r0, i);
2757 else {
2758 reg = jit_get_reg(jit_class_gpr);
2759 movi(rn(reg), i1);
2760 T2_ADDS(r0, r0, rn(reg));
2761 jit_unget_reg(reg);
2762 }
2763 w = _jit->pc.w;
2764 d = ((i0 - w) >> 1) - 2;
2765 assert(_s20P(d));
2766 T2_CC_B(cc, encode_thumb_cc_jump(d));
2767 }
2768 else {
2769 if ((i = encode_arm_immediate(i1)) != -1)
2770 ADDSI(r0, r0, i);
2771 else if ((i = encode_arm_immediate(-i1)) != -1)
2772 SUBSI(r0, r0, i);
2773 else {
2774 reg = jit_get_reg(jit_class_gpr);
2775 movi(rn(reg), i1);
2776 ADDS(r0, r0, rn(reg));
2777 jit_unget_reg(reg);
2778 }
2779 w = _jit->pc.w;
2780 d = ((i0 - w) >> 2) - 2;
2781 assert(_s24P(d));
2782 CC_B(cc, d & 0x00ffffff);
2783 }
2784 return (w);
2785 }
2786
2787 static jit_word_t
_bsubr(jit_state_t * _jit,int cc,jit_word_t i0,jit_int32_t r0,jit_int32_t r1)2788 _bsubr(jit_state_t *_jit, int cc, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
2789 {
2790 jit_word_t w;
2791 jit_word_t d;
2792 if (jit_thumb_p()) {
2793 if ((r0|r1) < 8)
2794 T1_SUB(r0, r0, r1);
2795 else
2796 T2_SUBS(r0, r0, r1);
2797 w = _jit->pc.w;
2798 d = ((i0 - w) >> 1) - 2;
2799 assert(_s20P(d));
2800 T2_CC_B(cc, encode_thumb_cc_jump(d));
2801 }
2802 else {
2803 SUBS(r0, r0, r1);
2804 w = _jit->pc.w;
2805 d = ((i0 - w) >> 2) - 2;
2806 assert(_s24P(d));
2807 CC_B(cc, d & 0x00ffffff);
2808 }
2809 return (w);
2810 }
2811
2812 static jit_word_t
_bsubi(jit_state_t * _jit,int cc,jit_word_t i0,jit_int32_t r0,int i1)2813 _bsubi(jit_state_t *_jit, int cc, jit_word_t i0, jit_int32_t r0, int i1)
2814 {
2815 int i;
2816 jit_word_t w;
2817 jit_word_t d;
2818 jit_int32_t reg;
2819 if (jit_thumb_p()) {
2820 if (r0 < 8 && !(i1 & ~7))
2821 T1_SUBI3(r0, r0, i1);
2822 else if (r0 < 8 && !(-i1 & ~7))
2823 T1_ADDI3(r0, r0, -i1);
2824 else if (r0 < 8 && !(i1 & ~0xff))
2825 T1_SUBI8(r0, i1);
2826 else if (r0 < 8 && !(-i1 & ~0xff))
2827 T1_ADDI8(r0, -i1);
2828 else if ((i = encode_thumb_immediate(i1)) != -1)
2829 T2_SUBSI(r0, r0, i);
2830 else if ((i = encode_thumb_immediate(-i1)) != -1)
2831 T2_SUBSI(r0, r0, i);
2832 else {
2833 reg = jit_get_reg(jit_class_gpr);
2834 movi(rn(reg), i1);
2835 T2_SUBS(r0, r0, rn(reg));
2836 jit_unget_reg(reg);
2837 }
2838 w = _jit->pc.w;
2839 d = ((i0 - w) >> 1) - 2;
2840 assert(_s20P(d));
2841 T2_CC_B(cc, encode_thumb_cc_jump(d));
2842 }
2843 else {
2844 if ((i = encode_arm_immediate(i1)) != -1)
2845 SUBSI(r0, r0, i);
2846 else if ((i = encode_arm_immediate(-i1)) != -1)
2847 ADDSI(r0, r0, i);
2848 else {
2849 reg = jit_get_reg(jit_class_gpr);
2850 movi(rn(reg), i1);
2851 SUBS(r0, r0, rn(reg));
2852 jit_unget_reg(reg);
2853 }
2854 w = _jit->pc.w;
2855 d = ((i0 - w) >> 2) - 2;
2856 assert(_s24P(d));
2857 CC_B(cc, d & 0x00ffffff);
2858 }
2859 return (w);
2860 }
2861
2862 static jit_word_t
_bmxr(jit_state_t * _jit,int cc,jit_word_t i0,jit_int32_t r0,jit_int32_t r1)2863 _bmxr(jit_state_t *_jit, int cc, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
2864 {
2865 jit_word_t w;
2866 jit_word_t d;
2867 jit_int32_t reg;
2868 if (jit_thumb_p()) {
2869 if ((r0|r1) < 8)
2870 T1_TST(r0, r1);
2871 else
2872 T2_TST(r0, r1);
2873 w = _jit->pc.w;
2874 d = ((i0 - w) >> 1) - 2;
2875 assert(_s20P(d));
2876 T2_CC_B(cc, encode_thumb_cc_jump(d));
2877 }
2878 else {
2879 if (jit_armv5_p())
2880 TST(r0, r1);
2881 else {
2882 reg = jit_get_reg(jit_class_gpr);
2883 ANDS(rn(reg), r0, r1);
2884 jit_unget_reg(reg);
2885 }
2886 w = _jit->pc.w;
2887 d = ((i0 - w) >> 2) - 2;
2888 assert(_s24P(d));
2889 CC_B(cc, d & 0x00ffffff);
2890 }
2891 return (w);
2892 }
2893
2894 static jit_word_t
_bmxi(jit_state_t * _jit,int cc,jit_word_t i0,jit_int32_t r0,jit_word_t i1)2895 _bmxi(jit_state_t *_jit, int cc, jit_word_t i0, jit_int32_t r0, jit_word_t i1)
2896 {
2897 int i;
2898 jit_word_t w;
2899 jit_word_t d;
2900 jit_int32_t reg;
2901 if (jit_thumb_p()) {
2902 if ((i = encode_thumb_immediate(i1)) != -1)
2903 T2_TSTI(r0, i);
2904 else {
2905 reg = jit_get_reg(jit_class_gpr);
2906 movi(rn(reg), i1);
2907 T2_TST(r0, rn(reg));
2908 jit_unget_reg(reg);
2909 }
2910 w = _jit->pc.w;
2911 d = ((i0 - w) >> 1) - 2;
2912 assert(_s20P(d));
2913 T2_CC_B(cc, encode_thumb_cc_jump(d));
2914 }
2915 else {
2916 if (jit_armv5_p()) {
2917 if ((i = encode_arm_immediate(i1)) != -1)
2918 TSTI(r0, i);
2919 else {
2920 reg = jit_get_reg(jit_class_gpr);
2921 movi(rn(reg), i1);
2922 TST(r0, rn(reg));
2923 jit_unget_reg(reg);
2924 }
2925 }
2926 else {
2927 reg = jit_get_reg(jit_class_gpr);
2928 if ((i = encode_arm_immediate(i1)) != -1)
2929 ANDSI(rn(reg), r0, i);
2930 else if ((i = encode_arm_immediate(~i1)) != -1)
2931 BICSI(rn(reg), r0, i);
2932 else {
2933 movi(rn(reg), i1);
2934 ANDS(rn(reg), r0, rn(reg));
2935 }
2936 jit_unget_reg(reg);
2937 }
2938 w = _jit->pc.w;
2939 d = ((i0 - w) >> 2) - 2;
2940 assert(_s24P(d));
2941 CC_B(cc, d & 0x00ffffff);
2942 }
2943 return (w);
2944 }
2945
2946 static void
_ldr_c(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)2947 _ldr_c(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
2948 {
2949 if (jit_thumb_p())
2950 T2_LDRSBI(r0, r1, 0);
2951 else
2952 LDRSBI(r0, r1, 0);
2953 }
2954
2955 static void
_ldi_c(jit_state_t * _jit,jit_int32_t r0,jit_word_t i0)2956 _ldi_c(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
2957 {
2958 jit_int32_t reg;
2959 reg = jit_get_reg(jit_class_gpr);
2960 movi(rn(reg), i0);
2961 if (jit_thumb_p())
2962 T2_LDRSBI(r0, rn(reg), 0);
2963 else
2964 LDRSBI(r0, rn(reg), 0);
2965 jit_unget_reg(reg);
2966 }
2967
2968 static void
_ldxr_c(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)2969 _ldxr_c(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
2970 {
2971 if (jit_thumb_p()) {
2972 if ((r0|r1|r2) < 8)
2973 T1_LDRSB(r0, r1, r2);
2974 else
2975 T2_LDRSB(r0, r1, r2);
2976 }
2977 else
2978 LDRSB(r0, r1, r2);
2979 }
2980
2981 static void
_ldxi_c(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)2982 _ldxi_c(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
2983 {
2984 jit_int32_t reg;
2985 if (jit_thumb_p()) {
2986 if (jit_ldrt_strt_p() && i0 >= 0 && i0 <= 255)
2987 T2_LDRSBI(r0, r1, i0);
2988 else if (i0 < 0 && i0 >= -255)
2989 T2_LDRSBIN(r0, r1, -i0);
2990 else if (i0 >= 0 && i0 <= 4095)
2991 T2_LDRSBWI(r0, r1, i0);
2992 else if (r0 != r1) {
2993 movi(r0, i0);
2994 if ((r0|r1) < 8)
2995 T1_LDRSB(r0, r1, r0);
2996 else
2997 T2_LDRSB(r0, r1, r0);
2998 }
2999 else {
3000 reg = jit_get_reg(jit_class_gpr);
3001 movi(rn(reg), i0);
3002 if ((r0|r1|rn(reg)) < 8)
3003 T1_LDRSB(r0, r1, rn(reg));
3004 else
3005 T2_LDRSB(r0, r1, rn(reg));
3006 jit_unget_reg(reg);
3007 }
3008 }
3009 else {
3010 if (i0 >= 0 && i0 <= 255)
3011 LDRSBI(r0, r1, i0);
3012 else if (i0 < 0 && i0 >= -255)
3013 LDRSBIN(r0, r1, -i0);
3014 else if (r0 != r1) {
3015 movi(r0, i0);
3016 LDRSB(r0, r1, r0);
3017 }
3018 else {
3019 reg = jit_get_reg(jit_class_gpr);
3020 movi(rn(reg), i0);
3021 LDRSB(r0, r1, rn(reg));
3022 jit_unget_reg(reg);
3023 }
3024 }
3025 }
3026
3027 static void
_ldr_uc(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3028 _ldr_uc(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3029 {
3030 if (jit_thumb_p())
3031 T2_LDRBI(r0, r1, 0);
3032 else
3033 LDRBI(r0, r1, 0);
3034 }
3035
3036 static void
_ldi_uc(jit_state_t * _jit,jit_int32_t r0,jit_word_t i0)3037 _ldi_uc(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
3038 {
3039 jit_int32_t reg;
3040 reg = jit_get_reg(jit_class_gpr);
3041 movi(rn(reg), i0);
3042 if (jit_thumb_p())
3043 T2_LDRBI(r0, rn(reg), 0);
3044 else
3045 LDRBI(r0, rn(reg), 0);
3046 jit_unget_reg(reg);
3047 }
3048
3049 static void
_ldxr_uc(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)3050 _ldxr_uc(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
3051 {
3052 if (jit_thumb_p()) {
3053 if ((r0|r1|r2) < 8)
3054 T1_LDRB(r0, r1, r2);
3055 else
3056 T2_LDRB(r0, r1, r2);
3057 }
3058 else
3059 LDRB(r0, r1, r2);
3060 }
3061
3062 static void
_ldxi_uc(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)3063 _ldxi_uc(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
3064 {
3065 jit_int32_t reg;
3066 if (jit_thumb_p()) {
3067 if ((r0|r1) < 8 && i0 >= 0 && i0 < 0x20)
3068 T1_LDRBI(r0, r1, i0);
3069 else if (jit_ldrt_strt_p() && i0 >= 0 && i0 <= 255)
3070 T2_LDRBI(r0, r1, i0);
3071 else if (i0 < 0 && i0 >= -255)
3072 T2_LDRBIN(r0, r1, -i0);
3073 else if (i0 >= 0 && i0 <= 4095)
3074 T2_LDRBWI(r0, r1, i0);
3075 else if (r0 != r1) {
3076 movi(r0, i0);
3077 if ((r0|r1) < 8)
3078 T1_LDRB(r0, r1, r0);
3079 else
3080 T2_LDRB(r0, r1, r0);
3081 }
3082 else {
3083 reg = jit_get_reg(jit_class_gpr);
3084 movi(rn(reg), i0);
3085 if ((r0|r1|rn(reg)) < 8)
3086 T1_LDRB(r0, r1, rn(reg));
3087 else
3088 T2_LDRB(r0, r1, rn(reg));
3089 jit_unget_reg(reg);
3090 }
3091 }
3092 else {
3093 if (i0 >= 0 && i0 <= 4095)
3094 LDRBI(r0, r1, i0);
3095 else if (i0 < 0 && i0 >= -4095)
3096 LDRBIN(r0, r1, -i0);
3097 else if (r0 != r1) {
3098 movi(r0, i0);
3099 LDRB(r0, r1, r0);
3100 }
3101 else {
3102 reg = jit_get_reg(jit_class_gpr);
3103 movi(rn(reg), i0);
3104 LDRB(r0, r1, rn(reg));
3105 jit_unget_reg(reg);
3106 }
3107 }
3108 }
3109
3110 static void
_ldr_s(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3111 _ldr_s(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3112 {
3113 if (jit_thumb_p())
3114 T2_LDRSHI(r0, r1, 0);
3115 else
3116 LDRSHI(r0, r1, 0);
3117 }
3118
3119 static void
_ldi_s(jit_state_t * _jit,jit_int32_t r0,jit_word_t i0)3120 _ldi_s(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
3121 {
3122 jit_int32_t reg;
3123 reg = jit_get_reg(jit_class_gpr);
3124 movi(rn(reg), i0);
3125 if (jit_thumb_p())
3126 T2_LDRSHI(r0, rn(reg), 0);
3127 else
3128 LDRSHI(r0, rn(reg), 0);
3129 jit_unget_reg(reg);
3130 }
3131
3132 static void
_ldxr_s(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)3133 _ldxr_s(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
3134 {
3135 if (jit_thumb_p()) {
3136 if ((r0|r1|r2) < 8)
3137 T1_LDRSH(r0, r1, r2);
3138 else
3139 T2_LDRSH(r0, r1, r2);
3140 }
3141 else
3142 LDRSH(r0, r1, r2);
3143 }
3144
3145 static void
_ldxi_s(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)3146 _ldxi_s(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
3147 {
3148 jit_int32_t reg;
3149 if (jit_thumb_p()) {
3150 if (jit_ldrt_strt_p() && i0 >= 0 && i0 <= 255)
3151 T2_LDRSHI(r0, r1, i0);
3152 else if (i0 < 0 && i0 >= -255)
3153 T2_LDRSHIN(r0, r1, -i0);
3154 else if (i0 >= 0 && i0 <= 4095)
3155 T2_LDRSHWI(r0, r1, i0);
3156 else if (r0 != r1) {
3157 movi(r0, i0);
3158 if ((r0|r1) < 8)
3159 T1_LDRSH(r0, r1, r0);
3160 else
3161 T2_LDRSH(r0, r1, r0);
3162 }
3163 else {
3164 reg = jit_get_reg(jit_class_gpr);
3165 movi(rn(reg), i0);
3166 if ((r0|r1|rn(reg)) < 8)
3167 T1_LDRSH(r0, r1, rn(reg));
3168 else
3169 T2_LDRSH(r0, r1, rn(reg));
3170 jit_unget_reg(reg);
3171 }
3172 }
3173 else {
3174 if (i0 >= 0 && i0 <= 255)
3175 LDRSHI(r0, r1, i0);
3176 else if (i0 < 0 && i0 >= -255)
3177 LDRSHIN(r0, r1, -i0);
3178 else if (r0 != r1) {
3179 movi(r0, i0);
3180 LDRSH(r0, r1, r0);
3181 }
3182 else {
3183 reg = jit_get_reg(jit_class_gpr);
3184 movi(rn(reg), i0);
3185 LDRSH(r0, r1, rn(reg));
3186 jit_unget_reg(reg);
3187 }
3188 }
3189 }
3190
3191 static void
_ldr_us(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3192 _ldr_us(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3193 {
3194 if (jit_thumb_p())
3195 T2_LDRHI(r0, r1, 0);
3196 else
3197 LDRHI(r0, r1, 0);
3198 }
3199
3200 static void
_ldi_us(jit_state_t * _jit,jit_int32_t r0,jit_word_t i0)3201 _ldi_us(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
3202 {
3203 jit_int32_t reg;
3204 reg = jit_get_reg(jit_class_gpr);
3205 movi(rn(reg), i0);
3206 if (jit_thumb_p())
3207 T2_LDRHI(r0, rn(reg), 0);
3208 else
3209 LDRHI(r0, rn(reg), 0);
3210 jit_unget_reg(reg);
3211 }
3212
3213 static void
_ldxr_us(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)3214 _ldxr_us(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
3215 {
3216 if (jit_thumb_p()) {
3217 if ((r0|r1|r2) < 8)
3218 T1_LDRH(r0, r1, r2);
3219 else
3220 T2_LDRH(r0, r1, r2);
3221 }
3222 else
3223 LDRH(r0, r1, r2);
3224 }
3225
3226 static void
_ldxi_us(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)3227 _ldxi_us(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
3228 {
3229 jit_int32_t reg;
3230 if (jit_thumb_p()) {
3231 if ((r0|r1) < 8 && i0 >= 0 && !(i0 & 1) && (i0 >> 1) < 0x20)
3232 T1_LDRHI(r0, r1, i0 >> 1);
3233 else if (jit_ldrt_strt_p() && i0 >= 0 && i0 <= 255)
3234 T2_LDRHI(r0, r1, i0);
3235 else if (i0 < 0 && i0 >= -255)
3236 T2_LDRHIN(r0, r1, -i0);
3237 else if (i0 >= 0 && i0 <= 4095)
3238 T2_LDRHWI(r0, r1, i0);
3239 else if (r0 != r1) {
3240 movi(r0, i0);
3241 if ((r0|r1) < 8)
3242 T1_LDRH(r0, r1, r0);
3243 else
3244 T2_LDRH(r0, r1, r0);
3245 }
3246 else {
3247 reg = jit_get_reg(jit_class_gpr);
3248 movi(rn(reg), i0);
3249 if ((r0|r1|rn(reg)) < 8)
3250 T1_LDRH(r0, r1, rn(reg));
3251 else
3252 T2_LDRH(r0, r1, rn(reg));
3253 jit_unget_reg(reg);
3254 }
3255 }
3256 else {
3257 if (i0 >= 0 && i0 <= 255)
3258 LDRHI(r0, r1, i0);
3259 else if (i0 < 0 && i0 >= -255)
3260 LDRHIN(r0, r1, -i0);
3261 else if (r0 != r1) {
3262 movi(r0, i0);
3263 LDRH(r0, r1, r0);
3264 }
3265 else {
3266 reg = jit_get_reg(jit_class_gpr);
3267 movi(rn(reg), i0);
3268 LDRH(r0, r1, rn(reg));
3269 jit_unget_reg(reg);
3270 }
3271 }
3272 }
3273
3274 static void
_ldr_i(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3275 _ldr_i(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3276 {
3277 if (jit_thumb_p())
3278 T2_LDRI(r0, r1, 0);
3279 else
3280 LDRI(r0, r1, 0);
3281 }
3282
3283 static void
_ldi_i(jit_state_t * _jit,jit_int32_t r0,jit_word_t i0)3284 _ldi_i(jit_state_t *_jit, jit_int32_t r0, jit_word_t i0)
3285 {
3286 jit_int32_t reg;
3287 reg = jit_get_reg(jit_class_gpr);
3288 movi(rn(reg), i0);
3289 if (jit_thumb_p())
3290 T2_LDRI(r0, rn(reg), 0);
3291 else
3292 LDRI(r0, rn(reg), 0);
3293 jit_unget_reg(reg);
3294 }
3295
3296 static void
_ldxr_i(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)3297 _ldxr_i(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
3298 {
3299 if (jit_thumb_p()) {
3300 if ((r0|r1|r2) < 8)
3301 T1_LDR(r0, r1, r2);
3302 else
3303 T2_LDR(r0, r1, r2);
3304 }
3305 else
3306 LDR(r0, r1, r2);
3307 }
3308
3309 static void
_ldxi_i(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_word_t i0)3310 _ldxi_i(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_word_t i0)
3311 {
3312 jit_int32_t reg;
3313 if (jit_thumb_p()) {
3314 if ((r0|r1) < 8 && i0 >= 0 && !(i0 & 3) && (i0 >> 2) < 0x20)
3315 T1_LDRI(r0, r1, i0 >> 2);
3316 else if (r1 == _R13_REGNO && r0 < 8 &&
3317 i0 >= 0 && !(i0 & 3) && (i0 >> 2) <= 255)
3318 T1_LDRISP(r0, i0 >> 2);
3319 else if (jit_ldrt_strt_p() && i0 >= 0 && i0 <= 255)
3320 T2_LDRI(r0, r1, i0);
3321 else if (i0 < 0 && i0 > -255)
3322 T2_LDRIN(r0, r1, -i0);
3323 else if (i0 >= 0 && i0 <= 4095)
3324 T2_LDRWI(r0, r1, i0);
3325 else if (r0 != r1) {
3326 movi(r0, i0);
3327 if ((r0|r1) < 8)
3328 T1_LDR(r0, r1, r0);
3329 else
3330 T2_LDR(r0, r1, r0);
3331 }
3332 else {
3333 reg = jit_get_reg(jit_class_gpr);
3334 movi(rn(reg), i0);
3335 if ((r0|r1|rn(reg)) < 8)
3336 T1_LDR(r0, r1, rn(reg));
3337 else
3338 T2_LDR(r0, r1, rn(reg));
3339 jit_unget_reg(reg);
3340 }
3341 }
3342 else {
3343 if (i0 >= 0 && i0 <= 4095)
3344 LDRI(r0, r1, i0);
3345 else if (i0 < 0 && i0 >= -4095)
3346 LDRIN(r0, r1, -i0);
3347 else if (r0 != r1) {
3348 movi(r0, i0);
3349 LDR(r0, r1, r0);
3350 }
3351 else {
3352 reg = jit_get_reg(jit_class_gpr);
3353 movi(rn(reg), i0);
3354 LDR(r0, r1, rn(reg));
3355 jit_unget_reg(reg);
3356 }
3357 }
3358 }
3359
3360 static void
_str_c(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3361 _str_c(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3362 {
3363 if (jit_thumb_p())
3364 T2_STRBI(r1, r0, 0);
3365 else
3366 STRBI(r1, r0, 0);
3367 }
3368
3369 static void
_sti_c(jit_state_t * _jit,jit_word_t i0,jit_int32_t r0)3370 _sti_c(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0)
3371 {
3372 jit_int32_t reg;
3373 reg = jit_get_reg(jit_class_gpr);
3374 movi(rn(reg), i0);
3375 if (jit_thumb_p())
3376 T2_STRBI(r0, rn(reg), 0);
3377 else
3378 STRBI(r0, rn(reg), 0);
3379 jit_unget_reg(reg);
3380 }
3381
3382 static void
_stxr_c(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)3383 _stxr_c(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
3384 {
3385 if (jit_thumb_p()) {
3386 if ((r0|r1|r2) < 8)
3387 T1_STRB(r2, r1, r0);
3388 else
3389 T2_STRB(r2, r1, r0);
3390 }
3391 else
3392 STRB(r2, r1, r0);
3393 }
3394
3395 static void
_stxi_c(jit_state_t * _jit,jit_word_t i0,jit_int32_t r0,jit_int32_t r1)3396 _stxi_c(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3397 {
3398 jit_int32_t reg;
3399 if (jit_thumb_p()) {
3400 if ((r0|r1) < 8 && i0 >= 0 && i0 < 0x20)
3401 T1_STRBI(r1, r0, i0);
3402 else if (jit_ldrt_strt_p() && i0 >= 0 && i0 <= 255)
3403 T2_STRBI(r1, r0, i0);
3404 else if (i0 < 0 && i0 >= -255)
3405 T2_STRBIN(r1, r0, -i0);
3406 else if (i0 >= 0 && i0 <= 4095)
3407 T2_STRBWI(r1, r0, i0);
3408 else {
3409 reg = jit_get_reg(jit_class_gpr);
3410 movi(rn(reg), i0);
3411 if ((r0|r1|rn(reg)) < 8)
3412 T1_STRB(r1, r0, rn(reg));
3413 else
3414 T2_STRB(r1, r0, rn(reg));
3415 jit_unget_reg(reg);
3416 }
3417 }
3418 else {
3419 if (i0 >= 0 && i0 <= 4095)
3420 STRBI(r1, r0, i0);
3421 else if (i0 < 0 && i0 >= -4095)
3422 STRBIN(r1, r0, -i0);
3423 else {
3424 reg = jit_get_reg(jit_class_gpr);
3425 movi(rn(reg), i0);
3426 STRB(r1, r0, rn(reg));
3427 jit_unget_reg(reg);
3428 }
3429 }
3430 }
3431
3432 static void
_str_s(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3433 _str_s(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3434 {
3435 if (jit_thumb_p())
3436 T2_STRHI(r1, r0, 0);
3437 else
3438 STRHI(r1, r0, 0);
3439 }
3440
3441 static void
_sti_s(jit_state_t * _jit,jit_word_t i0,jit_int32_t r0)3442 _sti_s(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0)
3443 {
3444 jit_int32_t reg;
3445 reg = jit_get_reg(jit_class_gpr);
3446 movi(rn(reg), i0);
3447 if (jit_thumb_p())
3448 T2_STRHI(r0, rn(reg), 0);
3449 else
3450 STRHI(r0, rn(reg), 0);
3451 jit_unget_reg(reg);
3452 }
3453
3454 static void
_stxr_s(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)3455 _stxr_s(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
3456 {
3457 if (jit_thumb_p()) {
3458 if ((r0|r1|r2) < 8)
3459 T1_STRH(r2, r1, r0);
3460 else
3461 T2_STRH(r2, r1, r0);
3462 }
3463 else
3464 STRH(r2, r1, r0);
3465 }
3466
3467 static void
_stxi_s(jit_state_t * _jit,jit_word_t i0,jit_int32_t r0,jit_int32_t r1)3468 _stxi_s(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3469 {
3470 jit_int32_t reg;
3471 if (jit_thumb_p()) {
3472 if ((r0|r1) < 8 && i0 >= 0 && !(i0 & 1) && (i0 >> 1) < 0x20)
3473 T1_STRHI(r1, r0, i0 >> 1);
3474 else if (jit_ldrt_strt_p() && i0 >= 0 && i0 <= 255)
3475 T2_STRHI(r1, r0, i0);
3476 else if (i0 < 0 && i0 >= -255)
3477 T2_STRHIN(r1, r0, -i0);
3478 else if (i0 >= 0 && i0 <= 4095)
3479 T2_STRHWI(r1, r0, i0);
3480 else {
3481 reg = jit_get_reg(jit_class_gpr);
3482 movi(rn(reg), i0);
3483 if ((r0|r1|rn(reg)) < 8)
3484 T1_STRH(r1, r0, rn(reg));
3485 else
3486 T2_STRH(r1, r0, rn(reg));
3487 jit_unget_reg(reg);
3488 }
3489 }
3490 else {
3491 if (i0 >= 0 && i0 <= 255)
3492 STRHI(r1, r0, i0);
3493 else if (i0 < 0 && i0 >= -255)
3494 STRHIN(r1, r0, -i0);
3495 else {
3496 reg = jit_get_reg(jit_class_gpr);
3497 movi(rn(reg), i0);
3498 STRH(r1, r0, rn(reg));
3499 jit_unget_reg(reg);
3500 }
3501 }
3502 }
3503
3504 static void
_str_i(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3505 _str_i(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3506 {
3507 if (jit_thumb_p())
3508 T2_STRI(r1, r0, 0);
3509 else
3510 STRI(r1, r0, 0);
3511 }
3512
3513 static void
_sti_i(jit_state_t * _jit,jit_word_t i0,jit_int32_t r0)3514 _sti_i(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0)
3515 {
3516 jit_int32_t reg;
3517 reg = jit_get_reg(jit_class_gpr);
3518 movi(rn(reg), i0);
3519 if (jit_thumb_p())
3520 T2_STRI(r0, rn(reg), 0);
3521 else
3522 STRI(r0, rn(reg), 0);
3523 jit_unget_reg(reg);
3524 }
3525
3526 static void
_stxr_i(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1,jit_int32_t r2)3527 _stxr_i(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1, jit_int32_t r2)
3528 {
3529 if (jit_thumb_p()) {
3530 if ((r0|r1|r2) < 8)
3531 T1_STR(r2, r1, r0);
3532 else
3533 T2_STR(r2, r1, r0);
3534 }
3535 else
3536 STR(r2, r1, r0);
3537 }
3538
3539 static void
_stxi_i(jit_state_t * _jit,jit_word_t i0,jit_int32_t r0,jit_int32_t r1)3540 _stxi_i(jit_state_t *_jit, jit_word_t i0, jit_int32_t r0, jit_int32_t r1)
3541 {
3542 jit_int32_t reg;
3543 if (jit_thumb_p()) {
3544 if ((r0|r1) < 8 && i0 >= 0 && !(i0 & 3) && (i0 >> 2) < 0x20)
3545 T1_STRI(r1, r0, i0 >> 2);
3546 else if (r0 == _R13_REGNO && r1 < 8 &&
3547 i0 >= 0 && !(i0 & 3) && (i0 >> 2) <= 255)
3548 T1_STRISP(r1, i0 >> 2);
3549 else if (jit_ldrt_strt_p() && i0 >= 0 && i0 <= 255)
3550 T2_STRI(r1, r0, i0);
3551 else if (i0 < 0 && i0 >= -255)
3552 T2_STRIN(r1, r0, -i0);
3553 else if (i0 >= 0 && i0 <= 4095)
3554 T2_STRWI(r1, r0, i0);
3555 else {
3556 reg = jit_get_reg(jit_class_gpr);
3557 movi(rn(reg), i0);
3558 if ((r0|r1|rn(reg)) < 8)
3559 T1_STR(r1, r0, rn(reg));
3560 else
3561 T2_STR(r1, r0, rn(reg));
3562 jit_unget_reg(reg);
3563 }
3564 }
3565 else {
3566 if (i0 >= 0 && i0 <= 4095)
3567 STRI(r1, r0, i0);
3568 else if (i0 < 0 && i0 >= -4095)
3569 STRIN(r1, r0, -i0);
3570 else {
3571 reg = jit_get_reg(jit_class_gpr);
3572 movi(rn(reg), i0);
3573 STR(r1, r0, rn(reg));
3574 jit_unget_reg(reg);
3575 }
3576 }
3577 }
3578
3579 # if __BYTE_ORDER == __LITTLE_ENDIAN
3580 static void
_htonr_us(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3581 _htonr_us(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3582 {
3583 jit_int32_t t0;
3584 if (jit_thumb_p()) {
3585 if ((r0|r1) < 8)
3586 T1_REV(r0, r1);
3587 else
3588 T2_REV(r0, r1);
3589 rshi_u(r0, r0, 16);
3590 }
3591 else {
3592 if (jit_armv6_p()) {
3593 REV(r0, r1);
3594 rshi_u(r0, r0, 16);
3595 }
3596 else {
3597 t0 = jit_get_reg(jit_class_gpr);
3598 rshi(rn(t0), r1, 8);
3599 andi(r0, r1, 0xff);
3600 andi(rn(t0), rn(t0), 0xff);
3601 lshi(r0, r0, 8);
3602 orr(r0, r0, rn(t0));
3603 jit_unget_reg(t0);
3604 }
3605 }
3606 }
3607
3608 /* inline glibc htonl (without register clobber) */
3609 static void
_htonr_ui(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3610 _htonr_ui(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3611 {
3612 jit_int32_t reg;
3613 if (jit_thumb_p()) {
3614 if ((r0|r1) < 8)
3615 T1_REV(r0, r1);
3616 else
3617 T2_REV(r0, r1);
3618 }
3619 else {
3620 if (jit_armv6_p())
3621 REV(r0, r1);
3622 else {
3623 reg = jit_get_reg(jit_class_gpr);
3624 EOR_SI(rn(reg), r1, r1, ARM_ROR, 16);
3625 LSRI(rn(reg), rn(reg), 8);
3626 BICI(rn(reg), rn(reg), encode_arm_immediate(0xff00));
3627 EOR_SI(r0, rn(reg), r1, ARM_ROR, 8);
3628 jit_unget_reg(reg);
3629 }
3630 }
3631 }
3632 #endif
3633
3634 static void
_extr_c(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3635 _extr_c(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3636 {
3637 if (jit_thumb_p()) {
3638 if ((r0|r1) < 8)
3639 T1_SXTB(r0, r1);
3640 else
3641 T2_SXTB(r0, r1);
3642 }
3643 else {
3644 if (jit_armv6_p())
3645 SXTB(r0, r1);
3646 else {
3647 LSLI(r0, r1, 24);
3648 ASRI(r0, r0, 24);
3649 }
3650 }
3651 }
3652
3653 static void
_extr_uc(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3654 _extr_uc(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3655 {
3656 if (jit_thumb_p()) {
3657 if ((r0|r1) < 8)
3658 T1_UXTB(r0, r1);
3659 else
3660 T2_UXTB(r0, r1);
3661 }
3662 else {
3663 if (jit_armv6_p())
3664 UXTB(r0, r1);
3665 else
3666 ANDI(r0, r1, 0xff);
3667 }
3668 }
3669
3670 static void
_extr_s(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3671 _extr_s(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3672 {
3673 if (jit_thumb_p()) {
3674 if ((r0|r1) < 8)
3675 T1_SXTH(r0, r1);
3676 else
3677 T2_SXTH(r0, r1);
3678 }
3679 else {
3680 if (jit_armv6_p())
3681 SXTH(r0, r1);
3682 else {
3683 LSLI(r0, r1, 16);
3684 ASRI(r0, r0, 16);
3685 }
3686 }
3687 }
3688
3689 static void
_extr_us(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3690 _extr_us(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3691 {
3692 if (jit_thumb_p()) {
3693 if ((r0|r1) < 8)
3694 T1_UXTH(r0, r1);
3695 else
3696 T2_UXTH(r0, r1);
3697 }
3698 else {
3699 if (jit_armv6_p())
3700 UXTH(r0, r1);
3701 else {
3702 LSLI(r0, r1, 16);
3703 LSRI(r0, r0, 16);
3704 }
3705 }
3706 }
3707
3708 static void
_callr(jit_state_t * _jit,jit_int32_t r0)3709 _callr(jit_state_t *_jit, jit_int32_t r0)
3710 {
3711 if (jit_thumb_p())
3712 T1_BLX(r0);
3713 else
3714 BLX(r0);
3715 }
3716
3717 static void
_calli(jit_state_t * _jit,jit_word_t i0)3718 _calli(jit_state_t *_jit, jit_word_t i0)
3719 {
3720 jit_word_t d;
3721 jit_int32_t reg;
3722 d = ((i0 - _jit->pc.w) >> 2) - 2;
3723 if (!jit_exchange_p() && !jit_thumb_p() && _s24P(d))
3724 BLI(d & 0x00ffffff);
3725 else {
3726 reg = jit_get_reg(jit_class_gpr);
3727 movi(rn(reg), i0);
3728 if (jit_thumb_p())
3729 T1_BLX(rn(reg));
3730 else
3731 BLX(rn(reg));
3732 jit_unget_reg(reg);
3733 }
3734 }
3735
3736 static jit_word_t
_calli_p(jit_state_t * _jit,jit_word_t i0)3737 _calli_p(jit_state_t *_jit, jit_word_t i0)
3738 {
3739 jit_word_t w;
3740 jit_int32_t reg;
3741 reg = jit_get_reg(jit_class_gpr);
3742 w = _jit->pc.w;
3743 movi_p(rn(reg), i0);
3744 if (jit_thumb_p())
3745 T1_BLX(rn(reg));
3746 else
3747 BLX(rn(reg));
3748 jit_unget_reg(reg);
3749 return (w);
3750 }
3751
3752 static void
_prolog(jit_state_t * _jit,jit_node_t * node)3753 _prolog(jit_state_t *_jit, jit_node_t *node)
3754 {
3755 jit_int32_t reg;
3756 if (_jitc->function->define_frame || _jitc->function->assume_frame) {
3757 jit_int32_t frame = -_jitc->function->frame;
3758 assert(_jitc->function->self.aoff >= frame);
3759 if (_jitc->function->assume_frame) {
3760 if (jit_thumb_p() && !_jitc->thumb)
3761 _jitc->thumb = _jit->pc.w;
3762 return;
3763 }
3764 _jitc->function->self.aoff = frame;
3765 }
3766 if (_jitc->function->allocar)
3767 _jitc->function->self.aoff &= -8;
3768 _jitc->function->stack = ((_jitc->function->self.alen -
3769 /* align stack at 8 bytes */
3770 _jitc->function->self.aoff) + 7) & -8;
3771
3772 if (jit_thumb_p()) {
3773 /* switch to thumb mode (better approach would be to
3774 * ORR 1 address being called, but no clear distinction
3775 * of what is a pointer to a jit function, or if patching
3776 * a pointer to a jit function) */
3777 ADDI(_R12_REGNO, _R15_REGNO, 1);
3778 BX(_R12_REGNO);
3779 if (!_jitc->thumb)
3780 _jitc->thumb = _jit->pc.w;
3781 if (jit_cpu.abi) {
3782 T2_PUSH(0xf);
3783 T2_PUSH(0x3f0|(1<<_FP_REGNO)|(1<<_LR_REGNO));
3784 VPUSH_F64(_D8_REGNO, 8);
3785 }
3786 else {
3787 T2_PUSH(0xf);
3788 T2_PUSH(0x3f0|(1<<_FP_REGNO)|(1<<_LR_REGNO));
3789 }
3790 }
3791 else {
3792 if (jit_cpu.abi) {
3793 PUSH(0xf);
3794 PUSH(0x3f0|(1<<_FP_REGNO)|(1<<_LR_REGNO));
3795 VPUSH_F64(_D8_REGNO, 8);
3796 }
3797 else {
3798 PUSH(0xf);
3799 PUSH(0x3f0|(1<<_FP_REGNO)|(1<<_LR_REGNO));
3800 }
3801 }
3802 movr(_FP_REGNO, _SP_REGNO);
3803 if (_jitc->function->stack)
3804 subi(_SP_REGNO, _SP_REGNO, _jitc->function->stack);
3805 if (_jitc->function->allocar) {
3806 reg = jit_get_reg(jit_class_gpr);
3807 movi(rn(reg), _jitc->function->self.aoff);
3808 stxi_i(_jitc->function->aoffoff, _FP_REGNO, rn(reg));
3809 jit_unget_reg(reg);
3810 }
3811 }
3812
3813 static void
_epilog(jit_state_t * _jit,jit_node_t * node)3814 _epilog(jit_state_t *_jit, jit_node_t *node)
3815 {
3816 if (_jitc->function->assume_frame)
3817 return;
3818
3819 movr(_SP_REGNO, _FP_REGNO);
3820 if (jit_cpu.abi)
3821 VPOP_F64(_D8_REGNO, 8);
3822 if (jit_thumb_p())
3823 T2_POP(0x3f0|(1<<_FP_REGNO)|(1<<_LR_REGNO));
3824 else
3825 POP(0x3f0|(1<<_FP_REGNO)|(1<<_LR_REGNO));
3826 addi(_SP_REGNO, _SP_REGNO, 16);
3827 if (jit_thumb_p())
3828 T1_BX(_LR_REGNO);
3829 else
3830 BX(_LR_REGNO);
3831 if (jit_thumb_p() && (_jit->pc.w & 2))
3832 T1_NOP();
3833 }
3834
3835 static void
_vastart(jit_state_t * _jit,jit_int32_t r0)3836 _vastart(jit_state_t *_jit, jit_int32_t r0)
3837 {
3838 assert(_jitc->function->self.call & jit_call_varargs);
3839
3840 /* Initialize stack pointer to the first stack argument.
3841 * The -16 is to account for the 4 argument registers
3842 * always saved, and _jitc->function->vagp is to account
3843 * for declared arguments. */
3844 addi(r0, _FP_REGNO, _jitc->function->self.size -
3845 16 + _jitc->function->vagp);
3846 }
3847
3848 static void
_vaarg(jit_state_t * _jit,jit_int32_t r0,jit_int32_t r1)3849 _vaarg(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
3850 {
3851 assert(_jitc->function->self.call & jit_call_varargs);
3852
3853 /* Load argument. */
3854 ldr(r0, r1);
3855
3856 /* Update stack pointer. */
3857 addi(r1, r1, sizeof(jit_word_t));
3858 }
3859
3860 static void
_patch_at(jit_state_t * _jit,jit_int32_t kind,jit_word_t instr,jit_word_t label)3861 _patch_at(jit_state_t *_jit,
3862 jit_int32_t kind, jit_word_t instr, jit_word_t label)
3863 {
3864 jit_word_t d;
3865 jit_thumb_t thumb;
3866 union {
3867 jit_int16_t *s;
3868 jit_int32_t *i;
3869 jit_word_t w;
3870 } u;
3871 u.w = instr;
3872 if (kind == arm_patch_jump) {
3873 if (jit_thumb_p() && (jit_uword_t)instr >= _jitc->thumb) {
3874 code2thumb(thumb.s[0], thumb.s[1], u.s[0], u.s[1]);
3875 if ((thumb.i & THUMB2_B) == THUMB2_B) {
3876 d = ((label - instr) >> 1) - 2;
3877 assert(_s24P(d));
3878 thumb.i = THUMB2_B | encode_thumb_jump(d);
3879 thumb2code(thumb.s[0], thumb.s[1], u.s[0], u.s[1]);
3880 }
3881 else if ((thumb.i & THUMB2_B) == THUMB2_CC_B) {
3882 d = ((label - instr) >> 1) - 2;
3883 assert(_s20P(d));
3884 thumb.i = THUMB2_CC_B | (thumb.i & 0x3c00000) |
3885 encode_thumb_cc_jump(d);
3886 thumb2code(thumb.s[0], thumb.s[1], u.s[0], u.s[1]);
3887 }
3888 else {
3889 /* for the sake of simplicity in case choose to
3890 * movw+movt+[bx|blx], e.g. if changing to instead
3891 * of asserting target is reachable, load constant
3892 * and do indirect jump if not reachable */
3893 if ((thumb.i & 0xfbf00000) == THUMB2_MOVWI)
3894 goto indirect_jump;
3895 assert(!"handled branch opcode");
3896 }
3897 }
3898 else {
3899 thumb.i = u.i[0];
3900 /* 0x0e000000 because 0x01000000 is (branch&) link modifier */
3901 assert((thumb.i & 0x0e000000) == ARM_B);
3902 d = ((label - instr) >> 2) - 2;
3903 assert(_s24P(d));
3904 u.i[0] = (thumb.i & 0xff000000) | (d & 0x00ffffff);
3905 }
3906 }
3907 else if (kind == arm_patch_load) {
3908 /* offset may be negative for a forward patch because it
3909 * is relative to pc + 8, for example:
3910 * ldr r0, [pc, #-4]
3911 * bx r0 ;; [pc, #-8]
3912 * .data ... ;; [pc, #-4]
3913 * ... ;; [pc]
3914 */
3915 assert(!jit_thumb_p());
3916 thumb.i = u.i[0];
3917 assert((thumb.i & 0x0f700000) == ARM_LDRI);
3918 d = label - (instr + 8);
3919 if (d < 0) {
3920 thumb.i &= ~ARM_P;
3921 d = -d;
3922 }
3923 else
3924 thumb.i |= ARM_P;
3925 assert(!(d & 0xfffff000));
3926 u.i[0] = (thumb.i & 0xfffff000) | d;
3927 }
3928 else if (kind == arm_patch_word) {
3929 if (jit_thumb_p()) {
3930 code2thumb(thumb.s[0], thumb.s[1], u.s[0], u.s[1]);
3931 assert((thumb.i & 0xfbf00000) == THUMB2_MOVWI);
3932 indirect_jump:
3933 thumb.i = ((thumb.i & 0xfbf00f00) |
3934 ( (label & 0x0000f000) << 4) |
3935 ( (label & 0x00000800) << 15) |
3936 ( (label & 0x00000700) << 4) |
3937 ( label & 0x000000ff));
3938 thumb2code(thumb.s[0], thumb.s[1], u.s[0], u.s[1]);
3939 label >>= 16;
3940 code2thumb(thumb.s[0], thumb.s[1], u.s[2], u.s[3]);
3941 assert((thumb.i & 0xfbf00000) == THUMB2_MOVTI);
3942 thumb.i = ((thumb.i & 0xfbf00f00) |
3943 ( (label & 0x0000f000) << 4) |
3944 ( (label & 0x00000800) << 15) |
3945 ( (label & 0x00000700) << 4) |
3946 ( label & 0x000000ff));
3947 thumb2code(thumb.s[0], thumb.s[1], u.s[2], u.s[3]);
3948 }
3949 else
3950 u.i[0] = label;
3951 }
3952 else
3953 assert(!"handled patch");
3954 }
3955 #endif
3956