1 /*
2 * Copyright (C) 2014-2020 Paul Cercueil <paul@crapouillou.net>
3 *
4 * This library is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU Lesser General Public
6 * License as published by the Free Software Foundation; either
7 * version 2.1 of the License, or (at your option) any later version.
8 *
9 * This library is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 * Lesser General Public License for more details.
13 */
14
15 #include "blockcache.h"
16 #include "debug.h"
17 #include "disassembler.h"
18 #include "emitter.h"
19 #include "optimizer.h"
20 #include "regcache.h"
21
22 #include <lightning.h>
23 #include <stdbool.h>
24 #include <stddef.h>
25
26 typedef void (*lightrec_rec_func_t)(const struct block *,
27 const struct opcode *, u32);
28
29 /* Forward declarations */
30 static void rec_SPECIAL(const struct block *block,
31 const struct opcode *op, u32 pc);
32 static void rec_REGIMM(const struct block *block,
33 const struct opcode *op, u32 pc);
34 static void rec_CP0(const struct block *block, const struct opcode *op, u32 pc);
35 static void rec_CP2(const struct block *block, const struct opcode *op, u32 pc);
36
37
unknown_opcode(const struct block * block,const struct opcode * op,u32 pc)38 static void unknown_opcode(const struct block *block,
39 const struct opcode *op, u32 pc)
40 {
41 pr_warn("Unknown opcode: 0x%08x at PC 0x%08x\n", op->opcode, pc);
42 }
43
lightrec_emit_end_of_block(const struct block * block,const struct opcode * op,u32 pc,s8 reg_new_pc,u32 imm,u8 ra_reg,u32 link,bool update_cycles)44 static void lightrec_emit_end_of_block(const struct block *block,
45 const struct opcode *op, u32 pc,
46 s8 reg_new_pc, u32 imm, u8 ra_reg,
47 u32 link, bool update_cycles)
48 {
49 struct lightrec_state *state = block->state;
50 struct regcache *reg_cache = state->reg_cache;
51 u32 cycles = state->cycles;
52 jit_state_t *_jit = block->_jit;
53
54 jit_note(__FILE__, __LINE__);
55
56 if (link) {
57 /* Update the $ra register */
58 u8 link_reg = lightrec_alloc_reg_out(reg_cache, _jit, ra_reg);
59 jit_movi(link_reg, link);
60 lightrec_free_reg(reg_cache, link_reg);
61 }
62
63 if (reg_new_pc < 0) {
64 reg_new_pc = lightrec_alloc_reg(reg_cache, _jit, JIT_V0);
65 lightrec_lock_reg(reg_cache, _jit, reg_new_pc);
66
67 jit_movi(reg_new_pc, imm);
68 }
69
70 if (has_delay_slot(op->c) &&
71 !(op->flags & (LIGHTREC_NO_DS | LIGHTREC_LOCAL_BRANCH))) {
72 cycles += lightrec_cycles_of_opcode(op->next->c);
73
74 /* Recompile the delay slot */
75 if (op->next->c.opcode)
76 lightrec_rec_opcode(block, op->next, pc + 4);
77 }
78
79 /* Store back remaining registers */
80 lightrec_storeback_regs(reg_cache, _jit);
81
82 jit_movr(JIT_V0, reg_new_pc);
83
84 if (cycles && update_cycles) {
85 jit_subi(LIGHTREC_REG_CYCLE, LIGHTREC_REG_CYCLE, cycles);
86 pr_debug("EOB: %u cycles\n", cycles);
87 }
88
89 if (op->next && ((op->flags & LIGHTREC_NO_DS) || op->next->next))
90 state->branches[state->nb_branches++] = jit_jmpi();
91 }
92
lightrec_emit_eob(const struct block * block,const struct opcode * op,u32 pc)93 void lightrec_emit_eob(const struct block *block,
94 const struct opcode *op, u32 pc)
95 {
96 struct lightrec_state *state = block->state;
97 struct regcache *reg_cache = state->reg_cache;
98 jit_state_t *_jit = block->_jit;
99
100 lightrec_storeback_regs(reg_cache, _jit);
101
102 jit_movi(JIT_V0, pc);
103 jit_subi(LIGHTREC_REG_CYCLE, LIGHTREC_REG_CYCLE,
104 state->cycles - lightrec_cycles_of_opcode(op->c));
105
106 state->branches[state->nb_branches++] = jit_jmpi();
107 }
108
rec_special_JR(const struct block * block,const struct opcode * op,u32 pc)109 static void rec_special_JR(const struct block *block,
110 const struct opcode *op, u32 pc)
111 {
112 struct regcache *reg_cache = block->state->reg_cache;
113 jit_state_t *_jit = block->_jit;
114 u8 rs = lightrec_request_reg_in(reg_cache, _jit, op->r.rs, JIT_V0);
115
116 _jit_name(block->_jit, __func__);
117 lightrec_lock_reg(reg_cache, _jit, rs);
118 lightrec_emit_end_of_block(block, op, pc, rs, 0, 31, 0, true);
119 }
120
rec_special_JALR(const struct block * block,const struct opcode * op,u32 pc)121 static void rec_special_JALR(const struct block *block,
122 const struct opcode *op, u32 pc)
123 {
124 struct regcache *reg_cache = block->state->reg_cache;
125 jit_state_t *_jit = block->_jit;
126 u8 rs = lightrec_request_reg_in(reg_cache, _jit, op->r.rs, JIT_V0);
127
128 _jit_name(block->_jit, __func__);
129 lightrec_lock_reg(reg_cache, _jit, rs);
130 lightrec_emit_end_of_block(block, op, pc, rs, 0, op->r.rd, pc + 8, true);
131 }
132
rec_J(const struct block * block,const struct opcode * op,u32 pc)133 static void rec_J(const struct block *block, const struct opcode *op, u32 pc)
134 {
135 _jit_name(block->_jit, __func__);
136 lightrec_emit_end_of_block(block, op, pc, -1,
137 (pc & 0xf0000000) | (op->j.imm << 2), 31, 0, true);
138 }
139
rec_JAL(const struct block * block,const struct opcode * op,u32 pc)140 static void rec_JAL(const struct block *block, const struct opcode *op, u32 pc)
141 {
142 _jit_name(block->_jit, __func__);
143 lightrec_emit_end_of_block(block, op, pc, -1,
144 (pc & 0xf0000000) | (op->j.imm << 2),
145 31, pc + 8, true);
146 }
147
rec_b(const struct block * block,const struct opcode * op,u32 pc,jit_code_t code,u32 link,bool unconditional,bool bz)148 static void rec_b(const struct block *block, const struct opcode *op, u32 pc,
149 jit_code_t code, u32 link, bool unconditional, bool bz)
150 {
151 struct regcache *reg_cache = block->state->reg_cache;
152 struct native_register *regs_backup;
153 jit_state_t *_jit = block->_jit;
154 struct lightrec_branch *branch;
155 jit_node_t *addr;
156 u8 link_reg;
157 u32 offset, cycles = block->state->cycles;
158 bool is_forward = (s16)op->i.imm >= -1;
159
160 jit_note(__FILE__, __LINE__);
161
162 if (!(op->flags & LIGHTREC_NO_DS))
163 cycles += lightrec_cycles_of_opcode(op->next->c);
164
165 block->state->cycles = 0;
166
167 if (cycles)
168 jit_subi(LIGHTREC_REG_CYCLE, LIGHTREC_REG_CYCLE, cycles);
169
170 if (!unconditional) {
171 u8 rs = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->i.rs),
172 rt = bz ? 0 : lightrec_alloc_reg_in_ext(reg_cache,
173 _jit, op->i.rt);
174
175 /* Generate the branch opcode */
176 addr = jit_new_node_pww(code, NULL, rs, rt);
177
178 lightrec_free_regs(reg_cache);
179 regs_backup = lightrec_regcache_enter_branch(reg_cache);
180 }
181
182 if (op->flags & LIGHTREC_LOCAL_BRANCH) {
183 if (op->next && !(op->flags & LIGHTREC_NO_DS)) {
184 /* Recompile the delay slot */
185 if (op->next->opcode)
186 lightrec_rec_opcode(block, op->next, pc + 4);
187 }
188
189 if (link) {
190 /* Update the $ra register */
191 link_reg = lightrec_alloc_reg_out(reg_cache, _jit, 31);
192 jit_movi(link_reg, link);
193 lightrec_free_reg(reg_cache, link_reg);
194 }
195
196 /* Store back remaining registers */
197 lightrec_storeback_regs(reg_cache, _jit);
198
199 offset = op->offset + 1 + (s16)op->i.imm;
200 pr_debug("Adding local branch to offset 0x%x\n", offset << 2);
201 branch = &block->state->local_branches[
202 block->state->nb_local_branches++];
203
204 branch->target = offset;
205 if (is_forward)
206 branch->branch = jit_jmpi();
207 else
208 branch->branch = jit_bgti(LIGHTREC_REG_CYCLE, 0);
209 }
210
211 if (!(op->flags & LIGHTREC_LOCAL_BRANCH) || !is_forward) {
212 lightrec_emit_end_of_block(block, op, pc, -1,
213 pc + 4 + ((s16)op->i.imm << 2),
214 31, link, false);
215 }
216
217 if (!unconditional) {
218 jit_patch(addr);
219 lightrec_regcache_leave_branch(reg_cache, regs_backup);
220
221 if (bz && link) {
222 /* Update the $ra register */
223 link_reg = lightrec_alloc_reg_out_ext(reg_cache,
224 _jit, 31);
225 jit_movi(link_reg, (s32)link);
226 lightrec_free_reg(reg_cache, link_reg);
227 }
228
229 if (!(op->flags & LIGHTREC_NO_DS) && op->next->opcode)
230 lightrec_rec_opcode(block, op->next, pc + 4);
231 }
232 }
233
rec_BNE(const struct block * block,const struct opcode * op,u32 pc)234 static void rec_BNE(const struct block *block, const struct opcode *op, u32 pc)
235 {
236 _jit_name(block->_jit, __func__);
237 rec_b(block, op, pc, jit_code_beqr, 0, false, false);
238 }
239
rec_BEQ(const struct block * block,const struct opcode * op,u32 pc)240 static void rec_BEQ(const struct block *block, const struct opcode *op, u32 pc)
241 {
242 _jit_name(block->_jit, __func__);
243 rec_b(block, op, pc, jit_code_bner, 0,
244 op->i.rs == op->i.rt, false);
245 }
246
rec_BLEZ(const struct block * block,const struct opcode * op,u32 pc)247 static void rec_BLEZ(const struct block *block, const struct opcode *op, u32 pc)
248 {
249 _jit_name(block->_jit, __func__);
250 rec_b(block, op, pc, jit_code_bgti, 0, op->i.rs == 0, true);
251 }
252
rec_BGTZ(const struct block * block,const struct opcode * op,u32 pc)253 static void rec_BGTZ(const struct block *block, const struct opcode *op, u32 pc)
254 {
255 _jit_name(block->_jit, __func__);
256 rec_b(block, op, pc, jit_code_blei, 0, false, true);
257 }
258
rec_regimm_BLTZ(const struct block * block,const struct opcode * op,u32 pc)259 static void rec_regimm_BLTZ(const struct block *block,
260 const struct opcode *op, u32 pc)
261 {
262 _jit_name(block->_jit, __func__);
263 rec_b(block, op, pc, jit_code_bgei, 0, false, true);
264 }
265
rec_regimm_BLTZAL(const struct block * block,const struct opcode * op,u32 pc)266 static void rec_regimm_BLTZAL(const struct block *block,
267 const struct opcode *op, u32 pc)
268 {
269 _jit_name(block->_jit, __func__);
270 rec_b(block, op, pc, jit_code_bgei, pc + 8, false, true);
271 }
272
rec_regimm_BGEZ(const struct block * block,const struct opcode * op,u32 pc)273 static void rec_regimm_BGEZ(const struct block *block,
274 const struct opcode *op, u32 pc)
275 {
276 _jit_name(block->_jit, __func__);
277 rec_b(block, op, pc, jit_code_blti, 0, !op->i.rs, true);
278 }
279
rec_regimm_BGEZAL(const struct block * block,const struct opcode * op,u32 pc)280 static void rec_regimm_BGEZAL(const struct block *block,
281 const struct opcode *op, u32 pc)
282 {
283 _jit_name(block->_jit, __func__);
284 rec_b(block, op, pc, jit_code_blti, pc + 8, !op->i.rs, true);
285 }
286
rec_alu_imm(const struct block * block,const struct opcode * op,jit_code_t code,bool sign_extend)287 static void rec_alu_imm(const struct block *block, const struct opcode *op,
288 jit_code_t code, bool sign_extend)
289 {
290 struct regcache *reg_cache = block->state->reg_cache;
291 jit_state_t *_jit = block->_jit;
292 u8 rs, rt;
293
294 jit_note(__FILE__, __LINE__);
295 rs = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->i.rs);
296 rt = lightrec_alloc_reg_out_ext(reg_cache, _jit, op->i.rt);
297
298 if (sign_extend)
299 jit_new_node_www(code, rt, rs, (s32)(s16) op->i.imm);
300 else
301 jit_new_node_www(code, rt, rs, (u32)(u16) op->i.imm);
302
303 lightrec_free_reg(reg_cache, rs);
304 lightrec_free_reg(reg_cache, rt);
305 }
306
rec_alu_special(const struct block * block,const struct opcode * op,jit_code_t code,bool out_ext)307 static void rec_alu_special(const struct block *block, const struct opcode *op,
308 jit_code_t code, bool out_ext)
309 {
310 struct regcache *reg_cache = block->state->reg_cache;
311 jit_state_t *_jit = block->_jit;
312 u8 rd, rt, rs;
313
314 jit_note(__FILE__, __LINE__);
315 rs = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->r.rs);
316 rt = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->r.rt);
317
318 if (out_ext)
319 rd = lightrec_alloc_reg_out_ext(reg_cache, _jit, op->r.rd);
320 else
321 rd = lightrec_alloc_reg_out(reg_cache, _jit, op->r.rd);
322
323 jit_new_node_www(code, rd, rs, rt);
324
325 lightrec_free_reg(reg_cache, rs);
326 lightrec_free_reg(reg_cache, rt);
327 lightrec_free_reg(reg_cache, rd);
328 }
329
rec_alu_shiftv(const struct block * block,const struct opcode * op,jit_code_t code)330 static void rec_alu_shiftv(const struct block *block,
331 const struct opcode *op, jit_code_t code)
332 {
333 struct regcache *reg_cache = block->state->reg_cache;
334 jit_state_t *_jit = block->_jit;
335 u8 rd, rt, rs, temp;
336
337 jit_note(__FILE__, __LINE__);
338 rs = lightrec_alloc_reg_in(reg_cache, _jit, op->r.rs);
339 temp = lightrec_alloc_reg_temp(reg_cache, _jit);
340
341 if (code == jit_code_rshr) {
342 rt = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->r.rt);
343 rd = lightrec_alloc_reg_out_ext(reg_cache, _jit, op->r.rd);
344 } else {
345 rt = lightrec_alloc_reg_in(reg_cache, _jit, op->r.rt);
346 rd = lightrec_alloc_reg_out(reg_cache, _jit, op->r.rd);
347 }
348
349 jit_andi(temp, rs, 0x1f);
350
351 #if __WORDSIZE == 64
352 if (code == jit_code_rshr_u) {
353 jit_extr_ui(rd, rt);
354 jit_new_node_www(code, rd, rd, temp);
355 }
356 #endif
357
358 if (__WORDSIZE == 32 || code != jit_code_rshr_u)
359 jit_new_node_www(code, rd, rt, temp);
360
361 lightrec_free_reg(reg_cache, rs);
362 lightrec_free_reg(reg_cache, temp);
363 lightrec_free_reg(reg_cache, rt);
364 lightrec_free_reg(reg_cache, rd);
365 }
366
rec_ADDIU(const struct block * block,const struct opcode * op,u32 pc)367 static void rec_ADDIU(const struct block *block,
368 const struct opcode *op, u32 pc)
369 {
370 _jit_name(block->_jit, __func__);
371 rec_alu_imm(block, op, jit_code_addi, true);
372 }
373
rec_ADDI(const struct block * block,const struct opcode * op,u32 pc)374 static void rec_ADDI(const struct block *block, const struct opcode *op, u32 pc)
375 {
376 /* TODO: Handle the exception? */
377 _jit_name(block->_jit, __func__);
378 rec_alu_imm(block, op, jit_code_addi, true);
379 }
380
rec_SLTIU(const struct block * block,const struct opcode * op,u32 pc)381 static void rec_SLTIU(const struct block *block,
382 const struct opcode *op, u32 pc)
383 {
384 _jit_name(block->_jit, __func__);
385 rec_alu_imm(block, op, jit_code_lti_u, true);
386 }
387
rec_SLTI(const struct block * block,const struct opcode * op,u32 pc)388 static void rec_SLTI(const struct block *block, const struct opcode *op, u32 pc)
389 {
390 _jit_name(block->_jit, __func__);
391 rec_alu_imm(block, op, jit_code_lti, true);
392 }
393
rec_ANDI(const struct block * block,const struct opcode * op,u32 pc)394 static void rec_ANDI(const struct block *block, const struct opcode *op, u32 pc)
395 {
396 struct regcache *reg_cache = block->state->reg_cache;
397 jit_state_t *_jit = block->_jit;
398 u8 rs, rt;
399
400 _jit_name(block->_jit, __func__);
401 jit_note(__FILE__, __LINE__);
402 rs = lightrec_alloc_reg_in(reg_cache, _jit, op->i.rs);
403 rt = lightrec_alloc_reg_out_ext(reg_cache, _jit, op->i.rt);
404
405 /* PSX code uses ANDI 0xff / ANDI 0xffff a lot, which are basically
406 * casts to uint8_t / uint16_t. */
407 if (op->i.imm == 0xff)
408 jit_extr_uc(rt, rs);
409 else if (op->i.imm == 0xffff)
410 jit_extr_us(rt, rs);
411 else
412 jit_andi(rt, rs, (u32)(u16) op->i.imm);
413
414 lightrec_free_reg(reg_cache, rs);
415 lightrec_free_reg(reg_cache, rt);
416 }
417
rec_ORI(const struct block * block,const struct opcode * op,u32 pc)418 static void rec_ORI(const struct block *block, const struct opcode *op, u32 pc)
419 {
420 _jit_name(block->_jit, __func__);
421 rec_alu_imm(block, op, jit_code_ori, false);
422 }
423
rec_XORI(const struct block * block,const struct opcode * op,u32 pc)424 static void rec_XORI(const struct block *block, const struct opcode *op, u32 pc)
425 {
426 _jit_name(block->_jit, __func__);
427 rec_alu_imm(block, op, jit_code_xori, false);
428 }
429
rec_LUI(const struct block * block,const struct opcode * op,u32 pc)430 static void rec_LUI(const struct block *block, const struct opcode *op, u32 pc)
431 {
432 struct regcache *reg_cache = block->state->reg_cache;
433 jit_state_t *_jit = block->_jit;
434 u8 rt;
435
436 jit_name(__func__);
437 jit_note(__FILE__, __LINE__);
438 rt = lightrec_alloc_reg_out_ext(reg_cache, _jit, op->i.rt);
439
440 jit_movi(rt, (s32)(op->i.imm << 16));
441
442 lightrec_free_reg(reg_cache, rt);
443 }
444
rec_special_ADDU(const struct block * block,const struct opcode * op,u32 pc)445 static void rec_special_ADDU(const struct block *block,
446 const struct opcode *op, u32 pc)
447 {
448 _jit_name(block->_jit, __func__);
449 rec_alu_special(block, op, jit_code_addr, false);
450 }
451
rec_special_ADD(const struct block * block,const struct opcode * op,u32 pc)452 static void rec_special_ADD(const struct block *block,
453 const struct opcode *op, u32 pc)
454 {
455 /* TODO: Handle the exception? */
456 _jit_name(block->_jit, __func__);
457 rec_alu_special(block, op, jit_code_addr, false);
458 }
459
rec_special_SUBU(const struct block * block,const struct opcode * op,u32 pc)460 static void rec_special_SUBU(const struct block *block,
461 const struct opcode *op, u32 pc)
462 {
463 _jit_name(block->_jit, __func__);
464 rec_alu_special(block, op, jit_code_subr, false);
465 }
466
rec_special_SUB(const struct block * block,const struct opcode * op,u32 pc)467 static void rec_special_SUB(const struct block *block,
468 const struct opcode *op, u32 pc)
469 {
470 /* TODO: Handle the exception? */
471 _jit_name(block->_jit, __func__);
472 rec_alu_special(block, op, jit_code_subr, false);
473 }
474
rec_special_AND(const struct block * block,const struct opcode * op,u32 pc)475 static void rec_special_AND(const struct block *block,
476 const struct opcode *op, u32 pc)
477 {
478 _jit_name(block->_jit, __func__);
479 rec_alu_special(block, op, jit_code_andr, false);
480 }
481
rec_special_OR(const struct block * block,const struct opcode * op,u32 pc)482 static void rec_special_OR(const struct block *block,
483 const struct opcode *op, u32 pc)
484 {
485 _jit_name(block->_jit, __func__);
486 rec_alu_special(block, op, jit_code_orr, false);
487 }
488
rec_special_XOR(const struct block * block,const struct opcode * op,u32 pc)489 static void rec_special_XOR(const struct block *block,
490 const struct opcode *op, u32 pc)
491 {
492 _jit_name(block->_jit, __func__);
493 rec_alu_special(block, op, jit_code_xorr, false);
494 }
495
rec_special_NOR(const struct block * block,const struct opcode * op,u32 pc)496 static void rec_special_NOR(const struct block *block,
497 const struct opcode *op, u32 pc)
498 {
499 struct regcache *reg_cache = block->state->reg_cache;
500 jit_state_t *_jit = block->_jit;
501 u8 rd;
502
503 jit_name(__func__);
504 rec_alu_special(block, op, jit_code_orr, false);
505 rd = lightrec_alloc_reg_out(reg_cache, _jit, op->r.rd);
506
507 jit_comr(rd, rd);
508
509 lightrec_free_reg(reg_cache, rd);
510 }
511
rec_special_SLTU(const struct block * block,const struct opcode * op,u32 pc)512 static void rec_special_SLTU(const struct block *block,
513 const struct opcode *op, u32 pc)
514 {
515 _jit_name(block->_jit, __func__);
516 rec_alu_special(block, op, jit_code_ltr_u, true);
517 }
518
rec_special_SLT(const struct block * block,const struct opcode * op,u32 pc)519 static void rec_special_SLT(const struct block *block,
520 const struct opcode *op, u32 pc)
521 {
522 _jit_name(block->_jit, __func__);
523 rec_alu_special(block, op, jit_code_ltr, true);
524 }
525
rec_special_SLLV(const struct block * block,const struct opcode * op,u32 pc)526 static void rec_special_SLLV(const struct block *block,
527 const struct opcode *op, u32 pc)
528 {
529 _jit_name(block->_jit, __func__);
530 rec_alu_shiftv(block, op, jit_code_lshr);
531 }
532
rec_special_SRLV(const struct block * block,const struct opcode * op,u32 pc)533 static void rec_special_SRLV(const struct block *block,
534 const struct opcode *op, u32 pc)
535 {
536 _jit_name(block->_jit, __func__);
537 rec_alu_shiftv(block, op, jit_code_rshr_u);
538 }
539
rec_special_SRAV(const struct block * block,const struct opcode * op,u32 pc)540 static void rec_special_SRAV(const struct block *block,
541 const struct opcode *op, u32 pc)
542 {
543 _jit_name(block->_jit, __func__);
544 rec_alu_shiftv(block, op, jit_code_rshr);
545 }
546
rec_alu_shift(const struct block * block,const struct opcode * op,jit_code_t code)547 static void rec_alu_shift(const struct block *block,
548 const struct opcode *op, jit_code_t code)
549 {
550 struct regcache *reg_cache = block->state->reg_cache;
551 jit_state_t *_jit = block->_jit;
552 u8 rd, rt;
553
554 jit_note(__FILE__, __LINE__);
555
556 if (code == jit_code_rshi) {
557 rt = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->r.rt);
558 rd = lightrec_alloc_reg_out_ext(reg_cache, _jit, op->r.rd);
559 } else {
560 rt = lightrec_alloc_reg_in(reg_cache, _jit, op->r.rt);
561 rd = lightrec_alloc_reg_out(reg_cache, _jit, op->r.rd);
562 }
563
564 #if __WORDSIZE == 64
565 if (code == jit_code_rshi_u) {
566 jit_extr_ui(rd, rt);
567 jit_new_node_www(code, rd, rd, op->r.imm);
568 }
569 #endif
570 if (__WORDSIZE == 32 || code != jit_code_rshi_u)
571 jit_new_node_www(code, rd, rt, op->r.imm);
572
573 lightrec_free_reg(reg_cache, rt);
574 lightrec_free_reg(reg_cache, rd);
575 }
576
rec_special_SLL(const struct block * block,const struct opcode * op,u32 pc)577 static void rec_special_SLL(const struct block *block,
578 const struct opcode *op, u32 pc)
579 {
580 _jit_name(block->_jit, __func__);
581 rec_alu_shift(block, op, jit_code_lshi);
582 }
583
rec_special_SRL(const struct block * block,const struct opcode * op,u32 pc)584 static void rec_special_SRL(const struct block *block,
585 const struct opcode *op, u32 pc)
586 {
587 _jit_name(block->_jit, __func__);
588 rec_alu_shift(block, op, jit_code_rshi_u);
589 }
590
rec_special_SRA(const struct block * block,const struct opcode * op,u32 pc)591 static void rec_special_SRA(const struct block *block,
592 const struct opcode *op, u32 pc)
593 {
594 _jit_name(block->_jit, __func__);
595 rec_alu_shift(block, op, jit_code_rshi);
596 }
597
rec_alu_mult(const struct block * block,const struct opcode * op,bool is_signed)598 static void rec_alu_mult(const struct block *block,
599 const struct opcode *op, bool is_signed)
600 {
601 struct regcache *reg_cache = block->state->reg_cache;
602 jit_state_t *_jit = block->_jit;
603 u8 lo, hi, rs, rt;
604
605 jit_note(__FILE__, __LINE__);
606
607 lo = lightrec_alloc_reg_out(reg_cache, _jit, REG_LO);
608 if (!(op->flags & LIGHTREC_MULT32))
609 hi = lightrec_alloc_reg_out_ext(reg_cache, _jit, REG_HI);
610 else if (__WORDSIZE == 64)
611 hi = lightrec_alloc_reg_temp(reg_cache, _jit);
612
613 if (__WORDSIZE == 32 || !is_signed) {
614 rs = lightrec_alloc_reg_in(reg_cache, _jit, op->r.rs);
615 rt = lightrec_alloc_reg_in(reg_cache, _jit, op->r.rt);
616 } else {
617 rs = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->r.rs);
618 rt = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->r.rt);
619 }
620
621 #if __WORDSIZE == 32
622 /* On 32-bit systems, do a 32*32->64 bit operation, or a 32*32->32 bit
623 * operation if the MULT was detected a 32-bit only. */
624 if (!(op->flags & LIGHTREC_MULT32)) {
625 if (is_signed)
626 jit_qmulr(lo, hi, rs, rt);
627 else
628 jit_qmulr_u(lo, hi, rs, rt);
629 } else {
630 jit_mulr(lo, rs, rt);
631 }
632 #else
633 /* On 64-bit systems, do a 64*64->64 bit operation.
634 * The input registers must be 32 bits, so we first sign-extend (if
635 * mult) or clear (if multu) the input registers. */
636 if (is_signed) {
637 jit_mulr(lo, rs, rt);
638 } else {
639 jit_extr_ui(lo, rt);
640 jit_extr_ui(hi, rs);
641 jit_mulr(lo, hi, lo);
642 }
643
644 /* The 64-bit output value is in $lo, store the upper 32 bits in $hi */
645 if (!(op->flags & LIGHTREC_MULT32))
646 jit_rshi(hi, lo, 32);
647 #endif
648
649 lightrec_free_reg(reg_cache, rs);
650 lightrec_free_reg(reg_cache, rt);
651 lightrec_free_reg(reg_cache, lo);
652 if (__WORDSIZE == 64 || !(op->flags & LIGHTREC_MULT32))
653 lightrec_free_reg(reg_cache, hi);
654 }
655
rec_alu_div(const struct block * block,const struct opcode * op,bool is_signed)656 static void rec_alu_div(const struct block *block,
657 const struct opcode *op, bool is_signed)
658 {
659 struct regcache *reg_cache = block->state->reg_cache;
660 jit_state_t *_jit = block->_jit;
661 jit_node_t *branch, *to_end;
662 u8 lo, hi, rs, rt;
663
664 jit_note(__FILE__, __LINE__);
665 lo = lightrec_alloc_reg_out(reg_cache, _jit, REG_LO);
666 hi = lightrec_alloc_reg_out(reg_cache, _jit, REG_HI);
667
668 if (__WORDSIZE == 32 || !is_signed) {
669 rs = lightrec_alloc_reg_in(reg_cache, _jit, op->r.rs);
670 rt = lightrec_alloc_reg_in(reg_cache, _jit, op->r.rt);
671 } else {
672 rs = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->r.rs);
673 rt = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->r.rt);
674 }
675
676 /* Jump to special handler if dividing by zero */
677 branch = jit_beqi(rt, 0);
678
679 #if __WORDSIZE == 32
680 if (is_signed)
681 jit_qdivr(lo, hi, rs, rt);
682 else
683 jit_qdivr_u(lo, hi, rs, rt);
684 #else
685 /* On 64-bit systems, the input registers must be 32 bits, so we first sign-extend
686 * (if div) or clear (if divu) the input registers. */
687 if (is_signed) {
688 jit_qdivr(lo, hi, rs, rt);
689 } else {
690 jit_extr_ui(lo, rt);
691 jit_extr_ui(hi, rs);
692 jit_qdivr_u(lo, hi, hi, lo);
693 }
694 #endif
695
696 /* Jump above the div-by-zero handler */
697 to_end = jit_jmpi();
698
699 jit_patch(branch);
700
701 if (is_signed) {
702 jit_lti(lo, rs, 0);
703 jit_lshi(lo, lo, 1);
704 jit_subi(lo, lo, 1);
705 } else {
706 jit_movi(lo, 0xffffffff);
707 }
708
709 jit_movr(hi, rs);
710
711 jit_patch(to_end);
712
713 lightrec_free_reg(reg_cache, rs);
714 lightrec_free_reg(reg_cache, rt);
715 lightrec_free_reg(reg_cache, lo);
716 lightrec_free_reg(reg_cache, hi);
717 }
718
rec_special_MULT(const struct block * block,const struct opcode * op,u32 pc)719 static void rec_special_MULT(const struct block *block,
720 const struct opcode *op, u32 pc)
721 {
722 _jit_name(block->_jit, __func__);
723 rec_alu_mult(block, op, true);
724 }
725
rec_special_MULTU(const struct block * block,const struct opcode * op,u32 pc)726 static void rec_special_MULTU(const struct block *block,
727 const struct opcode *op, u32 pc)
728 {
729 _jit_name(block->_jit, __func__);
730 rec_alu_mult(block, op, false);
731 }
732
rec_special_DIV(const struct block * block,const struct opcode * op,u32 pc)733 static void rec_special_DIV(const struct block *block,
734 const struct opcode *op, u32 pc)
735 {
736 _jit_name(block->_jit, __func__);
737 rec_alu_div(block, op, true);
738 }
739
rec_special_DIVU(const struct block * block,const struct opcode * op,u32 pc)740 static void rec_special_DIVU(const struct block *block,
741 const struct opcode *op, u32 pc)
742 {
743 _jit_name(block->_jit, __func__);
744 rec_alu_div(block, op, false);
745 }
746
rec_alu_mv_lo_hi(const struct block * block,u8 dst,u8 src)747 static void rec_alu_mv_lo_hi(const struct block *block, u8 dst, u8 src)
748 {
749 struct regcache *reg_cache = block->state->reg_cache;
750 jit_state_t *_jit = block->_jit;
751
752 jit_note(__FILE__, __LINE__);
753 src = lightrec_alloc_reg_in(reg_cache, _jit, src);
754 dst = lightrec_alloc_reg_out_ext(reg_cache, _jit, dst);
755
756 #if __WORDSIZE == 32
757 jit_movr(dst, src);
758 #else
759 jit_extr_i(dst, src);
760 #endif
761
762 lightrec_free_reg(reg_cache, src);
763 lightrec_free_reg(reg_cache, dst);
764 }
765
rec_special_MFHI(const struct block * block,const struct opcode * op,u32 pc)766 static void rec_special_MFHI(const struct block *block,
767 const struct opcode *op, u32 pc)
768 {
769 _jit_name(block->_jit, __func__);
770 rec_alu_mv_lo_hi(block, op->r.rd, REG_HI);
771 }
772
rec_special_MTHI(const struct block * block,const struct opcode * op,u32 pc)773 static void rec_special_MTHI(const struct block *block,
774 const struct opcode *op, u32 pc)
775 {
776 _jit_name(block->_jit, __func__);
777 rec_alu_mv_lo_hi(block, REG_HI, op->r.rs);
778 }
779
rec_special_MFLO(const struct block * block,const struct opcode * op,u32 pc)780 static void rec_special_MFLO(const struct block *block,
781 const struct opcode *op, u32 pc)
782 {
783 _jit_name(block->_jit, __func__);
784 rec_alu_mv_lo_hi(block, op->r.rd, REG_LO);
785 }
786
rec_special_MTLO(const struct block * block,const struct opcode * op,u32 pc)787 static void rec_special_MTLO(const struct block *block,
788 const struct opcode *op, u32 pc)
789 {
790 _jit_name(block->_jit, __func__);
791 rec_alu_mv_lo_hi(block, REG_LO, op->r.rs);
792 }
793
rec_io(const struct block * block,const struct opcode * op,bool load_rt,bool read_rt)794 static void rec_io(const struct block *block, const struct opcode *op,
795 bool load_rt, bool read_rt)
796 {
797 struct regcache *reg_cache = block->state->reg_cache;
798 jit_state_t *_jit = block->_jit;
799 bool is_tagged = op->flags & (LIGHTREC_HW_IO | LIGHTREC_DIRECT_IO);
800 u32 offset;
801 u8 tmp, tmp2, tmp3;
802
803 jit_note(__FILE__, __LINE__);
804
805 tmp = lightrec_alloc_reg(reg_cache, _jit, JIT_R0);
806
807 if (is_tagged) {
808 offset = offsetof(struct lightrec_state, rw_func);
809 } else {
810 tmp3 = lightrec_alloc_reg(reg_cache, _jit, JIT_R1);
811 offset = offsetof(struct lightrec_state, rw_generic_func);
812 }
813
814 tmp2 = lightrec_alloc_reg_temp(reg_cache, _jit);
815 jit_ldxi(tmp2, LIGHTREC_REG_STATE, offset);
816
817 lightrec_clean_reg_if_loaded(reg_cache, _jit, op->i.rs, false);
818
819 if (read_rt && likely(op->i.rt))
820 lightrec_clean_reg_if_loaded(reg_cache, _jit, op->i.rt, true);
821 else if (load_rt)
822 lightrec_clean_reg_if_loaded(reg_cache, _jit, op->i.rt, false);
823
824 if (is_tagged) {
825 jit_movi(tmp, op->opcode);
826 } else {
827 jit_movi(tmp, (uintptr_t)op);
828 jit_movi(tmp3, (uintptr_t)block);
829 }
830
831 jit_callr(tmp2);
832
833 lightrec_free_reg(reg_cache, tmp);
834 lightrec_free_reg(reg_cache, tmp2);
835 if (!is_tagged)
836 lightrec_free_reg(reg_cache, tmp3);
837 lightrec_regcache_mark_live(reg_cache, _jit);
838 }
839
rec_store_direct_no_invalidate(const struct block * block,const struct opcode * op,jit_code_t code)840 static void rec_store_direct_no_invalidate(const struct block *block,
841 const struct opcode *op,
842 jit_code_t code)
843 {
844 struct lightrec_state *state = block->state;
845 struct regcache *reg_cache = state->reg_cache;
846 jit_state_t *_jit = block->_jit;
847 jit_node_t *to_not_ram, *to_end;
848 u8 tmp, tmp2, rs, rt;
849 s16 imm;
850
851 jit_note(__FILE__, __LINE__);
852 rs = lightrec_alloc_reg_in(reg_cache, _jit, op->i.rs);
853 tmp = lightrec_alloc_reg_temp(reg_cache, _jit);
854 tmp2 = lightrec_alloc_reg_temp(reg_cache, _jit);
855
856 /* Convert to KUNSEG and avoid RAM mirrors */
857 if (state->mirrors_mapped) {
858 imm = (s16)op->i.imm;
859 jit_andi(tmp, rs, 0x1f800000 | (4 * RAM_SIZE - 1));
860 } else if (op->i.imm) {
861 imm = 0;
862 jit_addi(tmp, rs, (s16)op->i.imm);
863 jit_andi(tmp, tmp, 0x1f800000 | (RAM_SIZE - 1));
864 } else {
865 imm = 0;
866 jit_andi(tmp, rs, 0x1f800000 | (RAM_SIZE - 1));
867 }
868
869 lightrec_free_reg(reg_cache, rs);
870
871 if (state->offset_ram != state->offset_scratch) {
872 to_not_ram = jit_bmsi(tmp, BIT(28));
873
874 jit_movi(tmp2, state->offset_ram);
875
876 to_end = jit_jmpi();
877 jit_patch(to_not_ram);
878
879 jit_movi(tmp2, state->offset_scratch);
880 jit_patch(to_end);
881 } else if (state->offset_ram) {
882 jit_movi(tmp2, state->offset_ram);
883 }
884
885 if (state->offset_ram || state->offset_scratch)
886 jit_addr(tmp, tmp, tmp2);
887
888 lightrec_free_reg(reg_cache, tmp2);
889
890 rt = lightrec_alloc_reg_in(reg_cache, _jit, op->i.rt);
891 jit_new_node_www(code, imm, tmp, rt);
892
893 lightrec_free_reg(reg_cache, rt);
894 lightrec_free_reg(reg_cache, tmp);
895 }
896
rec_store_direct(const struct block * block,const struct opcode * op,jit_code_t code)897 static void rec_store_direct(const struct block *block, const struct opcode *op,
898 jit_code_t code)
899 {
900 struct lightrec_state *state = block->state;
901 struct regcache *reg_cache = state->reg_cache;
902 jit_state_t *_jit = block->_jit;
903 jit_node_t *to_not_ram, *to_end;
904 u8 tmp, tmp2, tmp3, rs, rt;
905
906 jit_note(__FILE__, __LINE__);
907
908 rs = lightrec_alloc_reg_in(reg_cache, _jit, op->i.rs);
909 tmp2 = lightrec_alloc_reg_temp(reg_cache, _jit);
910 tmp3 = lightrec_alloc_reg_in(reg_cache, _jit, 0);
911
912 /* Convert to KUNSEG and avoid RAM mirrors */
913 if (op->i.imm) {
914 jit_addi(tmp2, rs, (s16)op->i.imm);
915 jit_andi(tmp2, tmp2, 0x1f800000 | (RAM_SIZE - 1));
916 } else {
917 jit_andi(tmp2, rs, 0x1f800000 | (RAM_SIZE - 1));
918 }
919
920 lightrec_free_reg(reg_cache, rs);
921 tmp = lightrec_alloc_reg_temp(reg_cache, _jit);
922
923 to_not_ram = jit_bgti(tmp2, RAM_SIZE);
924
925 /* Compute the offset to the code LUT */
926 jit_andi(tmp, tmp2, (RAM_SIZE - 1) & ~3);
927 #if __WORDSIZE == 64
928 jit_lshi(tmp, tmp, 1);
929 #endif
930 jit_addr(tmp, LIGHTREC_REG_STATE, tmp);
931
932 /* Write NULL to the code LUT to invalidate any block that's there */
933 jit_stxi(offsetof(struct lightrec_state, code_lut), tmp, tmp3);
934
935 if (state->offset_ram != state->offset_scratch) {
936 jit_movi(tmp, state->offset_ram);
937
938 to_end = jit_jmpi();
939 }
940
941 jit_patch(to_not_ram);
942
943 if (state->offset_ram || state->offset_scratch)
944 jit_movi(tmp, state->offset_scratch);
945
946 if (state->offset_ram != state->offset_scratch)
947 jit_patch(to_end);
948
949 if (state->offset_ram || state->offset_scratch)
950 jit_addr(tmp2, tmp2, tmp);
951
952 lightrec_free_reg(reg_cache, tmp);
953 lightrec_free_reg(reg_cache, tmp3);
954
955 rt = lightrec_alloc_reg_in(reg_cache, _jit, op->i.rt);
956 jit_new_node_www(code, 0, tmp2, rt);
957
958 lightrec_free_reg(reg_cache, rt);
959 lightrec_free_reg(reg_cache, tmp2);
960 }
961
rec_store(const struct block * block,const struct opcode * op,jit_code_t code)962 static void rec_store(const struct block *block, const struct opcode *op,
963 jit_code_t code)
964 {
965 if (op->flags & LIGHTREC_NO_INVALIDATE) {
966 rec_store_direct_no_invalidate(block, op, code);
967 } else if (op->flags & LIGHTREC_DIRECT_IO) {
968 if (block->state->invalidate_from_dma_only)
969 rec_store_direct_no_invalidate(block, op, code);
970 else
971 rec_store_direct(block, op, code);
972 } else {
973 rec_io(block, op, true, false);
974 }
975 }
976
rec_SB(const struct block * block,const struct opcode * op,u32 pc)977 static void rec_SB(const struct block *block, const struct opcode *op, u32 pc)
978 {
979 _jit_name(block->_jit, __func__);
980 rec_store(block, op, jit_code_stxi_c);
981 }
982
rec_SH(const struct block * block,const struct opcode * op,u32 pc)983 static void rec_SH(const struct block *block, const struct opcode *op, u32 pc)
984 {
985 _jit_name(block->_jit, __func__);
986 rec_store(block, op, jit_code_stxi_s);
987 }
988
rec_SW(const struct block * block,const struct opcode * op,u32 pc)989 static void rec_SW(const struct block *block, const struct opcode *op, u32 pc)
990 {
991 _jit_name(block->_jit, __func__);
992 rec_store(block, op, jit_code_stxi_i);
993 }
994
rec_SWL(const struct block * block,const struct opcode * op,u32 pc)995 static void rec_SWL(const struct block *block, const struct opcode *op, u32 pc)
996 {
997 _jit_name(block->_jit, __func__);
998 rec_io(block, op, true, false);
999 }
1000
rec_SWR(const struct block * block,const struct opcode * op,u32 pc)1001 static void rec_SWR(const struct block *block, const struct opcode *op, u32 pc)
1002 {
1003 _jit_name(block->_jit, __func__);
1004 rec_io(block, op, true, false);
1005 }
1006
rec_SWC2(const struct block * block,const struct opcode * op,u32 pc)1007 static void rec_SWC2(const struct block *block, const struct opcode *op, u32 pc)
1008 {
1009 _jit_name(block->_jit, __func__);
1010 rec_io(block, op, false, false);
1011 }
1012
rec_load_direct(const struct block * block,const struct opcode * op,jit_code_t code)1013 static void rec_load_direct(const struct block *block, const struct opcode *op,
1014 jit_code_t code)
1015 {
1016 struct lightrec_state *state = block->state;
1017 struct regcache *reg_cache = state->reg_cache;
1018 jit_state_t *_jit = block->_jit;
1019 jit_node_t *to_not_ram, *to_not_bios, *to_end, *to_end2;
1020 u8 tmp, rs, rt, addr_reg;
1021 s16 imm;
1022
1023 if (!op->i.rt)
1024 return;
1025
1026 jit_note(__FILE__, __LINE__);
1027 rs = lightrec_alloc_reg_in(reg_cache, _jit, op->i.rs);
1028 rt = lightrec_alloc_reg_out_ext(reg_cache, _jit, op->i.rt);
1029
1030 if ((state->offset_ram == state->offset_bios &&
1031 state->offset_ram == state->offset_scratch &&
1032 state->mirrors_mapped) || !op->i.imm) {
1033 addr_reg = rs;
1034 imm = (s16)op->i.imm;
1035 } else {
1036 jit_addi(rt, rs, (s16)op->i.imm);
1037 addr_reg = rt;
1038 imm = 0;
1039
1040 if (op->i.rs != op->i.rt)
1041 lightrec_free_reg(reg_cache, rs);
1042 }
1043
1044 tmp = lightrec_alloc_reg_temp(reg_cache, _jit);
1045
1046 if (state->offset_ram == state->offset_bios &&
1047 state->offset_ram == state->offset_scratch) {
1048 if (!state->mirrors_mapped) {
1049 jit_andi(tmp, addr_reg, BIT(28));
1050 jit_rshi_u(tmp, tmp, 28 - 22);
1051 jit_ori(tmp, tmp, 0x1f800000 | (RAM_SIZE - 1));
1052 jit_andr(rt, addr_reg, tmp);
1053 } else {
1054 jit_andi(rt, addr_reg, 0x1fffffff);
1055 }
1056
1057 if (state->offset_ram)
1058 jit_movi(tmp, state->offset_ram);
1059 } else {
1060 to_not_ram = jit_bmsi(addr_reg, BIT(28));
1061
1062 /* Convert to KUNSEG and avoid RAM mirrors */
1063 jit_andi(rt, addr_reg, RAM_SIZE - 1);
1064
1065 if (state->offset_ram)
1066 jit_movi(tmp, state->offset_ram);
1067
1068 to_end = jit_jmpi();
1069
1070 jit_patch(to_not_ram);
1071
1072 if (state->offset_bios != state->offset_scratch)
1073 to_not_bios = jit_bmci(addr_reg, BIT(22));
1074
1075 /* Convert to KUNSEG */
1076 jit_andi(rt, addr_reg, 0x1fc00000 | (BIOS_SIZE - 1));
1077
1078 jit_movi(tmp, state->offset_bios);
1079
1080 if (state->offset_bios != state->offset_scratch) {
1081 to_end2 = jit_jmpi();
1082
1083 jit_patch(to_not_bios);
1084
1085 /* Convert to KUNSEG */
1086 jit_andi(rt, addr_reg, 0x1f800fff);
1087
1088 if (state->offset_scratch)
1089 jit_movi(tmp, state->offset_scratch);
1090
1091 jit_patch(to_end2);
1092 }
1093
1094 jit_patch(to_end);
1095 }
1096
1097 if (state->offset_ram || state->offset_bios || state->offset_scratch)
1098 jit_addr(rt, rt, tmp);
1099
1100 jit_new_node_www(code, rt, rt, imm);
1101
1102 lightrec_free_reg(reg_cache, addr_reg);
1103 lightrec_free_reg(reg_cache, rt);
1104 lightrec_free_reg(reg_cache, tmp);
1105 }
1106
rec_load(const struct block * block,const struct opcode * op,jit_code_t code)1107 static void rec_load(const struct block *block, const struct opcode *op,
1108 jit_code_t code)
1109 {
1110 if (op->flags & LIGHTREC_DIRECT_IO)
1111 rec_load_direct(block, op, code);
1112 else
1113 rec_io(block, op, false, true);
1114 }
1115
rec_LB(const struct block * block,const struct opcode * op,u32 pc)1116 static void rec_LB(const struct block *block, const struct opcode *op, u32 pc)
1117 {
1118 _jit_name(block->_jit, __func__);
1119 rec_load(block, op, jit_code_ldxi_c);
1120 }
1121
rec_LBU(const struct block * block,const struct opcode * op,u32 pc)1122 static void rec_LBU(const struct block *block, const struct opcode *op, u32 pc)
1123 {
1124 _jit_name(block->_jit, __func__);
1125 rec_load(block, op, jit_code_ldxi_uc);
1126 }
1127
rec_LH(const struct block * block,const struct opcode * op,u32 pc)1128 static void rec_LH(const struct block *block, const struct opcode *op, u32 pc)
1129 {
1130 _jit_name(block->_jit, __func__);
1131 rec_load(block, op, jit_code_ldxi_s);
1132 }
1133
rec_LHU(const struct block * block,const struct opcode * op,u32 pc)1134 static void rec_LHU(const struct block *block, const struct opcode *op, u32 pc)
1135 {
1136 _jit_name(block->_jit, __func__);
1137 rec_load(block, op, jit_code_ldxi_us);
1138 }
1139
rec_LWL(const struct block * block,const struct opcode * op,u32 pc)1140 static void rec_LWL(const struct block *block, const struct opcode *op, u32 pc)
1141 {
1142 _jit_name(block->_jit, __func__);
1143 rec_io(block, op, true, true);
1144 }
1145
rec_LWR(const struct block * block,const struct opcode * op,u32 pc)1146 static void rec_LWR(const struct block *block, const struct opcode *op, u32 pc)
1147 {
1148 _jit_name(block->_jit, __func__);
1149 rec_io(block, op, true, true);
1150 }
1151
rec_LW(const struct block * block,const struct opcode * op,u32 pc)1152 static void rec_LW(const struct block *block, const struct opcode *op, u32 pc)
1153 {
1154 _jit_name(block->_jit, __func__);
1155 rec_load(block, op, jit_code_ldxi_i);
1156 }
1157
rec_LWC2(const struct block * block,const struct opcode * op,u32 pc)1158 static void rec_LWC2(const struct block *block, const struct opcode *op, u32 pc)
1159 {
1160 _jit_name(block->_jit, __func__);
1161 rec_io(block, op, false, false);
1162 }
1163
rec_break_syscall(const struct block * block,const struct opcode * op,u32 pc,bool is_break)1164 static void rec_break_syscall(const struct block *block,
1165 const struct opcode *op, u32 pc, bool is_break)
1166 {
1167 struct regcache *reg_cache = block->state->reg_cache;
1168 jit_state_t *_jit = block->_jit;
1169 u32 offset;
1170 u8 tmp;
1171
1172 jit_note(__FILE__, __LINE__);
1173
1174 if (is_break)
1175 offset = offsetof(struct lightrec_state, break_func);
1176 else
1177 offset = offsetof(struct lightrec_state, syscall_func);
1178
1179 tmp = lightrec_alloc_reg_temp(reg_cache, _jit);
1180 jit_ldxi(tmp, LIGHTREC_REG_STATE, offset);
1181 jit_callr(tmp);
1182 lightrec_free_reg(reg_cache, tmp);
1183
1184 lightrec_regcache_mark_live(reg_cache, _jit);
1185
1186 /* TODO: the return address should be "pc - 4" if we're a delay slot */
1187 lightrec_emit_end_of_block(block, op, pc, -1, pc, 31, 0, true);
1188 }
1189
rec_special_SYSCALL(const struct block * block,const struct opcode * op,u32 pc)1190 static void rec_special_SYSCALL(const struct block *block,
1191 const struct opcode *op, u32 pc)
1192 {
1193 _jit_name(block->_jit, __func__);
1194 rec_break_syscall(block, op, pc, false);
1195 }
1196
rec_special_BREAK(const struct block * block,const struct opcode * op,u32 pc)1197 static void rec_special_BREAK(const struct block *block,
1198 const struct opcode *op, u32 pc)
1199 {
1200 _jit_name(block->_jit, __func__);
1201 rec_break_syscall(block, op, pc, true);
1202 }
1203
rec_mfc(const struct block * block,const struct opcode * op)1204 static void rec_mfc(const struct block *block, const struct opcode *op)
1205 {
1206 u8 tmp, tmp2;
1207 struct lightrec_state *state = block->state;
1208 struct regcache *reg_cache = state->reg_cache;
1209 jit_state_t *_jit = block->_jit;
1210
1211 jit_note(__FILE__, __LINE__);
1212
1213 tmp = lightrec_alloc_reg(reg_cache, _jit, JIT_R0);
1214 tmp2 = lightrec_alloc_reg_temp(reg_cache, _jit);
1215
1216 jit_ldxi(tmp2, LIGHTREC_REG_STATE,
1217 offsetof(struct lightrec_state, mfc_func));
1218
1219 lightrec_clean_reg_if_loaded(reg_cache, _jit, op->i.rt, true);
1220
1221 jit_movi(tmp, op->opcode);
1222 jit_callr(tmp2);
1223 lightrec_free_reg(reg_cache, tmp);
1224 lightrec_free_reg(reg_cache, tmp2);
1225
1226 lightrec_regcache_mark_live(reg_cache, _jit);
1227 }
1228
rec_mtc(const struct block * block,const struct opcode * op,u32 pc)1229 static void rec_mtc(const struct block *block, const struct opcode *op, u32 pc)
1230 {
1231 struct lightrec_state *state = block->state;
1232 struct regcache *reg_cache = state->reg_cache;
1233 jit_state_t *_jit = block->_jit;
1234 u8 tmp, tmp2;
1235
1236 jit_note(__FILE__, __LINE__);
1237
1238 tmp = lightrec_alloc_reg(reg_cache, _jit, JIT_R0);
1239 tmp2 = lightrec_alloc_reg_temp(reg_cache, _jit);
1240 jit_ldxi(tmp2, LIGHTREC_REG_STATE,
1241 offsetof(struct lightrec_state, mtc_func));
1242
1243 lightrec_clean_reg_if_loaded(reg_cache, _jit, op->i.rs, false);
1244 lightrec_clean_reg_if_loaded(reg_cache, _jit, op->i.rt, false);
1245
1246 jit_movi(tmp, op->opcode);
1247 jit_callr(tmp2);
1248 lightrec_free_reg(reg_cache, tmp);
1249 lightrec_free_reg(reg_cache, tmp2);
1250
1251 lightrec_regcache_mark_live(reg_cache, _jit);
1252
1253 if (op->i.op == OP_CP0 && !(op->flags & LIGHTREC_NO_DS) &&
1254 (op->r.rd == 12 || op->r.rd == 13))
1255 lightrec_emit_end_of_block(block, op, pc, -1, pc + 4, 0, 0, true);
1256 }
1257
rec_cp0_MFC0(const struct block * block,const struct opcode * op,u32 pc)1258 static void rec_cp0_MFC0(const struct block *block,
1259 const struct opcode *op, u32 pc)
1260 {
1261 _jit_name(block->_jit, __func__);
1262 rec_mfc(block, op);
1263 }
1264
rec_cp0_CFC0(const struct block * block,const struct opcode * op,u32 pc)1265 static void rec_cp0_CFC0(const struct block *block,
1266 const struct opcode *op, u32 pc)
1267 {
1268 _jit_name(block->_jit, __func__);
1269 rec_mfc(block, op);
1270 }
1271
rec_cp0_MTC0(const struct block * block,const struct opcode * op,u32 pc)1272 static void rec_cp0_MTC0(const struct block *block,
1273 const struct opcode *op, u32 pc)
1274 {
1275 _jit_name(block->_jit, __func__);
1276 rec_mtc(block, op, pc);
1277 }
1278
rec_cp0_CTC0(const struct block * block,const struct opcode * op,u32 pc)1279 static void rec_cp0_CTC0(const struct block *block,
1280 const struct opcode *op, u32 pc)
1281 {
1282 _jit_name(block->_jit, __func__);
1283 rec_mtc(block, op, pc);
1284 }
1285
rec_cp2_basic_MFC2(const struct block * block,const struct opcode * op,u32 pc)1286 static void rec_cp2_basic_MFC2(const struct block *block,
1287 const struct opcode *op, u32 pc)
1288 {
1289 _jit_name(block->_jit, __func__);
1290 rec_mfc(block, op);
1291 }
1292
rec_cp2_basic_CFC2(const struct block * block,const struct opcode * op,u32 pc)1293 static void rec_cp2_basic_CFC2(const struct block *block,
1294 const struct opcode *op, u32 pc)
1295 {
1296 _jit_name(block->_jit, __func__);
1297 rec_mfc(block, op);
1298 }
1299
rec_cp2_basic_MTC2(const struct block * block,const struct opcode * op,u32 pc)1300 static void rec_cp2_basic_MTC2(const struct block *block,
1301 const struct opcode *op, u32 pc)
1302 {
1303 _jit_name(block->_jit, __func__);
1304 rec_mtc(block, op, pc);
1305 }
1306
rec_cp2_basic_CTC2(const struct block * block,const struct opcode * op,u32 pc)1307 static void rec_cp2_basic_CTC2(const struct block *block,
1308 const struct opcode *op, u32 pc)
1309 {
1310 _jit_name(block->_jit, __func__);
1311 rec_mtc(block, op, pc);
1312 }
1313
rec_cp0_RFE(const struct block * block,const struct opcode * op,u32 pc)1314 static void rec_cp0_RFE(const struct block *block,
1315 const struct opcode *op, u32 pc)
1316 {
1317 struct lightrec_state *state = block->state;
1318 jit_state_t *_jit = block->_jit;
1319 u8 tmp;
1320
1321 jit_name(__func__);
1322 jit_note(__FILE__, __LINE__);
1323
1324 tmp = lightrec_alloc_reg_temp(state->reg_cache, _jit);
1325 jit_ldxi(tmp, LIGHTREC_REG_STATE,
1326 offsetof(struct lightrec_state, rfe_func));
1327 jit_callr(tmp);
1328 lightrec_free_reg(state->reg_cache, tmp);
1329
1330 lightrec_regcache_mark_live(state->reg_cache, _jit);
1331 }
1332
rec_CP(const struct block * block,const struct opcode * op,u32 pc)1333 static void rec_CP(const struct block *block, const struct opcode *op, u32 pc)
1334 {
1335 struct regcache *reg_cache = block->state->reg_cache;
1336 jit_state_t *_jit = block->_jit;
1337 u8 tmp, tmp2;
1338
1339 jit_name(__func__);
1340 jit_note(__FILE__, __LINE__);
1341
1342 tmp = lightrec_alloc_reg(reg_cache, _jit, JIT_R0);
1343 tmp2 = lightrec_alloc_reg_temp(reg_cache, _jit);
1344
1345 jit_ldxi(tmp2, LIGHTREC_REG_STATE,
1346 offsetof(struct lightrec_state, cp_func));
1347
1348 jit_movi(tmp, op->opcode);
1349 jit_callr(tmp2);
1350 lightrec_free_reg(reg_cache, tmp);
1351 lightrec_free_reg(reg_cache, tmp2);
1352
1353 lightrec_regcache_mark_live(reg_cache, _jit);
1354 }
1355
rec_meta_unload(const struct block * block,const struct opcode * op,u32 pc)1356 static void rec_meta_unload(const struct block *block,
1357 const struct opcode *op, u32 pc)
1358 {
1359 struct lightrec_state *state = block->state;
1360 struct regcache *reg_cache = state->reg_cache;
1361 jit_state_t *_jit = block->_jit;
1362
1363 jit_name(__func__);
1364 jit_note(__FILE__, __LINE__);
1365
1366 pr_debug("Unloading reg %s\n", lightrec_reg_name(op->i.rs));
1367 lightrec_clean_reg_if_loaded(reg_cache, _jit, op->i.rs, true);
1368 }
1369
rec_meta_BEQZ(const struct block * block,const struct opcode * op,u32 pc)1370 static void rec_meta_BEQZ(const struct block *block,
1371 const struct opcode *op, u32 pc)
1372 {
1373 _jit_name(block->_jit, __func__);
1374 rec_b(block, op, pc, jit_code_bnei, 0, false, true);
1375 }
1376
rec_meta_BNEZ(const struct block * block,const struct opcode * op,u32 pc)1377 static void rec_meta_BNEZ(const struct block *block,
1378 const struct opcode *op, u32 pc)
1379 {
1380 _jit_name(block->_jit, __func__);
1381 rec_b(block, op, pc, jit_code_beqi, 0, false, true);
1382 }
1383
rec_meta_MOV(const struct block * block,const struct opcode * op,u32 pc)1384 static void rec_meta_MOV(const struct block *block,
1385 const struct opcode *op, u32 pc)
1386 {
1387 struct lightrec_state *state = block->state;
1388 struct regcache *reg_cache = state->reg_cache;
1389 jit_state_t *_jit = block->_jit;
1390 u8 rs, rd;
1391
1392 _jit_name(block->_jit, __func__);
1393 jit_note(__FILE__, __LINE__);
1394 rs = op->r.rs ? lightrec_alloc_reg_in(reg_cache, _jit, op->r.rs) : 0;
1395 rd = lightrec_alloc_reg_out_ext(reg_cache, _jit, op->r.rd);
1396
1397 if (op->r.rs == 0) {
1398 jit_movi(rd, 0);
1399 } else {
1400 #if __WORDSIZE == 32
1401 jit_movr(rd, rs);
1402 #else
1403 jit_extr_i(rd, rs);
1404 #endif
1405 }
1406
1407 lightrec_free_reg(state->reg_cache, rs);
1408 lightrec_free_reg(state->reg_cache, rd);
1409 }
1410
rec_meta_sync(const struct block * block,const struct opcode * op,u32 pc)1411 static void rec_meta_sync(const struct block *block,
1412 const struct opcode *op, u32 pc)
1413 {
1414 struct lightrec_state *state = block->state;
1415 struct lightrec_branch_target *target;
1416 jit_state_t *_jit = block->_jit;
1417
1418 jit_name(__func__);
1419 jit_note(__FILE__, __LINE__);
1420
1421 jit_subi(LIGHTREC_REG_CYCLE, LIGHTREC_REG_CYCLE, state->cycles);
1422 state->cycles = 0;
1423
1424 lightrec_storeback_regs(state->reg_cache, _jit);
1425 lightrec_regcache_reset(state->reg_cache);
1426
1427 pr_debug("Adding branch target at offset 0x%x\n",
1428 op->offset << 2);
1429 target = &state->targets[state->nb_targets++];
1430 target->offset = op->offset;
1431 target->label = jit_indirect();
1432 }
1433
1434 static const lightrec_rec_func_t rec_standard[64] = {
1435 [OP_SPECIAL] = rec_SPECIAL,
1436 [OP_REGIMM] = rec_REGIMM,
1437 [OP_J] = rec_J,
1438 [OP_JAL] = rec_JAL,
1439 [OP_BEQ] = rec_BEQ,
1440 [OP_BNE] = rec_BNE,
1441 [OP_BLEZ] = rec_BLEZ,
1442 [OP_BGTZ] = rec_BGTZ,
1443 [OP_ADDI] = rec_ADDI,
1444 [OP_ADDIU] = rec_ADDIU,
1445 [OP_SLTI] = rec_SLTI,
1446 [OP_SLTIU] = rec_SLTIU,
1447 [OP_ANDI] = rec_ANDI,
1448 [OP_ORI] = rec_ORI,
1449 [OP_XORI] = rec_XORI,
1450 [OP_LUI] = rec_LUI,
1451 [OP_CP0] = rec_CP0,
1452 [OP_CP2] = rec_CP2,
1453 [OP_LB] = rec_LB,
1454 [OP_LH] = rec_LH,
1455 [OP_LWL] = rec_LWL,
1456 [OP_LW] = rec_LW,
1457 [OP_LBU] = rec_LBU,
1458 [OP_LHU] = rec_LHU,
1459 [OP_LWR] = rec_LWR,
1460 [OP_SB] = rec_SB,
1461 [OP_SH] = rec_SH,
1462 [OP_SWL] = rec_SWL,
1463 [OP_SW] = rec_SW,
1464 [OP_SWR] = rec_SWR,
1465 [OP_LWC2] = rec_LWC2,
1466 [OP_SWC2] = rec_SWC2,
1467
1468 [OP_META_REG_UNLOAD] = rec_meta_unload,
1469 [OP_META_BEQZ] = rec_meta_BEQZ,
1470 [OP_META_BNEZ] = rec_meta_BNEZ,
1471 [OP_META_MOV] = rec_meta_MOV,
1472 [OP_META_SYNC] = rec_meta_sync,
1473 };
1474
1475 static const lightrec_rec_func_t rec_special[64] = {
1476 [OP_SPECIAL_SLL] = rec_special_SLL,
1477 [OP_SPECIAL_SRL] = rec_special_SRL,
1478 [OP_SPECIAL_SRA] = rec_special_SRA,
1479 [OP_SPECIAL_SLLV] = rec_special_SLLV,
1480 [OP_SPECIAL_SRLV] = rec_special_SRLV,
1481 [OP_SPECIAL_SRAV] = rec_special_SRAV,
1482 [OP_SPECIAL_JR] = rec_special_JR,
1483 [OP_SPECIAL_JALR] = rec_special_JALR,
1484 [OP_SPECIAL_SYSCALL] = rec_special_SYSCALL,
1485 [OP_SPECIAL_BREAK] = rec_special_BREAK,
1486 [OP_SPECIAL_MFHI] = rec_special_MFHI,
1487 [OP_SPECIAL_MTHI] = rec_special_MTHI,
1488 [OP_SPECIAL_MFLO] = rec_special_MFLO,
1489 [OP_SPECIAL_MTLO] = rec_special_MTLO,
1490 [OP_SPECIAL_MULT] = rec_special_MULT,
1491 [OP_SPECIAL_MULTU] = rec_special_MULTU,
1492 [OP_SPECIAL_DIV] = rec_special_DIV,
1493 [OP_SPECIAL_DIVU] = rec_special_DIVU,
1494 [OP_SPECIAL_ADD] = rec_special_ADD,
1495 [OP_SPECIAL_ADDU] = rec_special_ADDU,
1496 [OP_SPECIAL_SUB] = rec_special_SUB,
1497 [OP_SPECIAL_SUBU] = rec_special_SUBU,
1498 [OP_SPECIAL_AND] = rec_special_AND,
1499 [OP_SPECIAL_OR] = rec_special_OR,
1500 [OP_SPECIAL_XOR] = rec_special_XOR,
1501 [OP_SPECIAL_NOR] = rec_special_NOR,
1502 [OP_SPECIAL_SLT] = rec_special_SLT,
1503 [OP_SPECIAL_SLTU] = rec_special_SLTU,
1504 };
1505
1506 static const lightrec_rec_func_t rec_regimm[64] = {
1507 [OP_REGIMM_BLTZ] = rec_regimm_BLTZ,
1508 [OP_REGIMM_BGEZ] = rec_regimm_BGEZ,
1509 [OP_REGIMM_BLTZAL] = rec_regimm_BLTZAL,
1510 [OP_REGIMM_BGEZAL] = rec_regimm_BGEZAL,
1511 };
1512
1513 static const lightrec_rec_func_t rec_cp0[64] = {
1514 [OP_CP0_MFC0] = rec_cp0_MFC0,
1515 [OP_CP0_CFC0] = rec_cp0_CFC0,
1516 [OP_CP0_MTC0] = rec_cp0_MTC0,
1517 [OP_CP0_CTC0] = rec_cp0_CTC0,
1518 [OP_CP0_RFE] = rec_cp0_RFE,
1519 };
1520
1521 static const lightrec_rec_func_t rec_cp2_basic[64] = {
1522 [OP_CP2_BASIC_MFC2] = rec_cp2_basic_MFC2,
1523 [OP_CP2_BASIC_CFC2] = rec_cp2_basic_CFC2,
1524 [OP_CP2_BASIC_MTC2] = rec_cp2_basic_MTC2,
1525 [OP_CP2_BASIC_CTC2] = rec_cp2_basic_CTC2,
1526 };
1527
rec_SPECIAL(const struct block * block,const struct opcode * op,u32 pc)1528 static void rec_SPECIAL(const struct block *block,
1529 const struct opcode *op, u32 pc)
1530 {
1531 lightrec_rec_func_t f = rec_special[op->r.op];
1532 if (likely(f))
1533 (*f)(block, op, pc);
1534 else
1535 unknown_opcode(block, op, pc);
1536 }
1537
rec_REGIMM(const struct block * block,const struct opcode * op,u32 pc)1538 static void rec_REGIMM(const struct block *block,
1539 const struct opcode *op, u32 pc)
1540 {
1541 lightrec_rec_func_t f = rec_regimm[op->r.rt];
1542 if (likely(f))
1543 (*f)(block, op, pc);
1544 else
1545 unknown_opcode(block, op, pc);
1546 }
1547
rec_CP0(const struct block * block,const struct opcode * op,u32 pc)1548 static void rec_CP0(const struct block *block, const struct opcode *op, u32 pc)
1549 {
1550 lightrec_rec_func_t f = rec_cp0[op->r.rs];
1551 if (likely(f))
1552 (*f)(block, op, pc);
1553 else
1554 rec_CP(block, op, pc);
1555 }
1556
rec_CP2(const struct block * block,const struct opcode * op,u32 pc)1557 static void rec_CP2(const struct block *block, const struct opcode *op, u32 pc)
1558 {
1559 if (op->r.op == OP_CP2_BASIC) {
1560 lightrec_rec_func_t f = rec_cp2_basic[op->r.rs];
1561 if (likely(f)) {
1562 (*f)(block, op, pc);
1563 return;
1564 }
1565 }
1566
1567 rec_CP(block, op, pc);
1568 }
1569
lightrec_rec_opcode(const struct block * block,const struct opcode * op,u32 pc)1570 void lightrec_rec_opcode(const struct block *block,
1571 const struct opcode *op, u32 pc)
1572 {
1573 lightrec_rec_func_t f = rec_standard[op->i.op];
1574 if (likely(f))
1575 (*f)(block, op, pc);
1576 else
1577 unknown_opcode(block, op, pc);
1578 }
1579