From d16005f843cd28ae90f091bd4e39a90b355e1d45 Mon Sep 17 00:00:00 2001 From: Paul Cercueil Date: Thu, 30 Jan 2020 12:34:17 -0300 Subject: git subrepo clone https://github.com/pcercuei/lightrec.git deps/lightrec subrepo: subdir: "deps/lightrec" merged: "6c69e10" upstream: origin: "https://github.com/pcercuei/lightrec.git" branch: "master" commit: "6c69e10" git-subrepo: version: "0.4.1" origin: "https://github.com/ingydotnet/git-subrepo.git" commit: "a04d8c2" --- deps/lightrec/emitter.c | 1577 +++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 1577 insertions(+) create mode 100644 deps/lightrec/emitter.c (limited to 'deps/lightrec/emitter.c') diff --git a/deps/lightrec/emitter.c b/deps/lightrec/emitter.c new file mode 100644 index 0000000..b09dc94 --- /dev/null +++ b/deps/lightrec/emitter.c @@ -0,0 +1,1577 @@ +/* + * Copyright (C) 2014-2020 Paul Cercueil + * + * This library is free software; you can redistribute it and/or + * modify it under the terms of the GNU Lesser General Public + * License as published by the Free Software Foundation; either + * version 2.1 of the License, or (at your option) any later version. + * + * This library is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + * Lesser General Public License for more details. + */ + +#include "blockcache.h" +#include "debug.h" +#include "disassembler.h" +#include "emitter.h" +#include "optimizer.h" +#include "regcache.h" + +#include +#include +#include + +typedef void (*lightrec_rec_func_t)(const struct block *, + const struct opcode *, u32); + +/* Forward declarations */ +static void rec_SPECIAL(const struct block *block, + const struct opcode *op, u32 pc); +static void rec_REGIMM(const struct block *block, + const struct opcode *op, u32 pc); +static void rec_CP0(const struct block *block, const struct opcode *op, u32 pc); +static void rec_CP2(const struct block *block, const struct opcode *op, u32 pc); + + +static void unknown_opcode(const struct block *block, + const struct opcode *op, u32 pc) +{ + pr_warn("Unknown opcode: 0x%08x at PC 0x%08x\n", op->opcode, pc); +} + +static void lightrec_emit_end_of_block(const struct block *block, + const struct opcode *op, u32 pc, + s8 reg_new_pc, u32 imm, u8 ra_reg, + u32 link, bool update_cycles) +{ + struct lightrec_state *state = block->state; + struct regcache *reg_cache = state->reg_cache; + u32 cycles = state->cycles; + jit_state_t *_jit = block->_jit; + + jit_note(__FILE__, __LINE__); + + if (link) { + /* Update the $ra register */ + u8 link_reg = lightrec_alloc_reg_out(reg_cache, _jit, ra_reg); + jit_movi(link_reg, link); + lightrec_free_reg(reg_cache, link_reg); + } + + if (reg_new_pc < 0) { + reg_new_pc = lightrec_alloc_reg(reg_cache, _jit, JIT_V0); + lightrec_lock_reg(reg_cache, _jit, reg_new_pc); + + jit_movi(reg_new_pc, imm); + } + + if (has_delay_slot(op->c) && + !(op->flags & (LIGHTREC_NO_DS | LIGHTREC_LOCAL_BRANCH))) { + cycles += lightrec_cycles_of_opcode(op->next->c); + + /* Recompile the delay slot */ + if (op->next->c.opcode) + lightrec_rec_opcode(block, op->next, pc + 4); + } + + /* Store back remaining registers */ + lightrec_storeback_regs(reg_cache, _jit); + + jit_movr(JIT_V0, reg_new_pc); + + if (cycles && update_cycles) { + jit_subi(LIGHTREC_REG_CYCLE, LIGHTREC_REG_CYCLE, cycles); + pr_debug("EOB: %u cycles\n", cycles); + } + + if (op->next && ((op->flags & LIGHTREC_NO_DS) || op->next->next)) + state->branches[state->nb_branches++] = jit_jmpi(); +} + +void lightrec_emit_eob(const struct block *block, + const struct opcode *op, u32 pc) +{ + struct lightrec_state *state = block->state; + struct regcache *reg_cache = state->reg_cache; + jit_state_t *_jit = block->_jit; + + lightrec_storeback_regs(reg_cache, _jit); + + jit_movi(JIT_V0, pc); + jit_subi(LIGHTREC_REG_CYCLE, LIGHTREC_REG_CYCLE, + state->cycles - lightrec_cycles_of_opcode(op->c)); + + state->branches[state->nb_branches++] = jit_jmpi(); +} + +static void rec_special_JR(const struct block *block, + const struct opcode *op, u32 pc) +{ + struct regcache *reg_cache = block->state->reg_cache; + jit_state_t *_jit = block->_jit; + u8 rs = lightrec_request_reg_in(reg_cache, _jit, op->r.rs, JIT_V0); + + _jit_name(block->_jit, __func__); + lightrec_lock_reg(reg_cache, _jit, rs); + lightrec_emit_end_of_block(block, op, pc, rs, 0, 31, 0, true); +} + +static void rec_special_JALR(const struct block *block, + const struct opcode *op, u32 pc) +{ + struct regcache *reg_cache = block->state->reg_cache; + jit_state_t *_jit = block->_jit; + u8 rs = lightrec_request_reg_in(reg_cache, _jit, op->r.rs, JIT_V0); + + _jit_name(block->_jit, __func__); + lightrec_lock_reg(reg_cache, _jit, rs); + lightrec_emit_end_of_block(block, op, pc, rs, 0, op->r.rd, pc + 8, true); +} + +static void rec_J(const struct block *block, const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + lightrec_emit_end_of_block(block, op, pc, -1, + (pc & 0xf0000000) | (op->j.imm << 2), 31, 0, true); +} + +static void rec_JAL(const struct block *block, const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + lightrec_emit_end_of_block(block, op, pc, -1, + (pc & 0xf0000000) | (op->j.imm << 2), + 31, pc + 8, true); +} + +static void rec_b(const struct block *block, const struct opcode *op, u32 pc, + jit_code_t code, u32 link, bool unconditional, bool bz) +{ + struct regcache *reg_cache = block->state->reg_cache; + struct native_register *regs_backup; + jit_state_t *_jit = block->_jit; + struct lightrec_branch *branch; + jit_node_t *addr; + u8 link_reg; + u32 offset, cycles = block->state->cycles; + bool is_forward = (s16)op->i.imm >= -1; + + jit_note(__FILE__, __LINE__); + + if (!(op->flags & LIGHTREC_NO_DS)) + cycles += lightrec_cycles_of_opcode(op->next->c); + + block->state->cycles = 0; + + if (cycles) + jit_subi(LIGHTREC_REG_CYCLE, LIGHTREC_REG_CYCLE, cycles); + + if (!unconditional) { + u8 rs = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->i.rs), + rt = bz ? 0 : lightrec_alloc_reg_in_ext(reg_cache, + _jit, op->i.rt); + + /* Generate the branch opcode */ + addr = jit_new_node_pww(code, NULL, rs, rt); + + lightrec_free_regs(reg_cache); + regs_backup = lightrec_regcache_enter_branch(reg_cache); + } + + if (op->flags & LIGHTREC_LOCAL_BRANCH) { + if (op->next && !(op->flags & LIGHTREC_NO_DS)) { + /* Recompile the delay slot */ + if (op->next->opcode) + lightrec_rec_opcode(block, op->next, pc + 4); + } + + if (link) { + /* Update the $ra register */ + link_reg = lightrec_alloc_reg_out(reg_cache, _jit, 31); + jit_movi(link_reg, link); + lightrec_free_reg(reg_cache, link_reg); + } + + /* Store back remaining registers */ + lightrec_storeback_regs(reg_cache, _jit); + + offset = op->offset + 1 + (s16)op->i.imm; + pr_debug("Adding local branch to offset 0x%x\n", offset << 2); + branch = &block->state->local_branches[ + block->state->nb_local_branches++]; + + branch->target = offset; + if (is_forward) + branch->branch = jit_jmpi(); + else + branch->branch = jit_bgti(LIGHTREC_REG_CYCLE, 0); + } + + if (!(op->flags & LIGHTREC_LOCAL_BRANCH) || !is_forward) { + lightrec_emit_end_of_block(block, op, pc, -1, + pc + 4 + ((s16)op->i.imm << 2), + 31, link, false); + } + + if (!unconditional) { + jit_patch(addr); + lightrec_regcache_leave_branch(reg_cache, regs_backup); + + if (bz && link) { + /* Update the $ra register */ + link_reg = lightrec_alloc_reg_out_ext(reg_cache, + _jit, 31); + jit_movi(link_reg, (s32)link); + lightrec_free_reg(reg_cache, link_reg); + } + + if (!(op->flags & LIGHTREC_NO_DS) && op->next->opcode) + lightrec_rec_opcode(block, op->next, pc + 4); + } +} + +static void rec_BNE(const struct block *block, const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_b(block, op, pc, jit_code_beqr, 0, false, false); +} + +static void rec_BEQ(const struct block *block, const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_b(block, op, pc, jit_code_bner, 0, + op->i.rs == op->i.rt, false); +} + +static void rec_BLEZ(const struct block *block, const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_b(block, op, pc, jit_code_bgti, 0, op->i.rs == 0, true); +} + +static void rec_BGTZ(const struct block *block, const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_b(block, op, pc, jit_code_blei, 0, false, true); +} + +static void rec_regimm_BLTZ(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_b(block, op, pc, jit_code_bgei, 0, false, true); +} + +static void rec_regimm_BLTZAL(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_b(block, op, pc, jit_code_bgei, pc + 8, false, true); +} + +static void rec_regimm_BGEZ(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_b(block, op, pc, jit_code_blti, 0, !op->i.rs, true); +} + +static void rec_regimm_BGEZAL(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_b(block, op, pc, jit_code_blti, pc + 8, !op->i.rs, true); +} + +static void rec_alu_imm(const struct block *block, const struct opcode *op, + jit_code_t code, bool sign_extend) +{ + struct regcache *reg_cache = block->state->reg_cache; + jit_state_t *_jit = block->_jit; + u8 rs, rt; + + jit_note(__FILE__, __LINE__); + rs = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->i.rs); + rt = lightrec_alloc_reg_out_ext(reg_cache, _jit, op->i.rt); + + if (sign_extend) + jit_new_node_www(code, rt, rs, (s32)(s16) op->i.imm); + else + jit_new_node_www(code, rt, rs, (u32)(u16) op->i.imm); + + lightrec_free_reg(reg_cache, rs); + lightrec_free_reg(reg_cache, rt); +} + +static void rec_alu_special(const struct block *block, const struct opcode *op, + jit_code_t code, bool out_ext) +{ + struct regcache *reg_cache = block->state->reg_cache; + jit_state_t *_jit = block->_jit; + u8 rd, rt, rs; + + jit_note(__FILE__, __LINE__); + rs = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->r.rs); + rt = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->r.rt); + + if (out_ext) + rd = lightrec_alloc_reg_out_ext(reg_cache, _jit, op->r.rd); + else + rd = lightrec_alloc_reg_out(reg_cache, _jit, op->r.rd); + + jit_new_node_www(code, rd, rs, rt); + + lightrec_free_reg(reg_cache, rs); + lightrec_free_reg(reg_cache, rt); + lightrec_free_reg(reg_cache, rd); +} + +static void rec_alu_shiftv(const struct block *block, + const struct opcode *op, jit_code_t code) +{ + struct regcache *reg_cache = block->state->reg_cache; + jit_state_t *_jit = block->_jit; + u8 rd, rt, rs, temp; + + jit_note(__FILE__, __LINE__); + rs = lightrec_alloc_reg_in(reg_cache, _jit, op->r.rs); + temp = lightrec_alloc_reg_temp(reg_cache, _jit); + + if (code == jit_code_rshr) { + rt = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->r.rt); + rd = lightrec_alloc_reg_out_ext(reg_cache, _jit, op->r.rd); + } else { + rt = lightrec_alloc_reg_in(reg_cache, _jit, op->r.rt); + rd = lightrec_alloc_reg_out(reg_cache, _jit, op->r.rd); + } + + jit_andi(temp, rs, 0x1f); + +#if __WORDSIZE == 64 + if (code == jit_code_rshr_u) { + jit_extr_ui(rd, rt); + jit_new_node_www(code, rd, rd, temp); + } +#endif + + if (__WORDSIZE == 32 || code != jit_code_rshr_u) + jit_new_node_www(code, rd, rt, temp); + + lightrec_free_reg(reg_cache, rs); + lightrec_free_reg(reg_cache, temp); + lightrec_free_reg(reg_cache, rt); + lightrec_free_reg(reg_cache, rd); +} + +static void rec_ADDIU(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_imm(block, op, jit_code_addi, true); +} + +static void rec_ADDI(const struct block *block, const struct opcode *op, u32 pc) +{ + /* TODO: Handle the exception? */ + _jit_name(block->_jit, __func__); + rec_alu_imm(block, op, jit_code_addi, true); +} + +static void rec_SLTIU(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_imm(block, op, jit_code_lti_u, true); +} + +static void rec_SLTI(const struct block *block, const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_imm(block, op, jit_code_lti, true); +} + +static void rec_ANDI(const struct block *block, const struct opcode *op, u32 pc) +{ + struct regcache *reg_cache = block->state->reg_cache; + jit_state_t *_jit = block->_jit; + u8 rs, rt; + + _jit_name(block->_jit, __func__); + jit_note(__FILE__, __LINE__); + rs = lightrec_alloc_reg_in(reg_cache, _jit, op->i.rs); + rt = lightrec_alloc_reg_out_ext(reg_cache, _jit, op->i.rt); + + /* PSX code uses ANDI 0xff / ANDI 0xffff a lot, which are basically + * casts to uint8_t / uint16_t. */ + if (op->i.imm == 0xff) + jit_extr_uc(rt, rs); + else if (op->i.imm == 0xffff) + jit_extr_us(rt, rs); + else + jit_andi(rt, rs, (u32)(u16) op->i.imm); + + lightrec_free_reg(reg_cache, rs); + lightrec_free_reg(reg_cache, rt); +} + +static void rec_ORI(const struct block *block, const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_imm(block, op, jit_code_ori, false); +} + +static void rec_XORI(const struct block *block, const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_imm(block, op, jit_code_xori, false); +} + +static void rec_LUI(const struct block *block, const struct opcode *op, u32 pc) +{ + struct regcache *reg_cache = block->state->reg_cache; + jit_state_t *_jit = block->_jit; + u8 rt; + + jit_name(__func__); + jit_note(__FILE__, __LINE__); + rt = lightrec_alloc_reg_out_ext(reg_cache, _jit, op->i.rt); + + jit_movi(rt, (s32)(op->i.imm << 16)); + + lightrec_free_reg(reg_cache, rt); +} + +static void rec_special_ADDU(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_special(block, op, jit_code_addr, false); +} + +static void rec_special_ADD(const struct block *block, + const struct opcode *op, u32 pc) +{ + /* TODO: Handle the exception? */ + _jit_name(block->_jit, __func__); + rec_alu_special(block, op, jit_code_addr, false); +} + +static void rec_special_SUBU(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_special(block, op, jit_code_subr, false); +} + +static void rec_special_SUB(const struct block *block, + const struct opcode *op, u32 pc) +{ + /* TODO: Handle the exception? */ + _jit_name(block->_jit, __func__); + rec_alu_special(block, op, jit_code_subr, false); +} + +static void rec_special_AND(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_special(block, op, jit_code_andr, false); +} + +static void rec_special_OR(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_special(block, op, jit_code_orr, false); +} + +static void rec_special_XOR(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_special(block, op, jit_code_xorr, false); +} + +static void rec_special_NOR(const struct block *block, + const struct opcode *op, u32 pc) +{ + struct regcache *reg_cache = block->state->reg_cache; + jit_state_t *_jit = block->_jit; + u8 rd; + + jit_name(__func__); + rec_alu_special(block, op, jit_code_orr, false); + rd = lightrec_alloc_reg_out(reg_cache, _jit, op->r.rd); + + jit_comr(rd, rd); + + lightrec_free_reg(reg_cache, rd); +} + +static void rec_special_SLTU(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_special(block, op, jit_code_ltr_u, true); +} + +static void rec_special_SLT(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_special(block, op, jit_code_ltr, true); +} + +static void rec_special_SLLV(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_shiftv(block, op, jit_code_lshr); +} + +static void rec_special_SRLV(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_shiftv(block, op, jit_code_rshr_u); +} + +static void rec_special_SRAV(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_shiftv(block, op, jit_code_rshr); +} + +static void rec_alu_shift(const struct block *block, + const struct opcode *op, jit_code_t code) +{ + struct regcache *reg_cache = block->state->reg_cache; + jit_state_t *_jit = block->_jit; + u8 rd, rt; + + jit_note(__FILE__, __LINE__); + + if (code == jit_code_rshi) { + rt = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->r.rt); + rd = lightrec_alloc_reg_out_ext(reg_cache, _jit, op->r.rd); + } else { + rt = lightrec_alloc_reg_in(reg_cache, _jit, op->r.rt); + rd = lightrec_alloc_reg_out(reg_cache, _jit, op->r.rd); + } + +#if __WORDSIZE == 64 + if (code == jit_code_rshi_u) { + jit_extr_ui(rd, rt); + jit_new_node_www(code, rd, rd, op->r.imm); + } +#endif + if (__WORDSIZE == 32 || code != jit_code_rshi_u) + jit_new_node_www(code, rd, rt, op->r.imm); + + lightrec_free_reg(reg_cache, rt); + lightrec_free_reg(reg_cache, rd); +} + +static void rec_special_SLL(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_shift(block, op, jit_code_lshi); +} + +static void rec_special_SRL(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_shift(block, op, jit_code_rshi_u); +} + +static void rec_special_SRA(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_shift(block, op, jit_code_rshi); +} + +static void rec_alu_mult(const struct block *block, + const struct opcode *op, bool is_signed) +{ + struct regcache *reg_cache = block->state->reg_cache; + jit_state_t *_jit = block->_jit; + u8 lo, hi, rs, rt; + + jit_note(__FILE__, __LINE__); + + lo = lightrec_alloc_reg_out(reg_cache, _jit, REG_LO); + if (!(op->flags & LIGHTREC_MULT32)) + hi = lightrec_alloc_reg_out_ext(reg_cache, _jit, REG_HI); + else if (__WORDSIZE == 64) + hi = lightrec_alloc_reg_temp(reg_cache, _jit); + + if (__WORDSIZE == 32 || !is_signed) { + rs = lightrec_alloc_reg_in(reg_cache, _jit, op->r.rs); + rt = lightrec_alloc_reg_in(reg_cache, _jit, op->r.rt); + } else { + rs = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->r.rs); + rt = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->r.rt); + } + +#if __WORDSIZE == 32 + /* On 32-bit systems, do a 32*32->64 bit operation, or a 32*32->32 bit + * operation if the MULT was detected a 32-bit only. */ + if (!(op->flags & LIGHTREC_MULT32)) { + if (is_signed) + jit_qmulr(lo, hi, rs, rt); + else + jit_qmulr_u(lo, hi, rs, rt); + } else { + jit_mulr(lo, rs, rt); + } +#else + /* On 64-bit systems, do a 64*64->64 bit operation. + * The input registers must be 32 bits, so we first sign-extend (if + * mult) or clear (if multu) the input registers. */ + if (is_signed) { + jit_mulr(lo, rs, rt); + } else { + jit_extr_ui(lo, rt); + jit_extr_ui(hi, rs); + jit_mulr(lo, hi, lo); + } + + /* The 64-bit output value is in $lo, store the upper 32 bits in $hi */ + if (!(op->flags & LIGHTREC_MULT32)) + jit_rshi(hi, lo, 32); +#endif + + lightrec_free_reg(reg_cache, rs); + lightrec_free_reg(reg_cache, rt); + lightrec_free_reg(reg_cache, lo); + if (__WORDSIZE == 64 || !(op->flags & LIGHTREC_MULT32)) + lightrec_free_reg(reg_cache, hi); +} + +static void rec_alu_div(const struct block *block, + const struct opcode *op, bool is_signed) +{ + struct regcache *reg_cache = block->state->reg_cache; + jit_state_t *_jit = block->_jit; + jit_node_t *branch, *to_end; + u8 lo, hi, rs, rt; + + jit_note(__FILE__, __LINE__); + lo = lightrec_alloc_reg_out(reg_cache, _jit, REG_LO); + hi = lightrec_alloc_reg_out(reg_cache, _jit, REG_HI); + + if (__WORDSIZE == 32 || !is_signed) { + rs = lightrec_alloc_reg_in(reg_cache, _jit, op->r.rs); + rt = lightrec_alloc_reg_in(reg_cache, _jit, op->r.rt); + } else { + rs = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->r.rs); + rt = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->r.rt); + } + + /* Jump to special handler if dividing by zero */ + branch = jit_beqi(rt, 0); + +#if __WORDSIZE == 32 + if (is_signed) + jit_qdivr(lo, hi, rs, rt); + else + jit_qdivr_u(lo, hi, rs, rt); +#else + /* On 64-bit systems, the input registers must be 32 bits, so we first sign-extend + * (if div) or clear (if divu) the input registers. */ + if (is_signed) { + jit_qdivr(lo, hi, rs, rt); + } else { + jit_extr_ui(lo, rt); + jit_extr_ui(hi, rs); + jit_qdivr_u(lo, hi, hi, lo); + } +#endif + + /* Jump above the div-by-zero handler */ + to_end = jit_jmpi(); + + jit_patch(branch); + + if (is_signed) { + jit_lti(lo, rs, 0); + jit_lshi(lo, lo, 1); + jit_subi(lo, lo, 1); + } else { + jit_movi(lo, 0xffffffff); + } + + jit_movr(hi, rs); + + jit_patch(to_end); + + lightrec_free_reg(reg_cache, rs); + lightrec_free_reg(reg_cache, rt); + lightrec_free_reg(reg_cache, lo); + lightrec_free_reg(reg_cache, hi); +} + +static void rec_special_MULT(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_mult(block, op, true); +} + +static void rec_special_MULTU(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_mult(block, op, false); +} + +static void rec_special_DIV(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_div(block, op, true); +} + +static void rec_special_DIVU(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_div(block, op, false); +} + +static void rec_alu_mv_lo_hi(const struct block *block, u8 dst, u8 src) +{ + struct regcache *reg_cache = block->state->reg_cache; + jit_state_t *_jit = block->_jit; + + jit_note(__FILE__, __LINE__); + src = lightrec_alloc_reg_in(reg_cache, _jit, src); + dst = lightrec_alloc_reg_out_ext(reg_cache, _jit, dst); + +#if __WORDSIZE == 32 + jit_movr(dst, src); +#else + jit_extr_i(dst, src); +#endif + + lightrec_free_reg(reg_cache, src); + lightrec_free_reg(reg_cache, dst); +} + +static void rec_special_MFHI(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_mv_lo_hi(block, op->r.rd, REG_HI); +} + +static void rec_special_MTHI(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_mv_lo_hi(block, REG_HI, op->r.rs); +} + +static void rec_special_MFLO(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_mv_lo_hi(block, op->r.rd, REG_LO); +} + +static void rec_special_MTLO(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_alu_mv_lo_hi(block, REG_LO, op->r.rs); +} + +static void rec_io(const struct block *block, const struct opcode *op, + bool load_rt, bool read_rt) +{ + struct regcache *reg_cache = block->state->reg_cache; + jit_state_t *_jit = block->_jit; + bool is_tagged = op->flags & (LIGHTREC_HW_IO | LIGHTREC_DIRECT_IO); + u32 offset; + u8 tmp, tmp2, tmp3; + + jit_note(__FILE__, __LINE__); + + tmp = lightrec_alloc_reg(reg_cache, _jit, JIT_R0); + + if (is_tagged) { + offset = offsetof(struct lightrec_state, rw_func); + } else { + tmp3 = lightrec_alloc_reg(reg_cache, _jit, JIT_R1); + offset = offsetof(struct lightrec_state, rw_generic_func); + } + + tmp2 = lightrec_alloc_reg_temp(reg_cache, _jit); + jit_ldxi(tmp2, LIGHTREC_REG_STATE, offset); + + lightrec_clean_reg_if_loaded(reg_cache, _jit, op->i.rs, false); + + if (read_rt && likely(op->i.rt)) + lightrec_clean_reg_if_loaded(reg_cache, _jit, op->i.rt, true); + else if (load_rt) + lightrec_clean_reg_if_loaded(reg_cache, _jit, op->i.rt, false); + + if (is_tagged) { + jit_movi(tmp, op->opcode); + } else { + jit_movi(tmp, (uintptr_t)op); + jit_movi(tmp3, (uintptr_t)block); + } + + jit_callr(tmp2); + + lightrec_free_reg(reg_cache, tmp); + lightrec_free_reg(reg_cache, tmp2); + if (!is_tagged) + lightrec_free_reg(reg_cache, tmp3); + lightrec_regcache_mark_live(reg_cache, _jit); +} + +static void rec_store_direct_no_invalidate(const struct block *block, + const struct opcode *op, + jit_code_t code) +{ + struct lightrec_state *state = block->state; + struct regcache *reg_cache = state->reg_cache; + jit_state_t *_jit = block->_jit; + jit_node_t *to_not_ram, *to_end; + u8 tmp, tmp2, rs, rt; + s16 imm; + + jit_note(__FILE__, __LINE__); + rs = lightrec_alloc_reg_in(reg_cache, _jit, op->i.rs); + tmp = lightrec_alloc_reg_temp(reg_cache, _jit); + tmp2 = lightrec_alloc_reg_temp(reg_cache, _jit); + + /* Convert to KUNSEG and avoid RAM mirrors */ + if (state->mirrors_mapped) { + imm = (s16)op->i.imm; + jit_andi(tmp, rs, 0x1f800000 | (4 * RAM_SIZE - 1)); + } else if (op->i.imm) { + imm = 0; + jit_addi(tmp, rs, (s16)op->i.imm); + jit_andi(tmp, tmp, 0x1f800000 | (RAM_SIZE - 1)); + } else { + imm = 0; + jit_andi(tmp, rs, 0x1f800000 | (RAM_SIZE - 1)); + } + + lightrec_free_reg(reg_cache, rs); + + if (state->offset_ram != state->offset_scratch) { + to_not_ram = jit_bmsi(tmp, BIT(28)); + + jit_movi(tmp2, state->offset_ram); + + to_end = jit_jmpi(); + jit_patch(to_not_ram); + + jit_movi(tmp2, state->offset_scratch); + jit_patch(to_end); + } else if (state->offset_ram) { + jit_movi(tmp2, state->offset_ram); + } + + if (state->offset_ram || state->offset_scratch) + jit_addr(tmp, tmp, tmp2); + + lightrec_free_reg(reg_cache, tmp2); + + rt = lightrec_alloc_reg_in(reg_cache, _jit, op->i.rt); + jit_new_node_www(code, imm, tmp, rt); + + lightrec_free_reg(reg_cache, rt); + lightrec_free_reg(reg_cache, tmp); +} + +static void rec_store_direct(const struct block *block, const struct opcode *op, + jit_code_t code) +{ + struct lightrec_state *state = block->state; + struct regcache *reg_cache = state->reg_cache; + jit_state_t *_jit = block->_jit; + jit_node_t *to_not_ram, *to_end; + u8 tmp, tmp2, tmp3, rs, rt; + + jit_note(__FILE__, __LINE__); + + rs = lightrec_alloc_reg_in(reg_cache, _jit, op->i.rs); + tmp2 = lightrec_alloc_reg_temp(reg_cache, _jit); + tmp3 = lightrec_alloc_reg_in(reg_cache, _jit, 0); + + /* Convert to KUNSEG and avoid RAM mirrors */ + if (op->i.imm) { + jit_addi(tmp2, rs, (s16)op->i.imm); + jit_andi(tmp2, tmp2, 0x1f800000 | (RAM_SIZE - 1)); + } else { + jit_andi(tmp2, rs, 0x1f800000 | (RAM_SIZE - 1)); + } + + lightrec_free_reg(reg_cache, rs); + tmp = lightrec_alloc_reg_temp(reg_cache, _jit); + + to_not_ram = jit_bgti(tmp2, RAM_SIZE); + + /* Compute the offset to the code LUT */ + jit_andi(tmp, tmp2, (RAM_SIZE - 1) & ~3); +#if __WORDSIZE == 64 + jit_lshi(tmp, tmp, 1); +#endif + jit_addr(tmp, LIGHTREC_REG_STATE, tmp); + + /* Write NULL to the code LUT to invalidate any block that's there */ + jit_stxi(offsetof(struct lightrec_state, code_lut), tmp, tmp3); + + if (state->offset_ram != state->offset_scratch) { + jit_movi(tmp, state->offset_ram); + + to_end = jit_jmpi(); + } + + jit_patch(to_not_ram); + + if (state->offset_ram || state->offset_scratch) + jit_movi(tmp, state->offset_scratch); + + if (state->offset_ram != state->offset_scratch) + jit_patch(to_end); + + if (state->offset_ram || state->offset_scratch) + jit_addr(tmp2, tmp2, tmp); + + lightrec_free_reg(reg_cache, tmp); + lightrec_free_reg(reg_cache, tmp3); + + rt = lightrec_alloc_reg_in(reg_cache, _jit, op->i.rt); + jit_new_node_www(code, 0, tmp2, rt); + + lightrec_free_reg(reg_cache, rt); + lightrec_free_reg(reg_cache, tmp2); +} + +static void rec_store(const struct block *block, const struct opcode *op, + jit_code_t code) +{ + if (op->flags & LIGHTREC_NO_INVALIDATE) { + rec_store_direct_no_invalidate(block, op, code); + } else if (op->flags & LIGHTREC_DIRECT_IO) { + if (block->state->invalidate_from_dma_only) + rec_store_direct_no_invalidate(block, op, code); + else + rec_store_direct(block, op, code); + } else { + rec_io(block, op, true, false); + } +} + +static void rec_SB(const struct block *block, const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_store(block, op, jit_code_stxi_c); +} + +static void rec_SH(const struct block *block, const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_store(block, op, jit_code_stxi_s); +} + +static void rec_SW(const struct block *block, const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_store(block, op, jit_code_stxi_i); +} + +static void rec_SWL(const struct block *block, const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_io(block, op, true, false); +} + +static void rec_SWR(const struct block *block, const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_io(block, op, true, false); +} + +static void rec_SWC2(const struct block *block, const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_io(block, op, false, false); +} + +static void rec_load_direct(const struct block *block, const struct opcode *op, + jit_code_t code) +{ + struct lightrec_state *state = block->state; + struct regcache *reg_cache = state->reg_cache; + jit_state_t *_jit = block->_jit; + jit_node_t *to_not_ram, *to_not_bios, *to_end, *to_end2; + u8 tmp, rs, rt, addr_reg; + s16 imm; + + if (!op->i.rt) + return; + + jit_note(__FILE__, __LINE__); + rs = lightrec_alloc_reg_in(reg_cache, _jit, op->i.rs); + rt = lightrec_alloc_reg_out_ext(reg_cache, _jit, op->i.rt); + + if ((state->offset_ram == state->offset_bios && + state->offset_ram == state->offset_scratch && + state->mirrors_mapped) || !op->i.imm) { + addr_reg = rs; + imm = (s16)op->i.imm; + } else { + jit_addi(rt, rs, (s16)op->i.imm); + addr_reg = rt; + imm = 0; + + if (op->i.rs != op->i.rt) + lightrec_free_reg(reg_cache, rs); + } + + tmp = lightrec_alloc_reg_temp(reg_cache, _jit); + + if (state->offset_ram == state->offset_bios && + state->offset_ram == state->offset_scratch) { + if (!state->mirrors_mapped) { + jit_andi(tmp, addr_reg, BIT(28)); + jit_rshi_u(tmp, tmp, 28 - 22); + jit_ori(tmp, tmp, 0x1f800000 | (RAM_SIZE - 1)); + jit_andr(rt, addr_reg, tmp); + } else { + jit_andi(rt, addr_reg, 0x1fffffff); + } + + if (state->offset_ram) + jit_movi(tmp, state->offset_ram); + } else { + to_not_ram = jit_bmsi(addr_reg, BIT(28)); + + /* Convert to KUNSEG and avoid RAM mirrors */ + jit_andi(rt, addr_reg, RAM_SIZE - 1); + + if (state->offset_ram) + jit_movi(tmp, state->offset_ram); + + to_end = jit_jmpi(); + + jit_patch(to_not_ram); + + if (state->offset_bios != state->offset_scratch) + to_not_bios = jit_bmci(addr_reg, BIT(22)); + + /* Convert to KUNSEG */ + jit_andi(rt, addr_reg, 0x1fc00000 | (BIOS_SIZE - 1)); + + jit_movi(tmp, state->offset_bios); + + if (state->offset_bios != state->offset_scratch) { + to_end2 = jit_jmpi(); + + jit_patch(to_not_bios); + + /* Convert to KUNSEG */ + jit_andi(rt, addr_reg, 0x1f800fff); + + if (state->offset_scratch) + jit_movi(tmp, state->offset_scratch); + + jit_patch(to_end2); + } + + jit_patch(to_end); + } + + if (state->offset_ram || state->offset_bios || state->offset_scratch) + jit_addr(rt, rt, tmp); + + jit_new_node_www(code, rt, rt, imm); + + lightrec_free_reg(reg_cache, addr_reg); + lightrec_free_reg(reg_cache, rt); + lightrec_free_reg(reg_cache, tmp); +} + +static void rec_load(const struct block *block, const struct opcode *op, + jit_code_t code) +{ + if (op->flags & LIGHTREC_DIRECT_IO) + rec_load_direct(block, op, code); + else + rec_io(block, op, false, true); +} + +static void rec_LB(const struct block *block, const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_load(block, op, jit_code_ldxi_c); +} + +static void rec_LBU(const struct block *block, const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_load(block, op, jit_code_ldxi_uc); +} + +static void rec_LH(const struct block *block, const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_load(block, op, jit_code_ldxi_s); +} + +static void rec_LHU(const struct block *block, const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_load(block, op, jit_code_ldxi_us); +} + +static void rec_LWL(const struct block *block, const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_io(block, op, true, true); +} + +static void rec_LWR(const struct block *block, const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_io(block, op, true, true); +} + +static void rec_LW(const struct block *block, const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_load(block, op, jit_code_ldxi_i); +} + +static void rec_LWC2(const struct block *block, const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_io(block, op, false, false); +} + +static void rec_break_syscall(const struct block *block, + const struct opcode *op, u32 pc, bool is_break) +{ + struct regcache *reg_cache = block->state->reg_cache; + jit_state_t *_jit = block->_jit; + u32 offset; + u8 tmp; + + jit_note(__FILE__, __LINE__); + + if (is_break) + offset = offsetof(struct lightrec_state, break_func); + else + offset = offsetof(struct lightrec_state, syscall_func); + + tmp = lightrec_alloc_reg_temp(reg_cache, _jit); + jit_ldxi(tmp, LIGHTREC_REG_STATE, offset); + jit_callr(tmp); + lightrec_free_reg(reg_cache, tmp); + + lightrec_regcache_mark_live(reg_cache, _jit); + + /* TODO: the return address should be "pc - 4" if we're a delay slot */ + lightrec_emit_end_of_block(block, op, pc, -1, pc, 31, 0, true); +} + +static void rec_special_SYSCALL(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_break_syscall(block, op, pc, false); +} + +static void rec_special_BREAK(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_break_syscall(block, op, pc, true); +} + +static void rec_mfc(const struct block *block, const struct opcode *op) +{ + u8 tmp, tmp2; + struct lightrec_state *state = block->state; + struct regcache *reg_cache = state->reg_cache; + jit_state_t *_jit = block->_jit; + + jit_note(__FILE__, __LINE__); + + tmp = lightrec_alloc_reg(reg_cache, _jit, JIT_R0); + tmp2 = lightrec_alloc_reg_temp(reg_cache, _jit); + + jit_ldxi(tmp2, LIGHTREC_REG_STATE, + offsetof(struct lightrec_state, mfc_func)); + + lightrec_clean_reg_if_loaded(reg_cache, _jit, op->i.rt, true); + + jit_movi(tmp, op->opcode); + jit_callr(tmp2); + lightrec_free_reg(reg_cache, tmp); + lightrec_free_reg(reg_cache, tmp2); + + lightrec_regcache_mark_live(reg_cache, _jit); +} + +static void rec_mtc(const struct block *block, const struct opcode *op, u32 pc) +{ + struct lightrec_state *state = block->state; + struct regcache *reg_cache = state->reg_cache; + jit_state_t *_jit = block->_jit; + u8 tmp, tmp2; + + jit_note(__FILE__, __LINE__); + + tmp = lightrec_alloc_reg(reg_cache, _jit, JIT_R0); + tmp2 = lightrec_alloc_reg_temp(reg_cache, _jit); + jit_ldxi(tmp2, LIGHTREC_REG_STATE, + offsetof(struct lightrec_state, mtc_func)); + + lightrec_clean_reg_if_loaded(reg_cache, _jit, op->i.rs, false); + lightrec_clean_reg_if_loaded(reg_cache, _jit, op->i.rt, false); + + jit_movi(tmp, op->opcode); + jit_callr(tmp2); + lightrec_free_reg(reg_cache, tmp); + lightrec_free_reg(reg_cache, tmp2); + + lightrec_regcache_mark_live(reg_cache, _jit); + + if (op->i.op == OP_CP0 && (op->r.rd == 12 || op->r.rd == 13)) + lightrec_emit_end_of_block(block, op, pc, -1, pc + 4, 0, 0, true); +} + +static void rec_cp0_MFC0(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_mfc(block, op); +} + +static void rec_cp0_CFC0(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_mfc(block, op); +} + +static void rec_cp0_MTC0(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_mtc(block, op, pc); +} + +static void rec_cp0_CTC0(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_mtc(block, op, pc); +} + +static void rec_cp2_basic_MFC2(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_mfc(block, op); +} + +static void rec_cp2_basic_CFC2(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_mfc(block, op); +} + +static void rec_cp2_basic_MTC2(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_mtc(block, op, pc); +} + +static void rec_cp2_basic_CTC2(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_mtc(block, op, pc); +} + +static void rec_cp0_RFE(const struct block *block, + const struct opcode *op, u32 pc) +{ + struct lightrec_state *state = block->state; + jit_state_t *_jit = block->_jit; + u8 tmp; + + jit_name(__func__); + jit_note(__FILE__, __LINE__); + + tmp = lightrec_alloc_reg_temp(state->reg_cache, _jit); + jit_ldxi(tmp, LIGHTREC_REG_STATE, + offsetof(struct lightrec_state, rfe_func)); + jit_callr(tmp); + lightrec_free_reg(state->reg_cache, tmp); + + lightrec_regcache_mark_live(state->reg_cache, _jit); +} + +static void rec_CP(const struct block *block, const struct opcode *op, u32 pc) +{ + struct regcache *reg_cache = block->state->reg_cache; + jit_state_t *_jit = block->_jit; + u8 tmp, tmp2; + + jit_name(__func__); + jit_note(__FILE__, __LINE__); + + tmp = lightrec_alloc_reg(reg_cache, _jit, JIT_R0); + tmp2 = lightrec_alloc_reg_temp(reg_cache, _jit); + + jit_ldxi(tmp2, LIGHTREC_REG_STATE, + offsetof(struct lightrec_state, cp_func)); + + jit_movi(tmp, op->opcode); + jit_callr(tmp2); + lightrec_free_reg(reg_cache, tmp); + lightrec_free_reg(reg_cache, tmp2); + + lightrec_regcache_mark_live(reg_cache, _jit); +} + +static void rec_meta_unload(const struct block *block, + const struct opcode *op, u32 pc) +{ + struct lightrec_state *state = block->state; + struct regcache *reg_cache = state->reg_cache; + jit_state_t *_jit = block->_jit; + + jit_name(__func__); + jit_note(__FILE__, __LINE__); + + pr_debug("Unloading reg %s\n", lightrec_reg_name(op->i.rs)); + lightrec_clean_reg_if_loaded(reg_cache, _jit, op->i.rs, true); +} + +static void rec_meta_BEQZ(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_b(block, op, pc, jit_code_bnei, 0, false, true); +} + +static void rec_meta_BNEZ(const struct block *block, + const struct opcode *op, u32 pc) +{ + _jit_name(block->_jit, __func__); + rec_b(block, op, pc, jit_code_beqi, 0, false, true); +} + +static void rec_meta_MOV(const struct block *block, + const struct opcode *op, u32 pc) +{ + struct lightrec_state *state = block->state; + struct regcache *reg_cache = state->reg_cache; + jit_state_t *_jit = block->_jit; + u8 rs, rd; + + _jit_name(block->_jit, __func__); + jit_note(__FILE__, __LINE__); + rs = op->r.rs ? lightrec_alloc_reg_in(reg_cache, _jit, op->r.rs) : 0; + rd = lightrec_alloc_reg_out_ext(reg_cache, _jit, op->r.rd); + + if (op->r.rs == 0) { + jit_movi(rd, 0); + } else { +#if __WORDSIZE == 32 + jit_movr(rd, rs); +#else + jit_extr_i(rd, rs); +#endif + } + + lightrec_free_reg(state->reg_cache, rs); + lightrec_free_reg(state->reg_cache, rd); +} + +static void rec_meta_sync(const struct block *block, + const struct opcode *op, u32 pc) +{ + struct lightrec_state *state = block->state; + struct lightrec_branch_target *target; + jit_state_t *_jit = block->_jit; + + jit_name(__func__); + jit_note(__FILE__, __LINE__); + + jit_subi(LIGHTREC_REG_CYCLE, LIGHTREC_REG_CYCLE, state->cycles); + state->cycles = 0; + + lightrec_storeback_regs(state->reg_cache, _jit); + lightrec_regcache_reset(state->reg_cache); + + pr_debug("Adding branch target at offset 0x%x\n", + op->offset << 2); + target = &state->targets[state->nb_targets++]; + target->offset = op->offset; + target->label = jit_label(); +} + +static const lightrec_rec_func_t rec_standard[64] = { + [OP_SPECIAL] = rec_SPECIAL, + [OP_REGIMM] = rec_REGIMM, + [OP_J] = rec_J, + [OP_JAL] = rec_JAL, + [OP_BEQ] = rec_BEQ, + [OP_BNE] = rec_BNE, + [OP_BLEZ] = rec_BLEZ, + [OP_BGTZ] = rec_BGTZ, + [OP_ADDI] = rec_ADDI, + [OP_ADDIU] = rec_ADDIU, + [OP_SLTI] = rec_SLTI, + [OP_SLTIU] = rec_SLTIU, + [OP_ANDI] = rec_ANDI, + [OP_ORI] = rec_ORI, + [OP_XORI] = rec_XORI, + [OP_LUI] = rec_LUI, + [OP_CP0] = rec_CP0, + [OP_CP2] = rec_CP2, + [OP_LB] = rec_LB, + [OP_LH] = rec_LH, + [OP_LWL] = rec_LWL, + [OP_LW] = rec_LW, + [OP_LBU] = rec_LBU, + [OP_LHU] = rec_LHU, + [OP_LWR] = rec_LWR, + [OP_SB] = rec_SB, + [OP_SH] = rec_SH, + [OP_SWL] = rec_SWL, + [OP_SW] = rec_SW, + [OP_SWR] = rec_SWR, + [OP_LWC2] = rec_LWC2, + [OP_SWC2] = rec_SWC2, + + [OP_META_REG_UNLOAD] = rec_meta_unload, + [OP_META_BEQZ] = rec_meta_BEQZ, + [OP_META_BNEZ] = rec_meta_BNEZ, + [OP_META_MOV] = rec_meta_MOV, + [OP_META_SYNC] = rec_meta_sync, +}; + +static const lightrec_rec_func_t rec_special[64] = { + [OP_SPECIAL_SLL] = rec_special_SLL, + [OP_SPECIAL_SRL] = rec_special_SRL, + [OP_SPECIAL_SRA] = rec_special_SRA, + [OP_SPECIAL_SLLV] = rec_special_SLLV, + [OP_SPECIAL_SRLV] = rec_special_SRLV, + [OP_SPECIAL_SRAV] = rec_special_SRAV, + [OP_SPECIAL_JR] = rec_special_JR, + [OP_SPECIAL_JALR] = rec_special_JALR, + [OP_SPECIAL_SYSCALL] = rec_special_SYSCALL, + [OP_SPECIAL_BREAK] = rec_special_BREAK, + [OP_SPECIAL_MFHI] = rec_special_MFHI, + [OP_SPECIAL_MTHI] = rec_special_MTHI, + [OP_SPECIAL_MFLO] = rec_special_MFLO, + [OP_SPECIAL_MTLO] = rec_special_MTLO, + [OP_SPECIAL_MULT] = rec_special_MULT, + [OP_SPECIAL_MULTU] = rec_special_MULTU, + [OP_SPECIAL_DIV] = rec_special_DIV, + [OP_SPECIAL_DIVU] = rec_special_DIVU, + [OP_SPECIAL_ADD] = rec_special_ADD, + [OP_SPECIAL_ADDU] = rec_special_ADDU, + [OP_SPECIAL_SUB] = rec_special_SUB, + [OP_SPECIAL_SUBU] = rec_special_SUBU, + [OP_SPECIAL_AND] = rec_special_AND, + [OP_SPECIAL_OR] = rec_special_OR, + [OP_SPECIAL_XOR] = rec_special_XOR, + [OP_SPECIAL_NOR] = rec_special_NOR, + [OP_SPECIAL_SLT] = rec_special_SLT, + [OP_SPECIAL_SLTU] = rec_special_SLTU, +}; + +static const lightrec_rec_func_t rec_regimm[64] = { + [OP_REGIMM_BLTZ] = rec_regimm_BLTZ, + [OP_REGIMM_BGEZ] = rec_regimm_BGEZ, + [OP_REGIMM_BLTZAL] = rec_regimm_BLTZAL, + [OP_REGIMM_BGEZAL] = rec_regimm_BGEZAL, +}; + +static const lightrec_rec_func_t rec_cp0[64] = { + [OP_CP0_MFC0] = rec_cp0_MFC0, + [OP_CP0_CFC0] = rec_cp0_CFC0, + [OP_CP0_MTC0] = rec_cp0_MTC0, + [OP_CP0_CTC0] = rec_cp0_CTC0, + [OP_CP0_RFE] = rec_cp0_RFE, +}; + +static const lightrec_rec_func_t rec_cp2_basic[64] = { + [OP_CP2_BASIC_MFC2] = rec_cp2_basic_MFC2, + [OP_CP2_BASIC_CFC2] = rec_cp2_basic_CFC2, + [OP_CP2_BASIC_MTC2] = rec_cp2_basic_MTC2, + [OP_CP2_BASIC_CTC2] = rec_cp2_basic_CTC2, +}; + +static void rec_SPECIAL(const struct block *block, + const struct opcode *op, u32 pc) +{ + lightrec_rec_func_t f = rec_special[op->r.op]; + if (likely(f)) + (*f)(block, op, pc); + else + unknown_opcode(block, op, pc); +} + +static void rec_REGIMM(const struct block *block, + const struct opcode *op, u32 pc) +{ + lightrec_rec_func_t f = rec_regimm[op->r.rt]; + if (likely(f)) + (*f)(block, op, pc); + else + unknown_opcode(block, op, pc); +} + +static void rec_CP0(const struct block *block, const struct opcode *op, u32 pc) +{ + lightrec_rec_func_t f = rec_cp0[op->r.rs]; + if (likely(f)) + (*f)(block, op, pc); + else + rec_CP(block, op, pc); +} + +static void rec_CP2(const struct block *block, const struct opcode *op, u32 pc) +{ + if (op->r.op == OP_CP2_BASIC) { + lightrec_rec_func_t f = rec_cp2_basic[op->r.rs]; + if (likely(f)) { + (*f)(block, op, pc); + return; + } + } + + rec_CP(block, op, pc); +} + +void lightrec_rec_opcode(const struct block *block, + const struct opcode *op, u32 pc) +{ + lightrec_rec_func_t f = rec_standard[op->i.op]; + if (likely(f)) + (*f)(block, op, pc); + else + unknown_opcode(block, op, pc); +} -- cgit v1.2.3