aboutsummaryrefslogtreecommitdiff
path: root/deps/lightrec/emitter.c
diff options
context:
space:
mode:
Diffstat (limited to 'deps/lightrec/emitter.c')
-rw-r--r--deps/lightrec/emitter.c1577
1 files changed, 1577 insertions, 0 deletions
diff --git a/deps/lightrec/emitter.c b/deps/lightrec/emitter.c
new file mode 100644
index 0000000..b09dc94
--- /dev/null
+++ b/deps/lightrec/emitter.c
@@ -0,0 +1,1577 @@
+/*
+ * Copyright (C) 2014-2020 Paul Cercueil <paul@crapouillou.net>
+ *
+ * This library is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU Lesser General Public
+ * License as published by the Free Software Foundation; either
+ * version 2.1 of the License, or (at your option) any later version.
+ *
+ * This library is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ * Lesser General Public License for more details.
+ */
+
+#include "blockcache.h"
+#include "debug.h"
+#include "disassembler.h"
+#include "emitter.h"
+#include "optimizer.h"
+#include "regcache.h"
+
+#include <lightning.h>
+#include <stdbool.h>
+#include <stddef.h>
+
+typedef void (*lightrec_rec_func_t)(const struct block *,
+ const struct opcode *, u32);
+
+/* Forward declarations */
+static void rec_SPECIAL(const struct block *block,
+ const struct opcode *op, u32 pc);
+static void rec_REGIMM(const struct block *block,
+ const struct opcode *op, u32 pc);
+static void rec_CP0(const struct block *block, const struct opcode *op, u32 pc);
+static void rec_CP2(const struct block *block, const struct opcode *op, u32 pc);
+
+
+static void unknown_opcode(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ pr_warn("Unknown opcode: 0x%08x at PC 0x%08x\n", op->opcode, pc);
+}
+
+static void lightrec_emit_end_of_block(const struct block *block,
+ const struct opcode *op, u32 pc,
+ s8 reg_new_pc, u32 imm, u8 ra_reg,
+ u32 link, bool update_cycles)
+{
+ struct lightrec_state *state = block->state;
+ struct regcache *reg_cache = state->reg_cache;
+ u32 cycles = state->cycles;
+ jit_state_t *_jit = block->_jit;
+
+ jit_note(__FILE__, __LINE__);
+
+ if (link) {
+ /* Update the $ra register */
+ u8 link_reg = lightrec_alloc_reg_out(reg_cache, _jit, ra_reg);
+ jit_movi(link_reg, link);
+ lightrec_free_reg(reg_cache, link_reg);
+ }
+
+ if (reg_new_pc < 0) {
+ reg_new_pc = lightrec_alloc_reg(reg_cache, _jit, JIT_V0);
+ lightrec_lock_reg(reg_cache, _jit, reg_new_pc);
+
+ jit_movi(reg_new_pc, imm);
+ }
+
+ if (has_delay_slot(op->c) &&
+ !(op->flags & (LIGHTREC_NO_DS | LIGHTREC_LOCAL_BRANCH))) {
+ cycles += lightrec_cycles_of_opcode(op->next->c);
+
+ /* Recompile the delay slot */
+ if (op->next->c.opcode)
+ lightrec_rec_opcode(block, op->next, pc + 4);
+ }
+
+ /* Store back remaining registers */
+ lightrec_storeback_regs(reg_cache, _jit);
+
+ jit_movr(JIT_V0, reg_new_pc);
+
+ if (cycles && update_cycles) {
+ jit_subi(LIGHTREC_REG_CYCLE, LIGHTREC_REG_CYCLE, cycles);
+ pr_debug("EOB: %u cycles\n", cycles);
+ }
+
+ if (op->next && ((op->flags & LIGHTREC_NO_DS) || op->next->next))
+ state->branches[state->nb_branches++] = jit_jmpi();
+}
+
+void lightrec_emit_eob(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ struct lightrec_state *state = block->state;
+ struct regcache *reg_cache = state->reg_cache;
+ jit_state_t *_jit = block->_jit;
+
+ lightrec_storeback_regs(reg_cache, _jit);
+
+ jit_movi(JIT_V0, pc);
+ jit_subi(LIGHTREC_REG_CYCLE, LIGHTREC_REG_CYCLE,
+ state->cycles - lightrec_cycles_of_opcode(op->c));
+
+ state->branches[state->nb_branches++] = jit_jmpi();
+}
+
+static void rec_special_JR(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ struct regcache *reg_cache = block->state->reg_cache;
+ jit_state_t *_jit = block->_jit;
+ u8 rs = lightrec_request_reg_in(reg_cache, _jit, op->r.rs, JIT_V0);
+
+ _jit_name(block->_jit, __func__);
+ lightrec_lock_reg(reg_cache, _jit, rs);
+ lightrec_emit_end_of_block(block, op, pc, rs, 0, 31, 0, true);
+}
+
+static void rec_special_JALR(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ struct regcache *reg_cache = block->state->reg_cache;
+ jit_state_t *_jit = block->_jit;
+ u8 rs = lightrec_request_reg_in(reg_cache, _jit, op->r.rs, JIT_V0);
+
+ _jit_name(block->_jit, __func__);
+ lightrec_lock_reg(reg_cache, _jit, rs);
+ lightrec_emit_end_of_block(block, op, pc, rs, 0, op->r.rd, pc + 8, true);
+}
+
+static void rec_J(const struct block *block, const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ lightrec_emit_end_of_block(block, op, pc, -1,
+ (pc & 0xf0000000) | (op->j.imm << 2), 31, 0, true);
+}
+
+static void rec_JAL(const struct block *block, const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ lightrec_emit_end_of_block(block, op, pc, -1,
+ (pc & 0xf0000000) | (op->j.imm << 2),
+ 31, pc + 8, true);
+}
+
+static void rec_b(const struct block *block, const struct opcode *op, u32 pc,
+ jit_code_t code, u32 link, bool unconditional, bool bz)
+{
+ struct regcache *reg_cache = block->state->reg_cache;
+ struct native_register *regs_backup;
+ jit_state_t *_jit = block->_jit;
+ struct lightrec_branch *branch;
+ jit_node_t *addr;
+ u8 link_reg;
+ u32 offset, cycles = block->state->cycles;
+ bool is_forward = (s16)op->i.imm >= -1;
+
+ jit_note(__FILE__, __LINE__);
+
+ if (!(op->flags & LIGHTREC_NO_DS))
+ cycles += lightrec_cycles_of_opcode(op->next->c);
+
+ block->state->cycles = 0;
+
+ if (cycles)
+ jit_subi(LIGHTREC_REG_CYCLE, LIGHTREC_REG_CYCLE, cycles);
+
+ if (!unconditional) {
+ u8 rs = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->i.rs),
+ rt = bz ? 0 : lightrec_alloc_reg_in_ext(reg_cache,
+ _jit, op->i.rt);
+
+ /* Generate the branch opcode */
+ addr = jit_new_node_pww(code, NULL, rs, rt);
+
+ lightrec_free_regs(reg_cache);
+ regs_backup = lightrec_regcache_enter_branch(reg_cache);
+ }
+
+ if (op->flags & LIGHTREC_LOCAL_BRANCH) {
+ if (op->next && !(op->flags & LIGHTREC_NO_DS)) {
+ /* Recompile the delay slot */
+ if (op->next->opcode)
+ lightrec_rec_opcode(block, op->next, pc + 4);
+ }
+
+ if (link) {
+ /* Update the $ra register */
+ link_reg = lightrec_alloc_reg_out(reg_cache, _jit, 31);
+ jit_movi(link_reg, link);
+ lightrec_free_reg(reg_cache, link_reg);
+ }
+
+ /* Store back remaining registers */
+ lightrec_storeback_regs(reg_cache, _jit);
+
+ offset = op->offset + 1 + (s16)op->i.imm;
+ pr_debug("Adding local branch to offset 0x%x\n", offset << 2);
+ branch = &block->state->local_branches[
+ block->state->nb_local_branches++];
+
+ branch->target = offset;
+ if (is_forward)
+ branch->branch = jit_jmpi();
+ else
+ branch->branch = jit_bgti(LIGHTREC_REG_CYCLE, 0);
+ }
+
+ if (!(op->flags & LIGHTREC_LOCAL_BRANCH) || !is_forward) {
+ lightrec_emit_end_of_block(block, op, pc, -1,
+ pc + 4 + ((s16)op->i.imm << 2),
+ 31, link, false);
+ }
+
+ if (!unconditional) {
+ jit_patch(addr);
+ lightrec_regcache_leave_branch(reg_cache, regs_backup);
+
+ if (bz && link) {
+ /* Update the $ra register */
+ link_reg = lightrec_alloc_reg_out_ext(reg_cache,
+ _jit, 31);
+ jit_movi(link_reg, (s32)link);
+ lightrec_free_reg(reg_cache, link_reg);
+ }
+
+ if (!(op->flags & LIGHTREC_NO_DS) && op->next->opcode)
+ lightrec_rec_opcode(block, op->next, pc + 4);
+ }
+}
+
+static void rec_BNE(const struct block *block, const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_b(block, op, pc, jit_code_beqr, 0, false, false);
+}
+
+static void rec_BEQ(const struct block *block, const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_b(block, op, pc, jit_code_bner, 0,
+ op->i.rs == op->i.rt, false);
+}
+
+static void rec_BLEZ(const struct block *block, const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_b(block, op, pc, jit_code_bgti, 0, op->i.rs == 0, true);
+}
+
+static void rec_BGTZ(const struct block *block, const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_b(block, op, pc, jit_code_blei, 0, false, true);
+}
+
+static void rec_regimm_BLTZ(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_b(block, op, pc, jit_code_bgei, 0, false, true);
+}
+
+static void rec_regimm_BLTZAL(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_b(block, op, pc, jit_code_bgei, pc + 8, false, true);
+}
+
+static void rec_regimm_BGEZ(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_b(block, op, pc, jit_code_blti, 0, !op->i.rs, true);
+}
+
+static void rec_regimm_BGEZAL(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_b(block, op, pc, jit_code_blti, pc + 8, !op->i.rs, true);
+}
+
+static void rec_alu_imm(const struct block *block, const struct opcode *op,
+ jit_code_t code, bool sign_extend)
+{
+ struct regcache *reg_cache = block->state->reg_cache;
+ jit_state_t *_jit = block->_jit;
+ u8 rs, rt;
+
+ jit_note(__FILE__, __LINE__);
+ rs = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->i.rs);
+ rt = lightrec_alloc_reg_out_ext(reg_cache, _jit, op->i.rt);
+
+ if (sign_extend)
+ jit_new_node_www(code, rt, rs, (s32)(s16) op->i.imm);
+ else
+ jit_new_node_www(code, rt, rs, (u32)(u16) op->i.imm);
+
+ lightrec_free_reg(reg_cache, rs);
+ lightrec_free_reg(reg_cache, rt);
+}
+
+static void rec_alu_special(const struct block *block, const struct opcode *op,
+ jit_code_t code, bool out_ext)
+{
+ struct regcache *reg_cache = block->state->reg_cache;
+ jit_state_t *_jit = block->_jit;
+ u8 rd, rt, rs;
+
+ jit_note(__FILE__, __LINE__);
+ rs = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->r.rs);
+ rt = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->r.rt);
+
+ if (out_ext)
+ rd = lightrec_alloc_reg_out_ext(reg_cache, _jit, op->r.rd);
+ else
+ rd = lightrec_alloc_reg_out(reg_cache, _jit, op->r.rd);
+
+ jit_new_node_www(code, rd, rs, rt);
+
+ lightrec_free_reg(reg_cache, rs);
+ lightrec_free_reg(reg_cache, rt);
+ lightrec_free_reg(reg_cache, rd);
+}
+
+static void rec_alu_shiftv(const struct block *block,
+ const struct opcode *op, jit_code_t code)
+{
+ struct regcache *reg_cache = block->state->reg_cache;
+ jit_state_t *_jit = block->_jit;
+ u8 rd, rt, rs, temp;
+
+ jit_note(__FILE__, __LINE__);
+ rs = lightrec_alloc_reg_in(reg_cache, _jit, op->r.rs);
+ temp = lightrec_alloc_reg_temp(reg_cache, _jit);
+
+ if (code == jit_code_rshr) {
+ rt = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->r.rt);
+ rd = lightrec_alloc_reg_out_ext(reg_cache, _jit, op->r.rd);
+ } else {
+ rt = lightrec_alloc_reg_in(reg_cache, _jit, op->r.rt);
+ rd = lightrec_alloc_reg_out(reg_cache, _jit, op->r.rd);
+ }
+
+ jit_andi(temp, rs, 0x1f);
+
+#if __WORDSIZE == 64
+ if (code == jit_code_rshr_u) {
+ jit_extr_ui(rd, rt);
+ jit_new_node_www(code, rd, rd, temp);
+ }
+#endif
+
+ if (__WORDSIZE == 32 || code != jit_code_rshr_u)
+ jit_new_node_www(code, rd, rt, temp);
+
+ lightrec_free_reg(reg_cache, rs);
+ lightrec_free_reg(reg_cache, temp);
+ lightrec_free_reg(reg_cache, rt);
+ lightrec_free_reg(reg_cache, rd);
+}
+
+static void rec_ADDIU(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_imm(block, op, jit_code_addi, true);
+}
+
+static void rec_ADDI(const struct block *block, const struct opcode *op, u32 pc)
+{
+ /* TODO: Handle the exception? */
+ _jit_name(block->_jit, __func__);
+ rec_alu_imm(block, op, jit_code_addi, true);
+}
+
+static void rec_SLTIU(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_imm(block, op, jit_code_lti_u, true);
+}
+
+static void rec_SLTI(const struct block *block, const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_imm(block, op, jit_code_lti, true);
+}
+
+static void rec_ANDI(const struct block *block, const struct opcode *op, u32 pc)
+{
+ struct regcache *reg_cache = block->state->reg_cache;
+ jit_state_t *_jit = block->_jit;
+ u8 rs, rt;
+
+ _jit_name(block->_jit, __func__);
+ jit_note(__FILE__, __LINE__);
+ rs = lightrec_alloc_reg_in(reg_cache, _jit, op->i.rs);
+ rt = lightrec_alloc_reg_out_ext(reg_cache, _jit, op->i.rt);
+
+ /* PSX code uses ANDI 0xff / ANDI 0xffff a lot, which are basically
+ * casts to uint8_t / uint16_t. */
+ if (op->i.imm == 0xff)
+ jit_extr_uc(rt, rs);
+ else if (op->i.imm == 0xffff)
+ jit_extr_us(rt, rs);
+ else
+ jit_andi(rt, rs, (u32)(u16) op->i.imm);
+
+ lightrec_free_reg(reg_cache, rs);
+ lightrec_free_reg(reg_cache, rt);
+}
+
+static void rec_ORI(const struct block *block, const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_imm(block, op, jit_code_ori, false);
+}
+
+static void rec_XORI(const struct block *block, const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_imm(block, op, jit_code_xori, false);
+}
+
+static void rec_LUI(const struct block *block, const struct opcode *op, u32 pc)
+{
+ struct regcache *reg_cache = block->state->reg_cache;
+ jit_state_t *_jit = block->_jit;
+ u8 rt;
+
+ jit_name(__func__);
+ jit_note(__FILE__, __LINE__);
+ rt = lightrec_alloc_reg_out_ext(reg_cache, _jit, op->i.rt);
+
+ jit_movi(rt, (s32)(op->i.imm << 16));
+
+ lightrec_free_reg(reg_cache, rt);
+}
+
+static void rec_special_ADDU(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_special(block, op, jit_code_addr, false);
+}
+
+static void rec_special_ADD(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ /* TODO: Handle the exception? */
+ _jit_name(block->_jit, __func__);
+ rec_alu_special(block, op, jit_code_addr, false);
+}
+
+static void rec_special_SUBU(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_special(block, op, jit_code_subr, false);
+}
+
+static void rec_special_SUB(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ /* TODO: Handle the exception? */
+ _jit_name(block->_jit, __func__);
+ rec_alu_special(block, op, jit_code_subr, false);
+}
+
+static void rec_special_AND(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_special(block, op, jit_code_andr, false);
+}
+
+static void rec_special_OR(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_special(block, op, jit_code_orr, false);
+}
+
+static void rec_special_XOR(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_special(block, op, jit_code_xorr, false);
+}
+
+static void rec_special_NOR(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ struct regcache *reg_cache = block->state->reg_cache;
+ jit_state_t *_jit = block->_jit;
+ u8 rd;
+
+ jit_name(__func__);
+ rec_alu_special(block, op, jit_code_orr, false);
+ rd = lightrec_alloc_reg_out(reg_cache, _jit, op->r.rd);
+
+ jit_comr(rd, rd);
+
+ lightrec_free_reg(reg_cache, rd);
+}
+
+static void rec_special_SLTU(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_special(block, op, jit_code_ltr_u, true);
+}
+
+static void rec_special_SLT(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_special(block, op, jit_code_ltr, true);
+}
+
+static void rec_special_SLLV(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_shiftv(block, op, jit_code_lshr);
+}
+
+static void rec_special_SRLV(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_shiftv(block, op, jit_code_rshr_u);
+}
+
+static void rec_special_SRAV(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_shiftv(block, op, jit_code_rshr);
+}
+
+static void rec_alu_shift(const struct block *block,
+ const struct opcode *op, jit_code_t code)
+{
+ struct regcache *reg_cache = block->state->reg_cache;
+ jit_state_t *_jit = block->_jit;
+ u8 rd, rt;
+
+ jit_note(__FILE__, __LINE__);
+
+ if (code == jit_code_rshi) {
+ rt = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->r.rt);
+ rd = lightrec_alloc_reg_out_ext(reg_cache, _jit, op->r.rd);
+ } else {
+ rt = lightrec_alloc_reg_in(reg_cache, _jit, op->r.rt);
+ rd = lightrec_alloc_reg_out(reg_cache, _jit, op->r.rd);
+ }
+
+#if __WORDSIZE == 64
+ if (code == jit_code_rshi_u) {
+ jit_extr_ui(rd, rt);
+ jit_new_node_www(code, rd, rd, op->r.imm);
+ }
+#endif
+ if (__WORDSIZE == 32 || code != jit_code_rshi_u)
+ jit_new_node_www(code, rd, rt, op->r.imm);
+
+ lightrec_free_reg(reg_cache, rt);
+ lightrec_free_reg(reg_cache, rd);
+}
+
+static void rec_special_SLL(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_shift(block, op, jit_code_lshi);
+}
+
+static void rec_special_SRL(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_shift(block, op, jit_code_rshi_u);
+}
+
+static void rec_special_SRA(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_shift(block, op, jit_code_rshi);
+}
+
+static void rec_alu_mult(const struct block *block,
+ const struct opcode *op, bool is_signed)
+{
+ struct regcache *reg_cache = block->state->reg_cache;
+ jit_state_t *_jit = block->_jit;
+ u8 lo, hi, rs, rt;
+
+ jit_note(__FILE__, __LINE__);
+
+ lo = lightrec_alloc_reg_out(reg_cache, _jit, REG_LO);
+ if (!(op->flags & LIGHTREC_MULT32))
+ hi = lightrec_alloc_reg_out_ext(reg_cache, _jit, REG_HI);
+ else if (__WORDSIZE == 64)
+ hi = lightrec_alloc_reg_temp(reg_cache, _jit);
+
+ if (__WORDSIZE == 32 || !is_signed) {
+ rs = lightrec_alloc_reg_in(reg_cache, _jit, op->r.rs);
+ rt = lightrec_alloc_reg_in(reg_cache, _jit, op->r.rt);
+ } else {
+ rs = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->r.rs);
+ rt = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->r.rt);
+ }
+
+#if __WORDSIZE == 32
+ /* On 32-bit systems, do a 32*32->64 bit operation, or a 32*32->32 bit
+ * operation if the MULT was detected a 32-bit only. */
+ if (!(op->flags & LIGHTREC_MULT32)) {
+ if (is_signed)
+ jit_qmulr(lo, hi, rs, rt);
+ else
+ jit_qmulr_u(lo, hi, rs, rt);
+ } else {
+ jit_mulr(lo, rs, rt);
+ }
+#else
+ /* On 64-bit systems, do a 64*64->64 bit operation.
+ * The input registers must be 32 bits, so we first sign-extend (if
+ * mult) or clear (if multu) the input registers. */
+ if (is_signed) {
+ jit_mulr(lo, rs, rt);
+ } else {
+ jit_extr_ui(lo, rt);
+ jit_extr_ui(hi, rs);
+ jit_mulr(lo, hi, lo);
+ }
+
+ /* The 64-bit output value is in $lo, store the upper 32 bits in $hi */
+ if (!(op->flags & LIGHTREC_MULT32))
+ jit_rshi(hi, lo, 32);
+#endif
+
+ lightrec_free_reg(reg_cache, rs);
+ lightrec_free_reg(reg_cache, rt);
+ lightrec_free_reg(reg_cache, lo);
+ if (__WORDSIZE == 64 || !(op->flags & LIGHTREC_MULT32))
+ lightrec_free_reg(reg_cache, hi);
+}
+
+static void rec_alu_div(const struct block *block,
+ const struct opcode *op, bool is_signed)
+{
+ struct regcache *reg_cache = block->state->reg_cache;
+ jit_state_t *_jit = block->_jit;
+ jit_node_t *branch, *to_end;
+ u8 lo, hi, rs, rt;
+
+ jit_note(__FILE__, __LINE__);
+ lo = lightrec_alloc_reg_out(reg_cache, _jit, REG_LO);
+ hi = lightrec_alloc_reg_out(reg_cache, _jit, REG_HI);
+
+ if (__WORDSIZE == 32 || !is_signed) {
+ rs = lightrec_alloc_reg_in(reg_cache, _jit, op->r.rs);
+ rt = lightrec_alloc_reg_in(reg_cache, _jit, op->r.rt);
+ } else {
+ rs = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->r.rs);
+ rt = lightrec_alloc_reg_in_ext(reg_cache, _jit, op->r.rt);
+ }
+
+ /* Jump to special handler if dividing by zero */
+ branch = jit_beqi(rt, 0);
+
+#if __WORDSIZE == 32
+ if (is_signed)
+ jit_qdivr(lo, hi, rs, rt);
+ else
+ jit_qdivr_u(lo, hi, rs, rt);
+#else
+ /* On 64-bit systems, the input registers must be 32 bits, so we first sign-extend
+ * (if div) or clear (if divu) the input registers. */
+ if (is_signed) {
+ jit_qdivr(lo, hi, rs, rt);
+ } else {
+ jit_extr_ui(lo, rt);
+ jit_extr_ui(hi, rs);
+ jit_qdivr_u(lo, hi, hi, lo);
+ }
+#endif
+
+ /* Jump above the div-by-zero handler */
+ to_end = jit_jmpi();
+
+ jit_patch(branch);
+
+ if (is_signed) {
+ jit_lti(lo, rs, 0);
+ jit_lshi(lo, lo, 1);
+ jit_subi(lo, lo, 1);
+ } else {
+ jit_movi(lo, 0xffffffff);
+ }
+
+ jit_movr(hi, rs);
+
+ jit_patch(to_end);
+
+ lightrec_free_reg(reg_cache, rs);
+ lightrec_free_reg(reg_cache, rt);
+ lightrec_free_reg(reg_cache, lo);
+ lightrec_free_reg(reg_cache, hi);
+}
+
+static void rec_special_MULT(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_mult(block, op, true);
+}
+
+static void rec_special_MULTU(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_mult(block, op, false);
+}
+
+static void rec_special_DIV(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_div(block, op, true);
+}
+
+static void rec_special_DIVU(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_div(block, op, false);
+}
+
+static void rec_alu_mv_lo_hi(const struct block *block, u8 dst, u8 src)
+{
+ struct regcache *reg_cache = block->state->reg_cache;
+ jit_state_t *_jit = block->_jit;
+
+ jit_note(__FILE__, __LINE__);
+ src = lightrec_alloc_reg_in(reg_cache, _jit, src);
+ dst = lightrec_alloc_reg_out_ext(reg_cache, _jit, dst);
+
+#if __WORDSIZE == 32
+ jit_movr(dst, src);
+#else
+ jit_extr_i(dst, src);
+#endif
+
+ lightrec_free_reg(reg_cache, src);
+ lightrec_free_reg(reg_cache, dst);
+}
+
+static void rec_special_MFHI(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_mv_lo_hi(block, op->r.rd, REG_HI);
+}
+
+static void rec_special_MTHI(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_mv_lo_hi(block, REG_HI, op->r.rs);
+}
+
+static void rec_special_MFLO(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_mv_lo_hi(block, op->r.rd, REG_LO);
+}
+
+static void rec_special_MTLO(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_alu_mv_lo_hi(block, REG_LO, op->r.rs);
+}
+
+static void rec_io(const struct block *block, const struct opcode *op,
+ bool load_rt, bool read_rt)
+{
+ struct regcache *reg_cache = block->state->reg_cache;
+ jit_state_t *_jit = block->_jit;
+ bool is_tagged = op->flags & (LIGHTREC_HW_IO | LIGHTREC_DIRECT_IO);
+ u32 offset;
+ u8 tmp, tmp2, tmp3;
+
+ jit_note(__FILE__, __LINE__);
+
+ tmp = lightrec_alloc_reg(reg_cache, _jit, JIT_R0);
+
+ if (is_tagged) {
+ offset = offsetof(struct lightrec_state, rw_func);
+ } else {
+ tmp3 = lightrec_alloc_reg(reg_cache, _jit, JIT_R1);
+ offset = offsetof(struct lightrec_state, rw_generic_func);
+ }
+
+ tmp2 = lightrec_alloc_reg_temp(reg_cache, _jit);
+ jit_ldxi(tmp2, LIGHTREC_REG_STATE, offset);
+
+ lightrec_clean_reg_if_loaded(reg_cache, _jit, op->i.rs, false);
+
+ if (read_rt && likely(op->i.rt))
+ lightrec_clean_reg_if_loaded(reg_cache, _jit, op->i.rt, true);
+ else if (load_rt)
+ lightrec_clean_reg_if_loaded(reg_cache, _jit, op->i.rt, false);
+
+ if (is_tagged) {
+ jit_movi(tmp, op->opcode);
+ } else {
+ jit_movi(tmp, (uintptr_t)op);
+ jit_movi(tmp3, (uintptr_t)block);
+ }
+
+ jit_callr(tmp2);
+
+ lightrec_free_reg(reg_cache, tmp);
+ lightrec_free_reg(reg_cache, tmp2);
+ if (!is_tagged)
+ lightrec_free_reg(reg_cache, tmp3);
+ lightrec_regcache_mark_live(reg_cache, _jit);
+}
+
+static void rec_store_direct_no_invalidate(const struct block *block,
+ const struct opcode *op,
+ jit_code_t code)
+{
+ struct lightrec_state *state = block->state;
+ struct regcache *reg_cache = state->reg_cache;
+ jit_state_t *_jit = block->_jit;
+ jit_node_t *to_not_ram, *to_end;
+ u8 tmp, tmp2, rs, rt;
+ s16 imm;
+
+ jit_note(__FILE__, __LINE__);
+ rs = lightrec_alloc_reg_in(reg_cache, _jit, op->i.rs);
+ tmp = lightrec_alloc_reg_temp(reg_cache, _jit);
+ tmp2 = lightrec_alloc_reg_temp(reg_cache, _jit);
+
+ /* Convert to KUNSEG and avoid RAM mirrors */
+ if (state->mirrors_mapped) {
+ imm = (s16)op->i.imm;
+ jit_andi(tmp, rs, 0x1f800000 | (4 * RAM_SIZE - 1));
+ } else if (op->i.imm) {
+ imm = 0;
+ jit_addi(tmp, rs, (s16)op->i.imm);
+ jit_andi(tmp, tmp, 0x1f800000 | (RAM_SIZE - 1));
+ } else {
+ imm = 0;
+ jit_andi(tmp, rs, 0x1f800000 | (RAM_SIZE - 1));
+ }
+
+ lightrec_free_reg(reg_cache, rs);
+
+ if (state->offset_ram != state->offset_scratch) {
+ to_not_ram = jit_bmsi(tmp, BIT(28));
+
+ jit_movi(tmp2, state->offset_ram);
+
+ to_end = jit_jmpi();
+ jit_patch(to_not_ram);
+
+ jit_movi(tmp2, state->offset_scratch);
+ jit_patch(to_end);
+ } else if (state->offset_ram) {
+ jit_movi(tmp2, state->offset_ram);
+ }
+
+ if (state->offset_ram || state->offset_scratch)
+ jit_addr(tmp, tmp, tmp2);
+
+ lightrec_free_reg(reg_cache, tmp2);
+
+ rt = lightrec_alloc_reg_in(reg_cache, _jit, op->i.rt);
+ jit_new_node_www(code, imm, tmp, rt);
+
+ lightrec_free_reg(reg_cache, rt);
+ lightrec_free_reg(reg_cache, tmp);
+}
+
+static void rec_store_direct(const struct block *block, const struct opcode *op,
+ jit_code_t code)
+{
+ struct lightrec_state *state = block->state;
+ struct regcache *reg_cache = state->reg_cache;
+ jit_state_t *_jit = block->_jit;
+ jit_node_t *to_not_ram, *to_end;
+ u8 tmp, tmp2, tmp3, rs, rt;
+
+ jit_note(__FILE__, __LINE__);
+
+ rs = lightrec_alloc_reg_in(reg_cache, _jit, op->i.rs);
+ tmp2 = lightrec_alloc_reg_temp(reg_cache, _jit);
+ tmp3 = lightrec_alloc_reg_in(reg_cache, _jit, 0);
+
+ /* Convert to KUNSEG and avoid RAM mirrors */
+ if (op->i.imm) {
+ jit_addi(tmp2, rs, (s16)op->i.imm);
+ jit_andi(tmp2, tmp2, 0x1f800000 | (RAM_SIZE - 1));
+ } else {
+ jit_andi(tmp2, rs, 0x1f800000 | (RAM_SIZE - 1));
+ }
+
+ lightrec_free_reg(reg_cache, rs);
+ tmp = lightrec_alloc_reg_temp(reg_cache, _jit);
+
+ to_not_ram = jit_bgti(tmp2, RAM_SIZE);
+
+ /* Compute the offset to the code LUT */
+ jit_andi(tmp, tmp2, (RAM_SIZE - 1) & ~3);
+#if __WORDSIZE == 64
+ jit_lshi(tmp, tmp, 1);
+#endif
+ jit_addr(tmp, LIGHTREC_REG_STATE, tmp);
+
+ /* Write NULL to the code LUT to invalidate any block that's there */
+ jit_stxi(offsetof(struct lightrec_state, code_lut), tmp, tmp3);
+
+ if (state->offset_ram != state->offset_scratch) {
+ jit_movi(tmp, state->offset_ram);
+
+ to_end = jit_jmpi();
+ }
+
+ jit_patch(to_not_ram);
+
+ if (state->offset_ram || state->offset_scratch)
+ jit_movi(tmp, state->offset_scratch);
+
+ if (state->offset_ram != state->offset_scratch)
+ jit_patch(to_end);
+
+ if (state->offset_ram || state->offset_scratch)
+ jit_addr(tmp2, tmp2, tmp);
+
+ lightrec_free_reg(reg_cache, tmp);
+ lightrec_free_reg(reg_cache, tmp3);
+
+ rt = lightrec_alloc_reg_in(reg_cache, _jit, op->i.rt);
+ jit_new_node_www(code, 0, tmp2, rt);
+
+ lightrec_free_reg(reg_cache, rt);
+ lightrec_free_reg(reg_cache, tmp2);
+}
+
+static void rec_store(const struct block *block, const struct opcode *op,
+ jit_code_t code)
+{
+ if (op->flags & LIGHTREC_NO_INVALIDATE) {
+ rec_store_direct_no_invalidate(block, op, code);
+ } else if (op->flags & LIGHTREC_DIRECT_IO) {
+ if (block->state->invalidate_from_dma_only)
+ rec_store_direct_no_invalidate(block, op, code);
+ else
+ rec_store_direct(block, op, code);
+ } else {
+ rec_io(block, op, true, false);
+ }
+}
+
+static void rec_SB(const struct block *block, const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_store(block, op, jit_code_stxi_c);
+}
+
+static void rec_SH(const struct block *block, const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_store(block, op, jit_code_stxi_s);
+}
+
+static void rec_SW(const struct block *block, const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_store(block, op, jit_code_stxi_i);
+}
+
+static void rec_SWL(const struct block *block, const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_io(block, op, true, false);
+}
+
+static void rec_SWR(const struct block *block, const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_io(block, op, true, false);
+}
+
+static void rec_SWC2(const struct block *block, const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_io(block, op, false, false);
+}
+
+static void rec_load_direct(const struct block *block, const struct opcode *op,
+ jit_code_t code)
+{
+ struct lightrec_state *state = block->state;
+ struct regcache *reg_cache = state->reg_cache;
+ jit_state_t *_jit = block->_jit;
+ jit_node_t *to_not_ram, *to_not_bios, *to_end, *to_end2;
+ u8 tmp, rs, rt, addr_reg;
+ s16 imm;
+
+ if (!op->i.rt)
+ return;
+
+ jit_note(__FILE__, __LINE__);
+ rs = lightrec_alloc_reg_in(reg_cache, _jit, op->i.rs);
+ rt = lightrec_alloc_reg_out_ext(reg_cache, _jit, op->i.rt);
+
+ if ((state->offset_ram == state->offset_bios &&
+ state->offset_ram == state->offset_scratch &&
+ state->mirrors_mapped) || !op->i.imm) {
+ addr_reg = rs;
+ imm = (s16)op->i.imm;
+ } else {
+ jit_addi(rt, rs, (s16)op->i.imm);
+ addr_reg = rt;
+ imm = 0;
+
+ if (op->i.rs != op->i.rt)
+ lightrec_free_reg(reg_cache, rs);
+ }
+
+ tmp = lightrec_alloc_reg_temp(reg_cache, _jit);
+
+ if (state->offset_ram == state->offset_bios &&
+ state->offset_ram == state->offset_scratch) {
+ if (!state->mirrors_mapped) {
+ jit_andi(tmp, addr_reg, BIT(28));
+ jit_rshi_u(tmp, tmp, 28 - 22);
+ jit_ori(tmp, tmp, 0x1f800000 | (RAM_SIZE - 1));
+ jit_andr(rt, addr_reg, tmp);
+ } else {
+ jit_andi(rt, addr_reg, 0x1fffffff);
+ }
+
+ if (state->offset_ram)
+ jit_movi(tmp, state->offset_ram);
+ } else {
+ to_not_ram = jit_bmsi(addr_reg, BIT(28));
+
+ /* Convert to KUNSEG and avoid RAM mirrors */
+ jit_andi(rt, addr_reg, RAM_SIZE - 1);
+
+ if (state->offset_ram)
+ jit_movi(tmp, state->offset_ram);
+
+ to_end = jit_jmpi();
+
+ jit_patch(to_not_ram);
+
+ if (state->offset_bios != state->offset_scratch)
+ to_not_bios = jit_bmci(addr_reg, BIT(22));
+
+ /* Convert to KUNSEG */
+ jit_andi(rt, addr_reg, 0x1fc00000 | (BIOS_SIZE - 1));
+
+ jit_movi(tmp, state->offset_bios);
+
+ if (state->offset_bios != state->offset_scratch) {
+ to_end2 = jit_jmpi();
+
+ jit_patch(to_not_bios);
+
+ /* Convert to KUNSEG */
+ jit_andi(rt, addr_reg, 0x1f800fff);
+
+ if (state->offset_scratch)
+ jit_movi(tmp, state->offset_scratch);
+
+ jit_patch(to_end2);
+ }
+
+ jit_patch(to_end);
+ }
+
+ if (state->offset_ram || state->offset_bios || state->offset_scratch)
+ jit_addr(rt, rt, tmp);
+
+ jit_new_node_www(code, rt, rt, imm);
+
+ lightrec_free_reg(reg_cache, addr_reg);
+ lightrec_free_reg(reg_cache, rt);
+ lightrec_free_reg(reg_cache, tmp);
+}
+
+static void rec_load(const struct block *block, const struct opcode *op,
+ jit_code_t code)
+{
+ if (op->flags & LIGHTREC_DIRECT_IO)
+ rec_load_direct(block, op, code);
+ else
+ rec_io(block, op, false, true);
+}
+
+static void rec_LB(const struct block *block, const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_load(block, op, jit_code_ldxi_c);
+}
+
+static void rec_LBU(const struct block *block, const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_load(block, op, jit_code_ldxi_uc);
+}
+
+static void rec_LH(const struct block *block, const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_load(block, op, jit_code_ldxi_s);
+}
+
+static void rec_LHU(const struct block *block, const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_load(block, op, jit_code_ldxi_us);
+}
+
+static void rec_LWL(const struct block *block, const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_io(block, op, true, true);
+}
+
+static void rec_LWR(const struct block *block, const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_io(block, op, true, true);
+}
+
+static void rec_LW(const struct block *block, const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_load(block, op, jit_code_ldxi_i);
+}
+
+static void rec_LWC2(const struct block *block, const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_io(block, op, false, false);
+}
+
+static void rec_break_syscall(const struct block *block,
+ const struct opcode *op, u32 pc, bool is_break)
+{
+ struct regcache *reg_cache = block->state->reg_cache;
+ jit_state_t *_jit = block->_jit;
+ u32 offset;
+ u8 tmp;
+
+ jit_note(__FILE__, __LINE__);
+
+ if (is_break)
+ offset = offsetof(struct lightrec_state, break_func);
+ else
+ offset = offsetof(struct lightrec_state, syscall_func);
+
+ tmp = lightrec_alloc_reg_temp(reg_cache, _jit);
+ jit_ldxi(tmp, LIGHTREC_REG_STATE, offset);
+ jit_callr(tmp);
+ lightrec_free_reg(reg_cache, tmp);
+
+ lightrec_regcache_mark_live(reg_cache, _jit);
+
+ /* TODO: the return address should be "pc - 4" if we're a delay slot */
+ lightrec_emit_end_of_block(block, op, pc, -1, pc, 31, 0, true);
+}
+
+static void rec_special_SYSCALL(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_break_syscall(block, op, pc, false);
+}
+
+static void rec_special_BREAK(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_break_syscall(block, op, pc, true);
+}
+
+static void rec_mfc(const struct block *block, const struct opcode *op)
+{
+ u8 tmp, tmp2;
+ struct lightrec_state *state = block->state;
+ struct regcache *reg_cache = state->reg_cache;
+ jit_state_t *_jit = block->_jit;
+
+ jit_note(__FILE__, __LINE__);
+
+ tmp = lightrec_alloc_reg(reg_cache, _jit, JIT_R0);
+ tmp2 = lightrec_alloc_reg_temp(reg_cache, _jit);
+
+ jit_ldxi(tmp2, LIGHTREC_REG_STATE,
+ offsetof(struct lightrec_state, mfc_func));
+
+ lightrec_clean_reg_if_loaded(reg_cache, _jit, op->i.rt, true);
+
+ jit_movi(tmp, op->opcode);
+ jit_callr(tmp2);
+ lightrec_free_reg(reg_cache, tmp);
+ lightrec_free_reg(reg_cache, tmp2);
+
+ lightrec_regcache_mark_live(reg_cache, _jit);
+}
+
+static void rec_mtc(const struct block *block, const struct opcode *op, u32 pc)
+{
+ struct lightrec_state *state = block->state;
+ struct regcache *reg_cache = state->reg_cache;
+ jit_state_t *_jit = block->_jit;
+ u8 tmp, tmp2;
+
+ jit_note(__FILE__, __LINE__);
+
+ tmp = lightrec_alloc_reg(reg_cache, _jit, JIT_R0);
+ tmp2 = lightrec_alloc_reg_temp(reg_cache, _jit);
+ jit_ldxi(tmp2, LIGHTREC_REG_STATE,
+ offsetof(struct lightrec_state, mtc_func));
+
+ lightrec_clean_reg_if_loaded(reg_cache, _jit, op->i.rs, false);
+ lightrec_clean_reg_if_loaded(reg_cache, _jit, op->i.rt, false);
+
+ jit_movi(tmp, op->opcode);
+ jit_callr(tmp2);
+ lightrec_free_reg(reg_cache, tmp);
+ lightrec_free_reg(reg_cache, tmp2);
+
+ lightrec_regcache_mark_live(reg_cache, _jit);
+
+ if (op->i.op == OP_CP0 && (op->r.rd == 12 || op->r.rd == 13))
+ lightrec_emit_end_of_block(block, op, pc, -1, pc + 4, 0, 0, true);
+}
+
+static void rec_cp0_MFC0(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_mfc(block, op);
+}
+
+static void rec_cp0_CFC0(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_mfc(block, op);
+}
+
+static void rec_cp0_MTC0(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_mtc(block, op, pc);
+}
+
+static void rec_cp0_CTC0(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_mtc(block, op, pc);
+}
+
+static void rec_cp2_basic_MFC2(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_mfc(block, op);
+}
+
+static void rec_cp2_basic_CFC2(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_mfc(block, op);
+}
+
+static void rec_cp2_basic_MTC2(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_mtc(block, op, pc);
+}
+
+static void rec_cp2_basic_CTC2(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_mtc(block, op, pc);
+}
+
+static void rec_cp0_RFE(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ struct lightrec_state *state = block->state;
+ jit_state_t *_jit = block->_jit;
+ u8 tmp;
+
+ jit_name(__func__);
+ jit_note(__FILE__, __LINE__);
+
+ tmp = lightrec_alloc_reg_temp(state->reg_cache, _jit);
+ jit_ldxi(tmp, LIGHTREC_REG_STATE,
+ offsetof(struct lightrec_state, rfe_func));
+ jit_callr(tmp);
+ lightrec_free_reg(state->reg_cache, tmp);
+
+ lightrec_regcache_mark_live(state->reg_cache, _jit);
+}
+
+static void rec_CP(const struct block *block, const struct opcode *op, u32 pc)
+{
+ struct regcache *reg_cache = block->state->reg_cache;
+ jit_state_t *_jit = block->_jit;
+ u8 tmp, tmp2;
+
+ jit_name(__func__);
+ jit_note(__FILE__, __LINE__);
+
+ tmp = lightrec_alloc_reg(reg_cache, _jit, JIT_R0);
+ tmp2 = lightrec_alloc_reg_temp(reg_cache, _jit);
+
+ jit_ldxi(tmp2, LIGHTREC_REG_STATE,
+ offsetof(struct lightrec_state, cp_func));
+
+ jit_movi(tmp, op->opcode);
+ jit_callr(tmp2);
+ lightrec_free_reg(reg_cache, tmp);
+ lightrec_free_reg(reg_cache, tmp2);
+
+ lightrec_regcache_mark_live(reg_cache, _jit);
+}
+
+static void rec_meta_unload(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ struct lightrec_state *state = block->state;
+ struct regcache *reg_cache = state->reg_cache;
+ jit_state_t *_jit = block->_jit;
+
+ jit_name(__func__);
+ jit_note(__FILE__, __LINE__);
+
+ pr_debug("Unloading reg %s\n", lightrec_reg_name(op->i.rs));
+ lightrec_clean_reg_if_loaded(reg_cache, _jit, op->i.rs, true);
+}
+
+static void rec_meta_BEQZ(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_b(block, op, pc, jit_code_bnei, 0, false, true);
+}
+
+static void rec_meta_BNEZ(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ _jit_name(block->_jit, __func__);
+ rec_b(block, op, pc, jit_code_beqi, 0, false, true);
+}
+
+static void rec_meta_MOV(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ struct lightrec_state *state = block->state;
+ struct regcache *reg_cache = state->reg_cache;
+ jit_state_t *_jit = block->_jit;
+ u8 rs, rd;
+
+ _jit_name(block->_jit, __func__);
+ jit_note(__FILE__, __LINE__);
+ rs = op->r.rs ? lightrec_alloc_reg_in(reg_cache, _jit, op->r.rs) : 0;
+ rd = lightrec_alloc_reg_out_ext(reg_cache, _jit, op->r.rd);
+
+ if (op->r.rs == 0) {
+ jit_movi(rd, 0);
+ } else {
+#if __WORDSIZE == 32
+ jit_movr(rd, rs);
+#else
+ jit_extr_i(rd, rs);
+#endif
+ }
+
+ lightrec_free_reg(state->reg_cache, rs);
+ lightrec_free_reg(state->reg_cache, rd);
+}
+
+static void rec_meta_sync(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ struct lightrec_state *state = block->state;
+ struct lightrec_branch_target *target;
+ jit_state_t *_jit = block->_jit;
+
+ jit_name(__func__);
+ jit_note(__FILE__, __LINE__);
+
+ jit_subi(LIGHTREC_REG_CYCLE, LIGHTREC_REG_CYCLE, state->cycles);
+ state->cycles = 0;
+
+ lightrec_storeback_regs(state->reg_cache, _jit);
+ lightrec_regcache_reset(state->reg_cache);
+
+ pr_debug("Adding branch target at offset 0x%x\n",
+ op->offset << 2);
+ target = &state->targets[state->nb_targets++];
+ target->offset = op->offset;
+ target->label = jit_label();
+}
+
+static const lightrec_rec_func_t rec_standard[64] = {
+ [OP_SPECIAL] = rec_SPECIAL,
+ [OP_REGIMM] = rec_REGIMM,
+ [OP_J] = rec_J,
+ [OP_JAL] = rec_JAL,
+ [OP_BEQ] = rec_BEQ,
+ [OP_BNE] = rec_BNE,
+ [OP_BLEZ] = rec_BLEZ,
+ [OP_BGTZ] = rec_BGTZ,
+ [OP_ADDI] = rec_ADDI,
+ [OP_ADDIU] = rec_ADDIU,
+ [OP_SLTI] = rec_SLTI,
+ [OP_SLTIU] = rec_SLTIU,
+ [OP_ANDI] = rec_ANDI,
+ [OP_ORI] = rec_ORI,
+ [OP_XORI] = rec_XORI,
+ [OP_LUI] = rec_LUI,
+ [OP_CP0] = rec_CP0,
+ [OP_CP2] = rec_CP2,
+ [OP_LB] = rec_LB,
+ [OP_LH] = rec_LH,
+ [OP_LWL] = rec_LWL,
+ [OP_LW] = rec_LW,
+ [OP_LBU] = rec_LBU,
+ [OP_LHU] = rec_LHU,
+ [OP_LWR] = rec_LWR,
+ [OP_SB] = rec_SB,
+ [OP_SH] = rec_SH,
+ [OP_SWL] = rec_SWL,
+ [OP_SW] = rec_SW,
+ [OP_SWR] = rec_SWR,
+ [OP_LWC2] = rec_LWC2,
+ [OP_SWC2] = rec_SWC2,
+
+ [OP_META_REG_UNLOAD] = rec_meta_unload,
+ [OP_META_BEQZ] = rec_meta_BEQZ,
+ [OP_META_BNEZ] = rec_meta_BNEZ,
+ [OP_META_MOV] = rec_meta_MOV,
+ [OP_META_SYNC] = rec_meta_sync,
+};
+
+static const lightrec_rec_func_t rec_special[64] = {
+ [OP_SPECIAL_SLL] = rec_special_SLL,
+ [OP_SPECIAL_SRL] = rec_special_SRL,
+ [OP_SPECIAL_SRA] = rec_special_SRA,
+ [OP_SPECIAL_SLLV] = rec_special_SLLV,
+ [OP_SPECIAL_SRLV] = rec_special_SRLV,
+ [OP_SPECIAL_SRAV] = rec_special_SRAV,
+ [OP_SPECIAL_JR] = rec_special_JR,
+ [OP_SPECIAL_JALR] = rec_special_JALR,
+ [OP_SPECIAL_SYSCALL] = rec_special_SYSCALL,
+ [OP_SPECIAL_BREAK] = rec_special_BREAK,
+ [OP_SPECIAL_MFHI] = rec_special_MFHI,
+ [OP_SPECIAL_MTHI] = rec_special_MTHI,
+ [OP_SPECIAL_MFLO] = rec_special_MFLO,
+ [OP_SPECIAL_MTLO] = rec_special_MTLO,
+ [OP_SPECIAL_MULT] = rec_special_MULT,
+ [OP_SPECIAL_MULTU] = rec_special_MULTU,
+ [OP_SPECIAL_DIV] = rec_special_DIV,
+ [OP_SPECIAL_DIVU] = rec_special_DIVU,
+ [OP_SPECIAL_ADD] = rec_special_ADD,
+ [OP_SPECIAL_ADDU] = rec_special_ADDU,
+ [OP_SPECIAL_SUB] = rec_special_SUB,
+ [OP_SPECIAL_SUBU] = rec_special_SUBU,
+ [OP_SPECIAL_AND] = rec_special_AND,
+ [OP_SPECIAL_OR] = rec_special_OR,
+ [OP_SPECIAL_XOR] = rec_special_XOR,
+ [OP_SPECIAL_NOR] = rec_special_NOR,
+ [OP_SPECIAL_SLT] = rec_special_SLT,
+ [OP_SPECIAL_SLTU] = rec_special_SLTU,
+};
+
+static const lightrec_rec_func_t rec_regimm[64] = {
+ [OP_REGIMM_BLTZ] = rec_regimm_BLTZ,
+ [OP_REGIMM_BGEZ] = rec_regimm_BGEZ,
+ [OP_REGIMM_BLTZAL] = rec_regimm_BLTZAL,
+ [OP_REGIMM_BGEZAL] = rec_regimm_BGEZAL,
+};
+
+static const lightrec_rec_func_t rec_cp0[64] = {
+ [OP_CP0_MFC0] = rec_cp0_MFC0,
+ [OP_CP0_CFC0] = rec_cp0_CFC0,
+ [OP_CP0_MTC0] = rec_cp0_MTC0,
+ [OP_CP0_CTC0] = rec_cp0_CTC0,
+ [OP_CP0_RFE] = rec_cp0_RFE,
+};
+
+static const lightrec_rec_func_t rec_cp2_basic[64] = {
+ [OP_CP2_BASIC_MFC2] = rec_cp2_basic_MFC2,
+ [OP_CP2_BASIC_CFC2] = rec_cp2_basic_CFC2,
+ [OP_CP2_BASIC_MTC2] = rec_cp2_basic_MTC2,
+ [OP_CP2_BASIC_CTC2] = rec_cp2_basic_CTC2,
+};
+
+static void rec_SPECIAL(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ lightrec_rec_func_t f = rec_special[op->r.op];
+ if (likely(f))
+ (*f)(block, op, pc);
+ else
+ unknown_opcode(block, op, pc);
+}
+
+static void rec_REGIMM(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ lightrec_rec_func_t f = rec_regimm[op->r.rt];
+ if (likely(f))
+ (*f)(block, op, pc);
+ else
+ unknown_opcode(block, op, pc);
+}
+
+static void rec_CP0(const struct block *block, const struct opcode *op, u32 pc)
+{
+ lightrec_rec_func_t f = rec_cp0[op->r.rs];
+ if (likely(f))
+ (*f)(block, op, pc);
+ else
+ rec_CP(block, op, pc);
+}
+
+static void rec_CP2(const struct block *block, const struct opcode *op, u32 pc)
+{
+ if (op->r.op == OP_CP2_BASIC) {
+ lightrec_rec_func_t f = rec_cp2_basic[op->r.rs];
+ if (likely(f)) {
+ (*f)(block, op, pc);
+ return;
+ }
+ }
+
+ rec_CP(block, op, pc);
+}
+
+void lightrec_rec_opcode(const struct block *block,
+ const struct opcode *op, u32 pc)
+{
+ lightrec_rec_func_t f = rec_standard[op->i.op];
+ if (likely(f))
+ (*f)(block, op, pc);
+ else
+ unknown_opcode(block, op, pc);
+}