parallel-rsp/debug_rsp.cpp

1434 lines
44 KiB
C++
Raw Permalink Normal View History

#include "debug_rsp.hpp"
2020-02-01 00:42:56 +00:00
#include "rsp_disasm.hpp"
2020-01-29 13:58:56 +00:00
#include <utility>
using namespace std;
2020-02-01 11:27:00 +00:00
#define TRACE
2020-01-29 20:39:26 +00:00
extern "C"
2020-01-29 13:58:56 +00:00
{
2020-01-29 20:39:26 +00:00
#ifdef INTENSE_DEBUG
static uint64_t hash_imem(const uint8_t *data, size_t size)
{
uint64_t h = 0xcbf29ce484222325ull;
size_t i;
for (i = 0; i < size; i++)
h = (h * 0x100000001b3ull) ^ data[i];
if (h == BREAKVAL)
breakme();
return h;
}
void RSP_DEBUG(RSP::CPUState *rsp, const char *tag, unsigned pc, unsigned value)
{
uint64_t hash = hash_imem((const uint8_t *)rsp->cp2.regs, sizeof(rsp->cp2.regs));
fprintf(DUMP_FILE, "%s (PC: %u): %u, %llu\n", tag, pc, value, hash);
2020-01-29 20:39:26 +00:00
if (value)
fprintf(DUMP_FILE, " DMEM HASH: 0x%016llx\n", hash_imem((const uint8_t *)rsp->dmem, 0x1000));
2020-01-29 20:39:26 +00:00
}
2020-01-29 13:58:56 +00:00
#endif
}
namespace RSP
{
CPU::CPU()
#ifndef DEBUG_JIT
: jit_engine(symbol_table)
#endif
{
2020-01-29 20:39:26 +00:00
init_symbol_table();
2020-01-29 13:58:56 +00:00
}
CPU::~CPU()
2020-01-29 20:39:26 +00:00
{
}
2020-01-29 13:58:56 +00:00
void CPU::init_symbol_table()
{
#define S(sym) symbol_table["RSP_" #sym] = reinterpret_cast<uint64_t>(RSP_##sym)
2020-01-29 20:39:26 +00:00
S(EXIT);
S(CALL);
S(RETURN);
2020-02-01 00:42:56 +00:00
S(REPORT_PC);
2020-01-29 13:58:56 +00:00
#ifdef INTENSE_DEBUG
2020-01-29 20:39:26 +00:00
S(DEBUG);
2020-01-29 13:58:56 +00:00
#endif
2020-01-29 20:39:26 +00:00
S(MFC0);
S(MTC0);
S(MTC2);
S(MFC2);
S(CFC2);
S(CTC2);
S(LBV);
S(LSV);
S(LLV);
S(LDV);
S(LQV);
S(LRV);
S(LPV);
S(LUV);
S(LHV);
S(LTV);
S(SBV);
S(SSV);
S(SLV);
S(SDV);
S(SQV);
S(SRV);
S(SPV);
S(SUV);
S(SHV);
S(SFV);
S(STV);
S(VMULF);
S(VMULU);
S(VMUDL);
S(VMUDM);
S(VMUDN);
S(VMUDH);
S(VMACF);
S(VMACU);
//S(VMACQ);
S(VMADL);
S(VMADM);
S(VMADN);
S(VMADH);
S(VADD);
S(VSUB);
S(VABS);
S(VADDC);
S(VSUBC);
S(VSAR);
S(VLT);
S(VEQ);
S(VNE);
S(VGE);
S(VCL);
S(VCH);
S(VCR);
S(VMRG);
S(VAND);
S(VNAND);
S(VOR);
S(VNOR);
S(VXOR);
S(VNXOR);
S(VRCP);
S(VRCPL);
S(VRCPH);
S(VMOV);
S(VRSQ);
S(VRSQL);
S(VRSQH);
S(VNOP);
2020-01-29 13:58:56 +00:00
#undef S
}
void CPU::invalidate_imem()
{
2020-01-29 20:39:26 +00:00
for (unsigned i = 0; i < CODE_BLOCKS; i++)
if (memcmp(cached_imem + i * CODE_BLOCK_WORDS, state.imem + i * CODE_BLOCK_WORDS, CODE_BLOCK_SIZE))
state.dirty_blocks |= (0x3 << i) >> 1;
2020-01-29 13:58:56 +00:00
}
void CPU::invalidate_code()
{
2020-01-29 20:39:26 +00:00
if (!state.dirty_blocks)
return;
for (unsigned i = 0; i < CODE_BLOCKS; i++)
{
if (state.dirty_blocks & (1 << i))
{
memset(blocks + i * CODE_BLOCK_WORDS, 0, CODE_BLOCK_WORDS * sizeof(blocks[0]));
memcpy(cached_imem + i * CODE_BLOCK_WORDS, state.imem + i * CODE_BLOCK_WORDS, CODE_BLOCK_SIZE);
}
}
state.dirty_blocks = 0;
2020-01-29 13:58:56 +00:00
}
// Need super-fast hash here.
uint64_t CPU::hash_imem(unsigned pc, unsigned count) const
{
2020-01-29 20:39:26 +00:00
size_t size = count;
// FNV-1.
const auto *data = state.imem + pc;
uint64_t h = 0xcbf29ce484222325ull;
h = (h * 0x100000001b3ull) ^ pc;
h = (h * 0x100000001b3ull) ^ count;
for (size_t i = 0; i < size; i++)
h = (h * 0x100000001b3ull) ^ data[i];
return h;
2020-01-29 13:58:56 +00:00
}
unsigned CPU::analyze_static_end(unsigned pc, unsigned end)
{
2020-01-29 20:39:26 +00:00
// Scans through IMEM and finds the logical "end" of the instruction stream.
unsigned max_static_pc = pc;
unsigned count = end - pc;
for (unsigned i = 0; i < count; i++)
{
uint32_t instr = state.imem[pc + i];
uint32_t type = instr >> 26;
uint32_t target;
bool forward_goto;
if (pc + i + 1 >= max_static_pc)
{
forward_goto = false;
max_static_pc = pc + i + 1;
}
else
forward_goto = true;
// VU
if ((instr >> 25) == 0x25)
continue;
switch (type)
{
case 000:
switch (instr & 63)
{
case 010:
// JR always terminates either by returning or exiting.
// We execute the next instruction via delay slot and exit.
// Unless we can branch past the JR
// (max_static_pc will be higher than expected),
// this will be the static end.
if (!forward_goto)
{
max_static_pc = max(pc + i + 2, max_static_pc);
goto end;
}
break;
case 015:
// BREAK always terminates.
if (!forward_goto)
goto end;
break;
default:
break;
}
break;
case 001: // REGIMM
switch ((instr >> 16) & 31)
{
case 000: // BLTZ
case 001: // BGEZ
case 021: // BGEZAL
case 020: // BLTZAL
target = (pc + i + 1 + instr) & 0x3ff;
if (target >= pc && target < end) // goto
max_static_pc = max(max_static_pc, target + 1);
break;
default:
break;
}
break;
case 002:
// J is resolved by goto.
target = instr & 0x3ff;
if (target >= pc && target < end) // goto
{
// J is a static jump, so if we aren't branching
// past this instruction and we're branching backwards,
// we can end the block here.
if (!forward_goto && target < end)
{
max_static_pc = max(pc + i + 2, max_static_pc);
goto end;
}
else
max_static_pc = max(max_static_pc, target + 1);
}
else if (!forward_goto)
{
// If we have static branch outside our block,
// we terminate the block.
max_static_pc = max(pc + i + 2, max_static_pc);
goto end;
}
break;
case 004: // BEQ
case 005: // BNE
case 006: // BLEZ
case 007: // BGTZ
target = (pc + i + 1 + instr) & 0x3ff;
if (target >= pc && target < end) // goto
max_static_pc = max(max_static_pc, target + 1);
break;
default:
break;
}
}
2020-01-29 13:58:56 +00:00
end:
2020-01-29 20:39:26 +00:00
unsigned ret = min(max_static_pc, end);
return ret;
2020-01-29 13:58:56 +00:00
}
Func CPU::jit_region(uint64_t hash, unsigned pc, unsigned count)
{
2020-01-29 20:39:26 +00:00
full_code.clear();
body.clear();
full_code.reserve(16 * 1024);
body.reserve(16 * 1024);
// Local branch delays resolve to within the block, so we can use goto.
bool pending_local_branch_delay = false;
bool pending_branch_delay = false;
bool pending_call = false;
bool pending_indirect_call = false;
bool pending_return = false;
bool pipe_pending_local_branch_delay = false;
bool pipe_pending_branch_delay = false;
bool pipe_pending_call = false;
bool pipe_pending_indirect_call = false;
bool pipe_pending_return = false;
uint32_t branch_delay = 0;
uint32_t pipe_branch_delay = 0;
char buf[256];
#define APPEND(...) \
do \
{ \
sprintf(buf, __VA_ARGS__); \
body += buf; \
} while (0)
#define APPEND_RD_NOT_R0(...) \
if (rd != 0) \
do \
{ \
APPEND(__VA_ARGS__); \
} while (0)
#define APPEND_RT_NOT_R0(...) \
if (rt != 0) \
do \
{ \
APPEND(__VA_ARGS__); \
} while (0)
#define DISASM(...) \
do \
{ \
APPEND("// "); \
APPEND(__VA_ARGS__); \
} while (0)
#define PIPELINE_BRANCH() \
do \
{ \
pending_local_branch_delay = pipe_pending_local_branch_delay; \
pending_branch_delay = pipe_pending_branch_delay; \
pending_call = pipe_pending_call; \
pending_indirect_call = pipe_pending_indirect_call; \
pending_return = pipe_pending_return; \
branch_delay = pipe_branch_delay; \
pipe_pending_local_branch_delay = false; \
pipe_pending_branch_delay = false; \
pipe_pending_call = false; \
pipe_pending_indirect_call = false; \
pipe_pending_return = false; \
pipe_branch_delay = 0; \
APPEND("ADVANCE_DELAY_SLOT();\n"); \
} while (0)
#define PROMOTE_LOCAL_DELAY_SLOT() \
do \
{ \
APPEND("if (pipe_branch) {\n"); \
APPEND(" STATE->has_delay_slot = 1;\n"); \
APPEND(" STATE->branch_target = %u;\n", pipe_branch_delay * 4); \
APPEND("}\n"); \
} while (0)
#define PROMOTE_DELAY_SLOT() \
do \
{ \
if (pipe_pending_local_branch_delay) \
PROMOTE_LOCAL_DELAY_SLOT(); \
else if (pipe_pending_branch_delay) \
{ \
APPEND(" PROMOTE_DELAY_SLOT();\n"); \
} \
} while (0)
// Statically checks if we need to handle branch delay slots.
// Only relevant if the last instruction did anything branch related.
// Double branch delays are technically undefined, but I assume it works like this.
#define CHECK_BRANCH_DELAY() \
do \
{ \
if (pending_call && !pipe_pending_local_branch_delay && !pipe_pending_branch_delay) \
{ \
APPEND("if (LIKELY(branch)) {\n"); \
APPEND(" RSP_CALL(opaque, 0x%03x, 0x%03x);\n", branch_delay * 4, ((pc + i + 1) << 2) & (IMEM_SIZE - 1)); \
APPEND("}\n"); \
} \
else if (pending_indirect_call && !pipe_pending_local_branch_delay && !pipe_pending_branch_delay) \
{ \
APPEND("if (LIKELY(branch)) {\n"); \
APPEND(" RSP_CALL(opaque, (branch_delay << 2) & %u, 0x%03x);\n", IMEM_SIZE - 1, \
((pc + i + 1) << 2) & (IMEM_SIZE - 1)); \
APPEND("}\n"); \
} \
else if (pending_return && !pipe_pending_local_branch_delay && !pipe_pending_branch_delay) \
{ \
APPEND("if (LIKELY(branch)) {\n"); \
APPEND(" if (RSP_RETURN(opaque, (branch_delay << 2) & %u)) return;\n", IMEM_SIZE - 1); \
APPEND(" STATE->pc = (branch_delay << 2) & %u;\n", IMEM_SIZE - 1); \
APPEND(" EXIT(MODE_CONTINUE);\n"); \
APPEND("}\n"); \
} \
else if (pending_local_branch_delay) \
{ \
if (pipe_pending_local_branch_delay || pipe_pending_branch_delay) \
{ \
APPEND("if (branch && pipe_branch) {\n"); \
APPEND(" STATE->pc = %u;\n", branch_delay * 4); \
APPEND(" PROMOTE_DELAY_SLOT();\n"); \
APPEND(" EXIT(MODE_CONTINUE);\n"); \
APPEND("} else if (branch) {\n"); \
APPEND(" goto pc_%03x;\n", branch_delay * 4); \
APPEND("}\n"); \
} \
else \
{ \
APPEND("if (branch) goto pc_%03x;\n", branch_delay * 4); \
} \
} \
else if (pending_branch_delay) \
{ \
APPEND("if (branch) {\n"); \
APPEND(" STATE->pc = (branch_delay << 2) & %u;\n", IMEM_SIZE - 1); \
PROMOTE_DELAY_SLOT(); \
APPEND(" EXIT(MODE_CONTINUE);\n"); \
APPEND("}\n"); \
} \
pending_call = false; \
pending_indirect_call = false; \
pending_return = false; \
pending_branch_delay = false; \
pending_local_branch_delay = false; \
} while (0)
#define CHECK_INHERIT_BRANCH_DELAY() \
do \
{ \
APPEND("if (UNLIKELY(STATE->has_delay_slot)) {\n"); \
APPEND(" STATE->pc = STATE->branch_target;\n"); \
APPEND(" STATE->has_delay_slot = 0;\n"); \
PROMOTE_DELAY_SLOT(); \
APPEND(" EXIT(MODE_CONTINUE);\n"); \
APPEND("}\n"); \
} while (0)
#define EXIT_WITH_DELAY(mode) \
do \
{ \
if (pending_local_branch_delay) \
{ \
APPEND("STATE->pc = branch ? %u : %u;\n", branch_delay * 4, ((pc + i + 1) << 2) & (IMEM_SIZE - 1)); \
APPEND("EXIT(%s);\n", #mode); \
} \
else if (pending_branch_delay) \
{ \
APPEND("STATE->pc = branch ? ((branch_delay << 2) & %u) : %u;\n", IMEM_SIZE - 1, \
((pc + i + 1) << 2) & (IMEM_SIZE - 1)); \
APPEND("EXIT(%s);\n", #mode); \
} \
else \
{ \
APPEND("if (UNLIKELY(STATE->has_delay_slot)) {\n"); \
APPEND(" STATE->pc = STATE->branch_target;\n"); \
APPEND(" STATE->has_delay_slot = 0;\n"); \
APPEND(" EXIT(%s);\n", #mode); \
APPEND("} else {\n"); \
APPEND(" STATE->pc = %u;\n", ((pc + i + 1) << 2) & (IMEM_SIZE - 1)); \
APPEND(" EXIT(%s);\n", #mode); \
APPEND("}\n"); \
} \
} while (0)
auto set_pc = [&](uint32_t next_pc) {
next_pc &= (IMEM_SIZE >> 2) - 1;
if (next_pc >= pc && next_pc < (pc + count))
{
pipe_pending_local_branch_delay = true;
pipe_branch_delay = next_pc;
}
else
{
pipe_pending_branch_delay = true;
pipe_branch_delay = next_pc;
APPEND("pipe_branch_delay = %u;\n", next_pc);
}
};
auto set_pc_indirect = [&](uint32_t reg) {
pipe_pending_branch_delay = true;
APPEND("BRANCH_INDIRECT((r%u & 0xfff) >> 2);\n", reg);
};
APPEND("unsigned branch = 0;\n");
APPEND("unsigned branch_delay = 0;\n");
APPEND("unsigned pipe_branch = 0;\n");
APPEND("unsigned pipe_branch_delay = 0;\n");
APPEND("unsigned cp0_result;\n");
APPEND("unsigned addr;\n");
APPEND("unsigned *dmem = STATE->dmem;\n");
for (unsigned i = 0; i < count; i++)
{
2020-02-01 00:42:56 +00:00
uint32_t instr = state.imem[pc + i];
2020-01-29 20:39:26 +00:00
APPEND("pc_%03x:\n", (pc + i) * 4);
2020-02-01 11:27:00 +00:00
#ifdef TRACE
2020-02-01 00:42:56 +00:00
APPEND("RSP_REPORT_PC(STATE, %u, %u);\n", (pc + i) * 4, instr);
2020-02-01 01:17:07 +00:00
#endif
2020-01-29 20:39:26 +00:00
PIPELINE_BRANCH();
uint32_t type = instr >> 26;
uint32_t rd, rs, rt, shift, imm;
int16_t simm;
if ((instr >> 25) == 0x25)
{
// VU instruction.
uint32_t op = instr & 63;
uint32_t vd = (instr >> 6) & 31;
uint32_t vs = (instr >> 11) & 31;
uint32_t vt = (instr >> 16) & 31;
uint32_t e = (instr >> 21) & 15;
static const char *ops[64] = {
"VMULF", "VMULU", nullptr, nullptr, "VMUDL", "VMUDM", "VMUDN", "VMUDH", "VMACF", "VMACU", nullptr,
nullptr, "VMADL", "VMADM", "VMADN", "VMADH", "VADD", "VSUB", nullptr, "VABS", "VADDC", "VSUBC",
nullptr, nullptr, nullptr, nullptr, nullptr, nullptr, nullptr, "VSAR", nullptr, nullptr, "VLT",
"VEQ", "VNE", "VGE", "VCL", "VCH", "VCR", "VMRG", "VAND", "VNAND", "VOR", "VNOR",
"VXOR", "VNXOR", nullptr, nullptr, "VRCP", "VRCPL", "VRCPH", "VMOV", "VRSQ", "VRSQL", "VRSQH",
"VNOP", nullptr, nullptr, nullptr, nullptr, nullptr, nullptr, nullptr, nullptr,
};
auto vop = ops[op];
if (vop)
{
APPEND("RSP_%s(STATE, %u, %u, %u, %u);\n", vop, vd, vs, vt, e);
DISASM("%s v%u, v%u, v%u[%u]\n", vop, vd, vs, vt, e);
}
else
{
APPEND("RSP_RESERVED(STATE, %u, %u, %u, %u);\n", vd, vs, vt, e);
DISASM("RSP_RESERVED v%u, v%u, v%u[%u]\n", vd, vs, vt, e);
//fprintf(DUMP_FILE, "Unimplemented COP2 op %u.\n", op);
2020-01-29 20:39:26 +00:00
}
2020-01-29 13:58:56 +00:00
#ifdef INTENSE_DEBUG
2020-01-29 20:39:26 +00:00
APPEND("RSP_DEBUG(STATE, \"CP2\", %u, 0);\n", op);
2020-01-29 13:58:56 +00:00
#endif
2020-01-29 20:39:26 +00:00
}
else
{
// Everything else.
switch (type)
{
case 000:
{
rd = (instr & 0xffff) >> 11;
rt = (instr >> 16) & 31;
shift = (instr >> 6) & 31;
rs = instr >> 21;
switch (instr & 63)
{
case 000: // SLL
APPEND_RD_NOT_R0("r%u = r%u << %u;\n", rd, rt, shift);
if (instr)
2020-02-01 00:42:56 +00:00
DISASM("sll %s, %s, %u\n", register_name(rd), register_name(rt), shift);
2020-01-29 20:39:26 +00:00
else
DISASM("nop\n");
break;
case 002: // SRL
APPEND_RD_NOT_R0("r%u = r%u >> %u;\n", rd, rt, shift);
2020-02-01 00:42:56 +00:00
DISASM("srl %s, %s, %u\n", register_name(rd), register_name(rt), shift);
2020-01-29 20:39:26 +00:00
break;
case 003: // SRA
APPEND_RD_NOT_R0("r%u = (int)r%u >> (int)%u;\n", rd, rt, shift);
2020-02-01 00:42:56 +00:00
DISASM("sra %s, %s, %u\n", register_name(rd), register_name(rt), shift);
2020-01-29 20:39:26 +00:00
break;
case 004: // SLLV
APPEND_RD_NOT_R0("r%u = r%u << MASK_SA(r%u);\n", rd, rt, rs);
2020-02-01 00:42:56 +00:00
DISASM("sllv %s, %s, $%u\n", register_name(rd), register_name(rt), rs);
2020-01-29 20:39:26 +00:00
break;
case 006: // SRLV
APPEND_RD_NOT_R0("r%u = r%u >> MASK_SA(r%u);\n", rd, rt, rs);
2020-02-01 00:42:56 +00:00
DISASM("srlv %s, %s, $%u\n", register_name(rd), register_name(rt), rs);
2020-01-29 20:39:26 +00:00
break;
case 007: // SRAV
APPEND_RD_NOT_R0("r%u = (int)r%u >> (int)MASK_SA(r%u);\n", rd, rt, rs);
2020-02-01 00:42:56 +00:00
DISASM("srav %s, %s, $%u\n", register_name(rd), register_name(rt), rs);
2020-01-29 20:39:26 +00:00
break;
case 011: // JALR
if (rd != 0)
{
APPEND("r%u = %u;\n", rd, ((pc + i + 2) << 2) & 0xffc);
}
set_pc_indirect(rs);
pipe_pending_indirect_call = true;
2020-02-01 00:42:56 +00:00
DISASM("jalr %s\n", register_name(rs));
2020-01-29 13:58:56 +00:00
#ifdef INTENSE_DEBUG
2020-01-29 20:39:26 +00:00
APPEND("RSP_DEBUG(STATE, \"JALR\", pipe_branch_delay * 4, 0);\n");
2020-01-29 13:58:56 +00:00
#endif
2020-01-29 20:39:26 +00:00
break;
case 010: // JR
set_pc_indirect(rs);
pipe_pending_return = true;
2020-02-01 00:42:56 +00:00
DISASM("jr %s\n", register_name(rs));
2020-01-29 13:58:56 +00:00
#ifdef INTENSE_DEBUG
2020-01-29 20:39:26 +00:00
APPEND("RSP_DEBUG(STATE, \"JR\", pipe_branch_delay * 4, 0);\n");
2020-01-29 13:58:56 +00:00
#endif
2020-01-29 20:39:26 +00:00
break;
case 015: // BREAK
EXIT_WITH_DELAY(MODE_BREAK);
break;
case 040: // ADD
case 041: // ADDU
APPEND_RD_NOT_R0("r%u = r%u + r%u;\n", rd, rs, rt);
2020-02-01 00:42:56 +00:00
DISASM("add %s, %s, %s\n", register_name(rd), register_name(rs), register_name(rt));
2020-01-29 20:39:26 +00:00
break;
case 042: // SUB
case 043: // SUBU
APPEND_RD_NOT_R0("r%u = r%u - r%u;\n", rd, rs, rt);
2020-02-01 00:42:56 +00:00
DISASM("sub %s, %s, %s\n", register_name(rd), register_name(rs), register_name(rt));
2020-01-29 20:39:26 +00:00
break;
case 044: // AND
APPEND_RD_NOT_R0("r%u = r%u & r%u;\n", rd, rs, rt);
2020-02-01 00:42:56 +00:00
DISASM("and %s, %s, %s\n", register_name(rd), register_name(rs), register_name(rt));
2020-01-29 20:39:26 +00:00
break;
case 045: // OR
APPEND_RD_NOT_R0("r%u = r%u | r%u;\n", rd, rs, rt);
2020-02-01 00:42:56 +00:00
DISASM("or %s, %s, %s\n", register_name(rd), register_name(rs), register_name(rt));
2020-01-29 20:39:26 +00:00
break;
case 046: // XOR
APPEND_RD_NOT_R0("r%u = r%u ^ r%u;\n", rd, rs, rt);
2020-02-01 00:42:56 +00:00
DISASM("xor %s, %s, %s\n", register_name(rd), register_name(rs), register_name(rt));
2020-01-29 20:39:26 +00:00
break;
case 047: // NOR
APPEND_RD_NOT_R0("r%u = ~(r%u | r%u);\n", rd, rs, rt);
2020-02-01 00:42:56 +00:00
DISASM("nor %s, %s, %s\n", register_name(rd), register_name(rs), register_name(rt));
2020-01-29 20:39:26 +00:00
break;
case 052: // SLT
APPEND_RD_NOT_R0("r%u = (int)r%u < (int)r%u;\n", rd, rs, rt);
2020-02-01 00:42:56 +00:00
DISASM("slt %s, %s, %s\n", register_name(rd), register_name(rs), register_name(rt));
2020-01-29 20:39:26 +00:00
break;
case 053: // SLTU
APPEND_RD_NOT_R0("r%u = r%u < r%u;\n", rd, rs, rt);
2020-02-01 00:42:56 +00:00
DISASM("sltu %s, %s, %s\n", register_name(rd), register_name(rs), register_name(rt));
2020-01-29 20:39:26 +00:00
break;
default:
break;
}
break;
}
case 001: // REGIMM
rs = (instr >> 21) & 31;
rt = (instr >> 16) & 31;
switch (rt)
{
case 020: // BLTZAL
APPEND("r31 = %u;\n", ((pc + i + 2) << 2) & 0xffc);
rs = (instr >> 21) & 31;
set_pc(pc + i + 1 + instr);
APPEND("BRANCH_IF((int)r%u < 0);\n", rs);
2020-02-01 00:42:56 +00:00
DISASM("bltzal %s, 0x%x\n", register_name(rs), ((pc + i + 1 + instr) << 2) & 0xffc);
2020-01-29 20:39:26 +00:00
break;
case 000: // BLTZ
rs = (instr >> 21) & 31;
set_pc(pc + i + 1 + instr);
APPEND("BRANCH_IF((int)r%u < 0);\n", rs);
2020-02-01 00:42:56 +00:00
DISASM("bltz %s, 0x%x\n", register_name(rs), ((pc + i + 1 + instr) << 2) & 0xffc);
2020-01-29 20:39:26 +00:00
break;
case 021: // BGEZAL
APPEND("r31 = %u;\n", ((pc + i + 2) << 2) & 0xffc);
rs = (instr >> 21) & 31;
set_pc(pc + i + 1 + instr);
APPEND("BRANCH_IF((int)r%u >= 0);\n", rs);
2020-02-01 00:42:56 +00:00
DISASM("bgezal %s, 0x%x\n", register_name(rs), ((pc + i + 1 + instr) << 2) & 0xffc);
2020-01-29 20:39:26 +00:00
break;
case 001: // BGEZ
rs = (instr >> 21) & 31;
set_pc(pc + i + 1 + instr);
APPEND("BRANCH_IF((int)r%u >= 0);\n", rs);
2020-02-01 00:42:56 +00:00
DISASM("bgez %s, 0x%x\n", register_name(rs), ((pc + i + 1 + instr) << 2) & 0xffc);
2020-01-29 20:39:26 +00:00
break;
default:
break;
}
break;
case 003: // JAL
APPEND("r31 = %u;\n", ((pc + i + 2) << 2) & 0xffc);
imm = instr & 0x3ff;
set_pc(imm);
pipe_pending_call = true;
APPEND("BRANCH();\n");
DISASM("jal 0x%x\n", (instr & 0x3ff) << 2);
2020-01-29 13:58:56 +00:00
#ifdef INTENSE_DEBUG
2020-01-29 20:39:26 +00:00
APPEND("RSP_DEBUG(STATE, \"JAL\", %u, 0);\n", pipe_branch_delay * 4);
2020-01-29 13:58:56 +00:00
#endif
2020-01-29 20:39:26 +00:00
break;
case 002: // J
imm = instr & 0x3ff;
set_pc(imm);
APPEND("BRANCH();\n");
DISASM("j 0x%x\n", (instr & 0x3ff) << 2);
break;
case 004: // BEQ
rs = (instr >> 21) & 31;
rt = (instr >> 16) & 31;
set_pc(pc + i + 1 + instr);
APPEND("BRANCH_IF(r%u == r%u);\n", rs, rt);
2020-02-01 00:42:56 +00:00
DISASM("beq %s, %s, 0x%x\n", register_name(rs), register_name(rt), ((pc + i + 1 + instr) & 0x3ff) << 2);
2020-01-29 20:39:26 +00:00
break;
case 005: // BNE
rs = (instr >> 21) & 31;
rt = (instr >> 16) & 31;
set_pc(pc + i + 1 + instr);
APPEND("BRANCH_IF(r%u != r%u);\n", rs, rt);
2020-02-01 00:42:56 +00:00
DISASM("bne %s, %s, 0x%x\n", register_name(rs), register_name(rt), ((pc + i + 1 + instr) & 0x3ff) << 2);
2020-01-29 20:39:26 +00:00
break;
case 006: // BLEZ
rs = (instr >> 21) & 31;
set_pc(pc + i + 1 + instr);
APPEND("BRANCH_IF((int)r%u <= 0);\n", rs);
2020-02-01 00:42:56 +00:00
DISASM("blez %s, 0x%x\n", register_name(rs), ((pc + i + 1 + instr) & 0x3ff) << 2);
2020-01-29 20:39:26 +00:00
break;
case 007: // BGTZ
rs = (instr >> 21) & 31;
set_pc(pc + i + 1 + instr);
APPEND("BRANCH_IF((int)r%u > 0);\n", rs);
2020-02-01 00:42:56 +00:00
DISASM("bgtz %s, 0x%x\n", register_name(rs), ((pc + i + 1 + instr) & 0x3ff) << 2);
2020-01-29 20:39:26 +00:00
break;
case 010:
case 011: // ADDI
simm = instr;
rs = (instr >> 21) & 31;
rt = (instr >> 16) & 31;
APPEND_RT_NOT_R0("r%u = (int)r%u + %d;\n", rt, rs, simm);
if (rs != 0)
2020-02-01 00:42:56 +00:00
DISASM("addi %s, %s, %d\n", register_name(rt), register_name(rs), simm);
2020-01-29 20:39:26 +00:00
else
2020-02-01 00:42:56 +00:00
DISASM("li %s, %d\n", register_name(rt), simm);
2020-01-29 20:39:26 +00:00
break;
case 012: // SLTI
simm = instr;
rs = (instr >> 21) & 31;
rt = (instr >> 16) & 31;
APPEND_RT_NOT_R0("r%u = (int)r%u < %d;\n", rt, rs, simm);
2020-02-01 00:42:56 +00:00
DISASM("slti %s, %s, %d\n", register_name(rt), register_name(rs), simm);
2020-01-29 20:39:26 +00:00
break;
case 013: // SLTIU
imm = instr & 0xffff;
rs = (instr >> 21) & 31;
rt = (instr >> 16) & 31;
APPEND_RT_NOT_R0("r%u = r%u < %u;\n", rt, rs, imm);
2020-02-01 00:42:56 +00:00
DISASM("sltiu %s, %s, %u\n", register_name(rt), register_name(rs), imm);
2020-01-29 20:39:26 +00:00
break;
case 014: // ANDI
imm = instr & 0xffff;
rs = (instr >> 21) & 31;
rt = (instr >> 16) & 31;
APPEND_RT_NOT_R0("r%u = r%u & %u;\n", rt, rs, imm);
2020-02-01 00:42:56 +00:00
DISASM("andi %s, %s, 0x%x\n", register_name(rt), register_name(rs), imm);
2020-01-29 20:39:26 +00:00
break;
case 015: // ORI
imm = instr & 0xffff;
rs = (instr >> 21) & 31;
rt = (instr >> 16) & 31;
APPEND_RT_NOT_R0("r%u = r%u | %u;\n", rt, rs, imm);
2020-02-01 00:42:56 +00:00
DISASM("ori %s, %s, 0x%x\n", register_name(rt), register_name(rs), imm);
2020-01-29 20:39:26 +00:00
break;
case 016: // XORI
imm = instr & 0xffff;
rs = (instr >> 21) & 31;
rt = (instr >> 16) & 31;
APPEND_RT_NOT_R0("r%u = r%u ^ %u;\n", rt, rs, imm);
2020-02-01 00:42:56 +00:00
DISASM("xori %s, %s, 0x%x\n", register_name(rt), register_name(rs), imm);
2020-01-29 20:39:26 +00:00
break;
case 017: // LUI
imm = instr & 0xffff;
rt = (instr >> 16) & 31;
APPEND_RT_NOT_R0("r%u = %uu << 16u;\n", rt, imm);
2020-02-01 00:42:56 +00:00
DISASM("lui %s, 0x%x\n", register_name(rt), imm);
2020-01-29 20:39:26 +00:00
break;
case 020: // COP0
rd = (instr >> 11) & 31;
rs = (instr >> 21) & 31;
rt = (instr >> 16) & 31;
switch (rs)
{
case 000: // MFC0
APPEND("cp0_result = RSP_MFC0(STATE, %u, %u);\n", rt, rd);
DISASM("mfc0 %u, %u\n", rt, rd);
APPEND("if (UNLIKELY(cp0_result != MODE_CONTINUE)) {\n");
EXIT_WITH_DELAY(cp0_result);
APPEND("}\n");
break;
case 004: // MTC0
APPEND("cp0_result = RSP_MTC0(STATE, %u, %u);\n", rd, rt);
DISASM("mtc0 %u, %u\n", rd, rt);
APPEND("if (UNLIKELY(cp0_result != MODE_CONTINUE)) {\n");
EXIT_WITH_DELAY(cp0_result);
APPEND("}\n");
break;
default:
break;
}
break;
case 022: // COP2
rd = (instr >> 11) & 31;
rs = (instr >> 21) & 31;
rt = (instr >> 16) & 31;
imm = (instr >> 7) & 15;
switch (rs)
{
case 000: // MFC2
APPEND("RSP_MFC2(STATE, %u, %u, %u);\n", rt, rd, imm);
DISASM("mfc2 %u, %u, %u\n", rt, rd, imm);
break;
case 002: // CFC2
APPEND("RSP_CFC2(STATE, %u, %u);\n", rt, rd);
DISASM("cfc2 %u, %u\n", rt, rd);
break;
case 004: // MTC2
APPEND("RSP_MTC2(STATE, %u, %u, %u);\n", rt, rd, imm);
DISASM("mtc2 %u, %u, %u\n", rt, rd, imm);
2020-01-29 13:58:56 +00:00
#ifdef INTENSE_DEBUG
2020-01-29 20:39:26 +00:00
APPEND("RSP_DEBUG(STATE, \"MTC2\", %u, 0);\n", 0);
2020-01-29 13:58:56 +00:00
#endif
2020-01-29 20:39:26 +00:00
break;
case 006: // CTC2
APPEND("RSP_CTC2(STATE, %u, %u);\n", rt, rd);
2020-01-31 21:53:36 +00:00
DISASM("ctc2 %u, %u\n", rt, rd);
2020-01-29 20:39:26 +00:00
break;
default:
break;
}
break;
case 040: // LB
simm = instr;
rt = (instr >> 16) & 31;
rs = (instr >> 21) & 31;
if (rt != 0)
{
APPEND("r%u = (signed char)READ_MEM_U8(dmem, (r%u + (%d)) & 0xfff);\n", rt, rs, simm);
}
2020-02-01 00:42:56 +00:00
DISASM("lb %s, %d(%s)\n", register_name(rt), simm, register_name(rs));
2020-01-29 20:39:26 +00:00
break;
case 041: // LH
simm = instr;
rt = (instr >> 16) & 31;
rs = (instr >> 21) & 31;
if (rt != 0)
{
APPEND("addr = (r%u + (%d)) & 0xfff;\n", rs, simm);
APPEND("if (UNLIKELY(addr & 1))\n");
APPEND(" r%u = (signed short)READ_MEM_U16_UNALIGNED(dmem, addr);\n", rt);
APPEND("else\n");
APPEND(" r%u = (signed short)READ_MEM_U16(dmem, addr);\n", rt);
}
2020-02-01 00:42:56 +00:00
DISASM("lh %s, %d(%s)\n", register_name(rt), simm, register_name(rs));
2020-01-29 20:39:26 +00:00
break;
case 043: // LW
simm = instr;
rt = (instr >> 16) & 31;
rs = (instr >> 21) & 31;
if (rt != 0)
{
APPEND("addr = (r%u + (%d)) & 0xfff;\n", rs, simm);
APPEND("if (UNLIKELY(addr & 3))\n");
APPEND(" r%u = READ_MEM_U32_UNALIGNED(dmem, addr);\n", rt);
APPEND("else\n");
APPEND(" r%u = READ_MEM_U32(dmem, addr);\n", rt);
}
2020-02-01 00:42:56 +00:00
DISASM("lw %s, %d(%s)\n", register_name(rt), simm, register_name(rs));
2020-01-29 20:39:26 +00:00
break;
case 044: // LBU
simm = instr;
rt = (instr >> 16) & 31;
rs = (instr >> 21) & 31;
if (rt != 0)
{
APPEND("r%u = READ_MEM_U8(dmem, (r%u + (%d)) & 0xfff);\n", rt, rs, simm);
}
2020-02-01 00:42:56 +00:00
DISASM("lbu %s, %d(%s)\n", register_name(rt), simm, register_name(rs));
2020-01-29 20:39:26 +00:00
break;
case 045: // LHU
simm = instr;
rt = (instr >> 16) & 31;
rs = (instr >> 21) & 31;
if (rt != 0)
{
APPEND("addr = (r%u + (%d)) & 0xfff;\n", rs, simm);
APPEND("if (UNLIKELY(addr & 1))\n");
APPEND(" r%u = READ_MEM_U16_UNALIGNED(dmem, addr);\n", rt);
APPEND("else\n");
APPEND(" r%u = READ_MEM_U16(dmem, addr);\n", rt);
}
2020-02-01 00:42:56 +00:00
DISASM("lhu %s, %d(%s)\n", register_name(rt), simm, register_name(rs));
2020-01-29 20:39:26 +00:00
break;
case 050: // SB
simm = instr;
rt = (instr >> 16) & 31;
rs = (instr >> 21) & 31;
APPEND("WRITE_MEM_U8(dmem, ((r%u + (%d)) & 0xfff), r%u);\n", rs, simm, rt);
2020-02-01 00:42:56 +00:00
DISASM("sb %s, %d(%s)\n", register_name(rt), simm, register_name(rs));
2020-01-29 20:39:26 +00:00
break;
case 051: // SH
rt = (instr >> 16) & 31;
rs = (instr >> 21) & 31;
simm = instr;
APPEND("addr = (r%u + (%d)) & 0xfff;\n", rs, simm);
APPEND("if (UNLIKELY(addr & 1))\n");
APPEND(" WRITE_MEM_U16_UNALIGNED(dmem, addr, r%u);\n", rt);
APPEND("else\n");
APPEND(" WRITE_MEM_U16(dmem, addr, r%u);\n", rt);
2020-02-01 00:42:56 +00:00
DISASM("sh %s, %d(%s)\n", register_name(rt), simm, register_name(rs));
2020-01-29 20:39:26 +00:00
break;
case 053: // SW
rt = (instr >> 16) & 31;
rs = (instr >> 21) & 31;
simm = instr;
APPEND("addr = (r%u + (%d)) & 0xfff;\n", rs, simm);
APPEND("if (UNLIKELY(addr & 3))\n");
APPEND(" WRITE_MEM_U32_UNALIGNED(dmem, addr, r%u);\n", rt);
APPEND("else\n");
APPEND(" WRITE_MEM_U32(dmem, addr, r%u);\n", rt);
2020-02-01 00:42:56 +00:00
DISASM("sw %s, %d(%s)\n", register_name(rt), simm, register_name(rs));
2020-01-29 20:39:26 +00:00
break;
case 062: // LWC2
{
rt = (instr >> 16) & 31;
simm = instr;
// Sign extend.
simm <<= 9;
simm >>= 9;
rs = (instr >> 21) & 31;
rd = (instr >> 11) & 31;
imm = (instr >> 7) & 15;
static const char *lwc2_ops[32] = {
"LBV", "LSV", "LLV", "LDV", "LQV", "LRV", "LPV", "LUV", "LHV", nullptr, nullptr,
"LTV", nullptr, nullptr, nullptr, nullptr, nullptr, nullptr, nullptr, nullptr, nullptr, nullptr,
nullptr, nullptr, nullptr, nullptr, nullptr, nullptr, nullptr, nullptr, nullptr, nullptr,
};
auto *op = lwc2_ops[rd];
if (op)
{
APPEND("RSP_%s(STATE, %u, %u, %d, %u);\n", op, rt, imm, simm, rs);
DISASM("%s %u, %u, %d, %u\n", op, rt, imm, simm, rs);
}
2020-01-29 13:58:56 +00:00
#ifdef INTENSE_DEBUG
2020-01-29 20:39:26 +00:00
APPEND("RSP_DEBUG(STATE, \"LWC2\", %u, %u);\n", (pc + i + 1) << 2, instr);
2020-01-29 13:58:56 +00:00
#endif
2020-01-29 20:39:26 +00:00
break;
}
case 072: // SWC2
{
rt = (instr >> 16) & 31;
simm = instr;
// Sign extend.
simm <<= 9;
simm >>= 9;
rs = (instr >> 21) & 31;
rd = (instr >> 11) & 31;
imm = (instr >> 7) & 15;
static const char *swc2_ops[32] = {
"SBV", "SSV", "SLV", "SDV", "SQV", "SRV", "SPV", "SUV", "SHV", "SFV", nullptr,
"STV", nullptr, nullptr, nullptr, nullptr, nullptr, nullptr, nullptr, nullptr, nullptr, nullptr,
nullptr, nullptr, nullptr, nullptr, nullptr, nullptr, nullptr, nullptr, nullptr, nullptr,
};
auto *op = swc2_ops[rd];
if (op)
{
APPEND("RSP_%s(STATE, %u, %u, %d, %u);\n", op, rt, imm, simm, rs);
DISASM("%s %u, %u, %d, %u\n", op, rt, imm, simm, rs);
}
2020-01-29 13:58:56 +00:00
#ifdef INTENSE_DEBUG
2020-01-29 20:39:26 +00:00
APPEND("RSP_DEBUG(STATE, \"SWC2\", %u, %u);\n", (pc + i + 1) << 2, instr);
2020-01-29 13:58:56 +00:00
#endif
2020-01-29 20:39:26 +00:00
break;
}
default:
break;
}
}
if (i == 0)
CHECK_INHERIT_BRANCH_DELAY();
else
CHECK_BRANCH_DELAY();
APPEND("\n");
}
// Falling off end of block.
APPEND("STATE->pc = %u;\n", ((pc + count) << 2) & (IMEM_SIZE - 1));
PROMOTE_DELAY_SLOT();
APPEND("EXIT(MODE_CONTINUE);\n");
// Emit helper code.
full_code += R"DELIM(
2020-01-29 13:58:56 +00:00
struct cpu_state
{
unsigned pc;
unsigned dirty_blocks;
unsigned has_delay_slot;
unsigned branch_target;
unsigned sr[33];
2020-01-29 13:58:56 +00:00
unsigned *dmem;
unsigned *imem;
};
#define UNLIKELY(x) __builtin_expect(!!(x), 0)
#define LIKELY(x) __builtin_expect(!!(x), 1)
#define MASK_SA(x) ((x) & 31)
enum ReturnMode {
MODE_ENTER = 0,
MODE_CONTINUE = 1,
MODE_BREAK = 2,
MODE_DMA_READ = 3,
MODE_CHECK_FLAGS = 4
};
#define r0 0
#define ADVANCE_DELAY_SLOT() do { \
branch = pipe_branch; \
pipe_branch = 0; \
branch_delay = pipe_branch_delay; \
} while(0)
#define BRANCH() pipe_branch = 1
#define BRANCH_IF(x) if (x) BRANCH()
#define BRANCH_INDIRECT(pc) do { \
pipe_branch_delay = pc; \
pipe_branch = 1; \
} while(0)
#define PROMOTE_DELAY_SLOT() do { \
if (pipe_branch) { \
STATE->has_delay_slot = 1; \
STATE->branch_target = pipe_branch_delay * 4; \
} \
} while(0)
extern int RSP_MFC0(struct cpu_state *STATE, unsigned rt, unsigned rd);
extern int RSP_MTC0(struct cpu_state *STATE, unsigned rd, unsigned rt);
extern void RSP_MTC2(struct cpu_state *STATE, unsigned rt, unsigned vd, unsigned e);
extern void RSP_MFC2(struct cpu_state *STATE, unsigned rt, unsigned vs, unsigned e);
extern void RSP_CFC2(struct cpu_state *STATE, unsigned rt, unsigned rd);
extern void RSP_CTC2(struct cpu_state *STATE, unsigned rt, unsigned rd);
2020-02-01 00:42:56 +00:00
extern void RSP_REPORT_PC(struct cpu_state *STATE, unsigned pc, unsigned instr);
2020-01-29 13:58:56 +00:00
#define DECL_LS(op) \
extern void RSP_##op(struct cpu_state *STATE, unsigned rt, unsigned element, int offset, unsigned base)
DECL_LS(LBV);
DECL_LS(LSV);
DECL_LS(LLV);
DECL_LS(LDV);
DECL_LS(LQV);
DECL_LS(LRV);
DECL_LS(LPV);
DECL_LS(LUV);
DECL_LS(LHV);
DECL_LS(LTV);
DECL_LS(SBV);
DECL_LS(SSV);
DECL_LS(SLV);
DECL_LS(SDV);
DECL_LS(SQV);
DECL_LS(SRV);
DECL_LS(SPV);
DECL_LS(SUV);
DECL_LS(SHV);
DECL_LS(SFV);
DECL_LS(STV);
extern void RSP_CALL(void *opaque, unsigned target, unsigned ret);
extern int RSP_RETURN(void *opaque, unsigned pc);
extern void RSP_EXIT(void *opaque, enum ReturnMode mode);
#define EXIT(mode) RSP_EXIT(opaque, mode)
extern void RSP_DEBUG(struct cpu_state *STATE, const char *tag, unsigned pc, unsigned value);
#define DECL_COP2(op) \
extern void RSP_##op(struct cpu_state *STATE, unsigned vd, unsigned vs, unsigned vt, unsigned e)
DECL_COP2(VMULF);
DECL_COP2(VMULU);
DECL_COP2(VMUDL);
DECL_COP2(VMUDM);
DECL_COP2(VMUDN);
DECL_COP2(VMUDH);
DECL_COP2(VMACF);
DECL_COP2(VMACU);
//DECL_COP2(VMACQ);
DECL_COP2(VMADL);
DECL_COP2(VMADM);
DECL_COP2(VMADN);
DECL_COP2(VMADH);
DECL_COP2(VADD);
DECL_COP2(VSUB);
DECL_COP2(VABS);
DECL_COP2(VADDC);
DECL_COP2(VSUBC);
DECL_COP2(VSAR);
DECL_COP2(VLT);
DECL_COP2(VEQ);
DECL_COP2(VNE);
DECL_COP2(VGE);
DECL_COP2(VCL);
DECL_COP2(VCH);
DECL_COP2(VCR);
DECL_COP2(VMRG);
DECL_COP2(VAND);
DECL_COP2(VNAND);
DECL_COP2(VOR);
DECL_COP2(VNOR);
DECL_COP2(VXOR);
DECL_COP2(VNXOR);
DECL_COP2(VRCP);
DECL_COP2(VRCPL);
DECL_COP2(VRCPH);
DECL_COP2(VMOV);
DECL_COP2(VRSQ);
DECL_COP2(VRSQL);
DECL_COP2(VRSQH);
DECL_COP2(VNOP);
DECL_COP2(RESERVED);
#define HES(x) ((x) ^ 2)
#define BES(x) ((x) ^ 3)
#define MES(x) ((x) ^ 1)
#define READ_MEM_U8(mem, addr) \
(((const unsigned char*)(mem))[BES(addr)])
#define READ_MEM_U16(mem, addr) \
(((const unsigned short*)(mem))[HES(addr) >> 1])
#define READ_MEM_U32(mem, addr) \
(((const unsigned*)(mem))[addr >> 2])
#define READ_MEM_U16_UNALIGNED(mem, addr) \
(READ_MEM_U8(mem, addr) << 8) | READ_MEM_U8(mem, (addr + 1) & 0xfff)
#define READ_MEM_U32_UNALIGNED(mem, addr) \
(READ_MEM_U8(mem, addr) << 24) | (READ_MEM_U8(mem, (addr + 1) & 0xfff) << 16) | \
(READ_MEM_U8(mem, (addr + 2) & 0xfff) << 8) | READ_MEM_U8(mem, (addr + 3) & 0xfff)
#define WRITE_MEM_U8(mem, addr, data) \
(((unsigned char*)(mem))[BES(addr)] = data)
#define WRITE_MEM_U16_UNALIGNED(mem, addr, data) do { \
WRITE_MEM_U8(mem, addr, data >> 8); \
WRITE_MEM_U8(mem, (addr + 1) & 0xfff, data & 0xff); \
} while(0)
#define WRITE_MEM_U32_UNALIGNED(mem, addr, data) do { \
WRITE_MEM_U8(mem, addr, data >> 24); \
WRITE_MEM_U8(mem, (addr + 1) & 0xfff, (data >> 16) & 0xff); \
WRITE_MEM_U8(mem, (addr + 2) & 0xfff, (data >> 8) & 0xff); \
WRITE_MEM_U8(mem, (addr + 3) & 0xfff, data & 0xff); \
} while(0)
#define WRITE_MEM_U16(mem, addr, data) \
(((unsigned short*)(mem))[HES(addr) >> 1] = data)
#define WRITE_MEM_U32(mem, addr, data) \
(((unsigned*)(mem))[addr >> 2] = data)
)DELIM";
2020-01-29 20:39:26 +00:00
full_code += "void block_entry(void *opaque, struct cpu_state *STATE)\n";
full_code += "{\n";
2020-01-29 13:58:56 +00:00
2020-01-29 20:39:26 +00:00
for (unsigned i = 1; i < 32; i++)
{
char buf[32];
sprintf(buf, "#define r%u (STATE->sr[%u])\n", i, i);
full_code += buf;
}
2020-01-29 13:58:56 +00:00
2020-01-29 20:39:26 +00:00
// Emit fixup code.
2020-01-29 13:58:56 +00:00
2020-01-29 20:39:26 +00:00
full_code += body;
full_code += "}\n";
2020-01-29 13:58:56 +00:00
#ifdef DEBUG_JIT
2020-01-29 20:39:26 +00:00
unique_ptr<Block> block(new Block(symbol_table));
2020-01-29 13:58:56 +00:00
#else
2020-01-29 20:39:26 +00:00
unique_ptr<Block> block(new Block(jit_engine));
2020-01-29 13:58:56 +00:00
#endif
2020-01-29 20:39:26 +00:00
if (!block->compile(hash, full_code))
return nullptr;
2020-01-29 13:58:56 +00:00
2020-01-29 20:39:26 +00:00
auto ret = block->get_func();
cached_blocks[pc][hash] = move(block);
return ret;
2020-01-29 13:58:56 +00:00
}
void CPU::print_registers()
{
#define DUMP_FILE stdout
fprintf(DUMP_FILE, "RSP state:\n");
fprintf(DUMP_FILE, " PC: 0x%03x\n", state.pc);
2020-01-29 20:39:26 +00:00
for (unsigned i = 1; i < 32; i++)
2020-02-01 00:42:56 +00:00
fprintf(DUMP_FILE, " SR[%s] = 0x%08x\n", register_name(i), state.sr[i]);
fprintf(DUMP_FILE, "\n");
2020-01-29 20:39:26 +00:00
for (unsigned i = 0; i < 32; i++)
{
fprintf(DUMP_FILE, " VR[%02u] = { 0x%04x, 0x%04x, 0x%04x, 0x%04x, 0x%04x, 0x%04x, 0x%04x, 0x%04x }\n", i,
2020-01-29 20:39:26 +00:00
state.cp2.regs[i].e[0], state.cp2.regs[i].e[1], state.cp2.regs[i].e[2], state.cp2.regs[i].e[3],
state.cp2.regs[i].e[4], state.cp2.regs[i].e[5], state.cp2.regs[i].e[6], state.cp2.regs[i].e[7]);
}
fprintf(DUMP_FILE, "\n");
2020-01-29 20:39:26 +00:00
for (unsigned i = 0; i < 3; i++)
{
static const char *strings[] = { "ACC_HI", "ACC_MD", "ACC_LO" };
fprintf(DUMP_FILE, " %s = { 0x%04x, 0x%04x, 0x%04x, 0x%04x, 0x%04x, 0x%04x, 0x%04x, 0x%04x }\n", strings[i],
2020-01-29 20:39:26 +00:00
state.cp2.acc.e[8 * i + 0], state.cp2.acc.e[8 * i + 1], state.cp2.acc.e[8 * i + 2],
state.cp2.acc.e[8 * i + 3], state.cp2.acc.e[8 * i + 4], state.cp2.acc.e[8 * i + 5],
state.cp2.acc.e[8 * i + 6], state.cp2.acc.e[8 * i + 7]);
}
fprintf(DUMP_FILE, "\n");
2020-01-29 20:39:26 +00:00
for (unsigned i = 0; i < 3; i++)
{
static const char *strings[] = { "VCO", "VCC", "VCE" };
uint16_t flags = rsp_get_flags(state.cp2.flags[i].e);
fprintf(DUMP_FILE, " %s = 0x%04x\n", strings[i], flags);
2020-01-29 20:39:26 +00:00
}
fprintf(DUMP_FILE, "\n");
fprintf(DUMP_FILE, " Div Out = 0x%04x\n", state.cp2.div_out);
fprintf(DUMP_FILE, " Div In = 0x%04x\n", state.cp2.div_in);
fprintf(DUMP_FILE, " DP flag = 0x%04x\n", state.cp2.dp_flag);
2020-01-29 13:58:56 +00:00
}
void CPU::exit(ReturnMode mode)
{
#ifdef __GNUC__
2020-01-29 20:39:26 +00:00
// On Windows, setjmp/longjmp crashes since it uses exception unwinding semantics
// and our JIT-ed LLVM code does not emit that kind of information, so we have to use a non-standard unwinding mechanism.
// FWIW, this should also be the fastest possible way of doing it.
return_mode = mode;
__builtin_longjmp(env, 1);
2020-01-29 13:58:56 +00:00
#else
#error "Need __builtin_setjmp/longjmp support alternative for other compilers ..."
#endif
}
void CPU::call(uint32_t target, uint32_t ret)
{
2020-01-29 20:39:26 +00:00
if (call_stack_ptr < CALL_STACK_SIZE)
call_stack[call_stack_ptr++] = ret;
enter(target);
2020-01-29 13:58:56 +00:00
}
int CPU::ret(uint32_t pc)
{
2020-01-29 20:39:26 +00:00
if (call_stack_ptr == 0)
return 0;
2020-01-29 13:58:56 +00:00
2020-01-29 20:39:26 +00:00
uint32_t ret = call_stack[--call_stack_ptr];
return ret == pc;
2020-01-29 13:58:56 +00:00
}
2020-01-29 20:39:26 +00:00
extern "C"
2020-01-29 13:58:56 +00:00
{
2020-01-29 20:39:26 +00:00
void RSP_CALL(void *cpu, unsigned target, unsigned ret)
{
static_cast<CPU *>(cpu)->call(target, ret);
}
void RSP_RETURN(void *cpu, unsigned pc)
{
static_cast<CPU *>(cpu)->ret(pc);
}
void RSP_EXIT(void *cpu, int mode)
{
static_cast<CPU *>(cpu)->exit(static_cast<ReturnMode>(mode));
}
2020-02-01 00:42:56 +00:00
void RSP_REPORT_PC(void *cpu, unsigned pc, unsigned instr)
{
auto *state = static_cast<const CPUState *>(cpu);
auto disasm = disassemble(pc, instr);
puts(disasm.c_str());
for (unsigned i = 0; i < 32; i++)
{
if (i == 0)
printf(" ");
else
printf("[%s = 0x%08x] ", register_name(i), state->sr[i]);
if ((i & 7) == 7)
printf("\n");
}
printf("\n");
}
2020-01-29 13:58:56 +00:00
}
void CPU::enter(uint32_t pc)
{
2020-01-29 20:39:26 +00:00
pc &= IMEM_SIZE - 1;
uint32_t word_pc = pc >> 2;
auto &block = blocks[word_pc];
if (!block)
{
unsigned end = (pc + (CODE_BLOCK_SIZE * 2)) >> CODE_BLOCK_SIZE_LOG2;
end <<= CODE_BLOCK_SIZE_LOG2 - 2;
end = min(end, unsigned(IMEM_SIZE >> 2));
end = analyze_static_end(word_pc, end);
uint64_t hash = hash_imem(word_pc, end - word_pc);
auto itr = cached_blocks[word_pc].find(hash);
if (itr != cached_blocks[word_pc].end())
{
block = itr->second->get_func();
//fprintf(stdout, "jit reuse");
}
else
{
//static unsigned count;
//fprintf(DUMP_FILE, "JIT region #%u\n", ++count);
2020-01-29 20:39:26 +00:00
block = jit_region(hash, word_pc, end - word_pc);
//fprintf(stdout, "jit compile");
}
}
//fprintf(stdout, "jit execute");
block(this, &state);
2020-01-29 13:58:56 +00:00
}
ReturnMode CPU::run()
{
2020-01-29 20:39:26 +00:00
for (;;)
{
invalidate_code();
call_stack_ptr = 0;
2020-01-29 13:58:56 +00:00
#ifdef __GNUC__
2020-01-29 20:39:26 +00:00
// On Windows, setjmp/longjmp crashes since it uses exception unwinding semantics
// and our JIT-ed LLVM code does not emit that kind of information, so we have to use a non-standard unwinding mechanism.
// FWIW, this should also be the fastest possible way of doing it.
int setjmp_ret = __builtin_setjmp(env);
auto ret = setjmp_ret ? return_mode : MODE_ENTER;
2020-01-29 13:58:56 +00:00
#else
#error "Need __builtin_setjmp/longjmp support alternative for other compilers ..."
#endif
2020-01-29 20:39:26 +00:00
switch (ret)
{
case MODE_ENTER:
enter(state.pc);
break;
2020-01-29 13:58:56 +00:00
2020-01-29 20:39:26 +00:00
case MODE_BREAK:
*state.cp0.cr[CP0_REGISTER_SP_STATUS] |= SP_STATUS_BROKE | SP_STATUS_HALT;
if (*state.cp0.cr[CP0_REGISTER_SP_STATUS] & SP_STATUS_INTR_BREAK)
*state.cp0.irq |= 1;
2020-01-29 13:58:56 +00:00
#ifndef PARALLEL_INTEGRATION
2020-01-29 20:39:26 +00:00
print_registers();
2020-01-29 13:58:56 +00:00
#endif
2020-01-29 20:39:26 +00:00
return MODE_BREAK;
2020-01-29 13:58:56 +00:00
2020-01-29 20:39:26 +00:00
case MODE_CHECK_FLAGS:
case MODE_DMA_READ:
return ret;
2020-01-29 13:58:56 +00:00
2020-01-29 20:39:26 +00:00
default:
break;
}
}
2020-01-29 13:58:56 +00:00
}
2020-01-29 20:39:26 +00:00
} // namespace RSP