mirror of
https://github.com/libretro/mupen64plus-libretro-nx.git
synced 2024-11-23 08:10:05 +00:00
c5fe217f97
- For now lets just link those against GLN64 - They never run at the same time, are same type and it lowers maintenance efforts
2130 lines
70 KiB
C
2130 lines
70 KiB
C
/******************************************************************************\
|
|
* Project: MSP Simulation Layer for Scalar Unit Operations *
|
|
* Authors: Iconoclast *
|
|
* Release: 2016.03.26 *
|
|
* License: CC0 Public Domain Dedication *
|
|
* *
|
|
* To the extent possible under law, the author(s) have dedicated all copyright *
|
|
* and related and neighboring rights to this software to the public domain *
|
|
* worldwide. This software is distributed without any warranty. *
|
|
* *
|
|
* You should have received a copy of the CC0 Public Domain Dedication along *
|
|
* with this software. *
|
|
* If not, see <http://creativecommons.org/publicdomain/zero/1.0/>. *
|
|
\******************************************************************************/
|
|
|
|
#include "su.h"
|
|
|
|
/*
|
|
* including modular interface structure to access configuration settings...
|
|
* Some of the parallel timing features require perfect timing or configs.
|
|
*/
|
|
#include "module.h"
|
|
|
|
u32 inst_word;
|
|
|
|
u32 SR[32];
|
|
typedef VECTOR_OPERATION(*p_vector_func)(v16, v16);
|
|
|
|
pu8 DRAM;
|
|
|
|
// NOTE: Links against GLideN64\src\N64.cpp due to conflicts and maintenance efforts
|
|
extern pu8 DMEM;
|
|
extern pu8 IMEM;
|
|
|
|
NOINLINE void res_S(void)
|
|
{
|
|
message("RESERVED.");
|
|
return;
|
|
}
|
|
|
|
void set_PC(unsigned int address)
|
|
{
|
|
temp_PC = 0x04001000 + FIT_IMEM(address);
|
|
#ifndef EMULATE_STATIC_PC
|
|
stage = 1;
|
|
#endif
|
|
return;
|
|
}
|
|
|
|
pu32 CR[NUMBER_OF_CP0_REGISTERS];
|
|
u8 conf[32];
|
|
|
|
int MF_SP_STATUS_TIMEOUT;
|
|
|
|
void SP_CP0_MF(unsigned int rt, unsigned int rd)
|
|
{
|
|
SR[rt] = *(CR[rd %= NUMBER_OF_CP0_REGISTERS]);
|
|
SR[zero] = 0x00000000;
|
|
if (rd == 0x7) {
|
|
if (CFG_MEND_SEMAPHORE_LOCK == 0)
|
|
return;
|
|
if (CFG_HLE_GFX | CFG_HLE_AUD)
|
|
return;
|
|
GET_RCP_REG(SP_SEMAPHORE_REG) = 0x00000001;
|
|
GET_RCP_REG(SP_STATUS_REG) |= SP_STATUS_HALT; /* temporary hack */
|
|
return;
|
|
}
|
|
#ifdef WAIT_FOR_CPU_HOST
|
|
if (rd == 0x4) {
|
|
MFC0_count[rt] += 1;
|
|
GET_RCP_REG(SP_STATUS_REG) |= (MFC0_count[rt] >= MF_SP_STATUS_TIMEOUT);
|
|
}
|
|
#endif
|
|
return;
|
|
}
|
|
|
|
static void MT_DMA_CACHE(unsigned int rt)
|
|
{
|
|
*CR[0x0] = SR[rt] & 0xFFFFFFF8ul; /* & 0x00001FF8 */
|
|
return; /* Reserved upper bits are ignored during DMA R/W. */
|
|
}
|
|
static void MT_DMA_DRAM(unsigned int rt)
|
|
{
|
|
*CR[0x1] = SR[rt] & 0xFFFFFFF8ul; /* & 0x00FFFFF8 */
|
|
return; /* Let the reserved bits get sent, but the pointer is 24-bit. */
|
|
}
|
|
static void MT_DMA_READ_LENGTH(unsigned int rt)
|
|
{
|
|
*CR[0x2] = SR[rt] | 07;
|
|
SP_DMA_READ();
|
|
return;
|
|
}
|
|
static void MT_DMA_WRITE_LENGTH(unsigned int rt)
|
|
{
|
|
*CR[0x3] = SR[rt] | 07;
|
|
SP_DMA_WRITE();
|
|
return;
|
|
}
|
|
static void MT_SP_STATUS(unsigned int rt)
|
|
{
|
|
pu32 MI_INTR_REG;
|
|
pu32 SP_STATUS_REG;
|
|
|
|
if (SR[rt] & 0xFE000040)
|
|
message("MTC0\nSP_STATUS");
|
|
MI_INTR_REG = GET_RSP_INFO(MI_INTR_REG);
|
|
SP_STATUS_REG = GET_RSP_INFO(SP_STATUS_REG);
|
|
|
|
*SP_STATUS_REG &= ~(!!(SR[rt] & 0x00000001) << 0);
|
|
*SP_STATUS_REG |= (!!(SR[rt] & 0x00000002) << 0);
|
|
*SP_STATUS_REG &= ~(!!(SR[rt] & 0x00000004) << 1);
|
|
*MI_INTR_REG &= ~((SR[rt] & 0x00000008) >> 3); /* SP_CLR_INTR */
|
|
*MI_INTR_REG |= ((SR[rt] & 0x00000010) >> 4); /* SP_SET_INTR */
|
|
*SP_STATUS_REG |= (SR[rt] & 0x00000010) >> 4; /* int set halt */
|
|
*SP_STATUS_REG &= ~(!!(SR[rt] & 0x00000020) << 5);
|
|
/* *SP_STATUS_REG |= (!!(SR[rt] & 0x00000040) << 5); */
|
|
*SP_STATUS_REG &= ~(!!(SR[rt] & 0x00000080) << 6);
|
|
*SP_STATUS_REG |= (!!(SR[rt] & 0x00000100) << 6);
|
|
*SP_STATUS_REG &= ~(!!(SR[rt] & 0x00000200) << 7);
|
|
*SP_STATUS_REG |= (!!(SR[rt] & 0x00000400) << 7); /* yield request? */
|
|
*SP_STATUS_REG &= ~(!!(SR[rt] & 0x00000800) << 8);
|
|
*SP_STATUS_REG |= (!!(SR[rt] & 0x00001000) << 8); /* yielded? */
|
|
*SP_STATUS_REG &= ~(!!(SR[rt] & 0x00002000) << 9);
|
|
*SP_STATUS_REG |= (!!(SR[rt] & 0x00004000) << 9); /* task done? */
|
|
*SP_STATUS_REG &= ~(!!(SR[rt] & 0x00008000) << 10);
|
|
*SP_STATUS_REG |= (!!(SR[rt] & 0x00010000) << 10);
|
|
*SP_STATUS_REG &= ~(!!(SR[rt] & 0x00020000) << 11);
|
|
*SP_STATUS_REG |= (!!(SR[rt] & 0x00040000) << 11);
|
|
*SP_STATUS_REG &= ~(!!(SR[rt] & 0x00080000) << 12);
|
|
*SP_STATUS_REG |= (!!(SR[rt] & 0x00100000) << 12);
|
|
*SP_STATUS_REG &= ~(!!(SR[rt] & 0x00200000) << 13);
|
|
*SP_STATUS_REG |= (!!(SR[rt] & 0x00400000) << 13);
|
|
*SP_STATUS_REG &= ~(!!(SR[rt] & 0x00800000) << 14);
|
|
*SP_STATUS_REG |= (!!(SR[rt] & 0x01000000) << 14);
|
|
return;
|
|
}
|
|
static void MT_SP_RESERVED(unsigned int rt)
|
|
{
|
|
const u32 source = SR[rt] & 0x00000000ul; /* forced (zilmar, dox) */
|
|
|
|
GET_RCP_REG(SP_SEMAPHORE_REG) = source;
|
|
return;
|
|
}
|
|
static void MT_CMD_START(unsigned int rt)
|
|
{
|
|
const u32 source = SR[rt] & 0xFFFFFFF8ul; /* Funnelcube demo by marshallh */
|
|
|
|
if (GET_RCP_REG(DPC_BUFBUSY_REG)) /* lock hazards not implemented */
|
|
message("MTC0\nCMD_START");
|
|
GET_RCP_REG(DPC_END_REG)
|
|
= GET_RCP_REG(DPC_CURRENT_REG)
|
|
= GET_RCP_REG(DPC_START_REG)
|
|
= source;
|
|
return;
|
|
}
|
|
static void MT_CMD_END(unsigned int rt)
|
|
{
|
|
if (GET_RCP_REG(DPC_BUFBUSY_REG))
|
|
message("MTC0\nCMD_END"); /* This is just CA-related. */
|
|
GET_RCP_REG(DPC_END_REG) = SR[rt] & 0xFFFFFFF8ul;
|
|
if (GET_RSP_INFO(ProcessRdpList) == NULL) /* zilmar GFX #1.2 */
|
|
return;
|
|
GET_RSP_INFO(ProcessRdpList)();
|
|
return;
|
|
}
|
|
static void MT_CMD_STATUS(unsigned int rt)
|
|
{
|
|
pu32 DPC_STATUS_REG;
|
|
|
|
if (SR[rt] & 0xFFFFFD80ul) /* unsupported or reserved bits */
|
|
message("MTC0\nCMD_STATUS");
|
|
DPC_STATUS_REG = GET_RSP_INFO(DPC_STATUS_REG);
|
|
|
|
*DPC_STATUS_REG &= ~(!!(SR[rt] & 0x00000001) << 0);
|
|
*DPC_STATUS_REG |= (!!(SR[rt] & 0x00000002) << 0);
|
|
*DPC_STATUS_REG &= ~(!!(SR[rt] & 0x00000004) << 1);
|
|
*DPC_STATUS_REG |= (!!(SR[rt] & 0x00000008) << 1);
|
|
*DPC_STATUS_REG &= ~(!!(SR[rt] & 0x00000010) << 2);
|
|
*DPC_STATUS_REG |= (!!(SR[rt] & 0x00000020) << 2);
|
|
/* Some NUS-CIC-6105 SP tasks try to clear some DPC cycle timers. */
|
|
GET_RCP_REG(DPC_TMEM_REG) &= !(SR[rt] & 0x00000040) ? ~0u : 0u;
|
|
/* GET_RCP_REG(DPC_PIPEBUSY_REG) &= !(SR[rt] & 0x00000080) ? ~0u : 0u; */
|
|
/* GET_RCP_REG(DPC_BUFBUSY_REG) &= !(SR[rt] & 0x00000100) ? ~0u : 0u; */
|
|
GET_RCP_REG(DPC_CLOCK_REG) &= !(SR[rt] & 0x00000200) ? ~0u : 0u;
|
|
return;
|
|
}
|
|
static void MT_CMD_CLOCK(unsigned int rt)
|
|
{
|
|
message("MTC0\nCMD_CLOCK"); /* read-only?? */
|
|
GET_RCP_REG(DPC_CLOCK_REG) = SR[rt];
|
|
return; /* Appendix says this is RW; elsewhere it says R. */
|
|
}
|
|
static void MT_READ_ONLY(unsigned int rt)
|
|
{
|
|
static char write_to_read_only[] = "Invalid MTC0 from SR[00].";
|
|
|
|
write_to_read_only[21] = '0' + (unsigned char)rt/10;
|
|
write_to_read_only[22] = '0' + (unsigned char)rt%10;
|
|
message(write_to_read_only);
|
|
return;
|
|
}
|
|
|
|
static void (*SP_CP0_MT[NUMBER_OF_CP0_REGISTERS])(unsigned int) = {
|
|
MT_DMA_CACHE ,MT_DMA_DRAM ,MT_DMA_READ_LENGTH ,MT_DMA_WRITE_LENGTH,
|
|
MT_SP_STATUS ,MT_READ_ONLY ,MT_READ_ONLY ,MT_SP_RESERVED,
|
|
MT_CMD_START ,MT_CMD_END ,MT_READ_ONLY ,MT_CMD_STATUS,
|
|
MT_CMD_CLOCK ,MT_READ_ONLY ,MT_READ_ONLY ,MT_READ_ONLY
|
|
};
|
|
|
|
void SP_DMA_READ(void)
|
|
{
|
|
unsigned int offC, offD; /* SP cache and dynamic DMA pointers */
|
|
register unsigned int length;
|
|
register unsigned int count;
|
|
register unsigned int skip;
|
|
|
|
length = (GET_RCP_REG(SP_RD_LEN_REG) & 0x00000FFFul) >> 0;
|
|
count = (GET_RCP_REG(SP_RD_LEN_REG) & 0x000FF000ul) >> 12;
|
|
skip = (GET_RCP_REG(SP_RD_LEN_REG) & 0xFFF00000ul) >> 20;
|
|
#ifdef _DEBUG
|
|
length |= 07; /* already corrected by mtc0 */
|
|
#endif
|
|
++length;
|
|
++count;
|
|
skip += length;
|
|
do {
|
|
register unsigned int i;
|
|
|
|
i = 0;
|
|
--count;
|
|
do {
|
|
offC = (count*length + *CR[0x0] + i) & 0x00001FF8ul;
|
|
offD = (count*skip + *CR[0x1] + i) & 0x00FFFFF8ul;
|
|
*(pi64)(DMEM + offC) =
|
|
*(pi64)(DRAM + offD)
|
|
& (offD & ~MAX_DRAM_DMA_ADDR ? 0 : ~0) /* 0 if (addr > limit) */
|
|
;
|
|
i += 0x008;
|
|
} while (i < length);
|
|
} while (count);
|
|
|
|
if ((*CR[0x0] & 0x1000) ^ (offC & 0x1000))
|
|
message("DMA over the DMEM-to-IMEM gap.");
|
|
GET_RCP_REG(SP_DMA_BUSY_REG) = 0x00000000;
|
|
GET_RCP_REG(SP_STATUS_REG) &= ~SP_STATUS_DMA_BUSY;
|
|
return;
|
|
}
|
|
void SP_DMA_WRITE(void)
|
|
{
|
|
unsigned int offC, offD; /* SP cache and dynamic DMA pointers */
|
|
register unsigned int length;
|
|
register unsigned int count;
|
|
register unsigned int skip;
|
|
|
|
length = (GET_RCP_REG(SP_WR_LEN_REG) & 0x00000FFFul) >> 0;
|
|
count = (GET_RCP_REG(SP_WR_LEN_REG) & 0x000FF000ul) >> 12;
|
|
skip = (GET_RCP_REG(SP_WR_LEN_REG) & 0xFFF00000ul) >> 20;
|
|
|
|
#ifdef _DEBUG
|
|
length |= 07; /* already corrected by mtc0 */
|
|
#endif
|
|
++length;
|
|
++count;
|
|
skip += length;
|
|
do {
|
|
register unsigned int i;
|
|
|
|
i = 0;
|
|
--count;
|
|
do {
|
|
offC = (count*length + *CR[0x0] + i) & 0x00001FF8ul;
|
|
offD = (count*skip + *CR[0x1] + i) & 0x00FFFFF8ul;
|
|
*(pi64)(DRAM + offD) = *(pi64)(DMEM + offC);
|
|
i += 0x000008;
|
|
} while (i < length);
|
|
} while (count);
|
|
|
|
if ((*CR[0x0] & 0x1000) ^ (offC & 0x1000))
|
|
message("DMA over the DMEM-to-IMEM gap.");
|
|
GET_RCP_REG(SP_DMA_BUSY_REG) = 0x00000000;
|
|
GET_RCP_REG(SP_STATUS_REG) &= ~SP_STATUS_DMA_BUSY;
|
|
return;
|
|
}
|
|
|
|
/*** scalar, R4000 control flow manipulation ***/
|
|
|
|
static INLINE void J(u32 inst)
|
|
{
|
|
set_PC(4 * inst);
|
|
}
|
|
|
|
static INLINE void JAL(u32 inst, u32 PC)
|
|
{
|
|
SR[ra] = FIT_IMEM(PC + LINK_OFF);
|
|
set_PC(4 * inst);
|
|
}
|
|
|
|
static INLINE int BEQ(u32 inst, u32 PC)
|
|
{
|
|
const unsigned int rs = (inst >> 21) % (1 << 5);
|
|
const unsigned int rt = (inst >> 16) % (1 << 5);
|
|
|
|
if (!(SR[rs] == SR[rt]))
|
|
return 0;
|
|
set_PC(PC + 4*inst + SLOT_OFF);
|
|
return 1;
|
|
}
|
|
static INLINE int BNE(u32 inst, u32 PC)
|
|
{
|
|
const unsigned int rs = (inst >> 21) % (1 << 5);
|
|
const unsigned int rt = (inst >> 16) % (1 << 5);
|
|
|
|
if (!(SR[rs] != SR[rt]))
|
|
return 0;
|
|
set_PC(PC + 4*inst + SLOT_OFF);
|
|
return 1;
|
|
}
|
|
static INLINE int BLEZ(u32 inst, u32 PC)
|
|
{
|
|
const unsigned int rs = (inst >> 21) % (1 << 5);
|
|
|
|
if (!((s32)SR[rs] <= 0))
|
|
return 0;
|
|
set_PC(PC + 4*inst + SLOT_OFF);
|
|
return 1;
|
|
}
|
|
static INLINE int BGTZ(u32 inst, u32 PC)
|
|
{
|
|
const unsigned int rs = (inst >> 21) % (1 << 5);
|
|
|
|
if (!((s32)SR[rs] > 0))
|
|
return 0;
|
|
set_PC(PC + 4*inst + SLOT_OFF);
|
|
return 1;
|
|
}
|
|
|
|
/*** scalar, R4000 bit-wise logical operations ***/
|
|
|
|
static INLINE void ANDI(u32 inst)
|
|
{
|
|
const u16 immediate = (u16)(inst & 0x0000FFFFu);
|
|
const unsigned int rs = (inst >> 21) % (1 << 5);
|
|
const unsigned int rt = (inst >> 16) % (1 << 5);
|
|
|
|
SR[rt] = SR[rs] & immediate;
|
|
SR[zero] = 0x00000000;
|
|
}
|
|
static INLINE void ORI(u32 inst)
|
|
{
|
|
const u16 immediate = (u16)(inst & 0x0000FFFFu);
|
|
const unsigned int rs = (inst >> 21) % (1 << 5);
|
|
const unsigned int rt = (inst >> 16) % (1 << 5);
|
|
|
|
SR[rt] = SR[rs] | immediate;
|
|
SR[zero] = 0x00000000;
|
|
}
|
|
static INLINE void XORI(u32 inst)
|
|
{
|
|
const u16 immediate = (u16)(inst & 0x0000FFFFu);
|
|
const unsigned int rs = (inst >> 21) % (1 << 5);
|
|
const unsigned int rt = (inst >> 16) % (1 << 5);
|
|
|
|
SR[rt] = SR[rs] ^ immediate;
|
|
SR[zero] = 0x00000000;
|
|
}
|
|
static INLINE void LUI(u32 inst)
|
|
{
|
|
const u16 immediate = (u16)(inst & 0x0000FFFFu);
|
|
const unsigned int rt = (inst >> 16) % (1 << 5);
|
|
|
|
SR[rt] = (u32)immediate << 16; /* or: SR[rt] = 0; SR[rt]31..16 = imm; */
|
|
SR[zero] = 0x00000000;
|
|
}
|
|
|
|
/*** scalar, R4000 arithmetic operations ***/
|
|
|
|
static INLINE void ADDIU(u32 inst)
|
|
{
|
|
const u16 immediate = (u16)(inst & 0x0000FFFFu);
|
|
const unsigned int rs = (inst >> 21) % (1 << 5);
|
|
const unsigned int rt = (inst >> 16) % (1 << 5);
|
|
|
|
SR[rt] = SR[rs] + (s16)(immediate);
|
|
SR[zero] = 0x00000000;
|
|
}
|
|
static INLINE void SLTI(u32 inst)
|
|
{
|
|
const u16 immediate = (u16)(inst & 0x0000FFFFu);
|
|
const unsigned int rs = (inst >> 21) % (1 << 5);
|
|
const unsigned int rt = (inst >> 16) % (1 << 5);
|
|
|
|
SR[rt] = ((s32)(SR[rs]) < (s16)(immediate)) ? 1 : 0;
|
|
SR[zero] = 0x00000000;
|
|
}
|
|
static INLINE void SLTIU(u32 inst)
|
|
{
|
|
const u16 immediate = (u16)(inst & 0x0000FFFFu);
|
|
const unsigned int rs = (inst >> 21) % (1 << 5);
|
|
const unsigned int rt = (inst >> 16) % (1 << 5);
|
|
|
|
SR[rt] = ((u32)(SR[rs]) < (u16)(immediate)) ? 1 : 0;
|
|
SR[zero] = 0x00000000;
|
|
}
|
|
|
|
/*** scalar, R4000 memory loads and stores ***/
|
|
|
|
static INLINE void LB(u32 inst)
|
|
{
|
|
u32 addr;
|
|
const s16 offset = (s16)(inst & 0x0000FFFFul);
|
|
const unsigned int base = (inst >> 21) % (1 << 5);
|
|
const unsigned int rt = (inst >> 16) % (1 << 5);
|
|
|
|
addr = SR[base] + offset;
|
|
SR[rt] = DMEM[BES(addr) & 0x00000FFFul];
|
|
SR[rt] = (s8)SR[rt];
|
|
SR[zero] = 0x00000000;
|
|
}
|
|
static INLINE void LH(u32 inst)
|
|
{
|
|
u32 addr;
|
|
const s16 offset = (s16)(inst & 0x0000FFFFul);
|
|
const unsigned int base = (inst >> 21) % (1 << 5);
|
|
const unsigned int rt = (inst >> 16) % (1 << 5);
|
|
|
|
addr = SR[base] + offset;
|
|
SR[rt] = 0x00000000
|
|
| DMEM[BES(addr + 0) & 0x00000FFFul] << 8
|
|
| DMEM[BES(addr + 1) & 0x00000FFFul] << 0
|
|
;
|
|
SR[rt] = (s16)SR[rt];
|
|
SR[zero] = 0x00000000;
|
|
}
|
|
static INLINE void LW(u32 inst)
|
|
{
|
|
u32 addr;
|
|
const s16 offset = (s16)(inst & 0x0000FFFFul);
|
|
const unsigned int base = (inst >> 21) % (1 << 5);
|
|
const unsigned int rt = (inst >> 16) % (1 << 5);
|
|
|
|
addr = SR[base] + offset;
|
|
SR_B(rt, 0) = DMEM[BES(addr + 0) & 0x00000FFFul];
|
|
SR_B(rt, 1) = DMEM[BES(addr + 1) & 0x00000FFFul];
|
|
SR_B(rt, 2) = DMEM[BES(addr + 2) & 0x00000FFFul];
|
|
SR_B(rt, 3) = DMEM[BES(addr + 3) & 0x00000FFFul];
|
|
SR[zero] = 0x00000000;
|
|
}
|
|
static INLINE void LBU(u32 inst)
|
|
{
|
|
u32 addr;
|
|
const s16 offset = (s16)(inst & 0x0000FFFFul);
|
|
const unsigned int base = (inst >> 21) % (1 << 5);
|
|
const unsigned int rt = (inst >> 16) % (1 << 5);
|
|
|
|
addr = SR[base] + offset;
|
|
SR[rt] = DMEM[BES(addr) & 0x00000FFFul];
|
|
SR[zero] = 0x00000000;
|
|
}
|
|
static INLINE void LHU(u32 inst)
|
|
{
|
|
u32 addr;
|
|
const s16 offset = (s16)(inst & 0x0000FFFFul);
|
|
const unsigned int base = (inst >> 21) % (1 << 5);
|
|
const unsigned int rt = (inst >> 16) % (1 << 5);
|
|
|
|
addr = SR[base] + offset;
|
|
SR[rt] = 0x00000000
|
|
| DMEM[BES(addr + 0) & 0x00000FFFul] << 8
|
|
| DMEM[BES(addr + 1) & 0x00000FFFul] << 0
|
|
;
|
|
SR[zero] = 0x00000000;
|
|
}
|
|
|
|
static INLINE void SB(u32 inst)
|
|
{
|
|
u32 addr;
|
|
const s16 offset = (s16)(inst & 0x0000FFFFul);
|
|
const unsigned int base = (inst >> 21) % (1 << 5);
|
|
const unsigned int rt = (inst >> 16) % (1 << 5);
|
|
|
|
addr = SR[base] + offset;
|
|
DMEM[BES(addr) & 0x00000FFFul] = (u8)(SR[rt] & 0xFFu);
|
|
}
|
|
static INLINE void SH(u32 inst)
|
|
{
|
|
u32 addr;
|
|
const s16 offset = (s16)(inst & 0x0000FFFFul);
|
|
const unsigned int base = (inst >> 21) % (1 << 5);
|
|
const unsigned int rt = (inst >> 16) % (1 << 5);
|
|
|
|
addr = SR[base] + offset;
|
|
DMEM[BES(addr + 0) & 0x00000FFFul] = SR_B(rt, 2);
|
|
DMEM[BES(addr + 1) & 0x00000FFFul] = SR_B(rt, 3);
|
|
}
|
|
static INLINE void SW(u32 inst)
|
|
{
|
|
u32 addr;
|
|
const s16 offset = (s16)(inst & 0x0000FFFFul);
|
|
const unsigned int base = (inst >> 21) % (1 << 5);
|
|
const unsigned int rt = (inst >> 16) % (1 << 5);
|
|
|
|
addr = SR[base] + offset;
|
|
DMEM[BES(addr + 0) & 0x00000FFFul] = SR_B(rt, 0);
|
|
DMEM[BES(addr + 1) & 0x00000FFFul] = SR_B(rt, 1);
|
|
DMEM[BES(addr + 2) & 0x00000FFFul] = SR_B(rt, 2);
|
|
DMEM[BES(addr + 3) & 0x00000FFFul] = SR_B(rt, 3);
|
|
}
|
|
|
|
/*** scalar, coprocessor operations (vector unit) ***/
|
|
|
|
u16 rwR_VCE(void)
|
|
{ /* never saw a game try to read VCE out to a scalar GPR yet */
|
|
register u16 ret_slot;
|
|
|
|
ret_slot = 0x00 | (u16)get_VCE();
|
|
return (ret_slot);
|
|
}
|
|
void rwW_VCE(u16 vce)
|
|
{ /* never saw a game try to write VCE using a scalar GPR yet */
|
|
register int i;
|
|
|
|
vce = 0x00 | (vce & 0xFF);
|
|
for (i = 0; i < 8; i++)
|
|
cf_vce[i] = (vce >> i) & 1;
|
|
return;
|
|
}
|
|
|
|
static u16 (*R_VCF[4])(void) = {
|
|
get_VCO,get_VCC,rwR_VCE,rwR_VCE,
|
|
};
|
|
static void (*W_VCF[4])(u16) = {
|
|
set_VCO,set_VCC,rwW_VCE,rwW_VCE,
|
|
};
|
|
void MFC2(unsigned int rt, unsigned int vs, unsigned int e)
|
|
{
|
|
SR_B(rt, 2) = VR_B(vs, e);
|
|
e = (e + 0x1) & 0xF;
|
|
SR_B(rt, 3) = VR_B(vs, e);
|
|
SR[rt] = (s16)(SR[rt]);
|
|
SR[zero] = 0x00000000;
|
|
return;
|
|
}
|
|
void MTC2(unsigned int rt, unsigned int vd, unsigned int e)
|
|
{
|
|
VR_B(vd, e+0x0) = SR_B(rt, 2);
|
|
VR_B(vd, e+0x1) = SR_B(rt, 3);
|
|
return; /* If element == 0xF, it does not matter; loads do not wrap over. */
|
|
}
|
|
void CFC2(unsigned int rt, unsigned int rd)
|
|
{
|
|
SR[rt] = (s16)R_VCF[rd & 3]();
|
|
SR[zero] = 0x00000000;
|
|
return;
|
|
}
|
|
void CTC2(unsigned int rt, unsigned int rd)
|
|
{
|
|
W_VCF[rd & 3](SR[rt] & 0x0000FFFF);
|
|
return;
|
|
}
|
|
|
|
/*** scalar, coprocessor operations (vector unit, scalar cache transfers) ***/
|
|
|
|
void LBV(unsigned vt, unsigned element, signed offset, unsigned base)
|
|
{
|
|
register u32 addr;
|
|
const unsigned int e = element;
|
|
|
|
addr = (SR[base] + 1*offset) & 0x00000FFF;
|
|
VR_B(vt, e) = DMEM[BES(addr)];
|
|
return;
|
|
}
|
|
void LSV(unsigned vt, unsigned element, signed offset, unsigned base)
|
|
{
|
|
signed int correction;
|
|
register u32 addr;
|
|
const unsigned int e = element;
|
|
|
|
if (e & 0x1) {
|
|
message("LSV\nIllegal element.");
|
|
return;
|
|
}
|
|
addr = (SR[base] + 2*offset) & 0x00000FFF;
|
|
correction = (signed)(addr % 0x004);
|
|
if (correction == 0x003) {
|
|
message("LSV\nWeird addr.");
|
|
return;
|
|
}
|
|
correction = (correction - 1) * HES(0x000);
|
|
VR_S(vt, e) = *(pi16)(DMEM + addr - correction);
|
|
return;
|
|
}
|
|
void LLV(unsigned vt, unsigned element, signed offset, unsigned base)
|
|
{
|
|
signed int correction;
|
|
register u32 addr;
|
|
const unsigned int e = element;
|
|
|
|
if (e & 0x1) {
|
|
message("LLV\nOdd element.");
|
|
return;
|
|
} /* Illegal (but still even) elements are used by Boss Game Studios. */
|
|
addr = (SR[base] + 4*offset) & 0x00000FFF;
|
|
if (addr & 0x00000001) {
|
|
VR_A(vt, e+0x0) = DMEM[BES(addr)];
|
|
addr = (addr + 0x00000001) & 0x00000FFF;
|
|
VR_U(vt, e+0x1) = DMEM[BES(addr)];
|
|
addr = (addr + 0x00000001) & 0x00000FFF;
|
|
VR_A(vt, e+0x2) = DMEM[BES(addr)];
|
|
addr = (addr + 0x00000001) & 0x00000FFF;
|
|
VR_U(vt, e+0x3) = DMEM[BES(addr)];
|
|
return;
|
|
} /* branch very unlikely: "Star Wars: Battle for Naboo" unaligned addr */
|
|
correction = HES(0x000)*(addr%0x004 - 1);
|
|
VR_S(vt, e+0x0) = *(pi16)(DMEM + addr - correction);
|
|
addr = (addr + 0x00000002) & 0x00000FFF; /* F3DLX 1.23: addr%4 is 0x002. */
|
|
VR_S(vt, e+0x2) = *(pi16)(DMEM + addr + correction);
|
|
return;
|
|
}
|
|
void LDV(unsigned vt, unsigned element, signed offset, unsigned base)
|
|
{
|
|
register u32 addr;
|
|
const unsigned int e = element;
|
|
|
|
if (e & 0x1) {
|
|
message("LDV\nOdd element.");
|
|
return;
|
|
} /* Illegal (but still even) elements are used by Boss Game Studios. */
|
|
addr = (SR[base] + 8*offset) & 0x00000FFF;
|
|
|
|
switch (addr & 07) {
|
|
case 00:
|
|
VR_S(vt, e+0x0) = *(pi16)(DMEM + addr + HES(0x000));
|
|
VR_S(vt, e+0x2) = *(pi16)(DMEM + addr + HES(0x002));
|
|
VR_S(vt, e+0x4) = *(pi16)(DMEM + addr + HES(0x004));
|
|
VR_S(vt, e+0x6) = *(pi16)(DMEM + addr + HES(0x006));
|
|
break;
|
|
case 01: /* standard ABI ucodes (unlike e.g. MusyX w/ even addresses) */
|
|
VR_S(vt, e+0x0) = *(pi16)(DMEM + addr + 0x000);
|
|
VR_A(vt, e+0x2) = DMEM[addr + 0x002 - BES(0x000)];
|
|
VR_U(vt, e+0x3) = DMEM[addr + 0x003 + BES(0x000)];
|
|
VR_S(vt, e+0x4) = *(pi16)(DMEM + addr + 0x004);
|
|
VR_A(vt, e+0x6) = DMEM[addr + 0x006 - BES(0x000)];
|
|
addr += 0x007 + BES(00);
|
|
addr &= 0x00000FFF;
|
|
VR_U(vt, e+0x7) = DMEM[addr];
|
|
break;
|
|
case 02:
|
|
VR_S(vt, e+0x0) = *(pi16)(DMEM + addr + 0x000 - HES(0x000));
|
|
VR_S(vt, e+0x2) = *(pi16)(DMEM + addr + 0x002 + HES(0x000));
|
|
VR_S(vt, e+0x4) = *(pi16)(DMEM + addr + 0x004 - HES(0x000));
|
|
addr += 0x006 + HES(00);
|
|
addr &= 0x00000FFF;
|
|
VR_S(vt, e+0x6) = *(pi16)(DMEM + addr);
|
|
break;
|
|
case 03: /* standard ABI ucodes (unlike e.g. MusyX w/ even addresses) */
|
|
VR_A(vt, e+0x0) = DMEM[addr + 0x000 - BES(0x000)];
|
|
VR_U(vt, e+0x1) = DMEM[addr + 0x001 + BES(0x000)];
|
|
VR_S(vt, e+0x2) = *(pi16)(DMEM + addr + 0x002);
|
|
VR_A(vt, e+0x4) = DMEM[addr + 0x004 - BES(0x000)];
|
|
addr += 0x005 + BES(00);
|
|
addr &= 0x00000FFF;
|
|
VR_U(vt, e+0x5) = DMEM[addr];
|
|
VR_S(vt, e+0x6) = *(pi16)(DMEM + addr + 0x001 - BES(0x000));
|
|
break;
|
|
case 04:
|
|
VR_S(vt, e+0x0) = *(pi16)(DMEM + addr + HES(0x000));
|
|
VR_S(vt, e+0x2) = *(pi16)(DMEM + addr + HES(0x002));
|
|
addr += 0x004 + WES(00);
|
|
addr &= 0x00000FFF;
|
|
VR_S(vt, e+0x4) = *(pi16)(DMEM + addr + HES(0x000));
|
|
VR_S(vt, e+0x6) = *(pi16)(DMEM + addr + HES(0x002));
|
|
break;
|
|
case 05: /* standard ABI ucodes (unlike e.g. MusyX w/ even addresses) */
|
|
VR_S(vt, e+0x0) = *(pi16)(DMEM + addr + 0x000);
|
|
VR_A(vt, e+0x2) = DMEM[addr + 0x002 - BES(0x000)];
|
|
addr += 0x003;
|
|
addr &= 0x00000FFF;
|
|
VR_U(vt, e+0x3) = DMEM[addr + BES(0x000)];
|
|
VR_S(vt, e+0x4) = *(pi16)(DMEM + addr + 0x001);
|
|
VR_A(vt, e+0x6) = DMEM[addr + BES(0x003)];
|
|
VR_U(vt, e+0x7) = DMEM[addr + BES(0x004)];
|
|
break;
|
|
case 06:
|
|
VR_S(vt, e+0x0) = *(pi16)(DMEM + addr - HES(0x000));
|
|
addr += 0x002;
|
|
addr &= 0x00000FFF;
|
|
VR_S(vt, e+0x2) = *(pi16)(DMEM + addr + HES(0x000));
|
|
VR_S(vt, e+0x4) = *(pi16)(DMEM + addr + HES(0x002));
|
|
VR_S(vt, e+0x6) = *(pi16)(DMEM + addr + HES(0x004));
|
|
break;
|
|
case 07: /* standard ABI ucodes (unlike e.g. MusyX w/ even addresses) */
|
|
VR_A(vt, e+0x0) = DMEM[addr - BES(0x000)];
|
|
addr += 0x001;
|
|
addr &= 0x00000FFF;
|
|
VR_U(vt, e+0x1) = DMEM[addr + BES(0x000)];
|
|
VR_S(vt, e+0x2) = *(pi16)(DMEM + addr + 0x001);
|
|
VR_A(vt, e+0x4) = DMEM[addr + BES(0x003)];
|
|
VR_U(vt, e+0x5) = DMEM[addr + BES(0x004)];
|
|
VR_S(vt, e+0x6) = *(pi16)(DMEM + addr + 0x005);
|
|
break;
|
|
}
|
|
return;
|
|
}
|
|
void SBV(unsigned vt, unsigned element, signed offset, unsigned base)
|
|
{
|
|
register u32 addr;
|
|
const unsigned int e = element;
|
|
|
|
addr = (SR[base] + 1*offset) & 0x00000FFF;
|
|
DMEM[BES(addr)] = VR_B(vt, e);
|
|
return;
|
|
}
|
|
void SSV(unsigned vt, unsigned element, signed offset, unsigned base)
|
|
{
|
|
register u32 addr;
|
|
const unsigned int e = element;
|
|
|
|
addr = (SR[base] + 2*offset) & 0x00000FFF;
|
|
DMEM[BES(addr)] = VR_B(vt, (e + 0x0));
|
|
addr = (addr + 0x00000001) & 0x00000FFF;
|
|
DMEM[BES(addr)] = VR_B(vt, (e + 0x1) & 0xF);
|
|
return;
|
|
}
|
|
void SLV(unsigned vt, unsigned element, signed offset, unsigned base)
|
|
{
|
|
signed int correction;
|
|
register u32 addr;
|
|
const unsigned int e = element;
|
|
|
|
if ((e & 0x1) || e > 0xC) {
|
|
message("SLV\nIllegal element.");
|
|
return;
|
|
} /* must support illegal even elements in F3DEX2 */
|
|
addr = (SR[base] + 4*offset) & 0x00000FFF;
|
|
if (addr & 0x00000001) {
|
|
message("SLV\nOdd addr.");
|
|
return;
|
|
}
|
|
correction = HES(0x000)*(addr%0x004 - 1);
|
|
*(pi16)(DMEM + addr - correction) = VR_S(vt, e+0x0);
|
|
addr = (addr + 0x00000002) & 0x00000FFF; /* F3DLX 0.95: "Mario Kart 64" */
|
|
*(pi16)(DMEM + addr + correction) = VR_S(vt, e+0x2);
|
|
return;
|
|
}
|
|
void SDV(unsigned vt, unsigned element, signed offset, unsigned base)
|
|
{
|
|
register u32 addr;
|
|
const unsigned int e = element;
|
|
|
|
addr = (SR[base] + 8*offset) & 0x00000FFF;
|
|
if (e > 0x8 || (e & 0x1)) {
|
|
register unsigned int i;
|
|
|
|
#if (VR_STATIC_WRAPAROUND == 1)
|
|
vector_copy(VR[vt] + N, VR[vt]);
|
|
for (i = 0; i < 8; i++)
|
|
DMEM[BES(addr++ & 0x00000FFF)] = VR_B(vt, e + i);
|
|
#else
|
|
for (i = 0; i < 8; i++)
|
|
DMEM[BES(addr++ & 0x00000FFF)] = VR_B(vt, (e+i)&0xF);
|
|
#endif
|
|
return;
|
|
} /* Illegal elements with Boss Game Studios publications. */
|
|
switch (addr & 07) {
|
|
case 00:
|
|
*(pi16)(DMEM + addr + HES(0x000)) = VR_S(vt, e+0x0);
|
|
*(pi16)(DMEM + addr + HES(0x002)) = VR_S(vt, e+0x2);
|
|
*(pi16)(DMEM + addr + HES(0x004)) = VR_S(vt, e+0x4);
|
|
*(pi16)(DMEM + addr + HES(0x006)) = VR_S(vt, e+0x6);
|
|
break;
|
|
case 01: /* "Tetrisphere" audio ucode */
|
|
*(pi16)(DMEM + addr + 0x000) = VR_S(vt, e+0x0);
|
|
DMEM[addr + 0x002 - BES(0x000)] = VR_A(vt, e+0x2);
|
|
DMEM[addr + 0x003 + BES(0x000)] = VR_U(vt, e+0x3);
|
|
*(pi16)(DMEM + addr + 0x004) = VR_S(vt, e+0x4);
|
|
DMEM[addr + 0x006 - BES(0x000)] = VR_A(vt, e+0x6);
|
|
addr += 0x007 + BES(0x000);
|
|
addr &= 0x00000FFF;
|
|
DMEM[addr] = VR_U(vt, e+0x7);
|
|
break;
|
|
case 02:
|
|
*(pi16)(DMEM + addr + 0x000 - HES(0x000)) = VR_S(vt, e+0x0);
|
|
*(pi16)(DMEM + addr + 0x002 + HES(0x000)) = VR_S(vt, e+0x2);
|
|
*(pi16)(DMEM + addr + 0x004 - HES(0x000)) = VR_S(vt, e+0x4);
|
|
addr += 0x006 + HES(0x000);
|
|
addr &= 0x00000FFF;
|
|
*(pi16)(DMEM + addr) = VR_S(vt, e+0x6);
|
|
break;
|
|
case 03: /* "Tetrisphere" audio ucode */
|
|
DMEM[addr + 0x000 - BES(0x000)] = VR_A(vt, e+0x0);
|
|
DMEM[addr + 0x001 + BES(0x000)] = VR_U(vt, e+0x1);
|
|
*(pi16)(DMEM + addr + 0x002) = VR_S(vt, e+0x2);
|
|
DMEM[addr + 0x004 - BES(0x000)] = VR_A(vt, e+0x4);
|
|
addr += 0x005 + BES(0x000);
|
|
addr &= 0x00000FFF;
|
|
DMEM[addr] = VR_U(vt, e+0x5);
|
|
*(pi16)(DMEM + addr + 0x001 - BES(0x000)) = VR_S(vt, 0x6);
|
|
break;
|
|
case 04:
|
|
*(pi16)(DMEM + addr + HES(0x000)) = VR_S(vt, e+0x0);
|
|
*(pi16)(DMEM + addr + HES(0x002)) = VR_S(vt, e+0x2);
|
|
addr = (addr + 0x004) & 0x00000FFF;
|
|
*(pi16)(DMEM + addr + HES(0x000)) = VR_S(vt, e+0x4);
|
|
*(pi16)(DMEM + addr + HES(0x002)) = VR_S(vt, e+0x6);
|
|
break;
|
|
case 05: /* "Tetrisphere" audio ucode */
|
|
*(pi16)(DMEM + addr + 0x000) = VR_S(vt, e+0x0);
|
|
DMEM[addr + 0x002 - BES(0x000)] = VR_A(vt, e+0x2);
|
|
addr = (addr + 0x003) & 0x00000FFF;
|
|
DMEM[addr + BES(0x000)] = VR_U(vt, e+0x3);
|
|
*(pi16)(DMEM + addr + 0x001) = VR_S(vt, e+0x4);
|
|
DMEM[addr + BES(0x003)] = VR_A(vt, e+0x6);
|
|
DMEM[addr + BES(0x004)] = VR_U(vt, e+0x7);
|
|
break;
|
|
case 06:
|
|
*(pi16)(DMEM + addr - HES(0x000)) = VR_S(vt, e+0x0);
|
|
addr = (addr + 0x002) & 0x00000FFF;
|
|
*(pi16)(DMEM + addr + HES(0x000)) = VR_S(vt, e+0x2);
|
|
*(pi16)(DMEM + addr + HES(0x002)) = VR_S(vt, e+0x4);
|
|
*(pi16)(DMEM + addr + HES(0x004)) = VR_S(vt, e+0x6);
|
|
break;
|
|
case 07: /* "Tetrisphere" audio ucode */
|
|
DMEM[addr - BES(0x000)] = VR_A(vt, e+0x0);
|
|
addr = (addr + 0x001) & 0x00000FFF;
|
|
DMEM[addr + BES(0x000)] = VR_U(vt, e+0x1);
|
|
*(pi16)(DMEM + addr + 0x001) = VR_S(vt, e+0x2);
|
|
DMEM[addr + BES(0x003)] = VR_A(vt, e+0x4);
|
|
DMEM[addr + BES(0x004)] = VR_U(vt, e+0x5);
|
|
*(pi16)(DMEM + addr + 0x005) = VR_S(vt, e+0x6);
|
|
break;
|
|
}
|
|
return;
|
|
}
|
|
|
|
static char transfer_debug[32] = "?WC2 $v00[0x0], 0x000($00)";
|
|
static const char digits[16] = {
|
|
'0','1','2','3','4','5','6','7','8','9','A','B','C','D','E','F'
|
|
};
|
|
|
|
NOINLINE void res_lsw(
|
|
unsigned vt,
|
|
unsigned element,
|
|
signed offset,
|
|
unsigned base)
|
|
{
|
|
transfer_debug[10] = '0' + (unsigned char)vt/10;
|
|
transfer_debug[11] = '0' + (unsigned char)vt%10;
|
|
|
|
transfer_debug[15] = digits[element & 0xF];
|
|
|
|
transfer_debug[21] = digits[(offset & 0xFFF) >> 8];
|
|
transfer_debug[22] = digits[(offset & 0x0FF) >> 4];
|
|
transfer_debug[23] = digits[(offset & 0x00F) >> 0];
|
|
|
|
transfer_debug[26] = '0' + (unsigned char)base/10;
|
|
transfer_debug[27] = '0' + (unsigned char)base%10;
|
|
|
|
message(transfer_debug);
|
|
return;
|
|
}
|
|
|
|
/*
|
|
* Group II vector loads and stores:
|
|
* PV and UV (As of RCP implementation, XV and ZV are reserved opcodes.)
|
|
*/
|
|
void LPV(unsigned vt, unsigned element, signed offset, unsigned base)
|
|
{
|
|
register u32 addr;
|
|
register int b;
|
|
const unsigned int e = element;
|
|
|
|
if (e != 0x0) {
|
|
message("LPV\nIllegal element.");
|
|
return;
|
|
}
|
|
addr = (SR[base] + 8*offset) & 0x00000FFF;
|
|
b = addr & 07;
|
|
addr &= ~07;
|
|
switch (b) {
|
|
case 00:
|
|
VR[vt][07] = DMEM[addr + BES(0x007)] << 8;
|
|
VR[vt][06] = DMEM[addr + BES(0x006)] << 8;
|
|
VR[vt][05] = DMEM[addr + BES(0x005)] << 8;
|
|
VR[vt][04] = DMEM[addr + BES(0x004)] << 8;
|
|
VR[vt][03] = DMEM[addr + BES(0x003)] << 8;
|
|
VR[vt][02] = DMEM[addr + BES(0x002)] << 8;
|
|
VR[vt][01] = DMEM[addr + BES(0x001)] << 8;
|
|
VR[vt][00] = DMEM[addr + BES(0x000)] << 8;
|
|
break;
|
|
case 01: /* F3DZEX 2.08J "Doubutsu no Mori" (Animal Forest) CPU CFB */
|
|
VR[vt][00] = DMEM[addr + BES(0x001)] << 8;
|
|
VR[vt][01] = DMEM[addr + BES(0x002)] << 8;
|
|
VR[vt][02] = DMEM[addr + BES(0x003)] << 8;
|
|
VR[vt][03] = DMEM[addr + BES(0x004)] << 8;
|
|
VR[vt][04] = DMEM[addr + BES(0x005)] << 8;
|
|
VR[vt][05] = DMEM[addr + BES(0x006)] << 8;
|
|
VR[vt][06] = DMEM[addr + BES(0x007)] << 8;
|
|
addr += BES(0x008);
|
|
addr &= 0x00000FFF;
|
|
VR[vt][07] = DMEM[addr] << 8;
|
|
break;
|
|
case 02: /* F3DZEX 2.08J "Doubutsu no Mori" (Animal Forest) CPU CFB */
|
|
VR[vt][00] = DMEM[addr + BES(0x002)] << 8;
|
|
VR[vt][01] = DMEM[addr + BES(0x003)] << 8;
|
|
VR[vt][02] = DMEM[addr + BES(0x004)] << 8;
|
|
VR[vt][03] = DMEM[addr + BES(0x005)] << 8;
|
|
VR[vt][04] = DMEM[addr + BES(0x006)] << 8;
|
|
VR[vt][05] = DMEM[addr + BES(0x007)] << 8;
|
|
addr += 0x008;
|
|
addr &= 0x00000FFF;
|
|
VR[vt][06] = DMEM[addr + BES(0x000)] << 8;
|
|
VR[vt][07] = DMEM[addr + BES(0x001)] << 8;
|
|
break;
|
|
case 03: /* F3DZEX 2.08J "Doubutsu no Mori" (Animal Forest) CPU CFB */
|
|
VR[vt][00] = DMEM[addr + BES(0x003)] << 8;
|
|
VR[vt][01] = DMEM[addr + BES(0x004)] << 8;
|
|
VR[vt][02] = DMEM[addr + BES(0x005)] << 8;
|
|
VR[vt][03] = DMEM[addr + BES(0x006)] << 8;
|
|
VR[vt][04] = DMEM[addr + BES(0x007)] << 8;
|
|
addr += 0x008;
|
|
addr &= 0x00000FFF;
|
|
VR[vt][05] = DMEM[addr + BES(0x000)] << 8;
|
|
VR[vt][06] = DMEM[addr + BES(0x001)] << 8;
|
|
VR[vt][07] = DMEM[addr + BES(0x002)] << 8;
|
|
break;
|
|
case 04: /* "Resident Evil 2" in-game 3-D, F3DLX 2.08--"WWF No Mercy" */
|
|
VR[vt][00] = DMEM[addr + BES(0x004)] << 8;
|
|
VR[vt][01] = DMEM[addr + BES(0x005)] << 8;
|
|
VR[vt][02] = DMEM[addr + BES(0x006)] << 8;
|
|
VR[vt][03] = DMEM[addr + BES(0x007)] << 8;
|
|
addr += 0x008;
|
|
addr &= 0x00000FFF;
|
|
VR[vt][04] = DMEM[addr + BES(0x000)] << 8;
|
|
VR[vt][05] = DMEM[addr + BES(0x001)] << 8;
|
|
VR[vt][06] = DMEM[addr + BES(0x002)] << 8;
|
|
VR[vt][07] = DMEM[addr + BES(0x003)] << 8;
|
|
break;
|
|
case 05: /* F3DZEX 2.08J "Doubutsu no Mori" (Animal Forest) CPU CFB */
|
|
VR[vt][00] = DMEM[addr + BES(0x005)] << 8;
|
|
VR[vt][01] = DMEM[addr + BES(0x006)] << 8;
|
|
VR[vt][02] = DMEM[addr + BES(0x007)] << 8;
|
|
addr += 0x008;
|
|
addr &= 0x00000FFF;
|
|
VR[vt][03] = DMEM[addr + BES(0x000)] << 8;
|
|
VR[vt][04] = DMEM[addr + BES(0x001)] << 8;
|
|
VR[vt][05] = DMEM[addr + BES(0x002)] << 8;
|
|
VR[vt][06] = DMEM[addr + BES(0x003)] << 8;
|
|
VR[vt][07] = DMEM[addr + BES(0x004)] << 8;
|
|
break;
|
|
case 06: /* F3DZEX 2.08J "Doubutsu no Mori" (Animal Forest) CPU CFB */
|
|
VR[vt][00] = DMEM[addr + BES(0x006)] << 8;
|
|
VR[vt][01] = DMEM[addr + BES(0x007)] << 8;
|
|
addr += 0x008;
|
|
addr &= 0x00000FFF;
|
|
VR[vt][02] = DMEM[addr + BES(0x000)] << 8;
|
|
VR[vt][03] = DMEM[addr + BES(0x001)] << 8;
|
|
VR[vt][04] = DMEM[addr + BES(0x002)] << 8;
|
|
VR[vt][05] = DMEM[addr + BES(0x003)] << 8;
|
|
VR[vt][06] = DMEM[addr + BES(0x004)] << 8;
|
|
VR[vt][07] = DMEM[addr + BES(0x005)] << 8;
|
|
break;
|
|
case 07: /* F3DZEX 2.08J "Doubutsu no Mori" (Animal Forest) CPU CFB */
|
|
VR[vt][00] = DMEM[addr + BES(0x007)] << 8;
|
|
addr += 0x008;
|
|
addr &= 0x00000FFF;
|
|
VR[vt][01] = DMEM[addr + BES(0x000)] << 8;
|
|
VR[vt][02] = DMEM[addr + BES(0x001)] << 8;
|
|
VR[vt][03] = DMEM[addr + BES(0x002)] << 8;
|
|
VR[vt][04] = DMEM[addr + BES(0x003)] << 8;
|
|
VR[vt][05] = DMEM[addr + BES(0x004)] << 8;
|
|
VR[vt][06] = DMEM[addr + BES(0x005)] << 8;
|
|
VR[vt][07] = DMEM[addr + BES(0x006)] << 8;
|
|
break;
|
|
}
|
|
return;
|
|
}
|
|
void LUV(unsigned vt, unsigned element, signed offset, unsigned base)
|
|
{
|
|
register u32 addr;
|
|
register unsigned int b;
|
|
const unsigned int e = element;
|
|
|
|
addr = (SR[base] + 8*offset) & 0x00000FFF;
|
|
if (e != 0x0) {
|
|
addr += (~e + 0x1) & 0xF;
|
|
for (b = 0; b < 8; b++) {
|
|
VR[vt][b] = DMEM[BES(addr &= 0x00000FFF)] << 7;
|
|
addr -= 16 * (e - b - 1 == 0x0);
|
|
++addr;
|
|
}
|
|
return;
|
|
} /* "Mia Hamm Soccer 64" SP exception override (zilmar) */
|
|
b = addr & 07;
|
|
addr &= ~07;
|
|
switch (b) {
|
|
case 00:
|
|
VR[vt][07] = DMEM[addr + BES(0x007)] << 7;
|
|
VR[vt][06] = DMEM[addr + BES(0x006)] << 7;
|
|
VR[vt][05] = DMEM[addr + BES(0x005)] << 7;
|
|
VR[vt][04] = DMEM[addr + BES(0x004)] << 7;
|
|
VR[vt][03] = DMEM[addr + BES(0x003)] << 7;
|
|
VR[vt][02] = DMEM[addr + BES(0x002)] << 7;
|
|
VR[vt][01] = DMEM[addr + BES(0x001)] << 7;
|
|
VR[vt][00] = DMEM[addr + BES(0x000)] << 7;
|
|
break;
|
|
case 01: /* PKMN Puzzle League HVQM decoder */
|
|
VR[vt][00] = DMEM[addr + BES(0x001)] << 7;
|
|
VR[vt][01] = DMEM[addr + BES(0x002)] << 7;
|
|
VR[vt][02] = DMEM[addr + BES(0x003)] << 7;
|
|
VR[vt][03] = DMEM[addr + BES(0x004)] << 7;
|
|
VR[vt][04] = DMEM[addr + BES(0x005)] << 7;
|
|
VR[vt][05] = DMEM[addr + BES(0x006)] << 7;
|
|
VR[vt][06] = DMEM[addr + BES(0x007)] << 7;
|
|
addr += BES(0x008);
|
|
addr &= 0x00000FFF;
|
|
VR[vt][07] = DMEM[addr] << 7;
|
|
break;
|
|
case 02: /* PKMN Puzzle League HVQM decoder */
|
|
VR[vt][00] = DMEM[addr + BES(0x002)] << 7;
|
|
VR[vt][01] = DMEM[addr + BES(0x003)] << 7;
|
|
VR[vt][02] = DMEM[addr + BES(0x004)] << 7;
|
|
VR[vt][03] = DMEM[addr + BES(0x005)] << 7;
|
|
VR[vt][04] = DMEM[addr + BES(0x006)] << 7;
|
|
VR[vt][05] = DMEM[addr + BES(0x007)] << 7;
|
|
addr += 0x008;
|
|
addr &= 0x00000FFF;
|
|
VR[vt][06] = DMEM[addr + BES(0x000)] << 7;
|
|
VR[vt][07] = DMEM[addr + BES(0x001)] << 7;
|
|
break;
|
|
case 03: /* PKMN Puzzle League HVQM decoder */
|
|
VR[vt][00] = DMEM[addr + BES(0x003)] << 7;
|
|
VR[vt][01] = DMEM[addr + BES(0x004)] << 7;
|
|
VR[vt][02] = DMEM[addr + BES(0x005)] << 7;
|
|
VR[vt][03] = DMEM[addr + BES(0x006)] << 7;
|
|
VR[vt][04] = DMEM[addr + BES(0x007)] << 7;
|
|
addr += 0x008;
|
|
addr &= 0x00000FFF;
|
|
VR[vt][05] = DMEM[addr + BES(0x000)] << 7;
|
|
VR[vt][06] = DMEM[addr + BES(0x001)] << 7;
|
|
VR[vt][07] = DMEM[addr + BES(0x002)] << 7;
|
|
break;
|
|
case 04: /* PKMN Puzzle League HVQM decoder */
|
|
VR[vt][00] = DMEM[addr + BES(0x004)] << 7;
|
|
VR[vt][01] = DMEM[addr + BES(0x005)] << 7;
|
|
VR[vt][02] = DMEM[addr + BES(0x006)] << 7;
|
|
VR[vt][03] = DMEM[addr + BES(0x007)] << 7;
|
|
addr += 0x008;
|
|
addr &= 0x00000FFF;
|
|
VR[vt][04] = DMEM[addr + BES(0x000)] << 7;
|
|
VR[vt][05] = DMEM[addr + BES(0x001)] << 7;
|
|
VR[vt][06] = DMEM[addr + BES(0x002)] << 7;
|
|
VR[vt][07] = DMEM[addr + BES(0x003)] << 7;
|
|
break;
|
|
case 05: /* PKMN Puzzle League HVQM decoder */
|
|
VR[vt][00] = DMEM[addr + BES(0x005)] << 7;
|
|
VR[vt][01] = DMEM[addr + BES(0x006)] << 7;
|
|
VR[vt][02] = DMEM[addr + BES(0x007)] << 7;
|
|
addr += 0x008;
|
|
addr &= 0x00000FFF;
|
|
VR[vt][03] = DMEM[addr + BES(0x000)] << 7;
|
|
VR[vt][04] = DMEM[addr + BES(0x001)] << 7;
|
|
VR[vt][05] = DMEM[addr + BES(0x002)] << 7;
|
|
VR[vt][06] = DMEM[addr + BES(0x003)] << 7;
|
|
VR[vt][07] = DMEM[addr + BES(0x004)] << 7;
|
|
break;
|
|
case 06: /* PKMN Puzzle League HVQM decoder */
|
|
VR[vt][00] = DMEM[addr + BES(0x006)] << 7;
|
|
VR[vt][01] = DMEM[addr + BES(0x007)] << 7;
|
|
addr += 0x008;
|
|
addr &= 0x00000FFF;
|
|
VR[vt][02] = DMEM[addr + BES(0x000)] << 7;
|
|
VR[vt][03] = DMEM[addr + BES(0x001)] << 7;
|
|
VR[vt][04] = DMEM[addr + BES(0x002)] << 7;
|
|
VR[vt][05] = DMEM[addr + BES(0x003)] << 7;
|
|
VR[vt][06] = DMEM[addr + BES(0x004)] << 7;
|
|
VR[vt][07] = DMEM[addr + BES(0x005)] << 7;
|
|
break;
|
|
case 07: /* PKMN Puzzle League HVQM decoder */
|
|
VR[vt][00] = DMEM[addr + BES(0x007)] << 7;
|
|
addr += 0x008;
|
|
addr &= 0x00000FFF;
|
|
VR[vt][01] = DMEM[addr + BES(0x000)] << 7;
|
|
VR[vt][02] = DMEM[addr + BES(0x001)] << 7;
|
|
VR[vt][03] = DMEM[addr + BES(0x002)] << 7;
|
|
VR[vt][04] = DMEM[addr + BES(0x003)] << 7;
|
|
VR[vt][05] = DMEM[addr + BES(0x004)] << 7;
|
|
VR[vt][06] = DMEM[addr + BES(0x005)] << 7;
|
|
VR[vt][07] = DMEM[addr + BES(0x006)] << 7;
|
|
break;
|
|
}
|
|
return;
|
|
}
|
|
void SPV(unsigned vt, unsigned element, signed offset, unsigned base)
|
|
{
|
|
register u32 addr;
|
|
register unsigned int b;
|
|
const unsigned int e = element;
|
|
|
|
if (e != 0x0) {
|
|
message("SPV\nIllegal element.");
|
|
return;
|
|
}
|
|
addr = (SR[base] + 8*offset) & 0x00000FFF;
|
|
b = addr & 07;
|
|
addr &= ~07;
|
|
switch (b) {
|
|
case 00:
|
|
DMEM[addr + BES(0x007)] = (u8)(VR[vt][07] >> 8);
|
|
DMEM[addr + BES(0x006)] = (u8)(VR[vt][06] >> 8);
|
|
DMEM[addr + BES(0x005)] = (u8)(VR[vt][05] >> 8);
|
|
DMEM[addr + BES(0x004)] = (u8)(VR[vt][04] >> 8);
|
|
DMEM[addr + BES(0x003)] = (u8)(VR[vt][03] >> 8);
|
|
DMEM[addr + BES(0x002)] = (u8)(VR[vt][02] >> 8);
|
|
DMEM[addr + BES(0x001)] = (u8)(VR[vt][01] >> 8);
|
|
DMEM[addr + BES(0x000)] = (u8)(VR[vt][00] >> 8);
|
|
break;
|
|
case 01: /* F3DZEX 2.08J "Doubutsu no Mori" (Animal Forest) CPU CFB */
|
|
DMEM[addr + BES(0x001)] = (u8)(VR[vt][00] >> 8);
|
|
DMEM[addr + BES(0x002)] = (u8)(VR[vt][01] >> 8);
|
|
DMEM[addr + BES(0x003)] = (u8)(VR[vt][02] >> 8);
|
|
DMEM[addr + BES(0x004)] = (u8)(VR[vt][03] >> 8);
|
|
DMEM[addr + BES(0x005)] = (u8)(VR[vt][04] >> 8);
|
|
DMEM[addr + BES(0x006)] = (u8)(VR[vt][05] >> 8);
|
|
DMEM[addr + BES(0x007)] = (u8)(VR[vt][06] >> 8);
|
|
addr += BES(0x008);
|
|
addr &= 0x00000FFF;
|
|
DMEM[addr] = (u8)(VR[vt][07] >> 8);
|
|
break;
|
|
case 02: /* F3DZEX 2.08J "Doubutsu no Mori" (Animal Forest) CPU CFB */
|
|
DMEM[addr + BES(0x002)] = (u8)(VR[vt][00] >> 8);
|
|
DMEM[addr + BES(0x003)] = (u8)(VR[vt][01] >> 8);
|
|
DMEM[addr + BES(0x004)] = (u8)(VR[vt][02] >> 8);
|
|
DMEM[addr + BES(0x005)] = (u8)(VR[vt][03] >> 8);
|
|
DMEM[addr + BES(0x006)] = (u8)(VR[vt][04] >> 8);
|
|
DMEM[addr + BES(0x007)] = (u8)(VR[vt][05] >> 8);
|
|
addr += 0x008;
|
|
addr &= 0x00000FFF;
|
|
DMEM[addr + BES(0x000)] = (u8)(VR[vt][06] >> 8);
|
|
DMEM[addr + BES(0x001)] = (u8)(VR[vt][07] >> 8);
|
|
break;
|
|
case 03: /* F3DZEX 2.08J "Doubutsu no Mori" (Animal Forest) CPU CFB */
|
|
DMEM[addr + BES(0x003)] = (u8)(VR[vt][00] >> 8);
|
|
DMEM[addr + BES(0x004)] = (u8)(VR[vt][01] >> 8);
|
|
DMEM[addr + BES(0x005)] = (u8)(VR[vt][02] >> 8);
|
|
DMEM[addr + BES(0x006)] = (u8)(VR[vt][03] >> 8);
|
|
DMEM[addr + BES(0x007)] = (u8)(VR[vt][04] >> 8);
|
|
addr += 0x008;
|
|
addr &= 0x00000FFF;
|
|
DMEM[addr + BES(0x000)] = (u8)(VR[vt][05] >> 8);
|
|
DMEM[addr + BES(0x001)] = (u8)(VR[vt][06] >> 8);
|
|
DMEM[addr + BES(0x002)] = (u8)(VR[vt][07] >> 8);
|
|
break;
|
|
case 04: /* F3DZEX 2.08J "Doubutsu no Mori" (Animal Forest) CPU CFB */
|
|
DMEM[addr + BES(0x004)] = (u8)(VR[vt][00] >> 8);
|
|
DMEM[addr + BES(0x005)] = (u8)(VR[vt][01] >> 8);
|
|
DMEM[addr + BES(0x006)] = (u8)(VR[vt][02] >> 8);
|
|
DMEM[addr + BES(0x007)] = (u8)(VR[vt][03] >> 8);
|
|
addr += 0x008;
|
|
addr &= 0x00000FFF;
|
|
DMEM[addr + BES(0x000)] = (u8)(VR[vt][04] >> 8);
|
|
DMEM[addr + BES(0x001)] = (u8)(VR[vt][05] >> 8);
|
|
DMEM[addr + BES(0x002)] = (u8)(VR[vt][06] >> 8);
|
|
DMEM[addr + BES(0x003)] = (u8)(VR[vt][07] >> 8);
|
|
break;
|
|
case 05: /* F3DZEX 2.08J "Doubutsu no Mori" (Animal Forest) CPU CFB */
|
|
DMEM[addr + BES(0x005)] = (u8)(VR[vt][00] >> 8);
|
|
DMEM[addr + BES(0x006)] = (u8)(VR[vt][01] >> 8);
|
|
DMEM[addr + BES(0x007)] = (u8)(VR[vt][02] >> 8);
|
|
addr += 0x008;
|
|
addr &= 0x00000FFF;
|
|
DMEM[addr + BES(0x000)] = (u8)(VR[vt][03] >> 8);
|
|
DMEM[addr + BES(0x001)] = (u8)(VR[vt][04] >> 8);
|
|
DMEM[addr + BES(0x002)] = (u8)(VR[vt][05] >> 8);
|
|
DMEM[addr + BES(0x003)] = (u8)(VR[vt][06] >> 8);
|
|
DMEM[addr + BES(0x004)] = (u8)(VR[vt][07] >> 8);
|
|
break;
|
|
case 06: /* F3DZEX 2.08J "Doubutsu no Mori" (Animal Forest) CPU CFB */
|
|
DMEM[addr + BES(0x006)] = (u8)(VR[vt][00] >> 8);
|
|
DMEM[addr + BES(0x007)] = (u8)(VR[vt][01] >> 8);
|
|
addr += 0x008;
|
|
addr &= 0x00000FFF;
|
|
DMEM[addr + BES(0x000)] = (u8)(VR[vt][02] >> 8);
|
|
DMEM[addr + BES(0x001)] = (u8)(VR[vt][03] >> 8);
|
|
DMEM[addr + BES(0x002)] = (u8)(VR[vt][04] >> 8);
|
|
DMEM[addr + BES(0x003)] = (u8)(VR[vt][05] >> 8);
|
|
DMEM[addr + BES(0x004)] = (u8)(VR[vt][06] >> 8);
|
|
DMEM[addr + BES(0x005)] = (u8)(VR[vt][07] >> 8);
|
|
break;
|
|
case 07: /* F3DZEX 2.08J "Doubutsu no Mori" (Animal Forest) CPU CFB */
|
|
DMEM[addr + BES(0x007)] = (u8)(VR[vt][00] >> 8);
|
|
addr += 0x008;
|
|
addr &= 0x00000FFF;
|
|
DMEM[addr + BES(0x000)] = (u8)(VR[vt][01] >> 8);
|
|
DMEM[addr + BES(0x001)] = (u8)(VR[vt][02] >> 8);
|
|
DMEM[addr + BES(0x002)] = (u8)(VR[vt][03] >> 8);
|
|
DMEM[addr + BES(0x003)] = (u8)(VR[vt][04] >> 8);
|
|
DMEM[addr + BES(0x004)] = (u8)(VR[vt][05] >> 8);
|
|
DMEM[addr + BES(0x005)] = (u8)(VR[vt][06] >> 8);
|
|
DMEM[addr + BES(0x006)] = (u8)(VR[vt][07] >> 8);
|
|
break;
|
|
}
|
|
return;
|
|
}
|
|
void SUV(unsigned vt, unsigned element, signed offset, unsigned base)
|
|
{
|
|
register u32 addr;
|
|
register unsigned int b;
|
|
const unsigned int e = element;
|
|
|
|
if (e != 0x0) {
|
|
message("SUV\nIllegal element.");
|
|
return;
|
|
}
|
|
addr = (SR[base] + 8*offset) & 0x00000FFF;
|
|
b = addr & 07;
|
|
addr &= ~07;
|
|
switch (b) {
|
|
case 00:
|
|
DMEM[addr + BES(0x007)] = (u8)(VR[vt][07] >> 7);
|
|
DMEM[addr + BES(0x006)] = (u8)(VR[vt][06] >> 7);
|
|
DMEM[addr + BES(0x005)] = (u8)(VR[vt][05] >> 7);
|
|
DMEM[addr + BES(0x004)] = (u8)(VR[vt][04] >> 7);
|
|
DMEM[addr + BES(0x003)] = (u8)(VR[vt][03] >> 7);
|
|
DMEM[addr + BES(0x002)] = (u8)(VR[vt][02] >> 7);
|
|
DMEM[addr + BES(0x001)] = (u8)(VR[vt][01] >> 7);
|
|
DMEM[addr + BES(0x000)] = (u8)(VR[vt][00] >> 7);
|
|
break;
|
|
case 04: /* "Indiana Jones and the Infernal Machine" in-game */
|
|
DMEM[addr + BES(0x004)] = (u8)(VR[vt][00] >> 7);
|
|
DMEM[addr + BES(0x005)] = (u8)(VR[vt][01] >> 7);
|
|
DMEM[addr + BES(0x006)] = (u8)(VR[vt][02] >> 7);
|
|
DMEM[addr + BES(0x007)] = (u8)(VR[vt][03] >> 7);
|
|
addr += 0x008;
|
|
addr &= 0x00000FFF;
|
|
DMEM[addr + BES(0x000)] = (u8)(VR[vt][04] >> 7);
|
|
DMEM[addr + BES(0x001)] = (u8)(VR[vt][05] >> 7);
|
|
DMEM[addr + BES(0x002)] = (u8)(VR[vt][06] >> 7);
|
|
DMEM[addr + BES(0x003)] = (u8)(VR[vt][07] >> 7);
|
|
break;
|
|
default: /* Completely legal, just never seen it be done. */
|
|
message("SUV\nWeird addr.");
|
|
}
|
|
return;
|
|
}
|
|
|
|
/*
|
|
* Group III vector loads and stores:
|
|
* HV, FV, and AV (As of RCP implementation, AV opcodes are reserved.)
|
|
*/
|
|
void LHV(unsigned vt, unsigned element, signed offset, unsigned base)
|
|
{
|
|
register u32 addr;
|
|
const unsigned int e = element;
|
|
|
|
if (e != 0x0) {
|
|
message("LHV\nIllegal element.");
|
|
return;
|
|
}
|
|
addr = (SR[base] + 16*offset) & 0x00000FFF;
|
|
if (addr & 0x0000000E) {
|
|
message("LHV\nIllegal addr.");
|
|
return;
|
|
}
|
|
addr ^= MES(00);
|
|
VR[vt][07] = DMEM[addr + HES(0x00E)] << 7;
|
|
VR[vt][06] = DMEM[addr + HES(0x00C)] << 7;
|
|
VR[vt][05] = DMEM[addr + HES(0x00A)] << 7;
|
|
VR[vt][04] = DMEM[addr + HES(0x008)] << 7;
|
|
VR[vt][03] = DMEM[addr + HES(0x006)] << 7;
|
|
VR[vt][02] = DMEM[addr + HES(0x004)] << 7;
|
|
VR[vt][01] = DMEM[addr + HES(0x002)] << 7;
|
|
VR[vt][00] = DMEM[addr + HES(0x000)] << 7;
|
|
return;
|
|
}
|
|
void LFV(unsigned vt, unsigned element, signed offset, unsigned base)
|
|
{ /* Dummy implementation only: Do any games execute this? */
|
|
res_lsw(vt, element, offset, base);
|
|
return;
|
|
}
|
|
void SHV(unsigned vt, unsigned element, signed offset, unsigned base)
|
|
{
|
|
register u32 addr;
|
|
const unsigned int e = element;
|
|
|
|
if (e != 0x0) {
|
|
message("SHV\nIllegal element.");
|
|
return;
|
|
}
|
|
addr = (SR[base] + 16*offset) & 0x00000FFF;
|
|
if (addr & 0x0000000E) {
|
|
message("SHV\nIllegal addr.");
|
|
return;
|
|
}
|
|
addr ^= MES(00);
|
|
DMEM[addr + HES(0x00E)] = (u8)(VR[vt][07] >> 7);
|
|
DMEM[addr + HES(0x00C)] = (u8)(VR[vt][06] >> 7);
|
|
DMEM[addr + HES(0x00A)] = (u8)(VR[vt][05] >> 7);
|
|
DMEM[addr + HES(0x008)] = (u8)(VR[vt][04] >> 7);
|
|
DMEM[addr + HES(0x006)] = (u8)(VR[vt][03] >> 7);
|
|
DMEM[addr + HES(0x004)] = (u8)(VR[vt][02] >> 7);
|
|
DMEM[addr + HES(0x002)] = (u8)(VR[vt][01] >> 7);
|
|
DMEM[addr + HES(0x000)] = (u8)(VR[vt][00] >> 7);
|
|
return;
|
|
}
|
|
void SFV(unsigned vt, unsigned element, signed offset, unsigned base)
|
|
{
|
|
register u32 addr;
|
|
const unsigned int e = element;
|
|
|
|
addr = (SR[base] + 16*offset) & 0x00000FFF;
|
|
addr &= 0x00000FF3;
|
|
addr ^= BES(00);
|
|
switch (e) {
|
|
case 0x0:
|
|
DMEM[addr + 0x000] = (u8)(VR[vt][00] >> 7);
|
|
DMEM[addr + 0x004] = (u8)(VR[vt][01] >> 7);
|
|
DMEM[addr + 0x008] = (u8)(VR[vt][02] >> 7);
|
|
DMEM[addr + 0x00C] = (u8)(VR[vt][03] >> 7);
|
|
break;
|
|
case 0x8:
|
|
DMEM[addr + 0x000] = (u8)(VR[vt][04] >> 7);
|
|
DMEM[addr + 0x004] = (u8)(VR[vt][05] >> 7);
|
|
DMEM[addr + 0x008] = (u8)(VR[vt][06] >> 7);
|
|
DMEM[addr + 0x00C] = (u8)(VR[vt][07] >> 7);
|
|
break;
|
|
default:
|
|
message("SFV\nIllegal element.");
|
|
}
|
|
return;
|
|
}
|
|
|
|
/*
|
|
* Group IV vector loads and stores:
|
|
* QV and RV
|
|
*/
|
|
void LQV(unsigned vt, unsigned element, signed offset, unsigned base)
|
|
{
|
|
register u32 addr;
|
|
register unsigned int b;
|
|
const unsigned int e = element; /* Boss Game Studios illegal elements */
|
|
|
|
if (e & 0x1) {
|
|
message("LQV\nOdd element.");
|
|
return;
|
|
}
|
|
addr = (SR[base] + 16*offset) & 0x00000FFF;
|
|
if (addr & 0x00000001) {
|
|
message("LQV\nOdd addr.");
|
|
return;
|
|
}
|
|
b = addr & 0x0000000F;
|
|
|
|
addr &= ~0x0000000F;
|
|
switch (b/2) { /* mistake in SGI patent regarding LQV */
|
|
case 0x0/2:
|
|
VR_S(vt,e+0x0) = *(pi16)(DMEM + addr + HES(0x000));
|
|
VR_S(vt,e+0x2) = *(pi16)(DMEM + addr + HES(0x002));
|
|
VR_S(vt,e+0x4) = *(pi16)(DMEM + addr + HES(0x004));
|
|
VR_S(vt,e+0x6) = *(pi16)(DMEM + addr + HES(0x006));
|
|
VR_S(vt,e+0x8) = *(pi16)(DMEM + addr + HES(0x008));
|
|
VR_S(vt,e+0xA) = *(pi16)(DMEM + addr + HES(0x00A));
|
|
VR_S(vt,e+0xC) = *(pi16)(DMEM + addr + HES(0x00C));
|
|
VR_S(vt,e+0xE) = *(pi16)(DMEM + addr + HES(0x00E));
|
|
break;
|
|
case 0x2/2:
|
|
VR_S(vt,e+0x0) = *(pi16)(DMEM + addr + HES(0x002));
|
|
VR_S(vt,e+0x2) = *(pi16)(DMEM + addr + HES(0x004));
|
|
VR_S(vt,e+0x4) = *(pi16)(DMEM + addr + HES(0x006));
|
|
VR_S(vt,e+0x6) = *(pi16)(DMEM + addr + HES(0x008));
|
|
VR_S(vt,e+0x8) = *(pi16)(DMEM + addr + HES(0x00A));
|
|
VR_S(vt,e+0xA) = *(pi16)(DMEM + addr + HES(0x00C));
|
|
VR_S(vt,e+0xC) = *(pi16)(DMEM + addr + HES(0x00E));
|
|
break;
|
|
case 0x4/2:
|
|
VR_S(vt,e+0x0) = *(pi16)(DMEM + addr + HES(0x004));
|
|
VR_S(vt,e+0x2) = *(pi16)(DMEM + addr + HES(0x006));
|
|
VR_S(vt,e+0x4) = *(pi16)(DMEM + addr + HES(0x008));
|
|
VR_S(vt,e+0x6) = *(pi16)(DMEM + addr + HES(0x00A));
|
|
VR_S(vt,e+0x8) = *(pi16)(DMEM + addr + HES(0x00C));
|
|
VR_S(vt,e+0xA) = *(pi16)(DMEM + addr + HES(0x00E));
|
|
break;
|
|
case 0x6/2:
|
|
VR_S(vt,e+0x0) = *(pi16)(DMEM + addr + HES(0x006));
|
|
VR_S(vt,e+0x2) = *(pi16)(DMEM + addr + HES(0x008));
|
|
VR_S(vt,e+0x4) = *(pi16)(DMEM + addr + HES(0x00A));
|
|
VR_S(vt,e+0x6) = *(pi16)(DMEM + addr + HES(0x00C));
|
|
VR_S(vt,e+0x8) = *(pi16)(DMEM + addr + HES(0x00E));
|
|
break;
|
|
case 0x8/2: /* "Resident Evil 2" cinematics and Boss Game Studios */
|
|
VR_S(vt,e+0x0) = *(pi16)(DMEM + addr + HES(0x008));
|
|
VR_S(vt,e+0x2) = *(pi16)(DMEM + addr + HES(0x00A));
|
|
VR_S(vt,e+0x4) = *(pi16)(DMEM + addr + HES(0x00C));
|
|
VR_S(vt,e+0x6) = *(pi16)(DMEM + addr + HES(0x00E));
|
|
break;
|
|
case 0xA/2: /* "Conker's Bad Fur Day" audio microcode by Rareware */
|
|
VR_S(vt,e+0x0) = *(pi16)(DMEM + addr + HES(0x00A));
|
|
VR_S(vt,e+0x2) = *(pi16)(DMEM + addr + HES(0x00C));
|
|
VR_S(vt,e+0x4) = *(pi16)(DMEM + addr + HES(0x00E));
|
|
break;
|
|
case 0xC/2: /* "Conker's Bad Fur Day" audio microcode by Rareware */
|
|
VR_S(vt,e+0x0) = *(pi16)(DMEM + addr + HES(0x00C));
|
|
VR_S(vt,e+0x2) = *(pi16)(DMEM + addr + HES(0x00E));
|
|
break;
|
|
case 0xE/2: /* "Conker's Bad Fur Day" audio microcode by Rareware */
|
|
VR_S(vt,e+0x0) = *(pi16)(DMEM + addr + HES(0x00E));
|
|
break;
|
|
}
|
|
return;
|
|
}
|
|
void LRV(unsigned vt, unsigned element, signed offset, unsigned base)
|
|
{
|
|
register u32 addr;
|
|
register unsigned int b;
|
|
const unsigned int e = element;
|
|
|
|
if (e != 0x0) {
|
|
message("LRV\nIllegal element.");
|
|
return;
|
|
}
|
|
addr = (SR[base] + 16*offset) & 0x00000FFF;
|
|
if (addr & 0x00000001) {
|
|
message("LRV\nOdd addr.");
|
|
return;
|
|
}
|
|
b = addr & 0x0000000F;
|
|
addr &= ~0x0000000F;
|
|
switch (b/2) {
|
|
case 0xE/2:
|
|
VR[vt][01] = *(pi16)(DMEM + addr + HES(0x000));
|
|
VR[vt][02] = *(pi16)(DMEM + addr + HES(0x002));
|
|
VR[vt][03] = *(pi16)(DMEM + addr + HES(0x004));
|
|
VR[vt][04] = *(pi16)(DMEM + addr + HES(0x006));
|
|
VR[vt][05] = *(pi16)(DMEM + addr + HES(0x008));
|
|
VR[vt][06] = *(pi16)(DMEM + addr + HES(0x00A));
|
|
VR[vt][07] = *(pi16)(DMEM + addr + HES(0x00C));
|
|
break;
|
|
case 0xC/2:
|
|
VR[vt][02] = *(pi16)(DMEM + addr + HES(0x000));
|
|
VR[vt][03] = *(pi16)(DMEM + addr + HES(0x002));
|
|
VR[vt][04] = *(pi16)(DMEM + addr + HES(0x004));
|
|
VR[vt][05] = *(pi16)(DMEM + addr + HES(0x006));
|
|
VR[vt][06] = *(pi16)(DMEM + addr + HES(0x008));
|
|
VR[vt][07] = *(pi16)(DMEM + addr + HES(0x00A));
|
|
break;
|
|
case 0xA/2:
|
|
VR[vt][03] = *(pi16)(DMEM + addr + HES(0x000));
|
|
VR[vt][04] = *(pi16)(DMEM + addr + HES(0x002));
|
|
VR[vt][05] = *(pi16)(DMEM + addr + HES(0x004));
|
|
VR[vt][06] = *(pi16)(DMEM + addr + HES(0x006));
|
|
VR[vt][07] = *(pi16)(DMEM + addr + HES(0x008));
|
|
break;
|
|
case 0x8/2:
|
|
VR[vt][04] = *(pi16)(DMEM + addr + HES(0x000));
|
|
VR[vt][05] = *(pi16)(DMEM + addr + HES(0x002));
|
|
VR[vt][06] = *(pi16)(DMEM + addr + HES(0x004));
|
|
VR[vt][07] = *(pi16)(DMEM + addr + HES(0x006));
|
|
break;
|
|
case 0x6/2:
|
|
VR[vt][05] = *(pi16)(DMEM + addr + HES(0x000));
|
|
VR[vt][06] = *(pi16)(DMEM + addr + HES(0x002));
|
|
VR[vt][07] = *(pi16)(DMEM + addr + HES(0x004));
|
|
break;
|
|
case 0x4/2:
|
|
VR[vt][06] = *(pi16)(DMEM + addr + HES(0x000));
|
|
VR[vt][07] = *(pi16)(DMEM + addr + HES(0x002));
|
|
break;
|
|
case 0x2/2:
|
|
VR[vt][07] = *(pi16)(DMEM + addr + HES(0x000));
|
|
break;
|
|
case 0x0/2:
|
|
break;
|
|
}
|
|
return;
|
|
}
|
|
void SQV(unsigned vt, unsigned element, signed offset, unsigned base)
|
|
{
|
|
register u32 addr;
|
|
register unsigned int b;
|
|
const unsigned int e = element;
|
|
|
|
addr = (SR[base] + 16*offset) & 0x00000FFF;
|
|
if (e != 0x0) {
|
|
register unsigned int i;
|
|
|
|
#if (VR_STATIC_WRAPAROUND == 1)
|
|
vector_copy(VR[vt] + N, VR[vt]);
|
|
for (i = 0; i < 16 - addr%16; i++)
|
|
DMEM[BES((addr + i) & 0xFFF)] = VR_B(vt, e + i);
|
|
#else
|
|
for (i = 0; i < 16 - addr%16; i++)
|
|
DMEM[BES((addr + i) & 0xFFF)] = VR_B(vt, (e + i) & 0xF);
|
|
#endif
|
|
return;
|
|
} /* illegal SQV, happens with "Mia Hamm Soccer 64" */
|
|
b = addr & 0x0000000F;
|
|
addr &= ~0x0000000F;
|
|
switch (b) {
|
|
case 00:
|
|
*(pi16)(DMEM + addr + HES(0x000)) = VR[vt][00];
|
|
*(pi16)(DMEM + addr + HES(0x002)) = VR[vt][01];
|
|
*(pi16)(DMEM + addr + HES(0x004)) = VR[vt][02];
|
|
*(pi16)(DMEM + addr + HES(0x006)) = VR[vt][03];
|
|
*(pi16)(DMEM + addr + HES(0x008)) = VR[vt][04];
|
|
*(pi16)(DMEM + addr + HES(0x00A)) = VR[vt][05];
|
|
*(pi16)(DMEM + addr + HES(0x00C)) = VR[vt][06];
|
|
*(pi16)(DMEM + addr + HES(0x00E)) = VR[vt][07];
|
|
break;
|
|
case 02:
|
|
*(pi16)(DMEM + addr + HES(0x002)) = VR[vt][00];
|
|
*(pi16)(DMEM + addr + HES(0x004)) = VR[vt][01];
|
|
*(pi16)(DMEM + addr + HES(0x006)) = VR[vt][02];
|
|
*(pi16)(DMEM + addr + HES(0x008)) = VR[vt][03];
|
|
*(pi16)(DMEM + addr + HES(0x00A)) = VR[vt][04];
|
|
*(pi16)(DMEM + addr + HES(0x00C)) = VR[vt][05];
|
|
*(pi16)(DMEM + addr + HES(0x00E)) = VR[vt][06];
|
|
break;
|
|
case 04:
|
|
*(pi16)(DMEM + addr + HES(0x004)) = VR[vt][00];
|
|
*(pi16)(DMEM + addr + HES(0x006)) = VR[vt][01];
|
|
*(pi16)(DMEM + addr + HES(0x008)) = VR[vt][02];
|
|
*(pi16)(DMEM + addr + HES(0x00A)) = VR[vt][03];
|
|
*(pi16)(DMEM + addr + HES(0x00C)) = VR[vt][04];
|
|
*(pi16)(DMEM + addr + HES(0x00E)) = VR[vt][05];
|
|
break;
|
|
case 06:
|
|
*(pi16)(DMEM + addr + HES(0x006)) = VR[vt][00];
|
|
*(pi16)(DMEM + addr + HES(0x008)) = VR[vt][01];
|
|
*(pi16)(DMEM + addr + HES(0x00A)) = VR[vt][02];
|
|
*(pi16)(DMEM + addr + HES(0x00C)) = VR[vt][03];
|
|
*(pi16)(DMEM + addr + HES(0x00E)) = VR[vt][04];
|
|
break;
|
|
default:
|
|
message("SQV\nWeird addr.");
|
|
}
|
|
return;
|
|
}
|
|
void SRV(unsigned vt, unsigned element, signed offset, unsigned base)
|
|
{
|
|
register u32 addr;
|
|
register unsigned int b;
|
|
const unsigned int e = element;
|
|
|
|
if (e != 0x0) {
|
|
message("SRV\nIllegal element.");
|
|
return;
|
|
}
|
|
addr = (SR[base] + 16*offset) & 0x00000FFF;
|
|
if (addr & 0x00000001) {
|
|
message("SRV\nOdd addr.");
|
|
return;
|
|
}
|
|
b = addr & 0x0000000F;
|
|
|
|
addr &= ~0x0000000F;
|
|
switch (b/2) {
|
|
case 0xE/2:
|
|
*(pi16)(DMEM + addr + HES(0x000)) = VR[vt][01];
|
|
*(pi16)(DMEM + addr + HES(0x002)) = VR[vt][02];
|
|
*(pi16)(DMEM + addr + HES(0x004)) = VR[vt][03];
|
|
*(pi16)(DMEM + addr + HES(0x006)) = VR[vt][04];
|
|
*(pi16)(DMEM + addr + HES(0x008)) = VR[vt][05];
|
|
*(pi16)(DMEM + addr + HES(0x00A)) = VR[vt][06];
|
|
*(pi16)(DMEM + addr + HES(0x00C)) = VR[vt][07];
|
|
break;
|
|
case 0xC/2:
|
|
*(pi16)(DMEM + addr + HES(0x000)) = VR[vt][02];
|
|
*(pi16)(DMEM + addr + HES(0x002)) = VR[vt][03];
|
|
*(pi16)(DMEM + addr + HES(0x004)) = VR[vt][04];
|
|
*(pi16)(DMEM + addr + HES(0x006)) = VR[vt][05];
|
|
*(pi16)(DMEM + addr + HES(0x008)) = VR[vt][06];
|
|
*(pi16)(DMEM + addr + HES(0x00A)) = VR[vt][07];
|
|
break;
|
|
case 0xA/2:
|
|
*(pi16)(DMEM + addr + HES(0x000)) = VR[vt][03];
|
|
*(pi16)(DMEM + addr + HES(0x002)) = VR[vt][04];
|
|
*(pi16)(DMEM + addr + HES(0x004)) = VR[vt][05];
|
|
*(pi16)(DMEM + addr + HES(0x006)) = VR[vt][06];
|
|
*(pi16)(DMEM + addr + HES(0x008)) = VR[vt][07];
|
|
break;
|
|
case 0x8/2:
|
|
*(pi16)(DMEM + addr + HES(0x000)) = VR[vt][04];
|
|
*(pi16)(DMEM + addr + HES(0x002)) = VR[vt][05];
|
|
*(pi16)(DMEM + addr + HES(0x004)) = VR[vt][06];
|
|
*(pi16)(DMEM + addr + HES(0x006)) = VR[vt][07];
|
|
break;
|
|
case 0x6/2:
|
|
*(pi16)(DMEM + addr + HES(0x000)) = VR[vt][05];
|
|
*(pi16)(DMEM + addr + HES(0x002)) = VR[vt][06];
|
|
*(pi16)(DMEM + addr + HES(0x004)) = VR[vt][07];
|
|
break;
|
|
case 0x4/2:
|
|
*(pi16)(DMEM + addr + HES(0x000)) = VR[vt][06];
|
|
*(pi16)(DMEM + addr + HES(0x002)) = VR[vt][07];
|
|
break;
|
|
case 0x2/2:
|
|
*(pi16)(DMEM + addr + HES(0x000)) = VR[vt][07];
|
|
break;
|
|
case 0x0/2:
|
|
break;
|
|
}
|
|
return;
|
|
}
|
|
|
|
/*
|
|
* Group V vector loads and stores
|
|
* TV and SWV (As of RCP implementation, LTWV opcode was undesired.)
|
|
*/
|
|
void LTV(unsigned vt, unsigned element, signed offset, unsigned base)
|
|
{
|
|
register u32 addr;
|
|
register unsigned int i;
|
|
const unsigned int e = element;
|
|
|
|
if (e & 1) {
|
|
message("LTV\nIllegal element.");
|
|
return;
|
|
}
|
|
if (vt & 07) {
|
|
message("LTV\nUncertain case!");
|
|
return; /* For LTV I am not sure; for STV I have an idea. */
|
|
}
|
|
addr = (SR[base] + 16*offset) & 0x00000FFF;
|
|
if (addr & 0x0000000F) {
|
|
message("LTV\nIllegal addr.");
|
|
return;
|
|
}
|
|
for (i = 0; i < 8; i++) /* SGI screwed LTV up on N64. See STV instead. */
|
|
VR[vt + i][(i - e/2) & 07] = *(pi16)(DMEM + addr + HES(2*i));
|
|
return;
|
|
}
|
|
void SWV(unsigned vt, unsigned element, signed offset, unsigned base)
|
|
{ /* Dummy implementation only: Do any games execute this? */
|
|
res_lsw(vt, element, offset, base);
|
|
return;
|
|
}
|
|
void STV(unsigned vt, unsigned element, signed offset, unsigned base)
|
|
{
|
|
register u32 addr;
|
|
register unsigned int i;
|
|
const unsigned int e = element;
|
|
|
|
if (e & 1) {
|
|
message("STV\nIllegal element.");
|
|
return;
|
|
}
|
|
if (vt & 07) {
|
|
message("STV\nUncertain case!");
|
|
return; /* vt &= 030; */
|
|
}
|
|
addr = (SR[base] + 16*offset) & 0x00000FFF;
|
|
if (addr & 0x0000000F) {
|
|
message("STV\nIllegal addr.");
|
|
return;
|
|
}
|
|
for (i = 0; i < 8; i++)
|
|
*(pi16)(DMEM + addr + HES(2*i)) = VR[vt + (e/2 + i)%8][i];
|
|
return;
|
|
}
|
|
|
|
int temp_PC;
|
|
#ifdef WAIT_FOR_CPU_HOST
|
|
short MFC0_count[32];
|
|
#endif
|
|
|
|
mwc2_func LWC2[2 * 8*2] = {
|
|
LBV ,LSV ,LLV ,LDV ,LQV ,LRV ,LPV ,LUV ,
|
|
LHV ,LFV ,res_lsw,LTV ,res_lsw,res_lsw,res_lsw,res_lsw,
|
|
res_lsw,res_lsw,res_lsw,res_lsw,res_lsw,res_lsw,res_lsw,res_lsw,
|
|
res_lsw,res_lsw,res_lsw,res_lsw,res_lsw,res_lsw,res_lsw,res_lsw,
|
|
};
|
|
mwc2_func SWC2[2 * 8*2] = {
|
|
SBV ,SSV ,SLV ,SDV ,SQV ,SRV ,SPV ,SUV ,
|
|
SHV ,SFV ,SWV ,STV ,res_lsw,res_lsw,res_lsw,res_lsw,
|
|
res_lsw,res_lsw,res_lsw,res_lsw,res_lsw,res_lsw,res_lsw,res_lsw,
|
|
res_lsw,res_lsw,res_lsw,res_lsw,res_lsw,res_lsw,res_lsw,res_lsw,
|
|
};
|
|
|
|
static ALIGNED i16 shuffle_temporary[N];
|
|
#ifndef ARCH_MIN_SSE2
|
|
static const unsigned char ei[1 << 4][N] = {
|
|
{ 00, 01, 02, 03, 04, 05, 06, 07 }, /* none (vector-only operand) */
|
|
{ 00, 01, 02, 03, 04, 05, 06, 07 },
|
|
{ 00, 00, 02, 02, 04, 04, 06, 06 }, /* 0Q */
|
|
{ 01, 01, 03, 03, 05, 05, 07, 07 }, /* 1Q */
|
|
{ 00, 00, 00, 00, 04, 04, 04, 04 }, /* 0H */
|
|
{ 01, 01, 01, 01, 05, 05, 05, 05 }, /* 1H */
|
|
{ 02, 02, 02, 02, 06, 06, 06, 06 }, /* 2H */
|
|
{ 03, 03, 03, 03, 07, 07, 07, 07 }, /* 3H */
|
|
{ 00, 00, 00, 00, 00, 00, 00, 00 }, /* 0W */
|
|
{ 01, 01, 01, 01, 01, 01, 01, 01 }, /* 1W */
|
|
{ 02, 02, 02, 02, 02, 02, 02, 02 }, /* 2W */
|
|
{ 03, 03, 03, 03, 03, 03, 03, 03 }, /* 3W */
|
|
{ 04, 04, 04, 04, 04, 04, 04, 04 }, /* 4W */
|
|
{ 05, 05, 05, 05, 05, 05, 05, 05 }, /* 5W */
|
|
{ 06, 06, 06, 06, 06, 06, 06, 06 }, /* 6W */
|
|
{ 07, 07, 07, 07, 07, 07, 07, 07 }, /* 7W */
|
|
};
|
|
#endif
|
|
|
|
static INLINE int SPECIAL(u32 inst, u32 PC)
|
|
{
|
|
unsigned int rd, rs, rt;
|
|
|
|
rd = IW_RD(inst);
|
|
rt = (inst >> 16) % (1 << 5);
|
|
|
|
switch (inst % 64) {
|
|
case 000: /* SLL */
|
|
SR[rd] = SR[rt] << MASK_SA(inst >> 6);
|
|
SR[zero] = 0x00000000;
|
|
break;
|
|
case 002: /* SRL */
|
|
SR[rd] = (u32)(SR[rt]) >> MASK_SA(inst >> 6);
|
|
SR[zero] = 0x00000000;
|
|
break;
|
|
case 003: /* SRA */
|
|
SR[rd] = (s32)(SR[rt]) >> MASK_SA(inst >> 6);
|
|
SR[zero] = 0x00000000;
|
|
break;
|
|
case 004: /* SLLV */
|
|
rs = SPECIAL_DECODE_RS(inst);
|
|
SR[rd] = SR[rt] << MASK_SA(SR[rs]);
|
|
SR[zero] = 0x00000000;
|
|
break;
|
|
case 006: /* SRLV */
|
|
rs = SPECIAL_DECODE_RS(inst);
|
|
SR[rd] = (u32)(SR[rt]) >> MASK_SA(SR[rs]);
|
|
SR[zero] = 0x00000000;
|
|
break;
|
|
case 007: /* SRAV */
|
|
rs = SPECIAL_DECODE_RS(inst);
|
|
SR[rd] = (s32)(SR[rt]) >> MASK_SA(SR[rs]);
|
|
SR[zero] = 0x00000000;
|
|
break;
|
|
case 011: /* JALR */
|
|
SR[rd] = FIT_IMEM(PC + LINK_OFF);
|
|
SR[zero] = 0x00000000;
|
|
/* Fall through. */
|
|
case 010: /* JR */
|
|
rs = SPECIAL_DECODE_RS(inst);
|
|
set_PC(SR[rs]);
|
|
return 1;
|
|
case 015: /* BREAK */
|
|
*CR[0x4] |= SP_STATUS_BROKE | SP_STATUS_HALT;
|
|
if (*CR[0x4] & SP_STATUS_INTR_BREAK) {
|
|
GET_RCP_REG(MI_INTR_REG) |= 0x00000001;
|
|
GET_RSP_INFO(CheckInterrupts)();
|
|
}
|
|
return -1;
|
|
case 040: /* ADD */
|
|
case 041: /* ADDU */
|
|
rs = SPECIAL_DECODE_RS(inst);
|
|
SR[rd] = SR[rs] + SR[rt];
|
|
SR[zero] = 0x00000000; /* needed for Rareware micro-codes */
|
|
break;
|
|
case 042: /* SUB */
|
|
case 043: /* SUBU */
|
|
rs = SPECIAL_DECODE_RS(inst);
|
|
SR[rd] = SR[rs] - SR[rt];
|
|
SR[zero] = 0x00000000;
|
|
break;
|
|
case 044: /* AND */
|
|
rs = SPECIAL_DECODE_RS(inst);
|
|
SR[rd] = SR[rs] & SR[rt];
|
|
SR[zero] = 0x00000000; /* needed for Rareware micro-codes */
|
|
break;
|
|
case 045: /* OR */
|
|
rs = SPECIAL_DECODE_RS(inst);
|
|
SR[rd] = SR[rs] | SR[rt];
|
|
SR[zero] = 0x00000000;
|
|
break;
|
|
case 046: /* XOR */
|
|
rs = SPECIAL_DECODE_RS(inst);
|
|
SR[rd] = SR[rs] ^ SR[rt];
|
|
SR[zero] = 0x00000000;
|
|
break;
|
|
case 047: /* NOR */
|
|
rs = SPECIAL_DECODE_RS(inst);
|
|
SR[rd] = ~(SR[rs] | SR[rt]);
|
|
SR[zero] = 0x00000000;
|
|
break;
|
|
case 052: /* SLT */
|
|
rs = SPECIAL_DECODE_RS(inst);
|
|
SR[rd] = ((s32)(SR[rs]) < (s32)(SR[rt]));
|
|
SR[zero] = 0x00000000;
|
|
break;
|
|
case 053: /* SLTU */
|
|
rs = SPECIAL_DECODE_RS(inst);
|
|
SR[rd] = ((u32)(SR[rs]) < (u32)(SR[rt]));
|
|
SR[zero] = 0x00000000;
|
|
break;
|
|
default:
|
|
res_S();
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
static INLINE int REGIMM(u32 inst, u32 PC)
|
|
{
|
|
const unsigned int base = (inst >> 21) % (1 << 5);
|
|
const unsigned int rt = (inst >> 16) % (1 << 5);
|
|
|
|
switch (rt) {
|
|
case 020: /* BLTZAL */
|
|
SR[ra] = FIT_IMEM(PC + LINK_OFF);
|
|
/* Fall through. */
|
|
case 000: /* BLTZ */
|
|
if (!((s32)SR[base] < 0))
|
|
return 0;
|
|
set_PC(PC + 4*inst + SLOT_OFF);
|
|
break;
|
|
case 021: /* BGEZAL */
|
|
SR[ra] = FIT_IMEM(PC + LINK_OFF);
|
|
/* Fall through. */
|
|
case 001: /* BGEZ */
|
|
if (!((s32)SR[base] >= 0))
|
|
return 0;
|
|
set_PC(PC + 4*inst + SLOT_OFF);
|
|
break;
|
|
default:
|
|
res_S();
|
|
}
|
|
return 1;
|
|
}
|
|
|
|
static INLINE void MWC2_load(u32 inst)
|
|
{
|
|
s16 offset;
|
|
const unsigned int base = (inst >> 21) % (1 << 5);
|
|
const unsigned int vt = (inst >> 16) % (1 << 5);
|
|
const unsigned int element = (inst >> 7) % (1 << 4);
|
|
|
|
#if defined(ARCH_MIN_SSE2) && !defined(SSE2NEON)
|
|
offset = (s16)inst;
|
|
offset <<= 5 + 4; /* safe on x86, skips 5-bit rd, 4-bit element */
|
|
offset >>= 5 + 4;
|
|
#else
|
|
offset = (inst & 64) ? -(s16)(~inst%64 + 1) : inst % 64;
|
|
#endif
|
|
LWC2[IW_RD(inst)](vt, element, offset, base);
|
|
}
|
|
static INLINE void MWC2_store(u32 inst)
|
|
{
|
|
s16 offset;
|
|
const unsigned int base = (inst >> 21) % (1 << 5);
|
|
const unsigned int vt = (inst >> 16) % (1 << 5);
|
|
const unsigned int element = (inst >> 7) % (1 << 4);
|
|
|
|
#if defined(ARCH_MIN_SSE2) && !defined(SSE2NEON)
|
|
offset = (s16)inst;
|
|
offset <<= 5 + 4; /* safe on x86, skips 5-bit rd, 4-bit element */
|
|
offset >>= 5 + 4;
|
|
#else
|
|
offset = (inst & 64) ? -(s16)(~inst%64 + 1) : inst % 64;
|
|
#endif
|
|
SWC2[IW_RD(inst)](vt, element, offset, base);
|
|
}
|
|
|
|
static INLINE void COP0(u32 inst)
|
|
{
|
|
const unsigned int rd = IW_RD(inst);
|
|
const unsigned int rs = (inst >> 21) % (1 << 5);
|
|
const unsigned int rt = (inst >> 16) % (1 << 5);
|
|
|
|
switch (rs) {
|
|
case 000:
|
|
SP_CP0_MF(rt, rd);
|
|
break;
|
|
case 004:
|
|
SP_CP0_MT[rd % NUMBER_OF_CP0_REGISTERS](rt);
|
|
break;
|
|
default:
|
|
res_S();
|
|
}
|
|
}
|
|
|
|
static INLINE void COP2(u32 inst)
|
|
{
|
|
const unsigned int op = (inst >> 21) % (1 << 5); /* inst.R.rs */
|
|
const unsigned int vt = (inst >> 16) % (1 << 5); /* inst.R.rt */
|
|
const unsigned int vs = IW_RD(inst);
|
|
const unsigned int vd = (inst >> 6) % (1 << 5); /* inst.R.sa */
|
|
const unsigned int func = inst % (1 << 6);
|
|
#ifndef ARCH_MIN_SSE2
|
|
const unsigned int e = op & 0xF; /* With Intel, LEA offsets beat ANDing. */
|
|
#endif
|
|
|
|
switch (op) {
|
|
#ifdef ARCH_MIN_SSE2
|
|
v16 target;
|
|
#else
|
|
register unsigned int i;
|
|
#endif
|
|
|
|
case 000:
|
|
MFC2(vt, vs, vd >> 1);
|
|
break;
|
|
case 002:
|
|
CFC2(vt, vs);
|
|
break;
|
|
case 004:
|
|
MTC2(vt, vs, vd >> 1);
|
|
break;
|
|
case 006:
|
|
CTC2(vt, vs);
|
|
break;
|
|
case 020:
|
|
case 021:
|
|
#ifdef ARCH_MIN_SSE2
|
|
*(v16 *)(VR[vd]) = COP2_C2[func](*(v16 *)VR[vs], *(v16 *)VR[vt]);
|
|
#else
|
|
COP2_C2[func](&VR[vs][0], &VR[vt][0]);
|
|
vector_copy(&VR[vd][0], &V_result[0]);
|
|
#endif
|
|
break;
|
|
case 022:
|
|
case 023:
|
|
#ifdef ARCH_MIN_SSE2
|
|
#ifdef __ARM_NEON__
|
|
target = (v16)vld1q_u16(&VR[vt][0 + op - 0x12]);
|
|
target = (v16)vshlq_n_u32((uint32x4_t)target, 16);
|
|
target = (v16)vorrq_u16((uint16x8_t)target,
|
|
(uint16x8_t)vshrq_n_u32((uint32x4_t)target, 16));
|
|
#else
|
|
shuffle_temporary[0] = VR[vt][0 + op - 0x12];
|
|
shuffle_temporary[2] = VR[vt][2 + op - 0x12];
|
|
shuffle_temporary[4] = VR[vt][4 + op - 0x12];
|
|
shuffle_temporary[6] = VR[vt][6 + op - 0x12];
|
|
target = *(v16 *)(&shuffle_temporary[0]);
|
|
target = _mm_shufflehi_epi16(target, _MM_SHUFFLE(2, 2, 0, 0));
|
|
target = _mm_shufflelo_epi16(target, _MM_SHUFFLE(2, 2, 0, 0));
|
|
#endif
|
|
*(v16 *)(VR[vd]) = COP2_C2[func](*(v16 *)VR[vs], target);
|
|
#else
|
|
for (i = 0; i < N; i++)
|
|
shuffle_temporary[i] = VR[vt][(i & 0xE) + (e & 0x1)];
|
|
COP2_C2[func](&VR[vs][0], &shuffle_temporary[0]);
|
|
vector_copy(&VR[vd][0], &V_result[0]);
|
|
#endif
|
|
break;
|
|
case 024:
|
|
case 025:
|
|
case 026:
|
|
case 027:
|
|
#ifdef ARCH_MIN_SSE2
|
|
#ifdef __ARM_NEON__
|
|
target = (v16)vcombine_s16(vdup_n_s16(VR[vt][0 + op - 0x14]),
|
|
vdup_n_s16(VR[vt][4 + op - 0x14]));
|
|
#else
|
|
target = _mm_setzero_si128();
|
|
target = _mm_insert_epi16(target, VR[vt][0 + op - 0x14], 0);
|
|
target = _mm_insert_epi16(target, VR[vt][4 + op - 0x14], 4);
|
|
target = _mm_shufflehi_epi16(target, _MM_SHUFFLE(0, 0, 0, 0));
|
|
target = _mm_shufflelo_epi16(target, _MM_SHUFFLE(0, 0, 0, 0));
|
|
#endif
|
|
*(v16 *)(VR[vd]) = COP2_C2[func](*(v16 *)VR[vs], target);
|
|
#else
|
|
for (i = 0; i < N; i++)
|
|
shuffle_temporary[i] = VR[vt][(i & 0xC) + (e & 0x3)];
|
|
COP2_C2[func](&VR[vs][0], &shuffle_temporary[0]);
|
|
vector_copy(&VR[vd][0], &V_result[0]);
|
|
#endif
|
|
break;
|
|
case 030:
|
|
case 031:
|
|
case 032:
|
|
case 033:
|
|
case 034:
|
|
case 035:
|
|
case 036:
|
|
case 037:
|
|
#ifdef ARCH_MIN_SSE2
|
|
*(v16 *)(VR[vd]) = COP2_C2[func](
|
|
*(v16 *)VR[vs],
|
|
_mm_set1_epi16(VR[vt][op - 0x18])
|
|
);
|
|
#else
|
|
for (i = 0; i < N; i++)
|
|
shuffle_temporary[i] = VR[vt][e % N];
|
|
COP2_C2[func](&VR[vs][0], &shuffle_temporary[0]);
|
|
vector_copy(&VR[vd][0], &V_result[0]);
|
|
#endif
|
|
break;
|
|
default:
|
|
res_S();
|
|
}
|
|
}
|
|
|
|
NOINLINE void run_task(void)
|
|
{
|
|
register u32 PC;
|
|
|
|
PC = FIT_IMEM(GET_RCP_REG(SP_PC_REG));
|
|
for (;;) {
|
|
inst_word = *(pi32)(IMEM + FIT_IMEM(PC));
|
|
#ifdef EMULATE_STATIC_PC
|
|
PC = (PC + 0x004);
|
|
EX:
|
|
#endif
|
|
#ifdef SP_EXECUTE_LOG
|
|
step_SP_commands(inst_word);
|
|
#endif
|
|
|
|
#if (0 != 0)
|
|
if (GET_RCP_REG(SP_STATUS_REG) & SP_STATUS_HALT)
|
|
goto RSP_halted_CPU_exit_point; /* Only BREAK and COP0 set this. */
|
|
SR[zero] = 0x00000000; /* already handled on per-instruction basis */
|
|
#endif
|
|
switch (inst_word >> 26) {
|
|
case 000: /* SPECIAL */
|
|
switch (SPECIAL(inst_word, PC)) {
|
|
case -1: /* BREAK */
|
|
goto RSP_halted_CPU_exit_point;
|
|
case +1: /* JR and JALR */
|
|
JUMP;
|
|
}
|
|
break;
|
|
case 001: /* REGIMM */
|
|
if (REGIMM(inst_word, PC) != 0)
|
|
JUMP;
|
|
break;
|
|
case 002:
|
|
J(inst_word);
|
|
JUMP;
|
|
case 003:
|
|
JAL(inst_word, PC);
|
|
JUMP;
|
|
case 004:
|
|
if (BEQ(inst_word, PC) != 0)
|
|
JUMP;
|
|
break;
|
|
case 005:
|
|
if (BNE(inst_word, PC) != 0)
|
|
JUMP;
|
|
break;
|
|
case 006:
|
|
if (BLEZ(inst_word, PC) != 0)
|
|
JUMP;
|
|
break;
|
|
case 007:
|
|
if (BGTZ(inst_word, PC) != 0)
|
|
JUMP;
|
|
break;
|
|
case 010: /* ADDI: Traps don't exist on the RCP. */
|
|
case 011:
|
|
ADDIU(inst_word);
|
|
break;
|
|
case 012:
|
|
SLTI(inst_word);
|
|
break;
|
|
case 013:
|
|
SLTIU(inst_word);
|
|
break;
|
|
case 014:
|
|
ANDI(inst_word);
|
|
break;
|
|
case 015:
|
|
ORI(inst_word);
|
|
break;
|
|
case 016:
|
|
XORI(inst_word);
|
|
break;
|
|
case 017:
|
|
LUI(inst_word);
|
|
break;
|
|
case 020:
|
|
COP0(inst_word);
|
|
if (GET_RCP_REG(SP_STATUS_REG) & SP_STATUS_HALT)
|
|
goto RSP_halted_CPU_exit_point;
|
|
break;
|
|
case 022:
|
|
COP2(inst_word);
|
|
break;
|
|
case 040:
|
|
LB(inst_word);
|
|
break;
|
|
case 041:
|
|
LH(inst_word);
|
|
break;
|
|
case 043:
|
|
LW(inst_word);
|
|
break;
|
|
case 044:
|
|
LBU(inst_word);
|
|
break;
|
|
case 045:
|
|
LHU(inst_word);
|
|
break;
|
|
case 050:
|
|
SB(inst_word);
|
|
break;
|
|
case 051:
|
|
SH(inst_word);
|
|
break;
|
|
case 053:
|
|
SW(inst_word);
|
|
break;
|
|
case 062: /* LWC2 */
|
|
MWC2_load(inst_word);
|
|
break;
|
|
case 072: /* SWC2 */
|
|
MWC2_store(inst_word);
|
|
break;
|
|
default:
|
|
res_S();
|
|
}
|
|
|
|
#ifndef EMULATE_STATIC_PC
|
|
if (stage == 2) { /* branch phase of scheduler */
|
|
stage = 0*stage;
|
|
PC = FIT_IMEM(temp_PC);
|
|
GET_RCP_REG(SP_PC_REG) = temp_PC;
|
|
} else {
|
|
stage = 2*stage; /* next IW in branch delay slot? */
|
|
PC = FIT_IMEM(PC + 0x004);
|
|
GET_RCP_REG(SP_PC_REG) = 0x04001000 + PC;
|
|
}
|
|
#else
|
|
continue;
|
|
set_branch_delay:
|
|
inst_word = *(pi32)(IMEM + FIT_IMEM(PC));
|
|
PC = FIT_IMEM(temp_PC);
|
|
goto EX;
|
|
#endif
|
|
}
|
|
RSP_halted_CPU_exit_point:
|
|
GET_RCP_REG(SP_PC_REG) = 0x04001000 | FIT_IMEM(PC);
|
|
return;
|
|
}
|