mirror of
https://github.com/libretro/ppsspp.git
synced 2024-12-15 21:18:12 +00:00
0ca8f5c655
Mostly affects games with a lot of modules and exports.
534 lines
12 KiB
C++
534 lines
12 KiB
C++
// Copyright (c) 2012- PPSSPP Project.
|
|
|
|
// This program is free software: you can redistribute it and/or modify
|
|
// it under the terms of the GNU General Public License as published by
|
|
// the Free Software Foundation, version 2.0 or later versions.
|
|
|
|
// This program is distributed in the hope that it will be useful,
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
// GNU General Public License 2.0 for more details.
|
|
|
|
// A copy of the GPL 2.0 should have been included with the program.
|
|
// If not, see http://www.gnu.org/licenses/
|
|
|
|
// Official git repository and contact information can be found at
|
|
// https://github.com/hrydgard/ppsspp and http://www.ppsspp.org/.
|
|
|
|
#include <map>
|
|
#include "../../Globals.h"
|
|
|
|
#include "MIPS.h"
|
|
#include "MIPSTables.h"
|
|
#include "MIPSAnalyst.h"
|
|
#include "MIPSCodeUtils.h"
|
|
#include "../Debugger/SymbolMap.h"
|
|
|
|
using namespace MIPSCodeUtils;
|
|
using namespace std;
|
|
|
|
namespace MIPSAnalyst
|
|
{
|
|
RegisterAnalysisResults regAnal[32];
|
|
RegisterAnalysisResults total[32];
|
|
int numAnalysisDone=0;
|
|
|
|
int GetOutReg(u32 op)
|
|
{
|
|
u32 opinfo = MIPSGetInfo(op);
|
|
if (opinfo & OUT_RT)
|
|
return MIPS_GET_RT(op);
|
|
if (opinfo & OUT_RD)
|
|
return MIPS_GET_RD(op);
|
|
if (opinfo & OUT_RA)
|
|
return MIPS_REG_RA;
|
|
return -1;
|
|
}
|
|
|
|
bool ReadsFromReg(u32 op, u32 reg)
|
|
{
|
|
u32 opinfo = MIPSGetInfo(op);
|
|
if (opinfo & IN_RT)
|
|
{
|
|
if (MIPS_GET_RT(opinfo) == reg)
|
|
return true;
|
|
}
|
|
if (opinfo & (IN_RS | IN_RS_ADDR | IN_RS_SHIFT))
|
|
{
|
|
if (MIPS_GET_RS(opinfo) == reg)
|
|
return true;
|
|
}
|
|
return false; //TODO: there are more cases!
|
|
}
|
|
|
|
// TODO: Remove me?
|
|
bool IsDelaySlotNice(u32 branch, u32 delayslot)
|
|
{
|
|
int outReg = GetOutReg(delayslot);
|
|
if (outReg != -1)
|
|
{
|
|
if (ReadsFromReg(branch, outReg))
|
|
{
|
|
return false; //evil :(
|
|
}
|
|
else
|
|
{
|
|
return false; //aggh this should be true but doesn't work
|
|
}
|
|
}
|
|
else
|
|
{
|
|
// Check for FPU flag
|
|
if ((MIPSGetInfo(delayslot) & OUT_FPUFLAG) && (MIPSGetInfo(branch) & IN_FPUFLAG))
|
|
return false;
|
|
|
|
return true; //nice :)
|
|
}
|
|
}
|
|
|
|
// Temporary, returns true for common ops which have proper flags in the table.
|
|
bool IsDelaySlotInfoSafe(u32 op)
|
|
{
|
|
const char *safeOps[] = {
|
|
"addi", "addiu", "slti", "sltiu", "andi", "ori", "xori", "lui",
|
|
"lb", "lh", "lwl", "lw", "lbu", "lhu", "lwr",
|
|
"sb", "sh", "swl", "sw", "swr",
|
|
"sll", "srl", "sra", "sllv", "srlv", "srav",
|
|
"add", "addu", "sub", "subu", "and", "or", "xor", "nor",
|
|
"slt", "sltu",
|
|
};
|
|
const char *opName = MIPSGetName(op);
|
|
for (size_t i = 0; i < ARRAY_SIZE(safeOps); ++i)
|
|
{
|
|
if (!strcmp(safeOps[i], opName))
|
|
return true;
|
|
}
|
|
|
|
return false;
|
|
}
|
|
|
|
bool IsDelaySlotNiceReg(u32 branchOp, u32 op, int reg1, int reg2)
|
|
{
|
|
// NOOPs are always nice.
|
|
if (op == 0)
|
|
return true;
|
|
|
|
// TODO: Once the flags are all correct on the tables, remove this safety.
|
|
if (IsDelaySlotInfoSafe(op))
|
|
{
|
|
// $0 is never an out reg, it's always 0.
|
|
if (reg1 != 0 && GetOutReg(op) == reg1)
|
|
return false;
|
|
if (reg2 != 0 && GetOutReg(op) == reg2)
|
|
return false;
|
|
|
|
return true;
|
|
}
|
|
|
|
return false;
|
|
}
|
|
|
|
bool IsDelaySlotNiceVFPU(u32 branchOp, u32 op)
|
|
{
|
|
// NOOPs are always nice.
|
|
if (op == 0)
|
|
return true;
|
|
|
|
// TODO: Once the flags are all correct on the tables, remove this safety.
|
|
if (IsDelaySlotInfoSafe(op))
|
|
{
|
|
// TODO: There may be IS_VFPU cases which are safe...
|
|
return (MIPSGetInfo(op) & IS_VFPU) == 0;
|
|
}
|
|
|
|
return false;
|
|
}
|
|
|
|
bool IsDelaySlotNiceFPU(u32 branchOp, u32 op)
|
|
{
|
|
// NOOPs are always nice.
|
|
if (op == 0)
|
|
return true;
|
|
|
|
// TODO: Once the flags are all correct on the tables, remove this safety.
|
|
if (IsDelaySlotInfoSafe(op))
|
|
return (MIPSGetInfo(op) & OUT_FPUFLAG) == 0;
|
|
|
|
return false;
|
|
}
|
|
|
|
bool IsSyscall(u32 op)
|
|
{
|
|
// Syscalls look like this: 0000 00-- ---- ---- ---- --00 1100
|
|
return (op >> 26) == 0 && (op & 0x3f) == 12;
|
|
}
|
|
|
|
void Analyze(u32 address)
|
|
{
|
|
//set everything to -1 (FF)
|
|
memset(regAnal, 255, sizeof(AnalysisResults)*32);
|
|
for (int i=0; i<32; i++)
|
|
{
|
|
regAnal[i].used=false;
|
|
regAnal[i].readCount=0;
|
|
regAnal[i].writeCount=0;
|
|
regAnal[i].readAsAddrCount=0;
|
|
}
|
|
|
|
u32 addr = address;
|
|
bool exitFlag = false;
|
|
while (true)
|
|
{
|
|
u32 op = Memory::Read_Instruction(addr);
|
|
u32 info = MIPSGetInfo(op);
|
|
|
|
for (int reg=0; reg < 32; reg++)
|
|
{
|
|
int rs = MIPS_GET_RS(op);
|
|
int rt = MIPS_GET_RT(op);
|
|
int rd = MIPS_GET_RD(op);
|
|
|
|
if (
|
|
((info & IN_RS) && (rs == reg)) ||
|
|
((info & IN_RS_SHIFT) && (rs == reg)) ||
|
|
((info & IN_RT) && (rt == reg)))
|
|
{
|
|
if (regAnal[reg].firstRead == -1)
|
|
regAnal[reg].firstRead = addr;
|
|
regAnal[reg].lastRead = addr;
|
|
regAnal[reg].readCount++;
|
|
regAnal[reg].used=true;
|
|
}
|
|
if (
|
|
((info & IN_RS_ADDR) && (rs == reg))
|
|
)
|
|
{
|
|
if (regAnal[reg].firstReadAsAddr == -1)
|
|
regAnal[reg].firstReadAsAddr = addr;
|
|
regAnal[reg].lastReadAsAddr = addr;
|
|
regAnal[reg].readAsAddrCount++;
|
|
regAnal[reg].used=true;
|
|
}
|
|
if (
|
|
((info & OUT_RT) && (rt == reg)) ||
|
|
((info & OUT_RD) && (rd == reg)) ||
|
|
((info & OUT_RA) && (reg == MIPS_REG_RA))
|
|
)
|
|
{
|
|
if (regAnal[reg].firstWrite == -1)
|
|
regAnal[reg].firstWrite = addr;
|
|
regAnal[reg].lastWrite = addr;
|
|
regAnal[reg].writeCount++;
|
|
regAnal[reg].used=true;
|
|
}
|
|
}
|
|
|
|
if (exitFlag) //delay slot done, let's quit!
|
|
break;
|
|
|
|
if ((info & IS_JUMP) || (info & IS_CONDBRANCH))
|
|
{
|
|
exitFlag = true; // now do the delay slot
|
|
}
|
|
|
|
addr += 4;
|
|
}
|
|
|
|
int numUsedRegs=0;
|
|
static int totalUsedRegs=0;
|
|
static int numAnalyzings=0;
|
|
for (int i=0; i<32; i++)
|
|
{
|
|
if (regAnal[i].used)
|
|
numUsedRegs++;
|
|
}
|
|
totalUsedRegs+=numUsedRegs;
|
|
numAnalyzings++;
|
|
DEBUG_LOG(CPU,"[ %08x ] Used regs: %i Average: %f",address,numUsedRegs,(float)totalUsedRegs/(float)numAnalyzings);
|
|
}
|
|
|
|
|
|
struct Function
|
|
{
|
|
u32 start;
|
|
u32 end;
|
|
u32 hash;
|
|
u32 size;
|
|
bool isStraightLeaf;
|
|
bool hasHash;
|
|
bool usesVFPU;
|
|
char name[64];
|
|
};
|
|
|
|
vector<Function> functions;
|
|
|
|
map<u32, Function*> hashToFunction;
|
|
|
|
void Shutdown()
|
|
{
|
|
functions.clear();
|
|
hashToFunction.clear();
|
|
}
|
|
|
|
// hm pointless :P
|
|
void UpdateHashToFunctionMap()
|
|
{
|
|
hashToFunction.clear();
|
|
for (vector<Function>::iterator iter = functions.begin(); iter != functions.end(); iter++)
|
|
{
|
|
Function &f = *iter;
|
|
if (f.hasHash)
|
|
{
|
|
hashToFunction[f.hash] = &f;
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
bool IsRegisterUsed(u32 reg, u32 addr)
|
|
{
|
|
while (true)
|
|
{
|
|
u32 op = Memory::Read_Instruction(addr);
|
|
u32 info = MIPSGetInfo(op);
|
|
|
|
if (
|
|
((info & IN_RS) ||
|
|
(info & IN_RS_SHIFT) ||
|
|
(info & IN_RS_ADDR))
|
|
&&
|
|
(MIPS_GET_RS(op) == reg)
|
|
)
|
|
return true;
|
|
if ((info & IN_RT) && (MIPS_GET_RT(op) == reg))
|
|
return true;
|
|
if ((info & IS_CONDBRANCH))
|
|
return true; // could also follow both paths
|
|
if ((info & IS_JUMP))
|
|
return true; // could also follow the path
|
|
if ((info & OUT_RT) && (MIPS_GET_RT(op) == reg))
|
|
return false; //the reg got clobbed! yay!
|
|
if ((info & OUT_RD) && (MIPS_GET_RD(op) == reg))
|
|
return false; //the reg got clobbed! yay!
|
|
if ((info & OUT_RA) && (reg == MIPS_REG_RA))
|
|
return false; //the reg got clobbed! yay!
|
|
addr+=4;
|
|
}
|
|
return true;
|
|
}
|
|
|
|
void HashFunctions()
|
|
{
|
|
for (vector<Function>::iterator iter = functions.begin(); iter!=functions.end(); iter++)
|
|
{
|
|
Function &f=*iter;
|
|
u32 hash = 0x1337babe;
|
|
for (u32 addr = f.start; addr <= f.end; addr += 4)
|
|
{
|
|
u32 validbits = 0xFFFFFFFF;
|
|
u32 instr = Memory::Read_Instruction(addr);
|
|
u32 flags = MIPSGetInfo(instr);
|
|
if (flags & IN_IMM16)
|
|
validbits&=~0xFFFF;
|
|
if (flags & IN_IMM26)
|
|
validbits&=~0x3FFFFFF;
|
|
hash = __rotl(hash,13);
|
|
hash ^= (instr&validbits);
|
|
}
|
|
f.hash=hash;
|
|
f.hasHash=true;
|
|
}
|
|
}
|
|
|
|
void ScanForFunctions(u32 startAddr, u32 endAddr /*, std::vector<u32> knownEntries*/)
|
|
{
|
|
Function currentFunction = {startAddr};
|
|
|
|
u32 furthestBranch = 0;
|
|
bool looking = false;
|
|
bool end = false;
|
|
bool isStraightLeaf=true;
|
|
u32 addr;
|
|
for (addr = startAddr; addr<=endAddr; addr+=4)
|
|
{
|
|
SymbolInfo syminfo;
|
|
if (symbolMap.GetSymbolInfo(&syminfo, addr, ST_FUNCTION))
|
|
{
|
|
addr = syminfo.address + syminfo.size;
|
|
continue;
|
|
}
|
|
|
|
u32 op = Memory::Read_Instruction(addr);
|
|
u32 target = GetBranchTargetNoRA(addr);
|
|
if (target != INVALIDTARGET)
|
|
{
|
|
isStraightLeaf = false;
|
|
if (target > furthestBranch)
|
|
{
|
|
furthestBranch = target;
|
|
}
|
|
}
|
|
if (op == MIPS_MAKE_JR_RA())
|
|
{
|
|
if (furthestBranch >= addr)
|
|
{
|
|
looking = true;
|
|
addr+=4;
|
|
}
|
|
else
|
|
{
|
|
end = true;
|
|
}
|
|
}
|
|
|
|
if (looking)
|
|
{
|
|
if (addr >= furthestBranch)
|
|
{
|
|
u32 sureTarget = GetSureBranchTarget(addr);
|
|
if (sureTarget != INVALIDTARGET && sureTarget < addr)
|
|
{
|
|
end = true;
|
|
}
|
|
sureTarget = GetJumpTarget(addr);
|
|
if (sureTarget != INVALIDTARGET && sureTarget < addr && ((op&0xFC000000)==0x08000000))
|
|
{
|
|
end = true;
|
|
}
|
|
//end = true;
|
|
}
|
|
}
|
|
if (end)
|
|
{
|
|
currentFunction.end = addr + 4;
|
|
currentFunction.isStraightLeaf = isStraightLeaf;
|
|
functions.push_back(currentFunction);
|
|
furthestBranch = 0;
|
|
addr += 4;
|
|
looking = false;
|
|
end = false;
|
|
isStraightLeaf=true;
|
|
currentFunction.start = addr+4;
|
|
}
|
|
}
|
|
currentFunction.end = addr + 4;
|
|
functions.push_back(currentFunction);
|
|
|
|
for (vector<Function>::iterator iter = functions.begin(); iter!=functions.end(); iter++)
|
|
{
|
|
(*iter).size = ((*iter).end-(*iter).start+4);
|
|
char temp[256];
|
|
sprintf(temp,"z_un_%08x",(*iter).start);
|
|
symbolMap.AddSymbol(std::string(temp).c_str(), (*iter).start,(*iter).end-(*iter).start+4,ST_FUNCTION);
|
|
}
|
|
HashFunctions();
|
|
}
|
|
|
|
struct HashMapFunc
|
|
{
|
|
char name[64];
|
|
u32 hash;
|
|
u32 size; //number of bytes
|
|
};
|
|
|
|
void StoreHashMap(const char *filename)
|
|
{
|
|
FILE *file = fopen(filename,"wb");
|
|
u32 num = 0;
|
|
if(fwrite(&num,4,1,file) != 1) //fill in later
|
|
WARN_LOG(CPU, "Could not store hash map %s", filename);
|
|
|
|
for (vector<Function>::iterator iter = functions.begin(); iter!=functions.end(); iter++)
|
|
{
|
|
Function &f=*iter;
|
|
if (f.hasHash && f.size>=12)
|
|
{
|
|
HashMapFunc temp;
|
|
memset(&temp,0,sizeof(temp));
|
|
strcpy(temp.name, f.name);
|
|
temp.hash=f.hash;
|
|
temp.size=f.size;
|
|
if(fwrite((char*)&temp,sizeof(temp),1,file) != 1) {
|
|
WARN_LOG(CPU, "Could not store hash map %s", filename);
|
|
break;
|
|
}
|
|
num++;
|
|
}
|
|
}
|
|
fseek(file,0,SEEK_SET);
|
|
if(fwrite(&num,4,1,file) != 1) //fill in later
|
|
WARN_LOG(CPU, "Could not store hash map %s", filename);
|
|
fclose(file);
|
|
}
|
|
|
|
|
|
void LoadHashMap(const char *filename)
|
|
{
|
|
HashFunctions();
|
|
UpdateHashToFunctionMap();
|
|
|
|
FILE *file = fopen(filename, "rb");
|
|
int num;
|
|
if(fread(&num,4,1,file) == 1) {
|
|
for (int i=0; i<num; i++)
|
|
{
|
|
HashMapFunc temp;
|
|
if(fread(&temp,sizeof(temp),1,file) == 1) {
|
|
map<u32,Function*>::iterator iter = hashToFunction.find(temp.hash);
|
|
if (iter != hashToFunction.end())
|
|
{
|
|
//yay, found a function!
|
|
Function &f = *(iter->second);
|
|
if (f.size==temp.size)
|
|
{
|
|
strcpy(f.name, temp.name);
|
|
f.hash=temp.hash;
|
|
f.size=temp.size;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
fclose(file);
|
|
}
|
|
void CompileLeafs()
|
|
{
|
|
/*
|
|
int count=0;
|
|
for (vector<Function>::iterator iter = functions.begin(); iter!=functions.end(); iter++)
|
|
{
|
|
Function &f = *iter;
|
|
if (f.isStraightLeaf)
|
|
{
|
|
MIPSComp::CompileAt(f.start);
|
|
count++;
|
|
}
|
|
}
|
|
LOG(CPU,"Precompiled %i straight leaf functions",count);*/
|
|
}
|
|
|
|
std::vector<int> GetInputRegs(u32 op)
|
|
{
|
|
std::vector<int> vec;
|
|
u32 info = MIPSGetInfo(op);
|
|
if ((info & IS_VFPU) == 0)
|
|
{
|
|
if (info & IN_RS) vec.push_back(MIPS_GET_RS(op));
|
|
if (info & IN_RT) vec.push_back(MIPS_GET_RT(op));
|
|
}
|
|
return vec;
|
|
}
|
|
std::vector<int> GetOutputRegs(u32 op)
|
|
{
|
|
std::vector<int> vec;
|
|
u32 info = MIPSGetInfo(op);
|
|
if ((info & IS_VFPU) == 0)
|
|
{
|
|
if (info & OUT_RD) vec.push_back(MIPS_GET_RD(op));
|
|
if (info & OUT_RT) vec.push_back(MIPS_GET_RT(op));
|
|
if (info & OUT_RA) vec.push_back(MIPS_REG_RA);
|
|
}
|
|
return vec;
|
|
}
|
|
}
|