mirror of
https://github.com/libretro/ppsspp.git
synced 2025-01-23 09:34:55 +00:00
Add missing cases to simplify pass
This commit is contained in:
parent
f544364c4a
commit
dc772e6f3a
@ -520,6 +520,14 @@ bool PropagateConstants(const IRWriter &in, IRWriter &out) {
|
||||
case IROp::Vec4Shuffle:
|
||||
case IROp::Vec4Neg:
|
||||
case IROp::Vec4Abs:
|
||||
case IROp::Vec4Pack31To8:
|
||||
case IROp::Vec4Pack32To8:
|
||||
case IROp::Vec2Pack32To16:
|
||||
case IROp::Vec4Unpack8To32:
|
||||
case IROp::Vec2Unpack16To32:
|
||||
case IROp::Vec4DuplicateUpperBitsAndShift1:
|
||||
case IROp::Vec2ClampToZero:
|
||||
case IROp::Vec4ClampToZero:
|
||||
out.Write(inst);
|
||||
break;
|
||||
|
||||
|
294
Core/MIPS/x86/IRToX86.cpp
Normal file
294
Core/MIPS/x86/IRToX86.cpp
Normal file
@ -0,0 +1,294 @@
|
||||
#include "Core/MIPS/x86/IRToX86.h"
|
||||
|
||||
namespace MIPSComp {
|
||||
|
||||
// Initial attempt at converting IR directly to x86.
|
||||
// This is intended to be an easy way to benefit from the IR with the current infrastructure.
|
||||
// Later tries may go across multiple blocks and a different representation.
|
||||
|
||||
struct GPRMapping {
|
||||
Gen::OpArg dest;
|
||||
Gen::OpArg src1;
|
||||
Gen::OpArg src2;
|
||||
};
|
||||
|
||||
struct FPRMapping {
|
||||
Gen::OpArg dest;
|
||||
Gen::OpArg src1;
|
||||
Gen::OpArg src2;
|
||||
};
|
||||
|
||||
|
||||
class GreedyRegallocGPR {
|
||||
public:
|
||||
GPRMapping Map(IRInst inst, const IRMeta &meta);
|
||||
|
||||
private:
|
||||
|
||||
};
|
||||
|
||||
|
||||
GPRMapping GreedyRegallocGPR::Map(IRInst inst, const IRMeta &meta) {
|
||||
GPRMapping mapping;
|
||||
if (meta.types[0] == 'G') {
|
||||
|
||||
}
|
||||
// etc..
|
||||
return mapping;
|
||||
}
|
||||
|
||||
// Every 4 registers can also be mapped into an SSE register.
|
||||
// When changing from single to vec4 mapping, we'll just flush, for now.
|
||||
class GreedyRegallocFPR {
|
||||
public:
|
||||
FPRMapping Map(IRInst inst, const IRMeta &meta);
|
||||
};
|
||||
|
||||
FPRMapping GreedyRegallocFPR::Map(IRInst inst, const IRMeta &meta) {
|
||||
FPRMapping mapping;
|
||||
|
||||
return mapping;
|
||||
}
|
||||
|
||||
|
||||
// This requires that ThreeOpToTwoOp has been run as the last pass.
|
||||
void IRToX86::ConvertIRToNative(const IRInst *instructions, int count, const u32 *constants) {
|
||||
// Set up regcaches
|
||||
using namespace Gen;
|
||||
|
||||
GreedyRegallocGPR gprAlloc;
|
||||
GreedyRegallocFPR fprAlloc;
|
||||
|
||||
// Loop through all the instructions, emitting code as we go.
|
||||
// Note that we do need to implement them all - fallbacks are not permitted.
|
||||
for (int i = 0; i < count; i++) {
|
||||
const IRInst *inst = &instructions[i];
|
||||
const IRMeta &meta = *GetIRMeta(inst->op);
|
||||
GPRMapping gpr = gprAlloc.Map(*inst, meta);
|
||||
FPRMapping fpr = fprAlloc.Map(*inst, meta);
|
||||
|
||||
bool symmetric = false;
|
||||
switch (inst->op) {
|
||||
case IROp::Nop:
|
||||
_assert_(false);
|
||||
break;
|
||||
|
||||
// Output-only
|
||||
case IROp::SetConst:
|
||||
code_->MOV(32, gpr.dest, Imm32(constants[inst->src1]));
|
||||
break;
|
||||
case IROp::SetConstF:
|
||||
code_->MOV(32, gpr.dest, Imm32(constants[inst->src1]));
|
||||
break;
|
||||
|
||||
// Add gets to be special cased because we have LEA.
|
||||
case IROp::Add:
|
||||
if (gpr.dest.IsSimpleReg() && gpr.src1.IsSimpleReg() && gpr.src2.IsSimpleReg()) {
|
||||
code_->LEA(32, gpr.dest.GetSimpleReg(), MRegSum(gpr.src1.GetSimpleReg(), gpr.src2.GetSimpleReg()));
|
||||
break;
|
||||
}
|
||||
// Else fall through.
|
||||
// 3-op arithmetic that directly corresponds to x86
|
||||
// (often 2-op in practice if src1 == dst). x86 only does 2-op though so some of these will need splitting.
|
||||
case IROp::Sub:
|
||||
case IROp::And:
|
||||
case IROp::Or:
|
||||
case IROp::Xor:
|
||||
if (inst->src1 != inst->dest) {
|
||||
code_->MOV(32, gpr.dest, gpr.src1);
|
||||
}
|
||||
// Emit directly
|
||||
switch (inst->op) {
|
||||
case IROp::Add: code_->ADD(32, gpr.dest, gpr.src2); break;
|
||||
case IROp::Sub: code_->SUB(32, gpr.dest, gpr.src2); break;
|
||||
case IROp::And: code_->AND(32, gpr.dest, gpr.src2); break;
|
||||
case IROp::Or: code_->OR(32, gpr.dest, gpr.src2); break;
|
||||
case IROp::Xor: code_->XOR(32, gpr.dest, gpr.src2); break;
|
||||
}
|
||||
break;
|
||||
|
||||
// Variable shifts.
|
||||
case IROp::Shl:
|
||||
case IROp::Shr:
|
||||
case IROp::Sar:
|
||||
case IROp::Ror:
|
||||
|
||||
case IROp::Slt:
|
||||
case IROp::SltU:
|
||||
case IROp::MovZ:
|
||||
case IROp::MovNZ:
|
||||
case IROp::Max:
|
||||
case IROp::Min:
|
||||
break;
|
||||
|
||||
// 2-op arithmetic with constant
|
||||
case IROp::AddConst:
|
||||
case IROp::SubConst:
|
||||
case IROp::AndConst:
|
||||
case IROp::OrConst:
|
||||
case IROp::XorConst:
|
||||
case IROp::SltConst:
|
||||
case IROp::SltUConst:
|
||||
|
||||
// 2-op arithmetic with immediate
|
||||
case IROp::ShlImm:
|
||||
case IROp::ShrImm:
|
||||
case IROp::SarImm:
|
||||
case IROp::RorImm:
|
||||
|
||||
// 2-op arithmetic
|
||||
case IROp::Mov:
|
||||
code_->MOV(32, gpr.dest, gpr.src1);
|
||||
break;
|
||||
|
||||
case IROp::Neg:
|
||||
case IROp::Not:
|
||||
case IROp::Ext8to32:
|
||||
case IROp::Ext16to32:
|
||||
case IROp::ReverseBits:
|
||||
case IROp::BSwap16:
|
||||
case IROp::BSwap32:
|
||||
case IROp::Clz:
|
||||
if (inst->dest != inst->src1) {
|
||||
code_->NEG(32, gpr.dest); break;
|
||||
}
|
||||
break;
|
||||
// Multiplier control
|
||||
case IROp::MtLo:
|
||||
case IROp::MtHi:
|
||||
case IROp::MfLo:
|
||||
case IROp::MfHi:
|
||||
case IROp::Mult:
|
||||
case IROp::MultU:
|
||||
case IROp::Madd:
|
||||
case IROp::MaddU:
|
||||
case IROp::Msub:
|
||||
case IROp::MsubU:
|
||||
case IROp::Div:
|
||||
case IROp::DivU:
|
||||
|
||||
// Memory access
|
||||
case IROp::Load8:
|
||||
case IROp::Load8Ext:
|
||||
case IROp::Load16:
|
||||
case IROp::Load16Ext:
|
||||
case IROp::Load32:
|
||||
case IROp::LoadFloat:
|
||||
case IROp::Store8:
|
||||
case IROp::Store16:
|
||||
case IROp::Store32:
|
||||
case IROp::StoreFloat:
|
||||
case IROp::LoadVec4:
|
||||
case IROp::StoreVec4:
|
||||
|
||||
// Output-only SIMD functions
|
||||
case IROp::Vec4Init:
|
||||
case IROp::Vec4Shuffle:
|
||||
|
||||
// 2-op SIMD functions
|
||||
case IROp::Vec4Mov:
|
||||
code_->MOVAPS(fpr.dest.GetSimpleReg(), fpr.src1);
|
||||
break;
|
||||
case IROp::Vec4Neg:
|
||||
case IROp::Vec4Abs:
|
||||
break;
|
||||
case IROp::Vec4ClampToZero:
|
||||
code_->PXOR(XMM0, R(XMM0));
|
||||
code_->PMAXSW(XMM0, fpr.src1);
|
||||
code_->MOVAPD(fpr.dest, XMM0);
|
||||
break;
|
||||
case IROp::Vec4DuplicateUpperBitsAndShift1:
|
||||
case IROp::Vec2ClampToZero:
|
||||
|
||||
// 3-op SIMD functions
|
||||
case IROp::Vec4Add:
|
||||
case IROp::Vec4Sub:
|
||||
case IROp::Vec4Mul:
|
||||
case IROp::Vec4Div:
|
||||
|
||||
case IROp::Vec4Scale:
|
||||
case IROp::Vec4Dot:
|
||||
|
||||
// Pack-unpack
|
||||
case IROp::Vec2Unpack16To31:
|
||||
case IROp::Vec2Unpack16To32:
|
||||
case IROp::Vec4Unpack8To32:
|
||||
case IROp::Vec2Pack32To16:
|
||||
case IROp::Vec2Pack31To16:
|
||||
case IROp::Vec4Pack32To8:
|
||||
case IROp::Vec4Pack31To8:
|
||||
|
||||
case IROp::FCmpVfpuBit:
|
||||
case IROp::FCmpVfpuAggregate:
|
||||
case IROp::FCmovVfpuCC:
|
||||
|
||||
// Trancendental functions (non-simd)
|
||||
case IROp::FSin:
|
||||
case IROp::FCos:
|
||||
case IROp::FRSqrt:
|
||||
case IROp::FRecip:
|
||||
case IROp::FAsin:
|
||||
|
||||
// 3-Op FP
|
||||
case IROp::FAdd:
|
||||
case IROp::FSub:
|
||||
case IROp::FMul:
|
||||
case IROp::FDiv:
|
||||
case IROp::FMin:
|
||||
case IROp::FMax:
|
||||
|
||||
// 2-Op FP
|
||||
case IROp::FMov:
|
||||
case IROp::FAbs:
|
||||
case IROp::FSqrt:
|
||||
case IROp::FNeg:
|
||||
case IROp::FSat0_1:
|
||||
case IROp::FSatMinus1_1:
|
||||
case IROp::FSign:
|
||||
case IROp::FCeil:
|
||||
case IROp::FFloor:
|
||||
case IROp::FCmp:
|
||||
case IROp::FCvtSW:
|
||||
case IROp::FCvtWS:
|
||||
case IROp::FRound:
|
||||
case IROp::FTrunc:
|
||||
|
||||
// Cross moves
|
||||
case IROp::FMovFromGPR:
|
||||
case IROp::FMovToGPR:
|
||||
case IROp::FpCondToReg:
|
||||
case IROp::VfpuCtrlToReg:
|
||||
|
||||
// VFPU flag/control
|
||||
case IROp::SetCtrlVFPU:
|
||||
case IROp::SetCtrlVFPUReg:
|
||||
case IROp::SetCtrlVFPUFReg:
|
||||
case IROp::ZeroFpCond:
|
||||
|
||||
// Block Exits
|
||||
case IROp::ExitToConst:
|
||||
case IROp::ExitToReg:
|
||||
case IROp::ExitToConstIfEq:
|
||||
case IROp::ExitToConstIfNeq:
|
||||
case IROp::ExitToConstIfGtZ:
|
||||
case IROp::ExitToConstIfGeZ:
|
||||
case IROp::ExitToConstIfLtZ:
|
||||
case IROp::ExitToConstIfLeZ:
|
||||
case IROp::ExitToPC:
|
||||
|
||||
// Utilities
|
||||
case IROp::Downcount:
|
||||
case IROp::SetPC:
|
||||
case IROp::SetPCConst:
|
||||
case IROp::Syscall:
|
||||
case IROp::Interpret: // SLOW fallback. Can be made faster.
|
||||
case IROp::CallReplacement:
|
||||
case IROp::Break:
|
||||
default:
|
||||
break;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
|
||||
} // namespace
|
23
Core/MIPS/x86/IRToX86.h
Normal file
23
Core/MIPS/x86/IRToX86.h
Normal file
@ -0,0 +1,23 @@
|
||||
#include "Core/MIPS/IR/IRInst.h"
|
||||
#include "Common/x64Emitter.h"
|
||||
|
||||
namespace MIPSComp {
|
||||
|
||||
class IRToNativeInterface {
|
||||
public:
|
||||
virtual ~IRToNativeInterface() {}
|
||||
|
||||
virtual void ConvertIRToNative(const IRInst *instructions, int count, const u32 *constants) = 0;
|
||||
};
|
||||
|
||||
|
||||
class IRToX86 : public IRToNativeInterface {
|
||||
public:
|
||||
void SetCodeBlock(Gen::XCodeBlock *code) { code_ = code; }
|
||||
virtual void ConvertIRToNative(const IRInst *instructions, int count, const u32 *constants) override;
|
||||
|
||||
private:
|
||||
Gen::XCodeBlock *code_;
|
||||
};
|
||||
|
||||
} // namespace
|
Loading…
x
Reference in New Issue
Block a user