mirror of
https://github.com/RPCSX/llvm.git
synced 2024-11-25 12:50:00 +00:00
LocalStackSlotAllocation improvements
First, taking advantage of the fact that the virtual base registers are allocated in order of the local frame offsets, remove the quadratic register-searching behavior. Because of the ordering, we only need to check the last virtual base register created. Second, store the frame index in the FrameRef structure, and get the frame index and the local offset from this structure at the top of the loop iteration. This allows us to de-nest the loops in insertFrameReferenceRegisters (and I think makes the code cleaner). I also moved the needsFrameBaseReg check into the first loop over instructions so that we don't bother pushing FrameRefs for instructions that don't want a virtual base register anyway. Lastly, and this is the only functionality change, avoid the creation of single-use virtual base registers. These are currently not useful because, in general, they end up replacing what would be one r+r instruction with an add and a r+i instruction. Committing this removes the XFAIL in CodeGen/PowerPC/2007-09-07-LoadStoreIdxForms.ll Jim has okayed this off-list. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@180799 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
34f39841d3
commit
db31bd31d6
@ -46,13 +46,16 @@ namespace {
|
||||
class FrameRef {
|
||||
MachineBasicBlock::iterator MI; // Instr referencing the frame
|
||||
int64_t LocalOffset; // Local offset of the frame idx referenced
|
||||
int FrameIdx; // The frame index
|
||||
public:
|
||||
FrameRef(MachineBasicBlock::iterator I, int64_t Offset) :
|
||||
MI(I), LocalOffset(Offset) {}
|
||||
FrameRef(MachineBasicBlock::iterator I, int64_t Offset, int Idx) :
|
||||
MI(I), LocalOffset(Offset), FrameIdx(Idx) {}
|
||||
bool operator<(const FrameRef &RHS) const {
|
||||
return LocalOffset < RHS.LocalOffset;
|
||||
}
|
||||
MachineBasicBlock::iterator getMachineInstr() { return MI; }
|
||||
MachineBasicBlock::iterator getMachineInstr() const { return MI; }
|
||||
int64_t getLocalOffset() const { return LocalOffset; }
|
||||
int getFrameIndex() const { return FrameIdx; }
|
||||
};
|
||||
|
||||
class LocalStackSlotPass: public MachineFunctionPass {
|
||||
@ -194,22 +197,15 @@ void LocalStackSlotPass::calculateFrameObjectOffsets(MachineFunction &Fn) {
|
||||
}
|
||||
|
||||
static inline bool
|
||||
lookupCandidateBaseReg(const SmallVector<std::pair<unsigned, int64_t>, 8> &Regs,
|
||||
std::pair<unsigned, int64_t> &RegOffset,
|
||||
lookupCandidateBaseReg(int64_t BaseOffset,
|
||||
int64_t FrameSizeAdjust,
|
||||
int64_t LocalFrameOffset,
|
||||
const MachineInstr *MI,
|
||||
const TargetRegisterInfo *TRI) {
|
||||
unsigned e = Regs.size();
|
||||
for (unsigned i = 0; i < e; ++i) {
|
||||
RegOffset = Regs[i];
|
||||
// Check if the relative offset from the where the base register references
|
||||
// to the target address is in range for the instruction.
|
||||
int64_t Offset = FrameSizeAdjust + LocalFrameOffset - RegOffset.second;
|
||||
if (TRI->isFrameOffsetLegal(MI, Offset))
|
||||
return true;
|
||||
}
|
||||
return false;
|
||||
int64_t Offset = FrameSizeAdjust + LocalFrameOffset - BaseOffset;
|
||||
return TRI->isFrameOffsetLegal(MI, Offset);
|
||||
}
|
||||
|
||||
bool LocalStackSlotPass::insertFrameReferenceRegisters(MachineFunction &Fn) {
|
||||
@ -233,9 +229,6 @@ bool LocalStackSlotPass::insertFrameReferenceRegisters(MachineFunction &Fn) {
|
||||
// choose the first one).
|
||||
SmallVector<FrameRef, 64> FrameReferenceInsns;
|
||||
|
||||
// A base register definition is a register + offset pair.
|
||||
SmallVector<std::pair<unsigned, int64_t>, 8> BaseRegisters;
|
||||
|
||||
for (MachineFunction::iterator BB = Fn.begin(), E = Fn.end(); BB != E; ++BB) {
|
||||
for (MachineBasicBlock::iterator I = BB->begin(); I != BB->end(); ++I) {
|
||||
MachineInstr *MI = I;
|
||||
@ -258,8 +251,12 @@ bool LocalStackSlotPass::insertFrameReferenceRegisters(MachineFunction &Fn) {
|
||||
// Don't try this with values not in the local block.
|
||||
if (!MFI->isObjectPreAllocated(MI->getOperand(i).getIndex()))
|
||||
break;
|
||||
int Idx = MI->getOperand(i).getIndex();
|
||||
int64_t LocalOffset = LocalOffsets[Idx];
|
||||
if (!TRI->needsFrameBaseReg(MI, LocalOffset))
|
||||
break;
|
||||
FrameReferenceInsns.
|
||||
push_back(FrameRef(MI, LocalOffsets[MI->getOperand(i).getIndex()]));
|
||||
push_back(FrameRef(MI, LocalOffset, Idx));
|
||||
break;
|
||||
}
|
||||
}
|
||||
@ -271,26 +268,34 @@ bool LocalStackSlotPass::insertFrameReferenceRegisters(MachineFunction &Fn) {
|
||||
|
||||
MachineBasicBlock *Entry = Fn.begin();
|
||||
|
||||
unsigned BaseReg = 0;
|
||||
int64_t BaseOffset = 0;
|
||||
|
||||
// Loop through the frame references and allocate for them as necessary.
|
||||
for (int ref = 0, e = FrameReferenceInsns.size(); ref < e ; ++ref) {
|
||||
MachineBasicBlock::iterator I =
|
||||
FrameReferenceInsns[ref].getMachineInstr();
|
||||
FrameRef &FR = FrameReferenceInsns[ref];
|
||||
MachineBasicBlock::iterator I = FR.getMachineInstr();
|
||||
MachineInstr *MI = I;
|
||||
for (unsigned idx = 0, e = MI->getNumOperands(); idx != e; ++idx) {
|
||||
// Consider replacing all frame index operands that reference
|
||||
// an object allocated in the local block.
|
||||
if (MI->getOperand(idx).isFI()) {
|
||||
int FrameIdx = MI->getOperand(idx).getIndex();
|
||||
|
||||
int64_t LocalOffset = FR.getLocalOffset();
|
||||
int FrameIdx = FR.getFrameIndex();
|
||||
assert(MFI->isObjectPreAllocated(FrameIdx) &&
|
||||
"Only pre-allocated locals expected!");
|
||||
|
||||
DEBUG(dbgs() << "Considering: " << *MI);
|
||||
if (TRI->needsFrameBaseReg(MI, LocalOffsets[FrameIdx])) {
|
||||
unsigned BaseReg = 0;
|
||||
|
||||
unsigned idx = 0;
|
||||
for (unsigned f = MI->getNumOperands(); idx != f; ++idx) {
|
||||
if (!MI->getOperand(idx).isFI())
|
||||
continue;
|
||||
|
||||
if (FrameIdx == I->getOperand(idx).getIndex())
|
||||
break;
|
||||
}
|
||||
|
||||
assert(idx < MI->getNumOperands() && "Cannot find FI operand");
|
||||
|
||||
int64_t Offset = 0;
|
||||
int64_t FrameSizeAdjust =
|
||||
StackGrowsDown ? MFI->getLocalFrameSize() : 0;
|
||||
int64_t FrameSizeAdjust = StackGrowsDown ? MFI->getLocalFrameSize() : 0;
|
||||
|
||||
DEBUG(dbgs() << " Replacing FI in: " << *MI);
|
||||
|
||||
@ -299,28 +304,46 @@ bool LocalStackSlotPass::insertFrameReferenceRegisters(MachineFunction &Fn) {
|
||||
// instruction itself will be taken into account by the target,
|
||||
// so we don't have to adjust for it here when reusing a base
|
||||
// register.
|
||||
std::pair<unsigned, int64_t> RegOffset;
|
||||
if (lookupCandidateBaseReg(BaseRegisters, RegOffset,
|
||||
FrameSizeAdjust,
|
||||
LocalOffsets[FrameIdx],
|
||||
MI, TRI)) {
|
||||
DEBUG(dbgs() << " Reusing base register " <<
|
||||
RegOffset.first << "\n");
|
||||
if (UsedBaseReg && lookupCandidateBaseReg(BaseOffset, FrameSizeAdjust,
|
||||
LocalOffset, MI, TRI)) {
|
||||
DEBUG(dbgs() << " Reusing base register " << BaseReg << "\n");
|
||||
// We found a register to reuse.
|
||||
BaseReg = RegOffset.first;
|
||||
Offset = FrameSizeAdjust + LocalOffsets[FrameIdx] -
|
||||
RegOffset.second;
|
||||
Offset = FrameSizeAdjust + LocalOffset - BaseOffset;
|
||||
} else {
|
||||
// No previously defined register was in range, so create a
|
||||
// new one.
|
||||
// No previously defined register was in range, so create a // new one.
|
||||
|
||||
int64_t InstrOffset = TRI->getFrameIndexInstrOffset(MI, idx);
|
||||
|
||||
int64_t PrevBaseOffset = BaseOffset;
|
||||
BaseOffset = FrameSizeAdjust + LocalOffset + InstrOffset;
|
||||
|
||||
// We'd like to avoid creating single-use virtual base registers.
|
||||
// Because the FrameRefs are in sorted order, and we've already
|
||||
// processed all FrameRefs before this one, just check whether or not
|
||||
// the next FrameRef will be able to reuse this new register. If not,
|
||||
// then don't bother creating it.
|
||||
bool CanReuse = false;
|
||||
for (int refn = ref + 1; refn < e; ++refn) {
|
||||
FrameRef &FRN = FrameReferenceInsns[refn];
|
||||
MachineBasicBlock::iterator J = FRN.getMachineInstr();
|
||||
MachineInstr *MIN = J;
|
||||
|
||||
CanReuse = lookupCandidateBaseReg(BaseOffset, FrameSizeAdjust,
|
||||
FRN.getLocalOffset(), MIN, TRI);
|
||||
break;
|
||||
}
|
||||
|
||||
if (!CanReuse) {
|
||||
BaseOffset = PrevBaseOffset;
|
||||
continue;
|
||||
}
|
||||
|
||||
const MachineFunction *MF = MI->getParent()->getParent();
|
||||
const TargetRegisterClass *RC = TRI->getPointerRegClass(*MF);
|
||||
BaseReg = Fn.getRegInfo().createVirtualRegister(RC);
|
||||
|
||||
DEBUG(dbgs() << " Materializing base register " << BaseReg <<
|
||||
" at frame local offset " <<
|
||||
LocalOffsets[FrameIdx] + InstrOffset << "\n");
|
||||
" at frame local offset " << LocalOffset + InstrOffset << "\n");
|
||||
|
||||
// Tell the target to insert the instruction to initialize
|
||||
// the base register.
|
||||
@ -333,10 +356,6 @@ bool LocalStackSlotPass::insertFrameReferenceRegisters(MachineFunction &Fn) {
|
||||
// applied twice.
|
||||
Offset = -InstrOffset;
|
||||
|
||||
int64_t BaseOffset = FrameSizeAdjust + LocalOffsets[FrameIdx] +
|
||||
InstrOffset;
|
||||
BaseRegisters.push_back(
|
||||
std::pair<unsigned, int64_t>(BaseReg, BaseOffset));
|
||||
++NumBaseRegisters;
|
||||
UsedBaseReg = true;
|
||||
}
|
||||
@ -349,8 +368,6 @@ bool LocalStackSlotPass::insertFrameReferenceRegisters(MachineFunction &Fn) {
|
||||
|
||||
++NumReplacements;
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
return UsedBaseReg;
|
||||
}
|
||||
|
@ -1,9 +1,5 @@
|
||||
; RUN: llc < %s -march=ppc64 | FileCheck %s
|
||||
|
||||
; Temporarily XFAIL this test until LSA stops creating single-use
|
||||
; virtual base registers.
|
||||
; XFAIL: *
|
||||
|
||||
%struct.__db_region = type { %struct.__mutex_t, [4 x i8], %struct.anon, i32, [1 x i32] }
|
||||
%struct.__mutex_t = type { i32 }
|
||||
%struct.anon = type { i64, i64 }
|
||||
|
@ -20,8 +20,8 @@ define void @test2() {
|
||||
|
||||
define i32 @test3() {
|
||||
; CHECK: test3:
|
||||
; CHECK: ldr.n r2, LCPI
|
||||
; CHECK: add sp, r2
|
||||
; CHECK: ldr.n r1, LCPI
|
||||
; CHECK: add sp, r1
|
||||
; CHECK: ldr.n r1, LCPI
|
||||
; CHECK: add r1, sp
|
||||
; CHECK: subs r4, r7, #4
|
||||
|
Loading…
Reference in New Issue
Block a user