mirror of
https://github.com/RPCSX/llvm.git
synced 2024-12-11 21:57:55 +00:00
[PBQP] Tweak spill costs and coalescing benefits
This patch improves how the different costs (register, interference, spill and coalescing) relates together. The assumption is now that: - coalescing (or any other "side effect" of reg alloc) is negative, and instead of being derived from a spill cost, they use the block frequency info. - spill costs are in the [MinSpillCost:+inf( range - register or interference costs are in [0.0:MinSpillCost( or +inf The current MinSpillCost is set to 10.0, which is a random value high enough that the current constraint builders do not need to worry about when settings costs. It would however be worth adding a normalization step for register and interference costs as the last step in the constraint builder chain to ensure they are not greater than SpillMinCost (unless this has some sense for some architectures). This would work well with the current builder pipeline, where all costs are tweaked relatively to each others, but could grow above MinSpillCost if the pipeline is deep enough. The current heuristic is tuned to depend rather on the number of uses of a live interval rather than a density of uses, as used by the greedy allocator. This heuristic provides a few percent improvement on a number of benchmarks (eembc, spec, ...) and will definitely need to change once spill placement is implemented: the current spill placement is really ineficient, so making the cost proportionnal to the number of use is a clear win. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@221292 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
e2463284fc
commit
8025a39d11
@ -30,8 +30,10 @@ namespace llvm {
|
|||||||
/// @param UseDefFreq Expected number of executed use and def instructions
|
/// @param UseDefFreq Expected number of executed use and def instructions
|
||||||
/// per function call. Derived from block frequencies.
|
/// per function call. Derived from block frequencies.
|
||||||
/// @param Size Size of live interval as returnexd by getSize()
|
/// @param Size Size of live interval as returnexd by getSize()
|
||||||
|
/// @param NumInstr Number of instructions using this live interval
|
||||||
///
|
///
|
||||||
static inline float normalizeSpillWeight(float UseDefFreq, unsigned Size) {
|
static inline float normalizeSpillWeight(float UseDefFreq, unsigned Size,
|
||||||
|
unsigned NumInstr) {
|
||||||
// The constant 25 instructions is added to avoid depending too much on
|
// The constant 25 instructions is added to avoid depending too much on
|
||||||
// accidental SlotIndex gaps for small intervals. The effect is that small
|
// accidental SlotIndex gaps for small intervals. The effect is that small
|
||||||
// intervals have a spill weight that is mostly proportional to the number
|
// intervals have a spill weight that is mostly proportional to the number
|
||||||
@ -44,7 +46,7 @@ namespace llvm {
|
|||||||
/// spill weight and allocation hint.
|
/// spill weight and allocation hint.
|
||||||
class VirtRegAuxInfo {
|
class VirtRegAuxInfo {
|
||||||
public:
|
public:
|
||||||
typedef float (*NormalizingFn)(float, unsigned);
|
typedef float (*NormalizingFn)(float, unsigned, unsigned);
|
||||||
|
|
||||||
private:
|
private:
|
||||||
MachineFunction &MF;
|
MachineFunction &MF;
|
||||||
|
@ -100,6 +100,7 @@ VirtRegAuxInfo::calculateSpillWeightAndHint(LiveInterval &li) {
|
|||||||
MachineLoop *loop = nullptr;
|
MachineLoop *loop = nullptr;
|
||||||
bool isExiting = false;
|
bool isExiting = false;
|
||||||
float totalWeight = 0;
|
float totalWeight = 0;
|
||||||
|
unsigned numInstr = 0; // Number of instructions using li
|
||||||
SmallPtrSet<MachineInstr*, 8> visited;
|
SmallPtrSet<MachineInstr*, 8> visited;
|
||||||
|
|
||||||
// Find the best physreg hint and the best virtreg hint.
|
// Find the best physreg hint and the best virtreg hint.
|
||||||
@ -116,6 +117,7 @@ VirtRegAuxInfo::calculateSpillWeightAndHint(LiveInterval &li) {
|
|||||||
I = mri.reg_instr_begin(li.reg), E = mri.reg_instr_end();
|
I = mri.reg_instr_begin(li.reg), E = mri.reg_instr_end();
|
||||||
I != E; ) {
|
I != E; ) {
|
||||||
MachineInstr *mi = &*(I++);
|
MachineInstr *mi = &*(I++);
|
||||||
|
numInstr++;
|
||||||
if (mi->isIdentityCopy() || mi->isImplicitDef() || mi->isDebugValue())
|
if (mi->isIdentityCopy() || mi->isImplicitDef() || mi->isDebugValue())
|
||||||
continue;
|
continue;
|
||||||
if (!visited.insert(mi))
|
if (!visited.insert(mi))
|
||||||
@ -189,5 +191,5 @@ VirtRegAuxInfo::calculateSpillWeightAndHint(LiveInterval &li) {
|
|||||||
if (isRematerializable(li, LIS, *MF.getSubtarget().getInstrInfo()))
|
if (isRematerializable(li, LIS, *MF.getSubtarget().getInstrInfo()))
|
||||||
totalWeight *= 0.5F;
|
totalWeight *= 0.5F;
|
||||||
|
|
||||||
li.weight = normalize(totalWeight, li.getSize());
|
li.weight = normalize(totalWeight, li.getSize(), numInstr);
|
||||||
}
|
}
|
||||||
|
@ -1789,9 +1789,11 @@ unsigned RAGreedy::tryLocalSplit(LiveInterval &VirtReg, AllocationOrder &Order,
|
|||||||
// instructions.
|
// instructions.
|
||||||
//
|
//
|
||||||
// Try to guess the size of the new interval.
|
// Try to guess the size of the new interval.
|
||||||
const float EstWeight = normalizeSpillWeight(blockFreq * (NewGaps + 1),
|
const float EstWeight = normalizeSpillWeight(
|
||||||
Uses[SplitBefore].distance(Uses[SplitAfter]) +
|
blockFreq * (NewGaps + 1),
|
||||||
(LiveBefore + LiveAfter)*SlotIndex::InstrDist);
|
Uses[SplitBefore].distance(Uses[SplitAfter]) +
|
||||||
|
(LiveBefore + LiveAfter) * SlotIndex::InstrDist,
|
||||||
|
1);
|
||||||
// Would this split be possible to allocate?
|
// Would this split be possible to allocate?
|
||||||
// Never allocate all gaps, we wouldn't be making progress.
|
// Never allocate all gaps, we wouldn't be making progress.
|
||||||
DEBUG(dbgs() << " w=" << EstWeight);
|
DEBUG(dbgs() << " w=" << EstWeight);
|
||||||
|
@ -150,11 +150,17 @@ public:
|
|||||||
void apply(PBQPRAGraph &G) override {
|
void apply(PBQPRAGraph &G) override {
|
||||||
LiveIntervals &LIS = G.getMetadata().LIS;
|
LiveIntervals &LIS = G.getMetadata().LIS;
|
||||||
|
|
||||||
|
// A minimum spill costs, so that register constraints can can be set
|
||||||
|
// without normalization in the [0.0:MinSpillCost( interval.
|
||||||
|
const PBQP::PBQPNum MinSpillCost = 10.0;
|
||||||
|
|
||||||
for (auto NId : G.nodeIds()) {
|
for (auto NId : G.nodeIds()) {
|
||||||
PBQP::PBQPNum SpillCost =
|
PBQP::PBQPNum SpillCost =
|
||||||
LIS.getInterval(G.getNodeMetadata(NId).getVReg()).weight;
|
LIS.getInterval(G.getNodeMetadata(NId).getVReg()).weight;
|
||||||
if (SpillCost == 0.0)
|
if (SpillCost == 0.0)
|
||||||
SpillCost = std::numeric_limits<PBQP::PBQPNum>::min();
|
SpillCost = std::numeric_limits<PBQP::PBQPNum>::min();
|
||||||
|
else
|
||||||
|
SpillCost += MinSpillCost;
|
||||||
PBQPRAGraph::RawVector NodeCosts(G.getNodeCosts(NId));
|
PBQPRAGraph::RawVector NodeCosts(G.getNodeCosts(NId));
|
||||||
NodeCosts[PBQP::RegAlloc::getSpillOptionIdx()] = SpillCost;
|
NodeCosts[PBQP::RegAlloc::getSpillOptionIdx()] = SpillCost;
|
||||||
G.setNodeCosts(NId, std::move(NodeCosts));
|
G.setNodeCosts(NId, std::move(NodeCosts));
|
||||||
@ -350,11 +356,8 @@ public:
|
|||||||
unsigned DstReg = CP.getDstReg();
|
unsigned DstReg = CP.getDstReg();
|
||||||
unsigned SrcReg = CP.getSrcReg();
|
unsigned SrcReg = CP.getSrcReg();
|
||||||
|
|
||||||
const float CopyFactor = 0.5; // Cost of copy relative to load. Current
|
const float Scale = 1.0f / MBFI.getEntryFreq();
|
||||||
// value plucked randomly out of the air.
|
PBQP::PBQPNum CBenefit = MBFI.getBlockFreq(&MBB).getFrequency() * Scale;
|
||||||
|
|
||||||
PBQP::PBQPNum CBenefit =
|
|
||||||
CopyFactor * LiveIntervals::getSpillWeight(false, true, &MBFI, &MI);
|
|
||||||
|
|
||||||
if (CP.isPhys()) {
|
if (CP.isPhys()) {
|
||||||
if (!MF.getRegInfo().isAllocatable(DstReg))
|
if (!MF.getRegInfo().isAllocatable(DstReg))
|
||||||
@ -607,12 +610,20 @@ void RegAllocPBQP::finalizeAlloc(MachineFunction &MF,
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
static inline float normalizePBQPSpillWeight(float UseDefFreq, unsigned Size,
|
||||||
|
unsigned NumInstr) {
|
||||||
|
// All intervals have a spill weight that is mostly proportional to the number
|
||||||
|
// of uses, with uses in loops having a bigger weight.
|
||||||
|
return NumInstr * normalizeSpillWeight(UseDefFreq, Size, 1);
|
||||||
|
}
|
||||||
|
|
||||||
bool RegAllocPBQP::runOnMachineFunction(MachineFunction &MF) {
|
bool RegAllocPBQP::runOnMachineFunction(MachineFunction &MF) {
|
||||||
LiveIntervals &LIS = getAnalysis<LiveIntervals>();
|
LiveIntervals &LIS = getAnalysis<LiveIntervals>();
|
||||||
MachineBlockFrequencyInfo &MBFI =
|
MachineBlockFrequencyInfo &MBFI =
|
||||||
getAnalysis<MachineBlockFrequencyInfo>();
|
getAnalysis<MachineBlockFrequencyInfo>();
|
||||||
|
|
||||||
calculateSpillWeightsAndHints(LIS, MF, getAnalysis<MachineLoopInfo>(), MBFI);
|
calculateSpillWeightsAndHints(LIS, MF, getAnalysis<MachineLoopInfo>(), MBFI,
|
||||||
|
normalizePBQPSpillWeight);
|
||||||
|
|
||||||
VirtRegMap &VRM = getAnalysis<VirtRegMap>();
|
VirtRegMap &VRM = getAnalysis<VirtRegMap>();
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user