mirror of
https://github.com/RPCS3/llvm.git
synced 2025-01-16 06:49:58 +00:00
9eb59ec548
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@22520 91177308-0d34-0410-b5e6-96231b3b80d8
285 lines
9.5 KiB
C++
285 lines
9.5 KiB
C++
//===-- SchedPriorities.h - Encapsulate scheduling heuristics -------------===//
|
|
//
|
|
// The LLVM Compiler Infrastructure
|
|
//
|
|
// This file was developed by the LLVM research group and is distributed under
|
|
// the University of Illinois Open Source License. See LICENSE.TXT for details.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// Strategy:
|
|
// Priority ordering rules:
|
|
// (1) Max delay, which is the order of the heap S.candsAsHeap.
|
|
// (2) Instruction that frees up a register.
|
|
// (3) Instruction that has the maximum number of dependent instructions.
|
|
// Note that rules 2 and 3 are only used if issue conflicts prevent
|
|
// choosing a higher priority instruction by rule 1.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "SchedPriorities.h"
|
|
#include "../LiveVar/FunctionLiveVarInfo.h"
|
|
#include "llvm/CodeGen/MachineBasicBlock.h"
|
|
#include "llvm/Support/CFG.h"
|
|
#include "llvm/ADT/PostOrderIterator.h"
|
|
#include <iostream>
|
|
|
|
namespace llvm {
|
|
|
|
std::ostream &operator<<(std::ostream &os, const NodeDelayPair* nd) {
|
|
return os << "Delay for node " << nd->node->getNodeId()
|
|
<< " = " << (long)nd->delay << "\n";
|
|
}
|
|
|
|
|
|
SchedPriorities::SchedPriorities(const Function *, const SchedGraph *G,
|
|
FunctionLiveVarInfo &LVI)
|
|
: curTime(0), graph(G), methodLiveVarInfo(LVI),
|
|
nodeDelayVec(G->getNumNodes(), INVALID_LATENCY), // make errors obvious
|
|
earliestReadyTimeForNode(G->getNumNodes(), 0),
|
|
earliestReadyTime(0),
|
|
nextToTry(candsAsHeap.begin())
|
|
{
|
|
computeDelays(graph);
|
|
}
|
|
|
|
|
|
void
|
|
SchedPriorities::initialize() {
|
|
initializeReadyHeap(graph);
|
|
}
|
|
|
|
|
|
void
|
|
SchedPriorities::computeDelays(const SchedGraph* graph) {
|
|
po_iterator<const SchedGraph*> poIter = po_begin(graph), poEnd =po_end(graph);
|
|
for ( ; poIter != poEnd; ++poIter) {
|
|
const SchedGraphNode* node = *poIter;
|
|
CycleCount_t nodeDelay;
|
|
if (node->beginOutEdges() == node->endOutEdges())
|
|
nodeDelay = node->getLatency();
|
|
else {
|
|
// Iterate over the out-edges of the node to compute delay
|
|
nodeDelay = 0;
|
|
for (SchedGraphNode::const_iterator E=node->beginOutEdges();
|
|
E != node->endOutEdges(); ++E) {
|
|
CycleCount_t sinkDelay = getNodeDelay((SchedGraphNode*)(*E)->getSink());
|
|
nodeDelay = std::max(nodeDelay, sinkDelay + (*E)->getMinDelay());
|
|
}
|
|
}
|
|
getNodeDelayRef(node) = nodeDelay;
|
|
}
|
|
}
|
|
|
|
|
|
void
|
|
SchedPriorities::initializeReadyHeap(const SchedGraph* graph) {
|
|
const SchedGraphNode* graphRoot = (const SchedGraphNode*)graph->getRoot();
|
|
assert(graphRoot->getMachineInstr() == NULL && "Expect dummy root");
|
|
|
|
// Insert immediate successors of dummy root, which are the actual roots
|
|
sg_succ_const_iterator SEnd = succ_end(graphRoot);
|
|
for (sg_succ_const_iterator S = succ_begin(graphRoot); S != SEnd; ++S)
|
|
this->insertReady(*S);
|
|
|
|
#undef TEST_HEAP_CONVERSION
|
|
#ifdef TEST_HEAP_CONVERSION
|
|
std::cerr << "Before heap conversion:\n";
|
|
copy(candsAsHeap.begin(), candsAsHeap.end(),
|
|
ostream_iterator<NodeDelayPair*>(std::cerr,"\n"));
|
|
#endif
|
|
|
|
candsAsHeap.makeHeap();
|
|
|
|
nextToTry = candsAsHeap.begin();
|
|
|
|
#ifdef TEST_HEAP_CONVERSION
|
|
std::cerr << "After heap conversion:\n";
|
|
copy(candsAsHeap.begin(), candsAsHeap.end(),
|
|
ostream_iterator<NodeDelayPair*>(std::cerr,"\n"));
|
|
#endif
|
|
}
|
|
|
|
void
|
|
SchedPriorities::insertReady(const SchedGraphNode* node) {
|
|
candsAsHeap.insert(node, nodeDelayVec[node->getNodeId()]);
|
|
candsAsSet.insert(node);
|
|
mcands.clear(); // ensure reset choices is called before any more choices
|
|
earliestReadyTime = std::min(earliestReadyTime,
|
|
getEarliestReadyTimeForNode(node));
|
|
|
|
if (SchedDebugLevel >= Sched_PrintSchedTrace) {
|
|
std::cerr << " Node " << node->getNodeId() << " will be ready in Cycle "
|
|
<< getEarliestReadyTimeForNode(node) << "; "
|
|
<< " Delay = " <<(long)getNodeDelay(node) << "; Instruction: \n"
|
|
<< " " << *node->getMachineInstr() << "\n";
|
|
}
|
|
}
|
|
|
|
void
|
|
SchedPriorities::issuedReadyNodeAt(CycleCount_t curTime,
|
|
const SchedGraphNode* node) {
|
|
candsAsHeap.removeNode(node);
|
|
candsAsSet.erase(node);
|
|
mcands.clear(); // ensure reset choices is called before any more choices
|
|
|
|
if (earliestReadyTime == getEarliestReadyTimeForNode(node)) {
|
|
// earliestReadyTime may have been due to this node, so recompute it
|
|
earliestReadyTime = HUGE_LATENCY;
|
|
for (NodeHeap::const_iterator I=candsAsHeap.begin();
|
|
I != candsAsHeap.end(); ++I)
|
|
if (candsAsHeap.getNode(I)) {
|
|
earliestReadyTime =
|
|
std::min(earliestReadyTime,
|
|
getEarliestReadyTimeForNode(candsAsHeap.getNode(I)));
|
|
}
|
|
}
|
|
|
|
// Now update ready times for successors
|
|
for (SchedGraphNode::const_iterator E=node->beginOutEdges();
|
|
E != node->endOutEdges(); ++E) {
|
|
CycleCount_t& etime =
|
|
getEarliestReadyTimeForNodeRef((SchedGraphNode*)(*E)->getSink());
|
|
etime = std::max(etime, curTime + (*E)->getMinDelay());
|
|
}
|
|
}
|
|
|
|
|
|
//----------------------------------------------------------------------
|
|
// Priority ordering rules:
|
|
// (1) Max delay, which is the order of the heap S.candsAsHeap.
|
|
// (2) Instruction that frees up a register.
|
|
// (3) Instruction that has the maximum number of dependent instructions.
|
|
// Note that rules 2 and 3 are only used if issue conflicts prevent
|
|
// choosing a higher priority instruction by rule 1.
|
|
//----------------------------------------------------------------------
|
|
|
|
inline int
|
|
SchedPriorities::chooseByRule1(std::vector<candIndex>& mcands) {
|
|
return (mcands.size() == 1)? 0 // only one choice exists so take it
|
|
: -1; // -1 indicates multiple choices
|
|
}
|
|
|
|
inline int
|
|
SchedPriorities::chooseByRule2(std::vector<candIndex>& mcands) {
|
|
assert(mcands.size() >= 1 && "Should have at least one candidate here.");
|
|
for (unsigned i=0, N = mcands.size(); i < N; i++)
|
|
if (instructionHasLastUse(methodLiveVarInfo,
|
|
candsAsHeap.getNode(mcands[i])))
|
|
return i;
|
|
return -1;
|
|
}
|
|
|
|
inline int
|
|
SchedPriorities::chooseByRule3(std::vector<candIndex>& mcands) {
|
|
assert(mcands.size() >= 1 && "Should have at least one candidate here.");
|
|
int maxUses = candsAsHeap.getNode(mcands[0])->getNumOutEdges();
|
|
int indexWithMaxUses = 0;
|
|
for (unsigned i=1, N = mcands.size(); i < N; i++) {
|
|
int numUses = candsAsHeap.getNode(mcands[i])->getNumOutEdges();
|
|
if (numUses > maxUses) {
|
|
maxUses = numUses;
|
|
indexWithMaxUses = i;
|
|
}
|
|
}
|
|
return indexWithMaxUses;
|
|
}
|
|
|
|
const SchedGraphNode*
|
|
SchedPriorities::getNextHighest(const SchedulingManager& S,
|
|
CycleCount_t curTime) {
|
|
int nextIdx = -1;
|
|
const SchedGraphNode* nextChoice = NULL;
|
|
|
|
if (mcands.size() == 0)
|
|
findSetWithMaxDelay(mcands, S);
|
|
|
|
while (nextIdx < 0 && mcands.size() > 0) {
|
|
nextIdx = chooseByRule1(mcands); // rule 1
|
|
|
|
if (nextIdx == -1)
|
|
nextIdx = chooseByRule2(mcands); // rule 2
|
|
|
|
if (nextIdx == -1)
|
|
nextIdx = chooseByRule3(mcands); // rule 3
|
|
|
|
if (nextIdx == -1)
|
|
nextIdx = 0; // default to first choice by delays
|
|
|
|
// We have found the next best candidate. Check if it ready in
|
|
// the current cycle, and if it is feasible.
|
|
// If not, remove it from mcands and continue. Refill mcands if
|
|
// it becomes empty.
|
|
nextChoice = candsAsHeap.getNode(mcands[nextIdx]);
|
|
if (getEarliestReadyTimeForNode(nextChoice) > curTime
|
|
|| ! instrIsFeasible(S, nextChoice->getMachineInstr()->getOpcode()))
|
|
{
|
|
mcands.erase(mcands.begin() + nextIdx);
|
|
nextIdx = -1;
|
|
if (mcands.size() == 0)
|
|
findSetWithMaxDelay(mcands, S);
|
|
}
|
|
}
|
|
|
|
if (nextIdx >= 0) {
|
|
mcands.erase(mcands.begin() + nextIdx);
|
|
return nextChoice;
|
|
} else
|
|
return NULL;
|
|
}
|
|
|
|
|
|
void
|
|
SchedPriorities::findSetWithMaxDelay(std::vector<candIndex>& mcands,
|
|
const SchedulingManager& S)
|
|
{
|
|
if (mcands.size() == 0 && nextToTry != candsAsHeap.end())
|
|
{ // out of choices at current maximum delay;
|
|
// put nodes with next highest delay in mcands
|
|
candIndex next = nextToTry;
|
|
CycleCount_t maxDelay = candsAsHeap.getDelay(next);
|
|
for (; next != candsAsHeap.end()
|
|
&& candsAsHeap.getDelay(next) == maxDelay; ++next)
|
|
mcands.push_back(next);
|
|
|
|
nextToTry = next;
|
|
|
|
if (SchedDebugLevel >= Sched_PrintSchedTrace) {
|
|
std::cerr << " Cycle " << (long)getTime() << ": "
|
|
<< "Next highest delay = " << (long)maxDelay << " : "
|
|
<< mcands.size() << " Nodes with this delay: ";
|
|
for (unsigned i=0; i < mcands.size(); i++)
|
|
std::cerr << candsAsHeap.getNode(mcands[i])->getNodeId() << ", ";
|
|
std::cerr << "\n";
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
bool
|
|
SchedPriorities::instructionHasLastUse(FunctionLiveVarInfo &LVI,
|
|
const SchedGraphNode* graphNode) {
|
|
const MachineInstr *MI = graphNode->getMachineInstr();
|
|
|
|
hash_map<const MachineInstr*, bool>::const_iterator
|
|
ui = lastUseMap.find(MI);
|
|
if (ui != lastUseMap.end())
|
|
return ui->second;
|
|
|
|
// else check if instruction is a last use and save it in the hash_map
|
|
bool hasLastUse = false;
|
|
const BasicBlock* bb = graphNode->getMachineBasicBlock().getBasicBlock();
|
|
const ValueSet &LVs = LVI.getLiveVarSetBeforeMInst(MI, bb);
|
|
|
|
for (MachineInstr::const_val_op_iterator OI = MI->begin(), OE = MI->end();
|
|
OI != OE; ++OI)
|
|
if (!LVs.count(*OI)) {
|
|
hasLastUse = true;
|
|
break;
|
|
}
|
|
|
|
return lastUseMap[MI] = hasLastUse;
|
|
}
|
|
|
|
} // End llvm namespace
|