mirror of
https://github.com/RPCSX/llvm.git
synced 2024-12-05 02:16:46 +00:00
63e04f3ccb
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@5859 91177308-0d34-0410-b5e6-96231b3b80d8
1347 lines
43 KiB
C++
1347 lines
43 KiB
C++
//===- ModuloSchedGraph.cpp - Graph datastructure for Modulo Scheduling ---===//
|
|
//
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "llvm/CodeGen/InstrSelection.h"
|
|
#include "llvm/Function.h"
|
|
#include "llvm/Instructions.h"
|
|
#include "llvm/Type.h"
|
|
#include "llvm/CodeGen/MachineCodeForInstruction.h"
|
|
#include "llvm/CodeGen/MachineInstr.h"
|
|
#include "llvm/Target/TargetSchedInfo.h"
|
|
#include "Support/StringExtras.h"
|
|
#include "Support/STLExtras.h"
|
|
#include "Support/hash_map"
|
|
#include "Support/Statistic.h"
|
|
#include "ModuloScheduling.h"
|
|
#include "ModuloSchedGraph.h"
|
|
#include <algorithm>
|
|
#include <ostream>
|
|
#include <vector>
|
|
// FIXME: Should be using #include <cmath>
|
|
#include <math.h>
|
|
//#include <swig.h>
|
|
|
|
#define UNIDELAY 1
|
|
|
|
//*********************** Internal Data Structures *************************/
|
|
|
|
// The following two types need to be classes, not typedefs, so we can use
|
|
// opaque declarations in SchedGraph.h
|
|
//
|
|
struct RefVec:public std::vector<std::pair<ModuloSchedGraphNode*,int> > {
|
|
typedef std::vector<std::pair<ModuloSchedGraphNode*,
|
|
int> >::iterator iterator;
|
|
typedef std::vector<std::pair<ModuloSchedGraphNode*,
|
|
int> >::const_iterator const_iterator;
|
|
};
|
|
|
|
struct RegToRefVecMap:public hash_map<int,RefVec> {
|
|
typedef hash_map<int,RefVec>::iterator iterator;
|
|
typedef hash_map<int,RefVec>::const_iterator const_iterator;
|
|
};
|
|
|
|
struct ValueToDefVecMap:public hash_map<const Instruction*,RefVec> {
|
|
typedef hash_map<const Instruction*, RefVec>::iterator iterator;
|
|
typedef hash_map<const Instruction*,
|
|
RefVec>::const_iterator const_iterator;
|
|
};
|
|
|
|
// class Modulo SchedGraphNode
|
|
|
|
ModuloSchedGraphNode::ModuloSchedGraphNode(unsigned int _nodeId,
|
|
const BasicBlock * _bb,
|
|
const Instruction * _inst,
|
|
int indexInBB,
|
|
const TargetMachine & target)
|
|
:SchedGraphNodeCommon(_nodeId, _bb, indexInBB), inst(_inst)
|
|
{
|
|
if (inst) {
|
|
//FIXME: find the latency
|
|
//currently setthe latency to zero
|
|
latency = 0;
|
|
}
|
|
}
|
|
|
|
//class ModuloScheGraph
|
|
|
|
void ModuloSchedGraph::addDummyEdges()
|
|
{
|
|
assert(graphRoot->outEdges.size() == 0);
|
|
|
|
for (const_iterator I = begin(); I != end(); ++I) {
|
|
ModuloSchedGraphNode *node = (ModuloSchedGraphNode *) ((*I).second);
|
|
assert(node != graphRoot && node != graphLeaf);
|
|
if (node->beginInEdges() == node->endInEdges())
|
|
(void) new SchedGraphEdge(graphRoot, node, SchedGraphEdge::CtrlDep,
|
|
SchedGraphEdge::NonDataDep, 0);
|
|
if (node->beginOutEdges() == node->endOutEdges())
|
|
(void) new SchedGraphEdge(node, graphLeaf, SchedGraphEdge::CtrlDep,
|
|
SchedGraphEdge::NonDataDep, 0);
|
|
}
|
|
}
|
|
|
|
bool isDefinition(const Instruction *I)
|
|
{
|
|
//if(TerminatorInst::classof(I)||FreeInst::classof(I) || StoreInst::classof(I) || CallInst::classof(I))
|
|
if (!I->hasName())
|
|
return false;
|
|
else
|
|
return true;
|
|
}
|
|
|
|
void ModuloSchedGraph::addDefUseEdges(const BasicBlock *bb)
|
|
{
|
|
//collect def instructions, store them in vector
|
|
// const TargetInstrInfo& mii = target.getInstrInfo();
|
|
const TargetInstrInfo & mii = target.getInstrInfo();
|
|
|
|
typedef std::vector < ModuloSchedGraphNode * >DefVec;
|
|
DefVec defVec;
|
|
|
|
//find those def instructions
|
|
for (BasicBlock::const_iterator I = bb->begin(), E = bb->end(); I != E; ++I) {
|
|
if (I->getType() != Type::VoidTy) {
|
|
defVec.push_back(this->getGraphNodeForInst(I));
|
|
}
|
|
}
|
|
|
|
for (unsigned int i = 0; i < defVec.size(); i++) {
|
|
for (Value::use_const_iterator I = defVec[i]->getInst()->use_begin();
|
|
I != defVec[i]->getInst()->use_end(); I++) {
|
|
//for each use of a def, add a flow edge from the def instruction to the
|
|
//ref instruction
|
|
|
|
const Instruction *value = defVec[i]->getInst();
|
|
Instruction *inst = (Instruction *) (*I);
|
|
ModuloSchedGraphNode *node = NULL;
|
|
|
|
for (BasicBlock::const_iterator I = bb->begin(), E = bb->end();
|
|
I != E; ++I)
|
|
if ((const Instruction *) I == inst) {
|
|
node = (*this)[inst];
|
|
break;
|
|
}
|
|
|
|
assert(inst != NULL && " Use not an Instruction ?");
|
|
|
|
if (node == NULL) //inst is not an instruction in this block
|
|
{
|
|
} else {
|
|
// Add a flow edge from the def instruction to the ref instruction
|
|
|
|
// self loop will not happen in SSA form
|
|
assert(defVec[i] != node && "same node?");
|
|
|
|
// This is a true dependence, so the delay is equal to the delay of the
|
|
// pred node.
|
|
int delay = 0;
|
|
MachineCodeForInstruction & tempMvec =
|
|
MachineCodeForInstruction::get(value);
|
|
for (unsigned j = 0; j < tempMvec.size(); j++) {
|
|
MachineInstr *temp = tempMvec[j];
|
|
//delay +=mii.minLatency(temp->getOpCode());
|
|
delay = std::max(delay, mii.minLatency(temp->getOpCode()));
|
|
}
|
|
|
|
SchedGraphEdge *trueEdge =
|
|
new SchedGraphEdge(defVec[i], node, value,
|
|
SchedGraphEdge::TrueDep, delay);
|
|
|
|
// if the ref instruction is before the def instrution
|
|
// then the def instruction must be a phi instruction
|
|
// add an anti-dependence edge to from the ref instruction to the def
|
|
// instruction
|
|
if (node->getOrigIndexInBB() < defVec[i]->getOrigIndexInBB()) {
|
|
assert(PHINode::classof(inst)
|
|
&& "the ref instruction befre def is not PHINode?");
|
|
trueEdge->setIteDiff(1);
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
}
|
|
}
|
|
|
|
void ModuloSchedGraph::addCDEdges(const BasicBlock * bb) {
|
|
// find the last instruction in the basic block
|
|
// see if it is an branch instruction.
|
|
// If yes, then add an edge from each node expcept the last node to the last
|
|
// node
|
|
const Instruction *inst = &(bb->back());
|
|
ModuloSchedGraphNode *lastNode = (*this)[inst];
|
|
if (TerminatorInst::classof(inst))
|
|
for (BasicBlock::const_iterator I = bb->begin(), E = bb->end(); I != E;
|
|
I++) {
|
|
if (inst != I) {
|
|
ModuloSchedGraphNode *node = (*this)[I];
|
|
//use latency of 0
|
|
(void) new SchedGraphEdge(node, lastNode, SchedGraphEdge::CtrlDep,
|
|
SchedGraphEdge::NonDataDep, 0);
|
|
}
|
|
|
|
}
|
|
}
|
|
|
|
static const int SG_LOAD_REF = 0;
|
|
static const int SG_STORE_REF = 1;
|
|
static const int SG_CALL_REF = 2;
|
|
|
|
static const unsigned int SG_DepOrderArray[][3] = {
|
|
{SchedGraphEdge::NonDataDep,
|
|
SchedGraphEdge::AntiDep,
|
|
SchedGraphEdge::AntiDep},
|
|
{SchedGraphEdge::TrueDep,
|
|
SchedGraphEdge::OutputDep,
|
|
SchedGraphEdge::TrueDep | SchedGraphEdge::OutputDep},
|
|
{SchedGraphEdge::TrueDep,
|
|
SchedGraphEdge::AntiDep | SchedGraphEdge::OutputDep,
|
|
SchedGraphEdge::TrueDep | SchedGraphEdge::AntiDep
|
|
| SchedGraphEdge::OutputDep}
|
|
};
|
|
|
|
|
|
// Add a dependence edge between every pair of machine load/store/call
|
|
// instructions, where at least one is a store or a call.
|
|
// Use latency 1 just to ensure that memory operations are ordered;
|
|
// latency does not otherwise matter (true dependences enforce that).
|
|
//
|
|
void ModuloSchedGraph::addMemEdges(const BasicBlock * bb) {
|
|
|
|
std::vector<ModuloSchedGraphNode*> memNodeVec;
|
|
|
|
//construct the memNodeVec
|
|
for (BasicBlock::const_iterator I = bb->begin(), E = bb->end(); I != E; ++I) {
|
|
if (LoadInst::classof(I) || StoreInst::classof(I)
|
|
|| CallInst::classof(I)) {
|
|
ModuloSchedGraphNode *node = (*this)[(const Instruction *) I];
|
|
memNodeVec.push_back(node);
|
|
}
|
|
}
|
|
|
|
// Instructions in memNodeVec are in execution order within the basic block,
|
|
// so simply look at all pairs <memNodeVec[i], memNodeVec[j: j > i]>.
|
|
//
|
|
for (unsigned im = 0, NM = memNodeVec.size(); im < NM; im++) {
|
|
const Instruction *fromInst = memNodeVec[im]->getInst();
|
|
int fromType = CallInst::classof(fromInst) ? SG_CALL_REF
|
|
: LoadInst::classof(fromInst) ? SG_LOAD_REF : SG_STORE_REF;
|
|
for (unsigned jm = im + 1; jm < NM; jm++) {
|
|
const Instruction *toInst = memNodeVec[jm]->getInst();
|
|
int toType = CallInst::classof(toInst) ? SG_CALL_REF
|
|
: LoadInst::classof(toInst) ? SG_LOAD_REF : SG_STORE_REF;
|
|
if (fromType != SG_LOAD_REF || toType != SG_LOAD_REF) {
|
|
(void) new SchedGraphEdge(memNodeVec[im], memNodeVec[jm],
|
|
SchedGraphEdge::MemoryDep,
|
|
SG_DepOrderArray[fromType][toType], 1);
|
|
|
|
SchedGraphEdge *edge =
|
|
new SchedGraphEdge(memNodeVec[jm], memNodeVec[im],
|
|
SchedGraphEdge::MemoryDep,
|
|
SG_DepOrderArray[toType][fromType], 1);
|
|
edge->setIteDiff(1);
|
|
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
|
|
void ModuloSchedGraph::buildNodesforBB(const TargetMachine &target,
|
|
const BasicBlock *bb,
|
|
std::vector<ModuloSchedGraphNode*> &memNode,
|
|
RegToRefVecMap ®ToRefVecMap,
|
|
ValueToDefVecMap &valueToDefVecMap)
|
|
{
|
|
//const TargetInstrInfo& mii=target.getInstrInfo();
|
|
|
|
//Build graph nodes for each LLVM instruction and gather def/use info.
|
|
//Do both together in a single pass over all machine instructions.
|
|
|
|
int i = 0;
|
|
for (BasicBlock::const_iterator I = bb->begin(), E = bb->end(); I != E;
|
|
++I) {
|
|
ModuloSchedGraphNode *node =
|
|
new ModuloSchedGraphNode(getNumNodes(), bb, I, i, target);
|
|
i++;
|
|
this->noteModuloSchedGraphNodeForInst(I, node);
|
|
}
|
|
|
|
//this function finds some info about instruction in basic block for later use
|
|
//findDefUseInfoAtInstr(target, node,
|
|
//memNode,regToRefVecMap,valueToDefVecMap);
|
|
}
|
|
|
|
|
|
bool ModuloSchedGraph::isLoop(const BasicBlock *bb) {
|
|
//only if the last instruction in the basicblock is branch instruction and
|
|
//there is at least an option to branch itself
|
|
|
|
const Instruction *inst = &(bb->back());
|
|
if (BranchInst::classof(inst)) {
|
|
for (unsigned i = 0; i < ((BranchInst *) inst)->getNumSuccessors();
|
|
i++) {
|
|
BasicBlock *sb = ((BranchInst *) inst)->getSuccessor(i);
|
|
if (sb == bb)
|
|
return true;
|
|
}
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
bool ModuloSchedGraph::isLoop() {
|
|
//only if the last instruction in the basicblock is branch instruction and
|
|
//there is at least an option to branch itself
|
|
|
|
assert(bbVec.size() == 1 && "only 1 basicblock in a graph");
|
|
const BasicBlock *bb = bbVec[0];
|
|
const Instruction *inst = &(bb->back());
|
|
if (BranchInst::classof(inst))
|
|
for (unsigned i = 0; i < ((BranchInst *) inst)->getNumSuccessors();
|
|
i++) {
|
|
BasicBlock *sb = ((BranchInst *) inst)->getSuccessor(i);
|
|
if (sb == bb)
|
|
return true;
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
void ModuloSchedGraph::computeNodeASAP(const BasicBlock *bb) {
|
|
|
|
//FIXME: now assume the only backward edges come from the edges from other
|
|
//nodes to the phi Node so i will ignore all edges to the phi node; after
|
|
//this, there shall be no recurrence.
|
|
|
|
unsigned numNodes = bb->size();
|
|
for (unsigned i = 2; i < numNodes + 2; i++) {
|
|
ModuloSchedGraphNode *node = getNode(i);
|
|
node->setPropertyComputed(false);
|
|
}
|
|
|
|
for (unsigned i = 2; i < numNodes + 2; i++) {
|
|
ModuloSchedGraphNode *node = getNode(i);
|
|
node->ASAP = 0;
|
|
if (i == 2 || node->getNumInEdges() == 0) {
|
|
node->setPropertyComputed(true);
|
|
continue;
|
|
}
|
|
for (ModuloSchedGraphNode::const_iterator I = node->beginInEdges(), E =
|
|
node->endInEdges(); I != E; I++) {
|
|
SchedGraphEdge *edge = *I;
|
|
ModuloSchedGraphNode *pred =
|
|
(ModuloSchedGraphNode *) (edge->getSrc());
|
|
assert(pred->getPropertyComputed()
|
|
&& "pred node property is not computed!");
|
|
int temp =
|
|
pred->ASAP + edge->getMinDelay() -
|
|
edge->getIteDiff() * this->MII;
|
|
node->ASAP = std::max(node->ASAP, temp);
|
|
}
|
|
node->setPropertyComputed(true);
|
|
}
|
|
}
|
|
|
|
void ModuloSchedGraph::computeNodeALAP(const BasicBlock *bb) {
|
|
unsigned numNodes = bb->size();
|
|
int maxASAP = 0;
|
|
for (unsigned i = numNodes + 1; i >= 2; i--) {
|
|
ModuloSchedGraphNode *node = getNode(i);
|
|
node->setPropertyComputed(false);
|
|
//cerr<< " maxASAP= " <<maxASAP<<" node->ASAP= "<< node->ASAP<<"\n";
|
|
maxASAP = std::max(maxASAP, node->ASAP);
|
|
}
|
|
|
|
//cerr<<"maxASAP is "<<maxASAP<<"\n";
|
|
|
|
for (unsigned i = numNodes + 1; i >= 2; i--) {
|
|
ModuloSchedGraphNode *node = getNode(i);
|
|
node->ALAP = maxASAP;
|
|
for (ModuloSchedGraphNode::const_iterator I =
|
|
node->beginOutEdges(), E = node->endOutEdges(); I != E; I++) {
|
|
SchedGraphEdge *edge = *I;
|
|
ModuloSchedGraphNode *succ =
|
|
(ModuloSchedGraphNode *) (edge->getSink());
|
|
if (PHINode::classof(succ->getInst()))
|
|
continue;
|
|
assert(succ->getPropertyComputed()
|
|
&& "succ node property is not computed!");
|
|
int temp =
|
|
succ->ALAP - edge->getMinDelay() +
|
|
edge->getIteDiff() * this->MII;
|
|
node->ALAP = std::min(node->ALAP, temp);
|
|
}
|
|
node->setPropertyComputed(true);
|
|
}
|
|
}
|
|
|
|
void ModuloSchedGraph::computeNodeMov(const BasicBlock *bb)
|
|
{
|
|
unsigned numNodes = bb->size();
|
|
for (unsigned i = 2; i < numNodes + 2; i++) {
|
|
ModuloSchedGraphNode *node = getNode(i);
|
|
node->mov = node->ALAP - node->ASAP;
|
|
assert(node->mov >= 0
|
|
&& "move freedom for this node is less than zero? ");
|
|
}
|
|
}
|
|
|
|
|
|
void ModuloSchedGraph::computeNodeDepth(const BasicBlock * bb)
|
|
{
|
|
|
|
unsigned numNodes = bb->size();
|
|
for (unsigned i = 2; i < numNodes + 2; i++) {
|
|
ModuloSchedGraphNode *node = getNode(i);
|
|
node->setPropertyComputed(false);
|
|
}
|
|
|
|
for (unsigned i = 2; i < numNodes + 2; i++) {
|
|
ModuloSchedGraphNode *node = getNode(i);
|
|
node->depth = 0;
|
|
if (i == 2 || node->getNumInEdges() == 0) {
|
|
node->setPropertyComputed(true);
|
|
continue;
|
|
}
|
|
for (ModuloSchedGraphNode::const_iterator I = node->beginInEdges(), E =
|
|
node->endInEdges(); I != E; I++) {
|
|
SchedGraphEdge *edge = *I;
|
|
ModuloSchedGraphNode *pred =
|
|
(ModuloSchedGraphNode *) (edge->getSrc());
|
|
assert(pred->getPropertyComputed()
|
|
&& "pred node property is not computed!");
|
|
int temp = pred->depth + edge->getMinDelay();
|
|
node->depth = std::max(node->depth, temp);
|
|
}
|
|
node->setPropertyComputed(true);
|
|
}
|
|
|
|
}
|
|
|
|
|
|
void ModuloSchedGraph::computeNodeHeight(const BasicBlock *bb)
|
|
{
|
|
unsigned numNodes = bb->size();
|
|
for (unsigned i = numNodes + 1; i >= 2; i--) {
|
|
ModuloSchedGraphNode *node = getNode(i);
|
|
node->setPropertyComputed(false);
|
|
}
|
|
|
|
for (unsigned i = numNodes + 1; i >= 2; i--) {
|
|
ModuloSchedGraphNode *node = getNode(i);
|
|
node->height = 0;
|
|
for (ModuloSchedGraphNode::const_iterator I =
|
|
node->beginOutEdges(), E = node->endOutEdges(); I != E; ++I) {
|
|
SchedGraphEdge *edge = *I;
|
|
ModuloSchedGraphNode *succ =
|
|
(ModuloSchedGraphNode *) (edge->getSink());
|
|
if (PHINode::classof(succ->getInst()))
|
|
continue;
|
|
assert(succ->getPropertyComputed()
|
|
&& "succ node property is not computed!");
|
|
node->height = std::max(node->height, succ->height + edge->getMinDelay());
|
|
|
|
}
|
|
node->setPropertyComputed(true);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
void ModuloSchedGraph::computeNodeProperty(const BasicBlock * bb)
|
|
{
|
|
//FIXME: now assume the only backward edges come from the edges from other
|
|
//nodes to the phi Node so i will ignore all edges to the phi node; after
|
|
//this, there shall be no recurrence.
|
|
|
|
this->computeNodeASAP(bb);
|
|
this->computeNodeALAP(bb);
|
|
this->computeNodeMov(bb);
|
|
this->computeNodeDepth(bb);
|
|
this->computeNodeHeight(bb);
|
|
}
|
|
|
|
|
|
//do not consider the backedge in these two functions:
|
|
// i.e. don't consider the edge with destination in phi node
|
|
std::vector<ModuloSchedGraphNode*>
|
|
ModuloSchedGraph::predSet(std::vector<ModuloSchedGraphNode*> set,
|
|
unsigned backEdgeSrc,
|
|
unsigned
|
|
backEdgeSink)
|
|
{
|
|
std::vector<ModuloSchedGraphNode*> predS;
|
|
for (unsigned i = 0; i < set.size(); i++) {
|
|
ModuloSchedGraphNode *node = set[i];
|
|
for (ModuloSchedGraphNode::const_iterator I = node->beginInEdges(), E =
|
|
node->endInEdges(); I != E; I++) {
|
|
SchedGraphEdge *edge = *I;
|
|
if (edge->getSrc()->getNodeId() == backEdgeSrc
|
|
&& edge->getSink()->getNodeId() == backEdgeSink)
|
|
continue;
|
|
ModuloSchedGraphNode *pred =
|
|
(ModuloSchedGraphNode *) (edge->getSrc());
|
|
//if pred is not in the predSet, push it in vector
|
|
bool alreadyInset = false;
|
|
for (unsigned j = 0; j < predS.size(); ++j)
|
|
if (predS[j]->getNodeId() == pred->getNodeId()) {
|
|
alreadyInset = true;
|
|
break;
|
|
}
|
|
|
|
for (unsigned j = 0; j < set.size(); ++j)
|
|
if (set[j]->getNodeId() == pred->getNodeId()) {
|
|
alreadyInset = true;
|
|
break;
|
|
}
|
|
|
|
if (!alreadyInset)
|
|
predS.push_back(pred);
|
|
}
|
|
}
|
|
return predS;
|
|
}
|
|
|
|
ModuloSchedGraph::NodeVec ModuloSchedGraph::predSet(NodeVec set)
|
|
{
|
|
//node number increases from 2
|
|
return predSet(set, 0, 0);
|
|
}
|
|
|
|
std::vector <ModuloSchedGraphNode*>
|
|
ModuloSchedGraph::predSet(ModuloSchedGraphNode *_node,
|
|
unsigned backEdgeSrc, unsigned backEdgeSink)
|
|
{
|
|
std::vector<ModuloSchedGraphNode*> set;
|
|
set.push_back(_node);
|
|
return predSet(set, backEdgeSrc, backEdgeSink);
|
|
}
|
|
|
|
std::vector <ModuloSchedGraphNode*>
|
|
ModuloSchedGraph::predSet(ModuloSchedGraphNode * _node)
|
|
{
|
|
return predSet(_node, 0, 0);
|
|
}
|
|
|
|
std::vector<ModuloSchedGraphNode*>
|
|
ModuloSchedGraph::succSet(std::vector<ModuloSchedGraphNode*> set,
|
|
unsigned src, unsigned sink)
|
|
{
|
|
std::vector<ModuloSchedGraphNode*> succS;
|
|
for (unsigned i = 0; i < set.size(); i++) {
|
|
ModuloSchedGraphNode *node = set[i];
|
|
for (ModuloSchedGraphNode::const_iterator I =
|
|
node->beginOutEdges(), E = node->endOutEdges(); I != E; I++) {
|
|
SchedGraphEdge *edge = *I;
|
|
if (edge->getSrc()->getNodeId() == src
|
|
&& edge->getSink()->getNodeId() == sink)
|
|
continue;
|
|
ModuloSchedGraphNode *succ =
|
|
(ModuloSchedGraphNode *) (edge->getSink());
|
|
//if pred is not in the predSet, push it in vector
|
|
bool alreadyInset = false;
|
|
for (unsigned j = 0; j < succS.size(); j++)
|
|
if (succS[j]->getNodeId() == succ->getNodeId()) {
|
|
alreadyInset = true;
|
|
break;
|
|
}
|
|
|
|
for (unsigned j = 0; j < set.size(); j++)
|
|
if (set[j]->getNodeId() == succ->getNodeId()) {
|
|
alreadyInset = true;
|
|
break;
|
|
}
|
|
if (!alreadyInset)
|
|
succS.push_back(succ);
|
|
}
|
|
}
|
|
return succS;
|
|
}
|
|
|
|
ModuloSchedGraph::NodeVec ModuloSchedGraph::succSet(NodeVec set)
|
|
{
|
|
return succSet(set, 0, 0);
|
|
}
|
|
|
|
|
|
std::vector<ModuloSchedGraphNode*>
|
|
ModuloSchedGraph::succSet(ModuloSchedGraphNode *_node,
|
|
unsigned src, unsigned sink)
|
|
{
|
|
std::vector<ModuloSchedGraphNode*>set;
|
|
set.push_back(_node);
|
|
return succSet(set, src, sink);
|
|
}
|
|
|
|
std::vector<ModuloSchedGraphNode*>
|
|
ModuloSchedGraph::succSet(ModuloSchedGraphNode * _node)
|
|
{
|
|
return succSet(_node, 0, 0);
|
|
}
|
|
|
|
SchedGraphEdge *ModuloSchedGraph::getMaxDelayEdge(unsigned srcId,
|
|
unsigned sinkId)
|
|
{
|
|
ModuloSchedGraphNode *node = getNode(srcId);
|
|
SchedGraphEdge *maxDelayEdge = NULL;
|
|
int maxDelay = -1;
|
|
for (ModuloSchedGraphNode::const_iterator I = node->beginOutEdges(), E =
|
|
node->endOutEdges(); I != E; I++) {
|
|
SchedGraphEdge *edge = *I;
|
|
if (edge->getSink()->getNodeId() == sinkId)
|
|
if (edge->getMinDelay() > maxDelay) {
|
|
maxDelayEdge = edge;
|
|
maxDelay = edge->getMinDelay();
|
|
}
|
|
}
|
|
assert(maxDelayEdge != NULL && "no edge between the srcId and sinkId?");
|
|
return maxDelayEdge;
|
|
}
|
|
|
|
void ModuloSchedGraph::dumpCircuits()
|
|
{
|
|
DEBUG(std::cerr << "dumping circuits for graph:\n");
|
|
int j = -1;
|
|
while (circuits[++j][0] != 0) {
|
|
int k = -1;
|
|
while (circuits[j][++k] != 0)
|
|
DEBUG(std::cerr << circuits[j][k] << "\t");
|
|
DEBUG(std::cerr << "\n");
|
|
}
|
|
}
|
|
|
|
void ModuloSchedGraph::dumpSet(std::vector < ModuloSchedGraphNode * >set)
|
|
{
|
|
for (unsigned i = 0; i < set.size(); i++)
|
|
DEBUG(std::cerr << set[i]->getNodeId() << "\t");
|
|
DEBUG(std::cerr << "\n");
|
|
}
|
|
|
|
std::vector<ModuloSchedGraphNode*>
|
|
ModuloSchedGraph::vectorUnion(std::vector<ModuloSchedGraphNode*> set1,
|
|
std::vector<ModuloSchedGraphNode*> set2)
|
|
{
|
|
std::vector<ModuloSchedGraphNode*> unionVec;
|
|
for (unsigned i = 0; i < set1.size(); i++)
|
|
unionVec.push_back(set1[i]);
|
|
for (unsigned j = 0; j < set2.size(); j++) {
|
|
bool inset = false;
|
|
for (unsigned i = 0; i < unionVec.size(); i++)
|
|
if (set2[j] == unionVec[i])
|
|
inset = true;
|
|
if (!inset)
|
|
unionVec.push_back(set2[j]);
|
|
}
|
|
return unionVec;
|
|
}
|
|
|
|
std::vector<ModuloSchedGraphNode*>
|
|
ModuloSchedGraph::vectorConj(std::vector<ModuloSchedGraphNode*> set1,
|
|
std::vector<ModuloSchedGraphNode*> set2)
|
|
{
|
|
std::vector<ModuloSchedGraphNode*> conjVec;
|
|
for (unsigned i = 0; i < set1.size(); i++)
|
|
for (unsigned j = 0; j < set2.size(); j++)
|
|
if (set1[i] == set2[j])
|
|
conjVec.push_back(set1[i]);
|
|
return conjVec;
|
|
}
|
|
|
|
ModuloSchedGraph::NodeVec ModuloSchedGraph::vectorSub(NodeVec set1,
|
|
NodeVec set2)
|
|
{
|
|
NodeVec newVec;
|
|
for (NodeVec::iterator I = set1.begin(); I != set1.end(); I++) {
|
|
bool inset = false;
|
|
for (NodeVec::iterator II = set2.begin(); II != set2.end(); II++)
|
|
if ((*I)->getNodeId() == (*II)->getNodeId()) {
|
|
inset = true;
|
|
break;
|
|
}
|
|
if (!inset)
|
|
newVec.push_back(*I);
|
|
}
|
|
return newVec;
|
|
}
|
|
|
|
void ModuloSchedGraph::orderNodes() {
|
|
oNodes.clear();
|
|
|
|
std::vector < ModuloSchedGraphNode * >set;
|
|
const BasicBlock *bb = bbVec[0];
|
|
unsigned numNodes = bb->size();
|
|
|
|
// first order all the sets
|
|
int j = -1;
|
|
int totalDelay = -1;
|
|
int preDelay = -1;
|
|
while (circuits[++j][0] != 0) {
|
|
int k = -1;
|
|
preDelay = totalDelay;
|
|
|
|
while (circuits[j][++k] != 0) {
|
|
ModuloSchedGraphNode *node = getNode(circuits[j][k]);
|
|
unsigned nextNodeId;
|
|
nextNodeId =
|
|
circuits[j][k + 1] != 0 ? circuits[j][k + 1] : circuits[j][0];
|
|
SchedGraphEdge *edge = getMaxDelayEdge(circuits[j][k], nextNodeId);
|
|
totalDelay += edge->getMinDelay();
|
|
}
|
|
if (preDelay != -1 && totalDelay > preDelay) {
|
|
// swap circuits[j][] and cuicuits[j-1][]
|
|
unsigned temp[MAXNODE];
|
|
for (int k = 0; k < MAXNODE; k++) {
|
|
temp[k] = circuits[j - 1][k];
|
|
circuits[j - 1][k] = circuits[j][k];
|
|
circuits[j][k] = temp[k];
|
|
}
|
|
//restart
|
|
j = -1;
|
|
}
|
|
}
|
|
|
|
// build the first set
|
|
int backEdgeSrc;
|
|
int backEdgeSink;
|
|
if (ModuloScheduling::printScheduleProcess())
|
|
DEBUG(std::cerr << "building the first set" << "\n");
|
|
int setSeq = -1;
|
|
int k = -1;
|
|
setSeq++;
|
|
while (circuits[setSeq][++k] != 0)
|
|
set.push_back(getNode(circuits[setSeq][k]));
|
|
if (circuits[setSeq][0] != 0) {
|
|
backEdgeSrc = circuits[setSeq][k - 1];
|
|
backEdgeSink = circuits[setSeq][0];
|
|
}
|
|
if (ModuloScheduling::printScheduleProcess()) {
|
|
DEBUG(std::cerr << "the first set is:");
|
|
dumpSet(set);
|
|
}
|
|
// implement the ordering algorithm
|
|
enum OrderSeq { bottom_up, top_down };
|
|
OrderSeq order;
|
|
std::vector<ModuloSchedGraphNode*> R;
|
|
while (!set.empty()) {
|
|
std::vector<ModuloSchedGraphNode*> pset = predSet(oNodes);
|
|
std::vector<ModuloSchedGraphNode*> sset = succSet(oNodes);
|
|
|
|
if (!pset.empty() && !vectorConj(pset, set).empty()) {
|
|
R = vectorConj(pset, set);
|
|
order = bottom_up;
|
|
} else if (!sset.empty() && !vectorConj(sset, set).empty()) {
|
|
R = vectorConj(sset, set);
|
|
order = top_down;
|
|
} else {
|
|
int maxASAP = -1;
|
|
int position = -1;
|
|
for (unsigned i = 0; i < set.size(); i++) {
|
|
int temp = set[i]->getASAP();
|
|
if (temp > maxASAP) {
|
|
maxASAP = temp;
|
|
position = i;
|
|
}
|
|
}
|
|
R.push_back(set[position]);
|
|
order = bottom_up;
|
|
}
|
|
|
|
while (!R.empty()) {
|
|
if (order == top_down) {
|
|
if (ModuloScheduling::printScheduleProcess())
|
|
DEBUG(std::cerr << "in top_down round\n");
|
|
while (!R.empty()) {
|
|
int maxHeight = -1;
|
|
NodeVec::iterator chosenI;
|
|
for (NodeVec::iterator I = R.begin(); I != R.end(); I++) {
|
|
int temp = (*I)->height;
|
|
if ((temp > maxHeight)
|
|
|| (temp == maxHeight && (*I)->mov <= (*chosenI)->mov)) {
|
|
|
|
if ((temp > maxHeight)
|
|
|| (temp == maxHeight && (*I)->mov < (*chosenI)->mov)) {
|
|
maxHeight = temp;
|
|
chosenI = I;
|
|
continue;
|
|
}
|
|
//possible case: instruction A and B has the same height and mov,
|
|
//but A has dependence to B e.g B is the branch instruction in the
|
|
//end, or A is the phi instruction at the beginning
|
|
if ((*I)->mov == (*chosenI)->mov)
|
|
for (ModuloSchedGraphNode::const_iterator oe =
|
|
(*I)->beginOutEdges(), end = (*I)->endOutEdges();
|
|
oe != end; oe++) {
|
|
if ((*oe)->getSink() == (*chosenI)) {
|
|
maxHeight = temp;
|
|
chosenI = I;
|
|
continue;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
ModuloSchedGraphNode *mu = *chosenI;
|
|
oNodes.push_back(mu);
|
|
R.erase(chosenI);
|
|
std::vector<ModuloSchedGraphNode*> succ_mu =
|
|
succSet(mu, backEdgeSrc, backEdgeSink);
|
|
std::vector<ModuloSchedGraphNode*> comm =
|
|
vectorConj(succ_mu, set);
|
|
comm = vectorSub(comm, oNodes);
|
|
R = vectorUnion(comm, R);
|
|
}
|
|
order = bottom_up;
|
|
R = vectorConj(predSet(oNodes), set);
|
|
} else {
|
|
if (ModuloScheduling::printScheduleProcess())
|
|
DEBUG(std::cerr << "in bottom up round\n");
|
|
while (!R.empty()) {
|
|
int maxDepth = -1;
|
|
NodeVec::iterator chosenI;
|
|
for (NodeVec::iterator I = R.begin(); I != R.end(); I++) {
|
|
int temp = (*I)->depth;
|
|
if ((temp > maxDepth)
|
|
|| (temp == maxDepth && (*I)->mov < (*chosenI)->mov)) {
|
|
maxDepth = temp;
|
|
chosenI = I;
|
|
}
|
|
}
|
|
ModuloSchedGraphNode *mu = *chosenI;
|
|
oNodes.push_back(mu);
|
|
R.erase(chosenI);
|
|
std::vector<ModuloSchedGraphNode*> pred_mu =
|
|
predSet(mu, backEdgeSrc, backEdgeSink);
|
|
std::vector<ModuloSchedGraphNode*> comm =
|
|
vectorConj(pred_mu, set);
|
|
comm = vectorSub(comm, oNodes);
|
|
R = vectorUnion(comm, R);
|
|
}
|
|
order = top_down;
|
|
R = vectorConj(succSet(oNodes), set);
|
|
}
|
|
}
|
|
if (ModuloScheduling::printScheduleProcess()) {
|
|
DEBUG(std::cerr << "order finished\n");
|
|
DEBUG(std::cerr << "dumping the ordered nodes:\n");
|
|
dumpSet(oNodes);
|
|
dumpCircuits();
|
|
}
|
|
//create a new set
|
|
//FIXME: the nodes between onodes and this circuit should also be include in
|
|
//this set
|
|
if (ModuloScheduling::printScheduleProcess())
|
|
DEBUG(std::cerr << "building the next set\n");
|
|
set.clear();
|
|
int k = -1;
|
|
setSeq++;
|
|
while (circuits[setSeq][++k] != 0)
|
|
set.push_back(getNode(circuits[setSeq][k]));
|
|
if (circuits[setSeq][0] != 0) {
|
|
backEdgeSrc = circuits[setSeq][k - 1];
|
|
backEdgeSink = circuits[setSeq][0];
|
|
}
|
|
if (set.empty()) {
|
|
//no circuits any more
|
|
//collect all other nodes
|
|
if (ModuloScheduling::printScheduleProcess())
|
|
DEBUG(std::cerr << "no circuits any more, collect the rest nodes\n");
|
|
for (unsigned i = 2; i < numNodes + 2; i++) {
|
|
bool inset = false;
|
|
for (unsigned j = 0; j < oNodes.size(); j++)
|
|
if (oNodes[j]->getNodeId() == i) {
|
|
inset = true;
|
|
break;
|
|
}
|
|
if (!inset)
|
|
set.push_back(getNode(i));
|
|
}
|
|
}
|
|
if (ModuloScheduling::printScheduleProcess()) {
|
|
DEBUG(std::cerr << "next set is:\n");
|
|
dumpSet(set);
|
|
}
|
|
} //while(!set.empty())
|
|
|
|
}
|
|
|
|
|
|
|
|
void ModuloSchedGraph::buildGraph(const TargetMachine & target)
|
|
{
|
|
const BasicBlock *bb = bbVec[0];
|
|
|
|
assert(bbVec.size() == 1 && "only handling a single basic block here");
|
|
|
|
// Use this data structure to note all machine operands that compute
|
|
// ordinary LLVM values. These must be computed defs (i.e., instructions).
|
|
// Note that there may be multiple machine instructions that define
|
|
// each Value.
|
|
ValueToDefVecMap valueToDefVecMap;
|
|
|
|
// Use this data structure to note all memory instructions.
|
|
// We use this to add memory dependence edges without a second full walk.
|
|
//
|
|
// vector<const Instruction*> memVec;
|
|
std::vector<ModuloSchedGraphNode*> memNodeVec;
|
|
|
|
// Use this data structure to note any uses or definitions of
|
|
// machine registers so we can add edges for those later without
|
|
// extra passes over the nodes.
|
|
// The vector holds an ordered list of references to the machine reg,
|
|
// ordered according to control-flow order. This only works for a
|
|
// single basic block, hence the assertion. Each reference is identified
|
|
// by the pair: <node, operand-number>.
|
|
//
|
|
RegToRefVecMap regToRefVecMap;
|
|
|
|
// Make a dummy root node. We'll add edges to the real roots later.
|
|
graphRoot = new ModuloSchedGraphNode(0, NULL, NULL, -1, target);
|
|
graphLeaf = new ModuloSchedGraphNode(1, NULL, NULL, -1, target);
|
|
|
|
//----------------------------------------------------------------
|
|
// First add nodes for all the LLVM instructions in the basic block because
|
|
// this greatly simplifies identifying which edges to add. Do this one VM
|
|
// instruction at a time since the ModuloSchedGraphNode needs that.
|
|
// Also, remember the load/store instructions to add memory deps later.
|
|
//----------------------------------------------------------------
|
|
|
|
//FIXME:if there is call instruction, then we shall quit somewhere
|
|
// currently we leave call instruction and continue construct graph
|
|
|
|
//dump only the blocks which are from loops
|
|
|
|
|
|
if (ModuloScheduling::printScheduleProcess())
|
|
this->dump(bb);
|
|
|
|
if (!isLoop(bb)) {
|
|
DEBUG(std::cerr << " dumping non-loop BB:\n");
|
|
dump(bb);
|
|
}
|
|
if (isLoop(bb)) {
|
|
buildNodesforBB(target, bb, memNodeVec, regToRefVecMap,
|
|
valueToDefVecMap);
|
|
|
|
this->addDefUseEdges(bb);
|
|
this->addCDEdges(bb);
|
|
this->addMemEdges(bb);
|
|
|
|
//this->dump();
|
|
|
|
int ResII = this->computeResII(bb);
|
|
if (ModuloScheduling::printScheduleProcess())
|
|
DEBUG(std::cerr << "ResII is " << ResII << "\n");
|
|
int RecII = this->computeRecII(bb);
|
|
if (ModuloScheduling::printScheduleProcess())
|
|
DEBUG(std::cerr << "RecII is " << RecII << "\n");
|
|
|
|
this->MII = std::max(ResII, RecII);
|
|
|
|
this->computeNodeProperty(bb);
|
|
if (ModuloScheduling::printScheduleProcess())
|
|
this->dumpNodeProperty();
|
|
|
|
this->orderNodes();
|
|
|
|
if (ModuloScheduling::printScheduleProcess())
|
|
this->dump();
|
|
//this->instrScheduling();
|
|
|
|
//this->dumpScheduling();
|
|
}
|
|
}
|
|
|
|
ModuloSchedGraphNode *ModuloSchedGraph::getNode(const unsigned nodeId) const
|
|
{
|
|
for (const_iterator I = begin(), E = end(); I != E; I++)
|
|
if ((*I).second->getNodeId() == nodeId)
|
|
return (ModuloSchedGraphNode *) (*I).second;
|
|
return NULL;
|
|
}
|
|
|
|
int ModuloSchedGraph::computeRecII(const BasicBlock *bb)
|
|
{
|
|
int RecII = 0;
|
|
|
|
//os<<"begining computerRecII()"<<"\n";
|
|
|
|
//FIXME: only deal with circuits starting at the first node: the phi node
|
|
//nodeId=2;
|
|
|
|
//search all elementary circuits in the dependance graph
|
|
//assume maximum number of nodes is MAXNODE
|
|
|
|
unsigned path[MAXNODE];
|
|
unsigned stack[MAXNODE][MAXNODE];
|
|
|
|
for (int j = 0; j < MAXNODE; j++) {
|
|
path[j] = 0;
|
|
for (int k = 0; k < MAXNODE; k++)
|
|
stack[j][k] = 0;
|
|
}
|
|
//in our graph, the node number starts at 2
|
|
|
|
//number of nodes, because each instruction will result in one node
|
|
const unsigned numNodes = bb->size();
|
|
|
|
int i = 0;
|
|
path[i] = 2;
|
|
|
|
ModuloSchedGraphNode *initNode = getNode(path[0]);
|
|
unsigned initNodeId = initNode->getNodeId();
|
|
ModuloSchedGraphNode *currentNode = initNode;
|
|
|
|
while (currentNode != NULL) {
|
|
unsigned currentNodeId = currentNode->getNodeId();
|
|
// DEBUG(std::cerr<<"current node is "<<currentNodeId<<"\n");
|
|
|
|
ModuloSchedGraphNode *nextNode = NULL;
|
|
for (ModuloSchedGraphNode::const_iterator I =
|
|
currentNode->beginOutEdges(), E = currentNode->endOutEdges();
|
|
I != E; I++) {
|
|
//DEBUG(std::cerr <<" searching in outgoint edges of node
|
|
//"<<currentNodeId<<"\n";
|
|
unsigned nodeId = ((SchedGraphEdge *) * I)->getSink()->getNodeId();
|
|
bool inpath = false, instack = false;
|
|
int k;
|
|
|
|
//DEBUG(std::cerr<<"nodeId is "<<nodeId<<"\n");
|
|
|
|
k = -1;
|
|
while (path[++k] != 0)
|
|
if (nodeId == path[k]) {
|
|
inpath = true;
|
|
break;
|
|
}
|
|
|
|
k = -1;
|
|
while (stack[i][++k] != 0)
|
|
if (nodeId == stack[i][k]) {
|
|
instack = true;
|
|
break;
|
|
}
|
|
|
|
if (nodeId > currentNodeId && !inpath && !instack) {
|
|
nextNode =
|
|
(ModuloSchedGraphNode *) ((SchedGraphEdge *) * I)->getSink();
|
|
break;
|
|
}
|
|
}
|
|
|
|
if (nextNode != NULL) {
|
|
//DEBUG(std::cerr<<"find the next Node "<<nextNode->getNodeId()<<"\n");
|
|
|
|
int j = 0;
|
|
while (stack[i][j] != 0)
|
|
j++;
|
|
stack[i][j] = nextNode->getNodeId();
|
|
|
|
i++;
|
|
path[i] = nextNode->getNodeId();
|
|
currentNode = nextNode;
|
|
} else {
|
|
//DEBUG(std::cerr<<"no expansion any more"<<"\n");
|
|
//confirmCircuit();
|
|
for (ModuloSchedGraphNode::const_iterator I =
|
|
currentNode->beginOutEdges(), E = currentNode->endOutEdges();
|
|
I != E; I++) {
|
|
unsigned nodeId = ((SchedGraphEdge *) * I)->getSink()->getNodeId();
|
|
if (nodeId == initNodeId) {
|
|
|
|
int j = -1;
|
|
while (circuits[++j][0] != 0);
|
|
for (int k = 0; k < MAXNODE; k++)
|
|
circuits[j][k] = path[k];
|
|
|
|
}
|
|
}
|
|
//remove this node in the path and clear the corresponding entries in the
|
|
//stack
|
|
path[i] = 0;
|
|
int j = 0;
|
|
for (j = 0; j < MAXNODE; j++)
|
|
stack[i][j] = 0;
|
|
i--;
|
|
currentNode = getNode(path[i]);
|
|
}
|
|
if (i == 0) {
|
|
|
|
if (ModuloScheduling::printScheduleProcess())
|
|
DEBUG(std::cerr << "circuits found are:\n");
|
|
int j = -1;
|
|
while (circuits[++j][0] != 0) {
|
|
int k = -1;
|
|
while (circuits[j][++k] != 0)
|
|
if (ModuloScheduling::printScheduleProcess())
|
|
DEBUG(std::cerr << circuits[j][k] << "\t");
|
|
if (ModuloScheduling::printScheduleProcess())
|
|
DEBUG(std::cerr << "\n");
|
|
|
|
//for this circuit, compute the sum of all edge delay
|
|
int sumDelay = 0;
|
|
k = -1;
|
|
while (circuits[j][++k] != 0) {
|
|
//ModuloSchedGraphNode* node =getNode(circuits[j][k]);
|
|
unsigned nextNodeId;
|
|
nextNodeId =
|
|
circuits[j][k + 1] !=
|
|
0 ? circuits[j][k + 1] : circuits[j][0];
|
|
|
|
/*
|
|
for(ModuloSchedGraphNode::const_iterator I=node->beginOutEdges(),
|
|
E=node->endOutEdges();I !=E; I++)
|
|
{
|
|
SchedGraphEdge* edge= *I;
|
|
if(edge->getSink()->getNodeId() == nextNodeId)
|
|
{sumDelay += edge->getMinDelay();break;}
|
|
}
|
|
*/
|
|
|
|
sumDelay +=
|
|
getMaxDelayEdge(circuits[j][k], nextNodeId)->getMinDelay();
|
|
|
|
}
|
|
// assume we have distance 1, in this case the sumDelay is RecII
|
|
// this is correct for SSA form only
|
|
//
|
|
if (ModuloScheduling::printScheduleProcess())
|
|
DEBUG(std::cerr << "The total Delay in the circuit is " << sumDelay
|
|
<< "\n");
|
|
|
|
RecII = RecII > sumDelay ? RecII : sumDelay;
|
|
|
|
}
|
|
return RecII;
|
|
}
|
|
|
|
}
|
|
|
|
return -1;
|
|
}
|
|
|
|
void ModuloSchedGraph::addResourceUsage(std::vector<std::pair<int,int> > &ruVec,
|
|
int rid)
|
|
{
|
|
//DEBUG(std::cerr<<"\nadding a resouce , current resouceUsage vector size is
|
|
//"<<ruVec.size()<<"\n";
|
|
bool alreadyExists = false;
|
|
for (unsigned i = 0; i < ruVec.size(); i++) {
|
|
if (rid == ruVec[i].first) {
|
|
ruVec[i].second++;
|
|
alreadyExists = true;
|
|
break;
|
|
}
|
|
}
|
|
if (!alreadyExists)
|
|
ruVec.push_back(std::make_pair(rid, 1));
|
|
//DEBUG(std::cerr<<"current resouceUsage vector size is "<<ruVec.size()<<"\n";
|
|
|
|
}
|
|
void ModuloSchedGraph::dumpResourceUsage(std::vector<std::pair<int,int> > &ru)
|
|
{
|
|
TargetSchedInfo & msi = (TargetSchedInfo &) target.getSchedInfo();
|
|
|
|
std::vector<std::pair<int,int> > resourceNumVector = msi.resourceNumVector;
|
|
DEBUG(std::cerr << "resourceID\t" << "resourceNum\n");
|
|
for (unsigned i = 0; i < resourceNumVector.size(); i++)
|
|
DEBUG(std::cerr << resourceNumVector[i].
|
|
first << "\t" << resourceNumVector[i].second << "\n");
|
|
|
|
DEBUG(std::cerr << " maxNumIssueTotal(issue slot in one cycle) = " << msi.
|
|
maxNumIssueTotal << "\n");
|
|
DEBUG(std::cerr << "resourceID\t resourceUsage\t ResourceNum\n");
|
|
for (unsigned i = 0; i < ru.size(); i++) {
|
|
DEBUG(std::cerr << ru[i].first << "\t" << ru[i].second);
|
|
const unsigned resNum = msi.getCPUResourceNum(ru[i].first);
|
|
DEBUG(std::cerr << "\t" << resNum << "\n");
|
|
}
|
|
}
|
|
|
|
int ModuloSchedGraph::computeResII(const BasicBlock * bb)
|
|
{
|
|
|
|
const TargetInstrInfo & mii = target.getInstrInfo();
|
|
const TargetSchedInfo & msi = target.getSchedInfo();
|
|
|
|
int ResII;
|
|
std::vector<std::pair<int,int> > resourceUsage;
|
|
//pair<int resourceid, int resourceUsageTimes_in_the_whole_block>
|
|
|
|
//FIXME: number of functional units the target machine can provide should be
|
|
//get from Target here I temporary hardcode it
|
|
|
|
for (BasicBlock::const_iterator I = bb->begin(), E = bb->end(); I != E;
|
|
I++) {
|
|
if (ModuloScheduling::printScheduleProcess()) {
|
|
DEBUG(std::cerr << "machine instruction for llvm instruction( node " <<
|
|
getGraphNodeForInst(I)->getNodeId() << ")\n");
|
|
DEBUG(std::cerr << "\t" << *I);
|
|
}
|
|
MachineCodeForInstruction & tempMvec =
|
|
MachineCodeForInstruction::get(I);
|
|
if (ModuloScheduling::printScheduleProcess())
|
|
DEBUG(std::cerr << "size =" << tempMvec.size() << "\n");
|
|
for (unsigned i = 0; i < tempMvec.size(); i++) {
|
|
MachineInstr *minstr = tempMvec[i];
|
|
|
|
unsigned minDelay = mii.minLatency(minstr->getOpCode());
|
|
InstrRUsage rUsage = msi.getInstrRUsage(minstr->getOpCode());
|
|
InstrClassRUsage classRUsage =
|
|
msi.getClassRUsage(mii.getSchedClass(minstr->getOpCode()));
|
|
unsigned totCycles = classRUsage.totCycles;
|
|
|
|
std::vector<std::vector<resourceId_t> > resources=rUsage.resourcesByCycle;
|
|
assert(totCycles == resources.size());
|
|
if (ModuloScheduling::printScheduleProcess())
|
|
DEBUG(std::cerr << "resources Usage for this Instr(totCycles="
|
|
<< totCycles << ",mindLatency="
|
|
<< mii.minLatency(minstr->getOpCode()) << "): " << *minstr
|
|
<< "\n");
|
|
for (unsigned j = 0; j < resources.size(); j++) {
|
|
if (ModuloScheduling::printScheduleProcess())
|
|
DEBUG(std::cerr << "cycle " << j << ": ");
|
|
for (unsigned k = 0; k < resources[j].size(); k++) {
|
|
if (ModuloScheduling::printScheduleProcess())
|
|
DEBUG(std::cerr << "\t" << resources[j][k]);
|
|
addResourceUsage(resourceUsage, resources[j][k]);
|
|
}
|
|
if (ModuloScheduling::printScheduleProcess())
|
|
DEBUG(std::cerr << "\n");
|
|
}
|
|
}
|
|
}
|
|
if (ModuloScheduling::printScheduleProcess())
|
|
this->dumpResourceUsage(resourceUsage);
|
|
|
|
//compute ResII
|
|
ResII = 0;
|
|
int issueSlots = msi.maxNumIssueTotal;
|
|
for (unsigned i = 0; i < resourceUsage.size(); i++) {
|
|
int resourceNum = msi.getCPUResourceNum(resourceUsage[i].first);
|
|
int useNum = resourceUsage[i].second;
|
|
double tempII;
|
|
if (resourceNum <= issueSlots)
|
|
tempII = ceil(1.0 * useNum / resourceNum);
|
|
else
|
|
tempII = ceil(1.0 * useNum / issueSlots);
|
|
ResII = std::max((int) tempII, ResII);
|
|
}
|
|
return ResII;
|
|
}
|
|
|
|
ModuloSchedGraphSet::ModuloSchedGraphSet(const Function *function,
|
|
const TargetMachine &target)
|
|
: method(function)
|
|
{
|
|
buildGraphsForMethod(method, target);
|
|
}
|
|
|
|
|
|
ModuloSchedGraphSet::~ModuloSchedGraphSet()
|
|
{
|
|
//delete all the graphs
|
|
for (iterator I = begin(), E = end(); I != E; ++I)
|
|
delete *I;
|
|
}
|
|
|
|
void ModuloSchedGraphSet::dump() const
|
|
{
|
|
DEBUG(std::cerr << " ====== ModuloSched graphs for function `" <<
|
|
method->getName() << "' =========\n\n");
|
|
for (const_iterator I = begin(); I != end(); ++I)
|
|
(*I)->dump();
|
|
|
|
DEBUG(std::cerr << "\n=========End graphs for function `" << method->getName()
|
|
<< "' ==========\n\n");
|
|
}
|
|
|
|
void ModuloSchedGraph::dump(const BasicBlock * bb)
|
|
{
|
|
DEBUG(std::cerr << "dumping basic block:");
|
|
DEBUG(std::cerr << (bb->hasName()? bb->getName() : "block")
|
|
<< " (" << bb << ")" << "\n");
|
|
}
|
|
|
|
void ModuloSchedGraph::dump(const BasicBlock * bb, std::ostream & os)
|
|
{
|
|
os << "dumping basic block:";
|
|
os << (bb->hasName()? bb->getName() : "block")
|
|
<< " (" << bb << ")" << "\n";
|
|
}
|
|
|
|
void ModuloSchedGraph::dump() const
|
|
{
|
|
DEBUG(std::cerr << " ModuloSchedGraph for basic Blocks:");
|
|
for (unsigned i = 0, N = bbVec.size(); i < N; i++) {
|
|
DEBUG(std::cerr << (bbVec[i]->hasName()? bbVec[i]->getName() : "block")
|
|
<< " (" << bbVec[i] << ")" << ((i == N - 1) ? "" : ", "));
|
|
}
|
|
|
|
DEBUG(std::cerr << "\n\n Actual Root nodes : ");
|
|
for (unsigned i = 0, N = graphRoot->outEdges.size(); i < N; i++)
|
|
DEBUG(std::cerr << graphRoot->outEdges[i]->getSink()->getNodeId()
|
|
<< ((i == N - 1) ? "" : ", "));
|
|
|
|
DEBUG(std::cerr << "\n Graph Nodes:\n");
|
|
//for (const_iterator I=begin(); I != end(); ++I)
|
|
//DEBUG(std::cerr << "\n" << *I->second;
|
|
unsigned numNodes = bbVec[0]->size();
|
|
for (unsigned i = 2; i < numNodes + 2; i++) {
|
|
ModuloSchedGraphNode *node = getNode(i);
|
|
DEBUG(std::cerr << "\n" << *node);
|
|
}
|
|
|
|
DEBUG(std::cerr << "\n");
|
|
}
|
|
|
|
void ModuloSchedGraph::dumpNodeProperty() const
|
|
{
|
|
const BasicBlock *bb = bbVec[0];
|
|
unsigned numNodes = bb->size();
|
|
for (unsigned i = 2; i < numNodes + 2; i++) {
|
|
ModuloSchedGraphNode *node = getNode(i);
|
|
DEBUG(std::cerr << "NodeId " << node->getNodeId() << "\t");
|
|
DEBUG(std::cerr << "ASAP " << node->getASAP() << "\t");
|
|
DEBUG(std::cerr << "ALAP " << node->getALAP() << "\t");
|
|
DEBUG(std::cerr << "mov " << node->getMov() << "\t");
|
|
DEBUG(std::cerr << "depth " << node->getDepth() << "\t");
|
|
DEBUG(std::cerr << "height " << node->getHeight() << "\t\n");
|
|
}
|
|
}
|
|
|
|
void ModuloSchedGraphSet::buildGraphsForMethod(const Function *F,
|
|
const TargetMachine &target)
|
|
{
|
|
for (Function::const_iterator BI = F->begin(); BI != F->end(); ++BI)
|
|
addGraph(new ModuloSchedGraph(BI, target));
|
|
}
|
|
|
|
std::ostream& operator<<(std::ostream &os,
|
|
const ModuloSchedGraphNode &node)
|
|
{
|
|
os << std::string(8, ' ')
|
|
<< "Node " << node.nodeId << " : "
|
|
<< "latency = " << node.latency << "\n" << std::string(12, ' ');
|
|
|
|
if (node.getInst() == NULL)
|
|
os << "(Dummy node)\n";
|
|
else {
|
|
os << *node.getInst() << "\n" << std::string(12, ' ');
|
|
os << node.inEdges.size() << " Incoming Edges:\n";
|
|
for (unsigned i = 0, N = node.inEdges.size(); i < N; i++)
|
|
os << std::string(16, ' ') << *node.inEdges[i];
|
|
|
|
os << std::string(12, ' ') << node.outEdges.size()
|
|
<< " Outgoing Edges:\n";
|
|
for (unsigned i = 0, N = node.outEdges.size(); i < N; i++)
|
|
os << std::string(16, ' ') << *node.outEdges[i];
|
|
}
|
|
|
|
return os;
|
|
}
|