mirror of
https://github.com/RPCS3/llvm.git
synced 2025-04-03 05:41:42 +00:00
Simplify names of lattice values. SGTUNE becomes SGT, for example.
Fix initializeConstant, now initializeInt. Fixes major performance bottleneck. X == Y || X->DominatedBy(Y) is redundant. Remove the X == Y part. Fix crasher in makeEqual where getOrInsertNode would add a new constant, producing an NE relationship between the two members we're trying to make equal. This now allows us to mark more BBs as unreachable. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@33612 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
ec9bfdc152
commit
6a08f918b6
@ -52,14 +52,14 @@
|
||||
// responsible for analyzing the variable and seeing what new inferences
|
||||
// can be made from each property. For example:
|
||||
//
|
||||
// %P = seteq int* %ptr, null
|
||||
// %a = or bool %P, %Q
|
||||
// %P = setne int* %ptr, null
|
||||
// %a = and bool %P, %Q
|
||||
// br bool %a label %cond_true, label %cond_false
|
||||
//
|
||||
// For the true branch, the VRPSolver will start with %a EQ true and look at
|
||||
// the definition of %a and find that it can infer that %P and %Q are both
|
||||
// true. From %P being true, it can infer that %ptr NE null. For the false
|
||||
// branch it can't infer anything from the "or" instruction.
|
||||
// branch it can't infer anything from the "and" instruction.
|
||||
//
|
||||
// Besides branches, we can also infer properties from instruction that may
|
||||
// have undefined behaviour in certain cases. For example, the dividend of
|
||||
@ -102,18 +102,18 @@ namespace {
|
||||
// 0 1 0 1 1 -- GE 11
|
||||
// 0 1 1 0 0 -- SGTULT 12
|
||||
// 0 1 1 0 1 -- SGEULE 13
|
||||
// 0 1 1 1 0 -- SGTUNE 14
|
||||
// 0 1 1 1 1 -- SGEUANY 15
|
||||
// 0 1 1 1 0 -- SGT 14
|
||||
// 0 1 1 1 1 -- SGE 15
|
||||
// 1 0 0 1 0 -- SLTUGT 18
|
||||
// 1 0 0 1 1 -- SLEUGE 19
|
||||
// 1 0 1 0 0 -- LT 20
|
||||
// 1 0 1 0 1 -- LE 21
|
||||
// 1 0 1 1 0 -- SLTUNE 22
|
||||
// 1 0 1 1 1 -- SLEUANY 23
|
||||
// 1 1 0 1 0 -- SNEUGT 26
|
||||
// 1 1 0 1 1 -- SANYUGE 27
|
||||
// 1 1 1 0 0 -- SNEULT 28
|
||||
// 1 1 1 0 1 -- SANYULE 29
|
||||
// 1 0 1 1 0 -- SLT 22
|
||||
// 1 0 1 1 1 -- SLE 23
|
||||
// 1 1 0 1 0 -- UGT 26
|
||||
// 1 1 0 1 1 -- UGE 27
|
||||
// 1 1 1 0 0 -- ULT 28
|
||||
// 1 1 1 0 1 -- ULE 29
|
||||
// 1 1 1 1 0 -- NE 30
|
||||
enum LatticeBits {
|
||||
EQ_BIT = 1, UGT_BIT = 2, ULT_BIT = 4, SGT_BIT = 8, SLT_BIT = 16
|
||||
@ -128,23 +128,23 @@ namespace {
|
||||
SGEULE = SGTULT | EQ_BIT,
|
||||
SLTUGT = SLT_BIT | UGT_BIT,
|
||||
SLEUGE = SLTUGT | EQ_BIT,
|
||||
SNEULT = SLT_BIT | SGT_BIT | ULT_BIT,
|
||||
SNEUGT = SLT_BIT | SGT_BIT | UGT_BIT,
|
||||
SLTUNE = SLT_BIT | ULT_BIT | UGT_BIT,
|
||||
SGTUNE = SGT_BIT | ULT_BIT | UGT_BIT,
|
||||
SLEUANY = SLT_BIT | ULT_BIT | UGT_BIT | EQ_BIT,
|
||||
SGEUANY = SGT_BIT | ULT_BIT | UGT_BIT | EQ_BIT,
|
||||
SANYULE = SLT_BIT | SGT_BIT | ULT_BIT | EQ_BIT,
|
||||
SANYUGE = SLT_BIT | SGT_BIT | UGT_BIT | EQ_BIT
|
||||
ULT = SLT_BIT | SGT_BIT | ULT_BIT,
|
||||
UGT = SLT_BIT | SGT_BIT | UGT_BIT,
|
||||
SLT = SLT_BIT | ULT_BIT | UGT_BIT,
|
||||
SGT = SGT_BIT | ULT_BIT | UGT_BIT,
|
||||
SLE = SLT | EQ_BIT,
|
||||
SGE = SGT | EQ_BIT,
|
||||
ULE = ULT | EQ_BIT,
|
||||
UGE = UGT | EQ_BIT
|
||||
};
|
||||
|
||||
static bool validPredicate(LatticeVal LV) {
|
||||
switch (LV) {
|
||||
case GT: case GE: case LT: case LE: case NE:
|
||||
case SGTULT: case SGTUNE: case SGEULE:
|
||||
case SLTUGT: case SLTUNE: case SLEUGE:
|
||||
case SNEULT: case SNEUGT:
|
||||
case SLEUANY: case SGEUANY: case SANYULE: case SANYUGE:
|
||||
case SGTULT: case SGT: case SGEULE:
|
||||
case SLTUGT: case SLT: case SLEUGE:
|
||||
case ULT: case UGT:
|
||||
case SLE: case SGE: case ULE: case UGE:
|
||||
return true;
|
||||
default:
|
||||
return false;
|
||||
@ -366,36 +366,91 @@ namespace {
|
||||
|
||||
std::vector<Node> Nodes;
|
||||
|
||||
std::vector<std::pair<ConstantInt *, unsigned> > Constants;
|
||||
void initializeConstant(Constant *C, unsigned index) {
|
||||
ConstantInt *CI = dyn_cast<ConstantInt>(C);
|
||||
if (!CI) return;
|
||||
std::vector<std::pair<ConstantInt *, unsigned> > Ints;
|
||||
|
||||
// XXX: instead of O(n) calls to addInequality, just find the 2, 3 or 4
|
||||
// nodes that are nearest less than or greater than (signed or unsigned).
|
||||
for (std::vector<std::pair<ConstantInt *, unsigned> >::iterator
|
||||
I = Constants.begin(), E = Constants.end(); I != E; ++I) {
|
||||
ConstantInt *Other = I->first;
|
||||
if (CI->getType() == Other->getType()) {
|
||||
unsigned lv = 0;
|
||||
|
||||
if (CI->getZExtValue() < Other->getZExtValue())
|
||||
lv |= ULT_BIT;
|
||||
else
|
||||
lv |= UGT_BIT;
|
||||
|
||||
if (CI->getSExtValue() < Other->getSExtValue())
|
||||
lv |= SLT_BIT;
|
||||
else
|
||||
lv |= SGT_BIT;
|
||||
|
||||
LatticeVal LV = static_cast<LatticeVal>(lv);
|
||||
assert(validPredicate(LV) && "Not a valid predicate.");
|
||||
if (!isRelatedBy(index, I->second, TreeRoot, LV))
|
||||
addInequality(index, I->second, TreeRoot, LV);
|
||||
}
|
||||
/// This is used to keep the ConstantInts list in unsigned ascending order.
|
||||
/// If the bitwidths don't match, this sorts smaller values ahead.
|
||||
struct SortByZExt {
|
||||
bool operator()(const std::pair<ConstantInt *, unsigned> &LHS,
|
||||
const std::pair<ConstantInt *, unsigned> &RHS) const {
|
||||
if (LHS.first->getType()->getBitWidth() !=
|
||||
RHS.first->getType()->getBitWidth())
|
||||
return LHS.first->getType()->getBitWidth() <
|
||||
RHS.first->getType()->getBitWidth();
|
||||
return LHS.first->getZExtValue() < RHS.first->getZExtValue();
|
||||
}
|
||||
Constants.push_back(std::make_pair(CI, index));
|
||||
};
|
||||
|
||||
/// True when the bitwidth of LHS < bitwidth of RHS.
|
||||
struct FindByIntegerWidth {
|
||||
bool operator()(const std::pair<ConstantInt *, unsigned> &LHS,
|
||||
const std::pair<ConstantInt *, unsigned> &RHS) const {
|
||||
return LHS.first->getType()->getBitWidth() <
|
||||
RHS.first->getType()->getBitWidth();
|
||||
}
|
||||
};
|
||||
|
||||
void initializeInt(ConstantInt *CI, unsigned index) {
|
||||
std::vector<std::pair<ConstantInt *, unsigned> >::iterator begin, end,
|
||||
last, iULT, iUGT, iSLT, iSGT;
|
||||
|
||||
std::pair<ConstantInt *, unsigned> pair = std::make_pair(CI, index);
|
||||
|
||||
begin = std::lower_bound(Ints.begin(), Ints.end(), pair,
|
||||
FindByIntegerWidth());
|
||||
end = std::upper_bound(begin, Ints.end(), pair, FindByIntegerWidth());
|
||||
|
||||
if (begin == end) last = end;
|
||||
else last = end - 1;
|
||||
|
||||
iUGT = std::lower_bound(begin, end, pair, SortByZExt());
|
||||
iULT = (iUGT == begin || begin == end) ? end : iUGT - 1;
|
||||
|
||||
if (iUGT != end && iULT != end &&
|
||||
(iULT->first->getSExtValue() >> 63) ==
|
||||
(iUGT->first->getSExtValue() >> 63)) { // signs match
|
||||
iSGT = iUGT;
|
||||
iSLT = iULT;
|
||||
} else {
|
||||
if (iULT == end || iUGT == end) {
|
||||
if (iULT == end) iSLT = last; else iSLT = iULT;
|
||||
if (iUGT == end) iSGT = begin; else iSGT = iUGT;
|
||||
} else if (iULT->first->getSExtValue() < 0) {
|
||||
assert(iUGT->first->getSExtValue() >= 0 && "Bad sign comparison.");
|
||||
iSGT = iUGT;
|
||||
iSLT = iULT;
|
||||
} else {
|
||||
assert(iULT->first->getSExtValue() >= 0 &&
|
||||
iUGT->first->getSExtValue() < 0 && "Bad sign comparison.");
|
||||
iSGT = iULT;
|
||||
iSLT = iUGT;
|
||||
}
|
||||
|
||||
if (iSGT != end &&
|
||||
iSGT->first->getSExtValue() < CI->getSExtValue()) iSGT = end;
|
||||
if (iSLT != end &&
|
||||
iSLT->first->getSExtValue() > CI->getSExtValue()) iSLT = end;
|
||||
|
||||
if (begin != end) {
|
||||
if (begin->first->getSExtValue() < CI->getSExtValue())
|
||||
if (iSLT == end ||
|
||||
begin->first->getSExtValue() > iSLT->first->getSExtValue())
|
||||
iSLT = begin;
|
||||
}
|
||||
if (last != end) {
|
||||
if (last->first->getSExtValue() > CI->getSExtValue())
|
||||
if (iSGT == end ||
|
||||
last->first->getSExtValue() < iSGT->first->getSExtValue())
|
||||
iSGT = last;
|
||||
}
|
||||
}
|
||||
|
||||
if (iULT != end) addInequality(iULT->second, index, TreeRoot, ULT);
|
||||
if (iUGT != end) addInequality(iUGT->second, index, TreeRoot, UGT);
|
||||
if (iSLT != end) addInequality(iSLT->second, index, TreeRoot, SLT);
|
||||
if (iSGT != end) addInequality(iSGT->second, index, TreeRoot, SGT);
|
||||
|
||||
Ints.insert(iUGT, pair);
|
||||
}
|
||||
|
||||
public:
|
||||
@ -441,8 +496,8 @@ namespace {
|
||||
NodeMap.insert(std::lower_bound(NodeMap.begin(), NodeMap.end(),
|
||||
MapEntry), MapEntry);
|
||||
|
||||
if (Constant *C = dyn_cast<Constant>(V))
|
||||
initializeConstant(C, MapEntry.index);
|
||||
if (ConstantInt *CI = dyn_cast<ConstantInt>(V))
|
||||
initializeInt(CI, MapEntry.index);
|
||||
|
||||
return MapEntry.index;
|
||||
}
|
||||
@ -485,11 +540,7 @@ namespace {
|
||||
ToRepoint.push_back(V);
|
||||
|
||||
if (unsigned Conflict = getNode(V, Subtree)) {
|
||||
// XXX: NodeMap.size() exceeds 68000 entries compiling kimwitu++!
|
||||
// This adds 57 seconds to the otherwise 3 second build. Unacceptable.
|
||||
//
|
||||
// IDEA: could we iterate 1..Nodes.size() calling getNode? It's
|
||||
// O(n log n) but kimwitu++ only has about 300 nodes.
|
||||
// XXX: NodeMap.size() exceeds 68,000 entries compiling kimwitu++!
|
||||
for (NodeMapType::iterator I = NodeMap.begin(), E = NodeMap.end();
|
||||
I != E; ++I) {
|
||||
if (I->index == Conflict && Subtree->DominatedBy(I->Subtree))
|
||||
@ -541,7 +592,7 @@ namespace {
|
||||
// add %a < %n2 too. This keeps the graph fully connected.
|
||||
if (LV1 != NE) {
|
||||
// Someone with a head for this sort of logic, please review this.
|
||||
// Given that %x SLTUGT %y and %a SLEUANY %x, what is the relationship
|
||||
// Given that %x SLTUGT %y and %a SLE %x, what is the relationship
|
||||
// between %a and %y? I believe the below code is correct, but I don't
|
||||
// think it's the most efficient solution.
|
||||
|
||||
@ -795,7 +846,7 @@ namespace {
|
||||
return IdomI(TopInst, I);
|
||||
else {
|
||||
ETNode *Node = Forest->getNodeForBlock(I->getParent());
|
||||
return Node == Top || Node->DominatedBy(Top);
|
||||
return Node->DominatedBy(Top);
|
||||
}
|
||||
}
|
||||
|
||||
@ -945,7 +996,12 @@ namespace {
|
||||
// Create N1.
|
||||
// XXX: this should call newNode, but instead the node might be created
|
||||
// in isRelatedBy. That's also a fixme.
|
||||
if (!n1) n1 = IG.getOrInsertNode(V1, Top);
|
||||
if (!n1) {
|
||||
n1 = IG.getOrInsertNode(V1, Top);
|
||||
|
||||
if (isa<ConstantInt>(V1))
|
||||
if (IG.isRelatedBy(n1, n2, Top, NE)) return false;
|
||||
}
|
||||
|
||||
// Migrate relationships from removed nodes to N1.
|
||||
Node *N1 = IG.node(n1);
|
||||
@ -954,7 +1010,7 @@ namespace {
|
||||
unsigned n = *I;
|
||||
Node *N = IG.node(n);
|
||||
for (Node::iterator NI = N->begin(), NE = N->end(); NI != NE; ++NI) {
|
||||
if (Top == NI->Subtree || NI->Subtree->DominatedBy(Top)) {
|
||||
if (NI->Subtree->DominatedBy(Top)) {
|
||||
if (NI->To == n1) {
|
||||
assert((NI->LV & EQ_BIT) && "Node inequal to itself.");
|
||||
continue;
|
||||
@ -1016,21 +1072,21 @@ namespace {
|
||||
case ICmpInst::ICMP_NE:
|
||||
return NE;
|
||||
case ICmpInst::ICMP_UGT:
|
||||
return SNEUGT;
|
||||
return UGT;
|
||||
case ICmpInst::ICMP_UGE:
|
||||
return SANYUGE;
|
||||
return UGE;
|
||||
case ICmpInst::ICMP_ULT:
|
||||
return SNEULT;
|
||||
return ULT;
|
||||
case ICmpInst::ICMP_ULE:
|
||||
return SANYULE;
|
||||
return ULE;
|
||||
case ICmpInst::ICMP_SGT:
|
||||
return SGTUNE;
|
||||
return SGT;
|
||||
case ICmpInst::ICMP_SGE:
|
||||
return SGEUANY;
|
||||
return SGE;
|
||||
case ICmpInst::ICMP_SLT:
|
||||
return SLTUNE;
|
||||
return SLT;
|
||||
case ICmpInst::ICMP_SLE:
|
||||
return SLEUANY;
|
||||
return SLE;
|
||||
}
|
||||
}
|
||||
|
||||
|
Loading…
x
Reference in New Issue
Block a user