mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-12-04 17:56:53 +00:00
Start removing the use of an ad-hoc 'never inline' set and instead
directly query the function information which this set was representing. This simplifies the interface of the inline cost analysis, and makes the always-inline pass significantly more efficient. Previously, always-inline would first make a single set of every function in the module *except* those marked with the always-inline attribute. It would then query this set at every call site to see if the function was a member of the set, and if so, refuse to inline it. This is quite wasteful. Instead, simply check the function attribute directly when looking at the callsite. The normal inliner also had similar redundancy. It added every function in the module with the noinline attribute to its set to ignore, even though inside the cost analysis function we *already tested* the noinline attribute and produced the same result. The only tricky part of removing this is that we have to be able to correctly remove only the functions inlined by the always-inline pass when finalizing, which requires a bit of a hack. Still, much less of a hack than the set of all non-always-inline functions was. While I was touching this function, I switched a heavy-weight set to a vector with sort+unique. The algorithm already had a two-phase insert and removal pattern, we were just needlessly paying the uniquing cost on every insert. This probably speeds up some compiles by a small amount (-O0 compiles with lots of always-inline, so potentially heavy libc++ users), but I've not tried to measure it. I believe there is no functional change here, but yell if you spot one. None are intended. Finally, the direction this is going in is to greatly simplify the inline cost query interface so that we can replace its implementation with a much more clever one. Along the way, all the APIs get simplified, so it seems incrementally good. llvm-svn: 152903
This commit is contained in:
parent
7eb05588b8
commit
1d0b0955da
@ -166,16 +166,13 @@ namespace llvm {
|
||||
/// getInlineCost - The heuristic used to determine if we should inline the
|
||||
/// function call or not.
|
||||
///
|
||||
InlineCost getInlineCost(CallSite CS,
|
||||
SmallPtrSet<const Function *, 16> &NeverInline);
|
||||
InlineCost getInlineCost(CallSite CS);
|
||||
/// getCalledFunction - The heuristic used to determine if we should inline
|
||||
/// the function call or not. The callee is explicitly specified, to allow
|
||||
/// you to calculate the cost of inlining a function via a pointer. The
|
||||
/// result assumes that the inlined version will always be used. You should
|
||||
/// weight it yourself in cases where this callee will not always be called.
|
||||
InlineCost getInlineCost(CallSite CS,
|
||||
Function *Callee,
|
||||
SmallPtrSet<const Function *, 16> &NeverInline);
|
||||
InlineCost getInlineCost(CallSite CS, Function *Callee);
|
||||
|
||||
/// getInlineFudgeFactor - Return a > 1.0 factor if the inliner should use a
|
||||
/// higher threshold to determine if the function call should be inlined.
|
||||
|
@ -79,10 +79,14 @@ struct Inliner : public CallGraphSCCPass {
|
||||
/// has been inlined.
|
||||
virtual void growCachedCostInfo(Function *Caller, Function *Callee) = 0;
|
||||
|
||||
/// removeDeadFunctions - Remove dead functions that are not included in
|
||||
/// DNR (Do Not Remove) list.
|
||||
bool removeDeadFunctions(CallGraph &CG,
|
||||
SmallPtrSet<const Function *, 16> *DNR = NULL);
|
||||
/// removeDeadFunctions - Remove dead functions.
|
||||
///
|
||||
/// This also includes a hack in the form of the 'AlwaysInlineOnly' flag
|
||||
/// which restricts it to deleting functions with an 'AlwaysInline'
|
||||
/// attribute. This is useful for the InlineAlways pass that only wants to
|
||||
/// deal with that subset of the functions.
|
||||
bool removeDeadFunctions(CallGraph &CG, bool AlwaysInlineOnly = false);
|
||||
|
||||
private:
|
||||
// InlineThreshold - Cache the value here for easy access.
|
||||
unsigned InlineThreshold;
|
||||
|
@ -520,22 +520,18 @@ int InlineCostAnalyzer::getInlineBonuses(CallSite CS, Function *Callee) {
|
||||
// getInlineCost - The heuristic used to determine if we should inline the
|
||||
// function call or not.
|
||||
//
|
||||
InlineCost InlineCostAnalyzer::getInlineCost(CallSite CS,
|
||||
SmallPtrSet<const Function*, 16> &NeverInline) {
|
||||
return getInlineCost(CS, CS.getCalledFunction(), NeverInline);
|
||||
InlineCost InlineCostAnalyzer::getInlineCost(CallSite CS) {
|
||||
return getInlineCost(CS, CS.getCalledFunction());
|
||||
}
|
||||
|
||||
InlineCost InlineCostAnalyzer::getInlineCost(CallSite CS,
|
||||
Function *Callee,
|
||||
SmallPtrSet<const Function*, 16> &NeverInline) {
|
||||
InlineCost InlineCostAnalyzer::getInlineCost(CallSite CS, Function *Callee) {
|
||||
Instruction *TheCall = CS.getInstruction();
|
||||
Function *Caller = TheCall->getParent()->getParent();
|
||||
|
||||
// Don't inline functions which can be redefined at link-time to mean
|
||||
// something else. Don't inline functions marked noinline or call sites
|
||||
// marked noinline.
|
||||
if (Callee->mayBeOverridden() ||
|
||||
Callee->hasFnAttr(Attribute::NoInline) || NeverInline.count(Callee) ||
|
||||
if (Callee->mayBeOverridden() || Callee->hasFnAttr(Attribute::NoInline) ||
|
||||
CS.isNoInline())
|
||||
return llvm::InlineCost::getNever();
|
||||
|
||||
|
@ -32,8 +32,6 @@ namespace {
|
||||
|
||||
// AlwaysInliner only inlines functions that are mark as "always inline".
|
||||
class AlwaysInliner : public Inliner {
|
||||
// Functions that are never inlined
|
||||
SmallPtrSet<const Function*, 16> NeverInline;
|
||||
InlineCostAnalyzer CA;
|
||||
public:
|
||||
// Use extremely low threshold.
|
||||
@ -46,7 +44,22 @@ namespace {
|
||||
}
|
||||
static char ID; // Pass identification, replacement for typeid
|
||||
InlineCost getInlineCost(CallSite CS) {
|
||||
return CA.getInlineCost(CS, NeverInline);
|
||||
Function *Callee = CS.getCalledFunction();
|
||||
// We assume indirect calls aren't calling an always-inline function.
|
||||
if (!Callee) return InlineCost::getNever();
|
||||
|
||||
// We can't inline calls to external functions.
|
||||
// FIXME: We shouldn't even get here.
|
||||
if (Callee->isDeclaration()) return InlineCost::getNever();
|
||||
|
||||
// Return never for anything not marked as always inline.
|
||||
if (!Callee->hasFnAttr(Attribute::AlwaysInline))
|
||||
return InlineCost::getNever();
|
||||
|
||||
// We still have to check the inline cost in case there are reasons to
|
||||
// not inline which trump the always-inline attribute such as setjmp and
|
||||
// indirectbr.
|
||||
return CA.getInlineCost(CS);
|
||||
}
|
||||
float getInlineFudgeFactor(CallSite CS) {
|
||||
return CA.getInlineFudgeFactor(CS);
|
||||
@ -58,7 +71,7 @@ namespace {
|
||||
CA.growCachedCostInfo(Caller, Callee);
|
||||
}
|
||||
virtual bool doFinalization(CallGraph &CG) {
|
||||
return removeDeadFunctions(CG, &NeverInline);
|
||||
return removeDeadFunctions(CG, /*AlwaysInlineOnly=*/true);
|
||||
}
|
||||
virtual bool doInitialization(CallGraph &CG);
|
||||
void releaseMemory() {
|
||||
@ -84,12 +97,5 @@ Pass *llvm::createAlwaysInlinerPass(bool InsertLifetime) {
|
||||
// been annotated with the "always inline" attribute.
|
||||
bool AlwaysInliner::doInitialization(CallGraph &CG) {
|
||||
CA.setTargetData(getAnalysisIfAvailable<TargetData>());
|
||||
|
||||
Module &M = CG.getModule();
|
||||
|
||||
for (Module::iterator I = M.begin(), E = M.end(); I != E; ++I)
|
||||
if (!I->isDeclaration() && !I->hasFnAttr(Attribute::AlwaysInline))
|
||||
NeverInline.insert(I);
|
||||
|
||||
return false;
|
||||
}
|
||||
|
@ -43,7 +43,16 @@ namespace {
|
||||
}
|
||||
static char ID; // Pass identification, replacement for typeid
|
||||
InlineCost getInlineCost(CallSite CS) {
|
||||
return CA.getInlineCost(CS, NeverInline);
|
||||
// Filter out functions which should never be inlined due to the global
|
||||
// 'llvm.noinline'.
|
||||
// FIXME: I'm 99% certain that this is an ancient bit of legacy that we
|
||||
// no longer need to support, but I don't want to blindly nuke it just
|
||||
// yet.
|
||||
if (Function *Callee = CS.getCalledFunction())
|
||||
if (NeverInline.count(Callee))
|
||||
return InlineCost::getNever();
|
||||
|
||||
return CA.getInlineCost(CS);
|
||||
}
|
||||
float getInlineFudgeFactor(CallSite CS) {
|
||||
return CA.getInlineFudgeFactor(CS);
|
||||
@ -81,11 +90,6 @@ bool SimpleInliner::doInitialization(CallGraph &CG) {
|
||||
|
||||
Module &M = CG.getModule();
|
||||
|
||||
for (Module::iterator I = M.begin(), E = M.end();
|
||||
I != E; ++I)
|
||||
if (!I->isDeclaration() && I->hasFnAttr(Attribute::NoInline))
|
||||
NeverInline.insert(I);
|
||||
|
||||
// Get llvm.noinline
|
||||
GlobalVariable *GV = M.getNamedGlobal("llvm.noinline");
|
||||
|
||||
|
@ -556,25 +556,27 @@ bool Inliner::doFinalization(CallGraph &CG) {
|
||||
|
||||
/// removeDeadFunctions - Remove dead functions that are not included in
|
||||
/// DNR (Do Not Remove) list.
|
||||
bool Inliner::removeDeadFunctions(CallGraph &CG,
|
||||
SmallPtrSet<const Function *, 16> *DNR) {
|
||||
SmallPtrSet<CallGraphNode*, 16> FunctionsToRemove;
|
||||
bool Inliner::removeDeadFunctions(CallGraph &CG, bool AlwaysInlineOnly) {
|
||||
SmallVector<CallGraphNode*, 16> FunctionsToRemove;
|
||||
|
||||
// Scan for all of the functions, looking for ones that should now be removed
|
||||
// from the program. Insert the dead ones in the FunctionsToRemove set.
|
||||
for (CallGraph::iterator I = CG.begin(), E = CG.end(); I != E; ++I) {
|
||||
CallGraphNode *CGN = I->second;
|
||||
if (CGN->getFunction() == 0)
|
||||
continue;
|
||||
|
||||
Function *F = CGN->getFunction();
|
||||
|
||||
if (!F || F->isDeclaration())
|
||||
continue;
|
||||
|
||||
// Handle the case when this function is called and we only want to care
|
||||
// about always-inline functions. This is a bit of a hack to share code
|
||||
// between here and the InlineAlways pass.
|
||||
if (AlwaysInlineOnly && !F->hasFnAttr(Attribute::AlwaysInline))
|
||||
continue;
|
||||
|
||||
// If the only remaining users of the function are dead constants, remove
|
||||
// them.
|
||||
F->removeDeadConstantUsers();
|
||||
|
||||
if (DNR && DNR->count(F))
|
||||
continue;
|
||||
if (!F->isDefTriviallyDead())
|
||||
continue;
|
||||
|
||||
@ -587,24 +589,28 @@ bool Inliner::removeDeadFunctions(CallGraph &CG,
|
||||
CG.getExternalCallingNode()->removeAnyCallEdgeTo(CGN);
|
||||
|
||||
// Removing the node for callee from the call graph and delete it.
|
||||
FunctionsToRemove.insert(CGN);
|
||||
FunctionsToRemove.push_back(CGN);
|
||||
}
|
||||
if (FunctionsToRemove.empty())
|
||||
return false;
|
||||
|
||||
// Now that we know which functions to delete, do so. We didn't want to do
|
||||
// this inline, because that would invalidate our CallGraph::iterator
|
||||
// objects. :(
|
||||
//
|
||||
// Note that it doesn't matter that we are iterating over a non-stable set
|
||||
// Note that it doesn't matter that we are iterating over a non-stable order
|
||||
// here to do this, it doesn't matter which order the functions are deleted
|
||||
// in.
|
||||
bool Changed = false;
|
||||
for (SmallPtrSet<CallGraphNode*, 16>::iterator I = FunctionsToRemove.begin(),
|
||||
E = FunctionsToRemove.end(); I != E; ++I) {
|
||||
std::sort(FunctionsToRemove.begin(), FunctionsToRemove.end());
|
||||
FunctionsToRemove.erase(std::unique(FunctionsToRemove.begin(),
|
||||
FunctionsToRemove.end()),
|
||||
FunctionsToRemove.end());
|
||||
for (SmallVectorImpl<CallGraphNode *>::iterator I = FunctionsToRemove.begin(),
|
||||
E = FunctionsToRemove.end();
|
||||
I != E; ++I) {
|
||||
resetCachedCostInfo((*I)->getFunction());
|
||||
delete CG.removeFunctionFromModule(*I);
|
||||
++NumDeleted;
|
||||
Changed = true;
|
||||
}
|
||||
|
||||
return Changed;
|
||||
return true;
|
||||
}
|
||||
|
Loading…
Reference in New Issue
Block a user