mirror of
https://github.com/capstone-engine/llvm-capstone.git
synced 2025-01-09 01:29:52 +00:00
[CodeExtractor] Factor out and reuse shrinkwrap analysis
Factor out CodeExtractor's analysis of allocas (for shrinkwrapping purposes), and allow the analysis to be reused. This resolves a quadratic compile-time bug observed when compiling AMDGPUDisassembler.cpp.o. Pre-patch (Release + LTO clang): ``` ---User Time--- --System Time-- --User+System-- ---Wall Time--- --- Name --- 176.5278 ( 57.8%) 0.4915 ( 18.5%) 177.0192 ( 57.4%) 177.4112 ( 57.3%) Hot Cold Splitting ``` Post-patch (ReleaseAsserts clang): ``` ---User Time--- --System Time-- --User+System-- ---Wall Time--- --- Name --- 1.4051 ( 3.3%) 0.0079 ( 0.3%) 1.4129 ( 3.2%) 1.4129 ( 3.2%) Hot Cold Splitting ``` Testing: check-llvm, and comparing the AMDGPUDisassembler.cpp.o binary pre- vs. post-patch. An alternate approach is to hide CodeExtractorAnalysisCache from clients of CodeExtractor, and to recompute the analysis from scratch inside of CodeExtractor::extractCodeRegion(). This eliminates some redundant work in the shrinkwrapping legality check. However, some clients continue to exhibit O(n^2) compile time behavior as computing the analysis is O(n). rdar://55912966 Differential Revision: https://reviews.llvm.org/D68616 llvm-svn: 374089
This commit is contained in:
parent
d8245e7a36
commit
9852699dcb
@ -23,6 +23,7 @@ class TargetTransformInfo;
|
||||
class OptimizationRemarkEmitter;
|
||||
class AssumptionCache;
|
||||
class DominatorTree;
|
||||
class CodeExtractorAnalysisCache;
|
||||
|
||||
/// A sequence of basic blocks.
|
||||
///
|
||||
@ -43,8 +44,10 @@ private:
|
||||
bool isFunctionCold(const Function &F) const;
|
||||
bool shouldOutlineFrom(const Function &F) const;
|
||||
bool outlineColdRegions(Function &F, bool HasProfileSummary);
|
||||
Function *extractColdRegion(const BlockSequence &Region, DominatorTree &DT,
|
||||
BlockFrequencyInfo *BFI, TargetTransformInfo &TTI,
|
||||
Function *extractColdRegion(const BlockSequence &Region,
|
||||
const CodeExtractorAnalysisCache &CEAC,
|
||||
DominatorTree &DT, BlockFrequencyInfo *BFI,
|
||||
TargetTransformInfo &TTI,
|
||||
OptimizationRemarkEmitter &ORE,
|
||||
AssumptionCache *AC, unsigned Count);
|
||||
ProfileSummaryInfo *PSI;
|
||||
|
@ -22,6 +22,7 @@
|
||||
|
||||
namespace llvm {
|
||||
|
||||
class AllocaInst;
|
||||
class BasicBlock;
|
||||
class BlockFrequency;
|
||||
class BlockFrequencyInfo;
|
||||
@ -36,6 +37,38 @@ class Module;
|
||||
class Type;
|
||||
class Value;
|
||||
|
||||
/// A cache for the CodeExtractor analysis. The operation \ref
|
||||
/// CodeExtractor::extractCodeRegion is guaranteed not to invalidate this
|
||||
/// object. This object should conservatively be considered invalid if any
|
||||
/// other mutating operations on the IR occur.
|
||||
///
|
||||
/// Constructing this object is O(n) in the size of the function.
|
||||
class CodeExtractorAnalysisCache {
|
||||
/// The allocas in the function.
|
||||
SmallVector<AllocaInst *, 16> Allocas;
|
||||
|
||||
/// Base memory addresses of load/store instructions, grouped by block.
|
||||
DenseMap<BasicBlock *, DenseSet<Value *>> BaseMemAddrs;
|
||||
|
||||
/// Blocks which contain instructions which may have unknown side-effects
|
||||
/// on memory.
|
||||
DenseSet<BasicBlock *> SideEffectingBlocks;
|
||||
|
||||
void findSideEffectInfoForBlock(BasicBlock &BB);
|
||||
|
||||
public:
|
||||
CodeExtractorAnalysisCache(Function &F);
|
||||
|
||||
/// Get the allocas in the function at the time the analysis was created.
|
||||
/// Note that some of these allocas may no longer be present in the function,
|
||||
/// due to \ref CodeExtractor::extractCodeRegion.
|
||||
ArrayRef<AllocaInst *> getAllocas() const { return Allocas; }
|
||||
|
||||
/// Check whether \p BB contains an instruction thought to load from, store
|
||||
/// to, or otherwise clobber the alloca \p Addr.
|
||||
bool doesBlockContainClobberOfAddr(BasicBlock &BB, AllocaInst *Addr) const;
|
||||
};
|
||||
|
||||
/// Utility class for extracting code into a new function.
|
||||
///
|
||||
/// This utility provides a simple interface for extracting some sequence of
|
||||
@ -104,7 +137,7 @@ class Value;
|
||||
///
|
||||
/// Returns zero when called on a CodeExtractor instance where isEligible
|
||||
/// returns false.
|
||||
Function *extractCodeRegion();
|
||||
Function *extractCodeRegion(const CodeExtractorAnalysisCache &CEAC);
|
||||
|
||||
/// Verify that assumption cache isn't stale after a region is extracted.
|
||||
/// Returns false when verifier finds errors. AssumptionCache is passed as
|
||||
@ -135,7 +168,9 @@ class Value;
|
||||
/// region.
|
||||
///
|
||||
/// Returns true if it is safe to do the code motion.
|
||||
bool isLegalToShrinkwrapLifetimeMarkers(Instruction *AllocaAddr) const;
|
||||
bool
|
||||
isLegalToShrinkwrapLifetimeMarkers(const CodeExtractorAnalysisCache &CEAC,
|
||||
Instruction *AllocaAddr) const;
|
||||
|
||||
/// Find the set of allocas whose life ranges are contained within the
|
||||
/// outlined region.
|
||||
@ -145,7 +180,8 @@ class Value;
|
||||
/// are used by the lifetime markers are also candidates for shrink-
|
||||
/// wrapping. The instructions that need to be sunk are collected in
|
||||
/// 'Allocas'.
|
||||
void findAllocas(ValueSet &SinkCands, ValueSet &HoistCands,
|
||||
void findAllocas(const CodeExtractorAnalysisCache &CEAC,
|
||||
ValueSet &SinkCands, ValueSet &HoistCands,
|
||||
BasicBlock *&ExitBlock) const;
|
||||
|
||||
/// Find or create a block within the outline region for placing hoisted
|
||||
@ -166,8 +202,9 @@ class Value;
|
||||
Instruction *LifeEnd = nullptr;
|
||||
};
|
||||
|
||||
LifetimeMarkerInfo getLifetimeMarkers(Instruction *Addr,
|
||||
BasicBlock *ExitBlock) const;
|
||||
LifetimeMarkerInfo
|
||||
getLifetimeMarkers(const CodeExtractorAnalysisCache &CEAC,
|
||||
Instruction *Addr, BasicBlock *ExitBlock) const;
|
||||
|
||||
void severSplitPHINodesOfEntry(BasicBlock *&Header);
|
||||
void severSplitPHINodesOfExits(const SmallPtrSetImpl<BasicBlock *> &Exits);
|
||||
|
@ -206,7 +206,8 @@ bool BlockExtractor::runOnModule(Module &M) {
|
||||
++NumExtracted;
|
||||
Changed = true;
|
||||
}
|
||||
Function *F = CodeExtractor(BlocksToExtractVec).extractCodeRegion();
|
||||
CodeExtractorAnalysisCache CEAC(*BBs[0]->getParent());
|
||||
Function *F = CodeExtractor(BlocksToExtractVec).extractCodeRegion(CEAC);
|
||||
if (F)
|
||||
LLVM_DEBUG(dbgs() << "Extracted group '" << (*BBs.begin())->getName()
|
||||
<< "' in: " << F->getName() << '\n');
|
||||
|
@ -290,13 +290,10 @@ static int getOutliningPenalty(ArrayRef<BasicBlock *> Region,
|
||||
return Penalty;
|
||||
}
|
||||
|
||||
Function *HotColdSplitting::extractColdRegion(const BlockSequence &Region,
|
||||
DominatorTree &DT,
|
||||
BlockFrequencyInfo *BFI,
|
||||
TargetTransformInfo &TTI,
|
||||
OptimizationRemarkEmitter &ORE,
|
||||
AssumptionCache *AC,
|
||||
unsigned Count) {
|
||||
Function *HotColdSplitting::extractColdRegion(
|
||||
const BlockSequence &Region, const CodeExtractorAnalysisCache &CEAC,
|
||||
DominatorTree &DT, BlockFrequencyInfo *BFI, TargetTransformInfo &TTI,
|
||||
OptimizationRemarkEmitter &ORE, AssumptionCache *AC, unsigned Count) {
|
||||
assert(!Region.empty());
|
||||
|
||||
// TODO: Pass BFI and BPI to update profile information.
|
||||
@ -318,7 +315,7 @@ Function *HotColdSplitting::extractColdRegion(const BlockSequence &Region,
|
||||
return nullptr;
|
||||
|
||||
Function *OrigF = Region[0]->getParent();
|
||||
if (Function *OutF = CE.extractCodeRegion()) {
|
||||
if (Function *OutF = CE.extractCodeRegion(CEAC)) {
|
||||
User *U = *OutF->user_begin();
|
||||
CallInst *CI = cast<CallInst>(U);
|
||||
CallSite CS(CI);
|
||||
@ -606,9 +603,14 @@ bool HotColdSplitting::outlineColdRegions(Function &F, bool HasProfileSummary) {
|
||||
}
|
||||
}
|
||||
|
||||
if (OutliningWorklist.empty())
|
||||
return Changed;
|
||||
|
||||
// Outline single-entry cold regions, splitting up larger regions as needed.
|
||||
unsigned OutlinedFunctionID = 1;
|
||||
while (!OutliningWorklist.empty()) {
|
||||
// Cache and recycle the CodeExtractor analysis to avoid O(n^2) compile-time.
|
||||
CodeExtractorAnalysisCache CEAC(F);
|
||||
do {
|
||||
OutliningRegion Region = OutliningWorklist.pop_back_val();
|
||||
assert(!Region.empty() && "Empty outlining region in worklist");
|
||||
do {
|
||||
@ -619,14 +621,14 @@ bool HotColdSplitting::outlineColdRegions(Function &F, bool HasProfileSummary) {
|
||||
BB->dump();
|
||||
});
|
||||
|
||||
Function *Outlined = extractColdRegion(SubRegion, *DT, BFI, TTI, ORE, AC,
|
||||
OutlinedFunctionID);
|
||||
Function *Outlined = extractColdRegion(SubRegion, CEAC, *DT, BFI, TTI,
|
||||
ORE, AC, OutlinedFunctionID);
|
||||
if (Outlined) {
|
||||
++OutlinedFunctionID;
|
||||
Changed = true;
|
||||
}
|
||||
} while (!Region.empty());
|
||||
}
|
||||
} while (!OutliningWorklist.empty());
|
||||
|
||||
return Changed;
|
||||
}
|
||||
|
@ -141,10 +141,12 @@ bool LoopExtractor::runOnLoop(Loop *L, LPPassManager &LPM) {
|
||||
if (NumLoops == 0) return Changed;
|
||||
--NumLoops;
|
||||
AssumptionCache *AC = nullptr;
|
||||
Function &Func = *L->getHeader()->getParent();
|
||||
if (auto *ACT = getAnalysisIfAvailable<AssumptionCacheTracker>())
|
||||
AC = ACT->lookupAssumptionCache(*L->getHeader()->getParent());
|
||||
AC = ACT->lookupAssumptionCache(Func);
|
||||
CodeExtractorAnalysisCache CEAC(Func);
|
||||
CodeExtractor Extractor(DT, *L, false, nullptr, nullptr, AC);
|
||||
if (Extractor.extractCodeRegion() != nullptr) {
|
||||
if (Extractor.extractCodeRegion(CEAC) != nullptr) {
|
||||
Changed = true;
|
||||
// After extraction, the loop is replaced by a function call, so
|
||||
// we shouldn't try to run any more loop passes on it.
|
||||
|
@ -1122,6 +1122,9 @@ bool PartialInlinerImpl::FunctionCloner::doMultiRegionFunctionOutlining() {
|
||||
BranchProbabilityInfo BPI(*ClonedFunc, LI);
|
||||
ClonedFuncBFI.reset(new BlockFrequencyInfo(*ClonedFunc, BPI, LI));
|
||||
|
||||
// Cache and recycle the CodeExtractor analysis to avoid O(n^2) compile-time.
|
||||
CodeExtractorAnalysisCache CEAC(*ClonedFunc);
|
||||
|
||||
SetVector<Value *> Inputs, Outputs, Sinks;
|
||||
for (FunctionOutliningMultiRegionInfo::OutlineRegionInfo RegionInfo :
|
||||
ClonedOMRI->ORI) {
|
||||
@ -1148,7 +1151,7 @@ bool PartialInlinerImpl::FunctionCloner::doMultiRegionFunctionOutlining() {
|
||||
if (Outputs.size() > 0 && !ForceLiveExit)
|
||||
continue;
|
||||
|
||||
Function *OutlinedFunc = CE.extractCodeRegion();
|
||||
Function *OutlinedFunc = CE.extractCodeRegion(CEAC);
|
||||
|
||||
if (OutlinedFunc) {
|
||||
CallSite OCS = PartialInlinerImpl::getOneCallSiteTo(OutlinedFunc);
|
||||
@ -1210,11 +1213,12 @@ PartialInlinerImpl::FunctionCloner::doSingleRegionFunctionOutlining() {
|
||||
}
|
||||
|
||||
// Extract the body of the if.
|
||||
CodeExtractorAnalysisCache CEAC(*ClonedFunc);
|
||||
Function *OutlinedFunc =
|
||||
CodeExtractor(ToExtract, &DT, /*AggregateArgs*/ false,
|
||||
ClonedFuncBFI.get(), &BPI, LookupAC(*ClonedFunc),
|
||||
/* AllowVarargs */ true)
|
||||
.extractCodeRegion();
|
||||
.extractCodeRegion(CEAC);
|
||||
|
||||
if (OutlinedFunc) {
|
||||
BasicBlock *OutliningCallBB =
|
||||
|
@ -305,52 +305,79 @@ static BasicBlock *getCommonExitBlock(const SetVector<BasicBlock *> &Blocks) {
|
||||
return CommonExitBlock;
|
||||
}
|
||||
|
||||
CodeExtractorAnalysisCache::CodeExtractorAnalysisCache(Function &F) {
|
||||
for (BasicBlock &BB : F) {
|
||||
for (Instruction &II : BB.instructionsWithoutDebug())
|
||||
if (auto *AI = dyn_cast<AllocaInst>(&II))
|
||||
Allocas.push_back(AI);
|
||||
|
||||
findSideEffectInfoForBlock(BB);
|
||||
}
|
||||
}
|
||||
|
||||
void CodeExtractorAnalysisCache::findSideEffectInfoForBlock(BasicBlock &BB) {
|
||||
for (Instruction &II : BB.instructionsWithoutDebug()) {
|
||||
unsigned Opcode = II.getOpcode();
|
||||
Value *MemAddr = nullptr;
|
||||
switch (Opcode) {
|
||||
case Instruction::Store:
|
||||
case Instruction::Load: {
|
||||
if (Opcode == Instruction::Store) {
|
||||
StoreInst *SI = cast<StoreInst>(&II);
|
||||
MemAddr = SI->getPointerOperand();
|
||||
} else {
|
||||
LoadInst *LI = cast<LoadInst>(&II);
|
||||
MemAddr = LI->getPointerOperand();
|
||||
}
|
||||
// Global variable can not be aliased with locals.
|
||||
if (dyn_cast<Constant>(MemAddr))
|
||||
break;
|
||||
Value *Base = MemAddr->stripInBoundsConstantOffsets();
|
||||
if (!isa<AllocaInst>(Base)) {
|
||||
SideEffectingBlocks.insert(&BB);
|
||||
return;
|
||||
}
|
||||
BaseMemAddrs[&BB].insert(Base);
|
||||
break;
|
||||
}
|
||||
default: {
|
||||
IntrinsicInst *IntrInst = dyn_cast<IntrinsicInst>(&II);
|
||||
if (IntrInst) {
|
||||
if (IntrInst->isLifetimeStartOrEnd())
|
||||
break;
|
||||
SideEffectingBlocks.insert(&BB);
|
||||
return;
|
||||
}
|
||||
// Treat all the other cases conservatively if it has side effects.
|
||||
if (II.mayHaveSideEffects()) {
|
||||
SideEffectingBlocks.insert(&BB);
|
||||
return;
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
bool CodeExtractorAnalysisCache::doesBlockContainClobberOfAddr(
|
||||
BasicBlock &BB, AllocaInst *Addr) const {
|
||||
if (SideEffectingBlocks.count(&BB))
|
||||
return true;
|
||||
auto It = BaseMemAddrs.find(&BB);
|
||||
if (It != BaseMemAddrs.end())
|
||||
return It->second.count(Addr);
|
||||
return false;
|
||||
}
|
||||
|
||||
bool CodeExtractor::isLegalToShrinkwrapLifetimeMarkers(
|
||||
Instruction *Addr) const {
|
||||
const CodeExtractorAnalysisCache &CEAC, Instruction *Addr) const {
|
||||
AllocaInst *AI = cast<AllocaInst>(Addr->stripInBoundsConstantOffsets());
|
||||
Function *Func = (*Blocks.begin())->getParent();
|
||||
for (BasicBlock &BB : *Func) {
|
||||
if (Blocks.count(&BB))
|
||||
continue;
|
||||
for (Instruction &II : BB) {
|
||||
if (isa<DbgInfoIntrinsic>(II))
|
||||
continue;
|
||||
|
||||
unsigned Opcode = II.getOpcode();
|
||||
Value *MemAddr = nullptr;
|
||||
switch (Opcode) {
|
||||
case Instruction::Store:
|
||||
case Instruction::Load: {
|
||||
if (Opcode == Instruction::Store) {
|
||||
StoreInst *SI = cast<StoreInst>(&II);
|
||||
MemAddr = SI->getPointerOperand();
|
||||
} else {
|
||||
LoadInst *LI = cast<LoadInst>(&II);
|
||||
MemAddr = LI->getPointerOperand();
|
||||
}
|
||||
// Global variable can not be aliased with locals.
|
||||
if (dyn_cast<Constant>(MemAddr))
|
||||
break;
|
||||
Value *Base = MemAddr->stripInBoundsConstantOffsets();
|
||||
if (!isa<AllocaInst>(Base) || Base == AI)
|
||||
return false;
|
||||
break;
|
||||
}
|
||||
default: {
|
||||
IntrinsicInst *IntrInst = dyn_cast<IntrinsicInst>(&II);
|
||||
if (IntrInst) {
|
||||
if (IntrInst->isLifetimeStartOrEnd())
|
||||
break;
|
||||
return false;
|
||||
}
|
||||
// Treat all the other cases conservatively if it has side effects.
|
||||
if (II.mayHaveSideEffects())
|
||||
return false;
|
||||
}
|
||||
}
|
||||
}
|
||||
if (CEAC.doesBlockContainClobberOfAddr(BB, AI))
|
||||
return false;
|
||||
}
|
||||
|
||||
return true;
|
||||
}
|
||||
|
||||
@ -413,7 +440,8 @@ CodeExtractor::findOrCreateBlockForHoisting(BasicBlock *CommonExitBlock) {
|
||||
// outline region. If there are not other untracked uses of the address, return
|
||||
// the pair of markers if found; otherwise return a pair of nullptr.
|
||||
CodeExtractor::LifetimeMarkerInfo
|
||||
CodeExtractor::getLifetimeMarkers(Instruction *Addr,
|
||||
CodeExtractor::getLifetimeMarkers(const CodeExtractorAnalysisCache &CEAC,
|
||||
Instruction *Addr,
|
||||
BasicBlock *ExitBlock) const {
|
||||
LifetimeMarkerInfo Info;
|
||||
|
||||
@ -445,7 +473,7 @@ CodeExtractor::getLifetimeMarkers(Instruction *Addr,
|
||||
Info.HoistLifeEnd = !definedInRegion(Blocks, Info.LifeEnd);
|
||||
// Do legality check.
|
||||
if ((Info.SinkLifeStart || Info.HoistLifeEnd) &&
|
||||
!isLegalToShrinkwrapLifetimeMarkers(Addr))
|
||||
!isLegalToShrinkwrapLifetimeMarkers(CEAC, Addr))
|
||||
return {};
|
||||
|
||||
// Check to see if we have a place to do hoisting, if not, bail.
|
||||
@ -455,7 +483,8 @@ CodeExtractor::getLifetimeMarkers(Instruction *Addr,
|
||||
return Info;
|
||||
}
|
||||
|
||||
void CodeExtractor::findAllocas(ValueSet &SinkCands, ValueSet &HoistCands,
|
||||
void CodeExtractor::findAllocas(const CodeExtractorAnalysisCache &CEAC,
|
||||
ValueSet &SinkCands, ValueSet &HoistCands,
|
||||
BasicBlock *&ExitBlock) const {
|
||||
Function *Func = (*Blocks.begin())->getParent();
|
||||
ExitBlock = getCommonExitBlock(Blocks);
|
||||
@ -476,61 +505,65 @@ void CodeExtractor::findAllocas(ValueSet &SinkCands, ValueSet &HoistCands,
|
||||
return true;
|
||||
};
|
||||
|
||||
for (BasicBlock &BB : *Func) {
|
||||
if (Blocks.count(&BB))
|
||||
// Look up allocas in the original function in CodeExtractorAnalysisCache, as
|
||||
// this is much faster than walking all the instructions.
|
||||
for (AllocaInst *AI : CEAC.getAllocas()) {
|
||||
BasicBlock *BB = AI->getParent();
|
||||
if (Blocks.count(BB))
|
||||
continue;
|
||||
for (Instruction &II : BB) {
|
||||
auto *AI = dyn_cast<AllocaInst>(&II);
|
||||
if (!AI)
|
||||
continue;
|
||||
|
||||
LifetimeMarkerInfo MarkerInfo = getLifetimeMarkers(AI, ExitBlock);
|
||||
bool Moved = moveOrIgnoreLifetimeMarkers(MarkerInfo);
|
||||
if (Moved) {
|
||||
LLVM_DEBUG(dbgs() << "Sinking alloca: " << *AI << "\n");
|
||||
SinkCands.insert(AI);
|
||||
continue;
|
||||
}
|
||||
// As a prior call to extractCodeRegion() may have shrinkwrapped the alloca,
|
||||
// check whether it is actually still in the original function.
|
||||
Function *AIFunc = BB->getParent();
|
||||
if (AIFunc != Func)
|
||||
continue;
|
||||
|
||||
// Follow any bitcasts.
|
||||
SmallVector<Instruction *, 2> Bitcasts;
|
||||
SmallVector<LifetimeMarkerInfo, 2> BitcastLifetimeInfo;
|
||||
for (User *U : AI->users()) {
|
||||
if (U->stripInBoundsConstantOffsets() == AI) {
|
||||
Instruction *Bitcast = cast<Instruction>(U);
|
||||
LifetimeMarkerInfo LMI = getLifetimeMarkers(Bitcast, ExitBlock);
|
||||
if (LMI.LifeStart) {
|
||||
Bitcasts.push_back(Bitcast);
|
||||
BitcastLifetimeInfo.push_back(LMI);
|
||||
continue;
|
||||
}
|
||||
}
|
||||
|
||||
// Found unknown use of AI.
|
||||
if (!definedInRegion(Blocks, U)) {
|
||||
Bitcasts.clear();
|
||||
break;
|
||||
}
|
||||
}
|
||||
|
||||
// Either no bitcasts reference the alloca or there are unknown uses.
|
||||
if (Bitcasts.empty())
|
||||
continue;
|
||||
|
||||
LLVM_DEBUG(dbgs() << "Sinking alloca (via bitcast): " << *AI << "\n");
|
||||
LifetimeMarkerInfo MarkerInfo = getLifetimeMarkers(CEAC, AI, ExitBlock);
|
||||
bool Moved = moveOrIgnoreLifetimeMarkers(MarkerInfo);
|
||||
if (Moved) {
|
||||
LLVM_DEBUG(dbgs() << "Sinking alloca: " << *AI << "\n");
|
||||
SinkCands.insert(AI);
|
||||
for (unsigned I = 0, E = Bitcasts.size(); I != E; ++I) {
|
||||
Instruction *BitcastAddr = Bitcasts[I];
|
||||
const LifetimeMarkerInfo &LMI = BitcastLifetimeInfo[I];
|
||||
assert(LMI.LifeStart &&
|
||||
"Unsafe to sink bitcast without lifetime markers");
|
||||
moveOrIgnoreLifetimeMarkers(LMI);
|
||||
if (!definedInRegion(Blocks, BitcastAddr)) {
|
||||
LLVM_DEBUG(dbgs() << "Sinking bitcast-of-alloca: " << *BitcastAddr
|
||||
<< "\n");
|
||||
SinkCands.insert(BitcastAddr);
|
||||
continue;
|
||||
}
|
||||
|
||||
// Follow any bitcasts.
|
||||
SmallVector<Instruction *, 2> Bitcasts;
|
||||
SmallVector<LifetimeMarkerInfo, 2> BitcastLifetimeInfo;
|
||||
for (User *U : AI->users()) {
|
||||
if (U->stripInBoundsConstantOffsets() == AI) {
|
||||
Instruction *Bitcast = cast<Instruction>(U);
|
||||
LifetimeMarkerInfo LMI = getLifetimeMarkers(CEAC, Bitcast, ExitBlock);
|
||||
if (LMI.LifeStart) {
|
||||
Bitcasts.push_back(Bitcast);
|
||||
BitcastLifetimeInfo.push_back(LMI);
|
||||
continue;
|
||||
}
|
||||
}
|
||||
|
||||
// Found unknown use of AI.
|
||||
if (!definedInRegion(Blocks, U)) {
|
||||
Bitcasts.clear();
|
||||
break;
|
||||
}
|
||||
}
|
||||
|
||||
// Either no bitcasts reference the alloca or there are unknown uses.
|
||||
if (Bitcasts.empty())
|
||||
continue;
|
||||
|
||||
LLVM_DEBUG(dbgs() << "Sinking alloca (via bitcast): " << *AI << "\n");
|
||||
SinkCands.insert(AI);
|
||||
for (unsigned I = 0, E = Bitcasts.size(); I != E; ++I) {
|
||||
Instruction *BitcastAddr = Bitcasts[I];
|
||||
const LifetimeMarkerInfo &LMI = BitcastLifetimeInfo[I];
|
||||
assert(LMI.LifeStart &&
|
||||
"Unsafe to sink bitcast without lifetime markers");
|
||||
moveOrIgnoreLifetimeMarkers(LMI);
|
||||
if (!definedInRegion(Blocks, BitcastAddr)) {
|
||||
LLVM_DEBUG(dbgs() << "Sinking bitcast-of-alloca: " << *BitcastAddr
|
||||
<< "\n");
|
||||
SinkCands.insert(BitcastAddr);
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -1349,7 +1382,8 @@ void CodeExtractor::calculateNewCallTerminatorWeights(
|
||||
MDBuilder(TI->getContext()).createBranchWeights(BranchWeights));
|
||||
}
|
||||
|
||||
Function *CodeExtractor::extractCodeRegion() {
|
||||
Function *
|
||||
CodeExtractor::extractCodeRegion(const CodeExtractorAnalysisCache &CEAC) {
|
||||
if (!isEligible())
|
||||
return nullptr;
|
||||
|
||||
@ -1435,7 +1469,7 @@ Function *CodeExtractor::extractCodeRegion() {
|
||||
|
||||
ValueSet inputs, outputs, SinkingCands, HoistingCands;
|
||||
BasicBlock *CommonExit = nullptr;
|
||||
findAllocas(SinkingCands, HoistingCands, CommonExit);
|
||||
findAllocas(CEAC, SinkingCands, HoistingCands, CommonExit);
|
||||
assert(HoistingCands.empty() || CommonExit);
|
||||
|
||||
// Find inputs to, outputs from the code region.
|
||||
|
@ -62,7 +62,8 @@ TEST(CodeExtractor, ExitStub) {
|
||||
CodeExtractor CE(Candidates);
|
||||
EXPECT_TRUE(CE.isEligible());
|
||||
|
||||
Function *Outlined = CE.extractCodeRegion();
|
||||
CodeExtractorAnalysisCache CEAC(*Func);
|
||||
Function *Outlined = CE.extractCodeRegion(CEAC);
|
||||
EXPECT_TRUE(Outlined);
|
||||
BasicBlock *Exit = getBlockByName(Func, "notExtracted");
|
||||
BasicBlock *ExitSplit = getBlockByName(Outlined, "notExtracted.split");
|
||||
@ -112,7 +113,8 @@ TEST(CodeExtractor, ExitPHIOnePredFromRegion) {
|
||||
CodeExtractor CE(ExtractedBlocks);
|
||||
EXPECT_TRUE(CE.isEligible());
|
||||
|
||||
Function *Outlined = CE.extractCodeRegion();
|
||||
CodeExtractorAnalysisCache CEAC(*Func);
|
||||
Function *Outlined = CE.extractCodeRegion(CEAC);
|
||||
EXPECT_TRUE(Outlined);
|
||||
BasicBlock *Exit1 = getBlockByName(Func, "exit1");
|
||||
BasicBlock *Exit2 = getBlockByName(Func, "exit2");
|
||||
@ -186,7 +188,8 @@ TEST(CodeExtractor, StoreOutputInvokeResultAfterEHPad) {
|
||||
CodeExtractor CE(ExtractedBlocks);
|
||||
EXPECT_TRUE(CE.isEligible());
|
||||
|
||||
Function *Outlined = CE.extractCodeRegion();
|
||||
CodeExtractorAnalysisCache CEAC(*Func);
|
||||
Function *Outlined = CE.extractCodeRegion(CEAC);
|
||||
EXPECT_TRUE(Outlined);
|
||||
EXPECT_FALSE(verifyFunction(*Outlined, &errs()));
|
||||
EXPECT_FALSE(verifyFunction(*Func, &errs()));
|
||||
@ -220,7 +223,8 @@ TEST(CodeExtractor, StoreOutputInvokeResultInExitStub) {
|
||||
CodeExtractor CE(Blocks);
|
||||
EXPECT_TRUE(CE.isEligible());
|
||||
|
||||
Function *Outlined = CE.extractCodeRegion();
|
||||
CodeExtractorAnalysisCache CEAC(*Func);
|
||||
Function *Outlined = CE.extractCodeRegion(CEAC);
|
||||
EXPECT_TRUE(Outlined);
|
||||
EXPECT_FALSE(verifyFunction(*Outlined));
|
||||
EXPECT_FALSE(verifyFunction(*Func));
|
||||
@ -271,7 +275,8 @@ TEST(CodeExtractor, ExtractAndInvalidateAssumptionCache) {
|
||||
CodeExtractor CE(Blocks, nullptr, false, nullptr, nullptr, &AC);
|
||||
EXPECT_TRUE(CE.isEligible());
|
||||
|
||||
Function *Outlined = CE.extractCodeRegion();
|
||||
CodeExtractorAnalysisCache CEAC(*Func);
|
||||
Function *Outlined = CE.extractCodeRegion(CEAC);
|
||||
EXPECT_TRUE(Outlined);
|
||||
EXPECT_FALSE(verifyFunction(*Outlined));
|
||||
EXPECT_FALSE(verifyFunction(*Func));
|
||||
|
Loading…
Reference in New Issue
Block a user