mirror of
https://github.com/RPCSX/llvm.git
synced 2025-01-17 18:03:49 +00:00
[NVPTX] fix a crash bug in NVPTXFavorNonGenericAddrSpaces
Summary: We used to assume V->RAUW only modifies the operand list of V's user. However, if V and V's user are Constants, RAUW may replace and invalidate V's user entirely. This patch fixes the above issue by letting the caller replace the operand instead of calling RAUW on Constants. Test Plan: @nested_const_expr and @rauw in access-non-generic.ll Reviewers: broune, jholewinski Reviewed By: broune, jholewinski Subscribers: jholewinski, llvm-commits Differential Revision: http://reviews.llvm.org/D10345 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@239435 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
1d815cac84
commit
95355e6498
@ -98,15 +98,14 @@ private:
|
||||
/// This reordering exposes to optimizeMemoryInstruction more
|
||||
/// optimization opportunities on loads and stores.
|
||||
///
|
||||
/// Returns true if this function succesfully hoists an eliminable
|
||||
/// addrspacecast or V is already such an addrspacecast.
|
||||
/// Transforms "gep (addrspacecast X), indices" into "addrspacecast (gep X,
|
||||
/// indices)".
|
||||
bool hoistAddrSpaceCastFrom(Value *V, int Depth = 0);
|
||||
/// If this function succesfully hoists an eliminable addrspacecast or V is
|
||||
/// already such an addrspacecast, it returns the transformed value (which is
|
||||
/// guaranteed to be an addrspacecast); otherwise, it returns nullptr.
|
||||
Value *hoistAddrSpaceCastFrom(Value *V, int Depth = 0);
|
||||
/// Helper function for GEPs.
|
||||
bool hoistAddrSpaceCastFromGEP(GEPOperator *GEP, int Depth);
|
||||
Value *hoistAddrSpaceCastFromGEP(GEPOperator *GEP, int Depth);
|
||||
/// Helper function for bitcasts.
|
||||
bool hoistAddrSpaceCastFromBitCast(BitCastOperator *BC, int Depth);
|
||||
Value *hoistAddrSpaceCastFromBitCast(BitCastOperator *BC, int Depth);
|
||||
};
|
||||
}
|
||||
|
||||
@ -143,17 +142,19 @@ static bool isEliminableAddrSpaceCast(Value *V) {
|
||||
DestTy->getAddressSpace() == AddressSpace::ADDRESS_SPACE_GENERIC);
|
||||
}
|
||||
|
||||
bool NVPTXFavorNonGenericAddrSpaces::hoistAddrSpaceCastFromGEP(GEPOperator *GEP,
|
||||
int Depth) {
|
||||
if (!hoistAddrSpaceCastFrom(GEP->getPointerOperand(), Depth + 1))
|
||||
return false;
|
||||
Value *NVPTXFavorNonGenericAddrSpaces::hoistAddrSpaceCastFromGEP(
|
||||
GEPOperator *GEP, int Depth) {
|
||||
Value *NewOperand =
|
||||
hoistAddrSpaceCastFrom(GEP->getPointerOperand(), Depth + 1);
|
||||
if (NewOperand == nullptr)
|
||||
return nullptr;
|
||||
|
||||
// That hoistAddrSpaceCastFrom succeeds implies GEP's pointer operand is now
|
||||
// an eliminable addrspacecast.
|
||||
assert(isEliminableAddrSpaceCast(GEP->getPointerOperand()));
|
||||
Operator *Cast = cast<Operator>(GEP->getPointerOperand());
|
||||
// hoistAddrSpaceCastFrom returns an eliminable addrspacecast or nullptr.
|
||||
assert(isEliminableAddrSpaceCast(NewOperand));
|
||||
Operator *Cast = cast<Operator>(NewOperand);
|
||||
|
||||
SmallVector<Value *, 8> Indices(GEP->idx_begin(), GEP->idx_end());
|
||||
Value *NewASC;
|
||||
if (Instruction *GEPI = dyn_cast<Instruction>(GEP)) {
|
||||
// GEP = gep (addrspacecast X), indices
|
||||
// =>
|
||||
@ -163,30 +164,31 @@ bool NVPTXFavorNonGenericAddrSpaces::hoistAddrSpaceCastFromGEP(GEPOperator *GEP,
|
||||
GEP->getSourceElementType(), Cast->getOperand(0), Indices,
|
||||
"", GEPI);
|
||||
NewGEP->setIsInBounds(GEP->isInBounds());
|
||||
Value *NewASC = new AddrSpaceCastInst(NewGEP, GEP->getType(), "", GEPI);
|
||||
NewASC = new AddrSpaceCastInst(NewGEP, GEP->getType(), "", GEPI);
|
||||
NewASC->takeName(GEP);
|
||||
// Without RAUWing GEP, the compiler would visit GEP again and emit
|
||||
// redundant instructions. This is exercised in test @rauw in
|
||||
// access-non-generic.ll.
|
||||
GEP->replaceAllUsesWith(NewASC);
|
||||
} else {
|
||||
// GEP is a constant expression.
|
||||
Constant *NewGEP = ConstantExpr::getGetElementPtr(
|
||||
GEP->getSourceElementType(), cast<Constant>(Cast->getOperand(0)),
|
||||
Indices, GEP->isInBounds());
|
||||
GEP->replaceAllUsesWith(
|
||||
ConstantExpr::getAddrSpaceCast(NewGEP, GEP->getType()));
|
||||
NewASC = ConstantExpr::getAddrSpaceCast(NewGEP, GEP->getType());
|
||||
}
|
||||
|
||||
return true;
|
||||
return NewASC;
|
||||
}
|
||||
|
||||
bool NVPTXFavorNonGenericAddrSpaces::hoistAddrSpaceCastFromBitCast(
|
||||
Value *NVPTXFavorNonGenericAddrSpaces::hoistAddrSpaceCastFromBitCast(
|
||||
BitCastOperator *BC, int Depth) {
|
||||
if (!hoistAddrSpaceCastFrom(BC->getOperand(0), Depth + 1))
|
||||
return false;
|
||||
Value *NewOperand = hoistAddrSpaceCastFrom(BC->getOperand(0), Depth + 1);
|
||||
if (NewOperand == nullptr)
|
||||
return nullptr;
|
||||
|
||||
// That hoistAddrSpaceCastFrom succeeds implies BC's source operand is now
|
||||
// an eliminable addrspacecast.
|
||||
assert(isEliminableAddrSpaceCast(BC->getOperand(0)));
|
||||
Operator *Cast = cast<Operator>(BC->getOperand(0));
|
||||
// hoistAddrSpaceCastFrom returns an eliminable addrspacecast or nullptr.
|
||||
assert(isEliminableAddrSpaceCast(NewOperand));
|
||||
Operator *Cast = cast<Operator>(NewOperand);
|
||||
|
||||
// Cast = addrspacecast Src
|
||||
// BC = bitcast Cast
|
||||
@ -197,31 +199,34 @@ bool NVPTXFavorNonGenericAddrSpaces::hoistAddrSpaceCastFromBitCast(
|
||||
Type *TypeOfNewCast =
|
||||
PointerType::get(BC->getType()->getPointerElementType(),
|
||||
Src->getType()->getPointerAddressSpace());
|
||||
Value *NewBC;
|
||||
if (BitCastInst *BCI = dyn_cast<BitCastInst>(BC)) {
|
||||
Value *NewCast = new BitCastInst(Src, TypeOfNewCast, "", BCI);
|
||||
Value *NewBC = new AddrSpaceCastInst(NewCast, BC->getType(), "", BCI);
|
||||
NewBC = new AddrSpaceCastInst(NewCast, BC->getType(), "", BCI);
|
||||
NewBC->takeName(BC);
|
||||
// Without RAUWing BC, the compiler would visit BC again and emit
|
||||
// redundant instructions. This is exercised in test @rauw in
|
||||
// access-non-generic.ll.
|
||||
BC->replaceAllUsesWith(NewBC);
|
||||
} else {
|
||||
// BC is a constant expression.
|
||||
Constant *NewCast =
|
||||
ConstantExpr::getBitCast(cast<Constant>(Src), TypeOfNewCast);
|
||||
Constant *NewBC = ConstantExpr::getAddrSpaceCast(NewCast, BC->getType());
|
||||
BC->replaceAllUsesWith(NewBC);
|
||||
NewBC = ConstantExpr::getAddrSpaceCast(NewCast, BC->getType());
|
||||
}
|
||||
return true;
|
||||
return NewBC;
|
||||
}
|
||||
|
||||
bool NVPTXFavorNonGenericAddrSpaces::hoistAddrSpaceCastFrom(Value *V,
|
||||
int Depth) {
|
||||
// Returns true if V is already an eliminable addrspacecast.
|
||||
Value *NVPTXFavorNonGenericAddrSpaces::hoistAddrSpaceCastFrom(Value *V,
|
||||
int Depth) {
|
||||
// Returns V if V is already an eliminable addrspacecast.
|
||||
if (isEliminableAddrSpaceCast(V))
|
||||
return true;
|
||||
return V;
|
||||
|
||||
// Limit the depth to prevent this recursive function from running too long.
|
||||
const int MaxDepth = 20;
|
||||
if (Depth >= MaxDepth)
|
||||
return false;
|
||||
return nullptr;
|
||||
|
||||
// If V is a GEP or bitcast, hoist the addrspacecast if any from its pointer
|
||||
// operand. This enables optimizeMemoryInstruction to shortcut addrspacecasts
|
||||
@ -232,28 +237,29 @@ bool NVPTXFavorNonGenericAddrSpaces::hoistAddrSpaceCastFrom(Value *V,
|
||||
if (BitCastOperator *BC = dyn_cast<BitCastOperator>(V))
|
||||
return hoistAddrSpaceCastFromBitCast(BC, Depth);
|
||||
|
||||
return false;
|
||||
return nullptr;
|
||||
}
|
||||
|
||||
bool NVPTXFavorNonGenericAddrSpaces::optimizeMemoryInstruction(Instruction *MI,
|
||||
unsigned Idx) {
|
||||
if (hoistAddrSpaceCastFrom(MI->getOperand(Idx))) {
|
||||
// load/store (addrspacecast X) => load/store X if shortcutting the
|
||||
// addrspacecast is valid and can improve performance.
|
||||
//
|
||||
// e.g.,
|
||||
// %1 = addrspacecast float addrspace(3)* %0 to float*
|
||||
// %2 = load float* %1
|
||||
// ->
|
||||
// %2 = load float addrspace(3)* %0
|
||||
//
|
||||
// Note: the addrspacecast can also be a constant expression.
|
||||
assert(isEliminableAddrSpaceCast(MI->getOperand(Idx)));
|
||||
Operator *ASC = dyn_cast<Operator>(MI->getOperand(Idx));
|
||||
MI->setOperand(Idx, ASC->getOperand(0));
|
||||
return true;
|
||||
}
|
||||
return false;
|
||||
Value *NewOperand = hoistAddrSpaceCastFrom(MI->getOperand(Idx));
|
||||
if (NewOperand == nullptr)
|
||||
return false;
|
||||
|
||||
// load/store (addrspacecast X) => load/store X if shortcutting the
|
||||
// addrspacecast is valid and can improve performance.
|
||||
//
|
||||
// e.g.,
|
||||
// %1 = addrspacecast float addrspace(3)* %0 to float*
|
||||
// %2 = load float* %1
|
||||
// ->
|
||||
// %2 = load float addrspace(3)* %0
|
||||
//
|
||||
// Note: the addrspacecast can also be a constant expression.
|
||||
assert(isEliminableAddrSpaceCast(NewOperand));
|
||||
Operator *ASC = dyn_cast<Operator>(NewOperand);
|
||||
MI->setOperand(Idx, ASC->getOperand(0));
|
||||
return true;
|
||||
}
|
||||
|
||||
bool NVPTXFavorNonGenericAddrSpaces::runOnFunction(Function &F) {
|
||||
|
@ -101,6 +101,28 @@ define i32 @ld_int_from_global_float(float addrspace(1)* %input, i32 %i, i32 %j)
|
||||
ret i32 %5
|
||||
}
|
||||
|
||||
define void @nested_const_expr() {
|
||||
; PTX-LABEL: nested_const_expr(
|
||||
; store 1 to bitcast(gep(addrspacecast(array), 0, 1))
|
||||
store i32 1, i32* bitcast (float* getelementptr ([10 x float], [10 x float]* addrspacecast ([10 x float] addrspace(3)* @array to [10 x float]*), i64 0, i64 1) to i32*), align 4
|
||||
; PTX: mov.u32 %r1, 1;
|
||||
; PTX-NEXT: st.shared.u32 [array+4], %r1;
|
||||
ret void
|
||||
}
|
||||
|
||||
define void @rauw(float addrspace(1)* %input) {
|
||||
%generic_input = addrspacecast float addrspace(1)* %input to float*
|
||||
%addr = getelementptr float, float* %generic_input, i64 10
|
||||
%v = load float, float* %addr
|
||||
store float %v, float* %addr
|
||||
ret void
|
||||
; IR-LABEL: @rauw(
|
||||
; IR-NEXT: %1 = getelementptr float, float addrspace(1)* %input, i64 10
|
||||
; IR-NEXT: %v = load float, float addrspace(1)* %1
|
||||
; IR-NEXT: store float %v, float addrspace(1)* %1
|
||||
; IR-NEXT: ret void
|
||||
}
|
||||
|
||||
declare void @llvm.cuda.syncthreads() #3
|
||||
|
||||
attributes #3 = { noduplicate nounwind }
|
||||
|
Loading…
x
Reference in New Issue
Block a user