mirror of
https://github.com/RPCSX/llvm.git
synced 2025-01-19 02:42:58 +00:00
Fixed optimization of combining two shuffles where the first shuffle inputs
has a different number of elements than the output. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@62998 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
e7852d0144
commit
fe6d2cd9d1
@ -12179,9 +12179,11 @@ Instruction *InstCombiner::visitShuffleVectorInst(ShuffleVectorInst &SVI) {
|
||||
// If the result mask is equal to the src shuffle or this shuffle mask, do
|
||||
// the replacement.
|
||||
if (NewMask == LHSMask || NewMask == Mask) {
|
||||
unsigned LHSInNElts =
|
||||
cast<VectorType>(LHSSVI->getOperand(0)->getType())->getNumElements();
|
||||
std::vector<Constant*> Elts;
|
||||
for (unsigned i = 0, e = NewMask.size(); i != e; ++i) {
|
||||
if (NewMask[i] >= e*2) {
|
||||
if (NewMask[i] >= LHSInNElts*2) {
|
||||
Elts.push_back(UndefValue::get(Type::Int32Ty));
|
||||
} else {
|
||||
Elts.push_back(ConstantInt::get(Type::Int32Ty, NewMask[i]));
|
||||
|
19
test/Transforms/InstCombine/vec_shuffle2.ll
Normal file
19
test/Transforms/InstCombine/vec_shuffle2.ll
Normal file
@ -0,0 +1,19 @@
|
||||
; RUN: llvm-as < %s | opt -instcombine | llvm-dis | grep undef | count 1
|
||||
; END.
|
||||
|
||||
; Test fold of two shuffles where the first shuffle vectors inputs are a
|
||||
; different length then the second.
|
||||
|
||||
define void @test_cl(<4 x i8> addrspace(1)* %dest, <16 x i8> addrspace(1)* %old) nounwind {
|
||||
entry:
|
||||
%arrayidx = getelementptr <4 x i8> addrspace(1)* %dest, i32 0 ; <<4 x i8> addrspace(1)*> [#uses=1]
|
||||
%arrayidx5 = getelementptr <16 x i8> addrspace(1)* %old, i32 0 ; <<16 x i8> addrspace(1)*> [#uses=1]
|
||||
%tmp6 = load <16 x i8> addrspace(1)* %arrayidx5 ; <<16 x i8>> [#uses=1]
|
||||
%tmp7 = shufflevector <16 x i8> %tmp6, <16 x i8> undef, <4 x i32> < i32 13, i32 9, i32 4, i32 13 > ; <<4 x i8>> [#uses=1]
|
||||
%tmp9 = shufflevector <4 x i8> %tmp7, <4 x i8> undef, <4 x i32> < i32 3, i32 1, i32 2, i32 0 > ; <<4 x i8>> [#uses=1]
|
||||
store <4 x i8> %tmp9, <4 x i8> addrspace(1)* %arrayidx
|
||||
ret void
|
||||
|
||||
return: ; preds = %entry
|
||||
ret void
|
||||
}
|
Loading…
x
Reference in New Issue
Block a user