mirror of
https://github.com/RPCS3/llvm.git
synced 2025-05-20 20:36:11 +00:00

The patch was reverted due to a bug. The bug was that if the IV is the 2nd operand of the icmp instruction, then the "Pred" variable gets swapped and differs from the instruction's predicate. In this patch we use the original predicate to do the transformation. Also added a test case that exercises this situation. Differentian Revision: https://reviews.llvm.org/D35107 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@307477 91177308-0d34-0410-b5e6-96231b3b80d8
356 lines
9.2 KiB
LLVM
356 lines
9.2 KiB
LLVM
; RUN: opt < %s -indvars -S | FileCheck %s
|
|
target triple = "aarch64--linux-gnu"
|
|
|
|
; Provide legal integer types.
|
|
target datalayout = "n8:16:32:64"
|
|
|
|
|
|
; Check the loop exit i32 compare instruction and operand are widened to i64
|
|
; instead of truncating IV before its use in the i32 compare instruction.
|
|
|
|
@idx = common global i32 0, align 4
|
|
@e = common global i32 0, align 4
|
|
@ptr = common global i32* null, align 8
|
|
|
|
; CHECK-LABEL: @test1
|
|
; CHECK: for.body.lr.ph:
|
|
; CHECK: sext i32
|
|
; CHECK: for.cond:
|
|
; CHECK: icmp slt i64
|
|
; CHECK: for.body:
|
|
; CHECK: phi i64
|
|
|
|
define i32 @test1() {
|
|
entry:
|
|
store i32 -1, i32* @idx, align 4
|
|
%0 = load i32, i32* @e, align 4
|
|
%cmp4 = icmp slt i32 %0, 0
|
|
br i1 %cmp4, label %for.end.loopexit, label %for.body.lr.ph
|
|
|
|
for.body.lr.ph:
|
|
%1 = load i32*, i32** @ptr, align 8
|
|
%2 = load i32, i32* @e, align 4
|
|
br label %for.body
|
|
|
|
for.cond:
|
|
%inc = add nsw i32 %i.05, 1
|
|
%cmp = icmp slt i32 %i.05, %2
|
|
br i1 %cmp, label %for.body, label %for.cond.for.end.loopexit_crit_edge
|
|
|
|
for.body:
|
|
%i.05 = phi i32 [ 0, %for.body.lr.ph ], [ %inc, %for.cond ]
|
|
%idxprom = sext i32 %i.05 to i64
|
|
%arrayidx = getelementptr inbounds i32, i32* %1, i64 %idxprom
|
|
%3 = load i32, i32* %arrayidx, align 4
|
|
%tobool = icmp eq i32 %3, 0
|
|
br i1 %tobool, label %if.then, label %for.cond
|
|
|
|
if.then:
|
|
%i.05.lcssa = phi i32 [ %i.05, %for.body ]
|
|
store i32 %i.05.lcssa, i32* @idx, align 4
|
|
br label %for.end
|
|
|
|
for.cond.for.end.loopexit_crit_edge:
|
|
br label %for.end.loopexit
|
|
|
|
for.end.loopexit:
|
|
br label %for.end
|
|
|
|
for.end:
|
|
%4 = load i32, i32* @idx, align 4
|
|
ret i32 %4
|
|
}
|
|
|
|
; CHECK-LABEL: @test2
|
|
; CHECK: for.body4.us
|
|
; CHECK: %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
; CHECK: %cmp2.us = icmp ult i64
|
|
; CHECK-NOT: %2 = trunc i64 %indvars.iv.next to i32
|
|
; CHECK-NOT: %cmp2.us = icmp slt i32
|
|
|
|
define void @test2([8 x i8]* %a, i8* %b, i8 %limit) {
|
|
entry:
|
|
%conv = zext i8 %limit to i32
|
|
br i1 undef, label %for.cond1.preheader, label %for.cond1.preheader.us
|
|
|
|
for.cond1.preheader.us:
|
|
%storemerge5.us = phi i32 [ 0, %entry ], [ %inc14.us, %for.inc13.us ]
|
|
br i1 true, label %for.body4.lr.ph.us, label %for.inc13.us
|
|
|
|
for.inc13.us:
|
|
%inc14.us = add nsw i32 %storemerge5.us, 1
|
|
%cmp.us = icmp slt i32 %inc14.us, 4
|
|
br i1 %cmp.us, label %for.cond1.preheader.us, label %for.end
|
|
|
|
for.body4.us:
|
|
%storemerge14.us = phi i32 [ 0, %for.body4.lr.ph.us ], [ %inc.us, %for.body4.us ]
|
|
%idxprom.us = sext i32 %storemerge14.us to i64
|
|
%arrayidx6.us = getelementptr inbounds [8 x i8], [8 x i8]* %a, i64 %idxprom5.us, i64 %idxprom.us
|
|
%0 = load i8, i8* %arrayidx6.us, align 1
|
|
%idxprom7.us = zext i8 %0 to i64
|
|
%arrayidx8.us = getelementptr inbounds i8, i8* %b, i64 %idxprom7.us
|
|
%1 = load i8, i8* %arrayidx8.us, align 1
|
|
store i8 %1, i8* %arrayidx6.us, align 1
|
|
%inc.us = add nsw i32 %storemerge14.us, 1
|
|
%cmp2.us = icmp slt i32 %inc.us, %conv
|
|
br i1 %cmp2.us, label %for.body4.us, label %for.inc13.us
|
|
|
|
for.body4.lr.ph.us:
|
|
%idxprom5.us = sext i32 %storemerge5.us to i64
|
|
br label %for.body4.us
|
|
|
|
for.cond1.preheader:
|
|
%storemerge5 = phi i32 [ 0, %entry ], [ %inc14, %for.inc13 ]
|
|
br i1 false, label %for.inc13, label %for.inc13
|
|
|
|
for.inc13:
|
|
%inc14 = add nsw i32 %storemerge5, 1
|
|
%cmp = icmp slt i32 %inc14, 4
|
|
br i1 %cmp, label %for.cond1.preheader, label %for.end
|
|
|
|
for.end:
|
|
ret void
|
|
}
|
|
|
|
; CHECK-LABEL: @test3
|
|
; CHECK: sext i32 %b
|
|
; CHECK: for.cond:
|
|
; CHECK: phi i64
|
|
; CHECK: icmp slt i64
|
|
|
|
define i32 @test3(i32* %a, i32 %b) {
|
|
entry:
|
|
br label %for.cond
|
|
|
|
for.cond:
|
|
%sum.0 = phi i32 [ 0, %entry ], [ %add, %for.body ]
|
|
%i.0 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
|
|
%cmp = icmp slt i32 %i.0, %b
|
|
br i1 %cmp, label %for.body, label %for.end
|
|
|
|
for.body:
|
|
%idxprom = sext i32 %i.0 to i64
|
|
%arrayidx = getelementptr inbounds i32, i32* %a, i64 %idxprom
|
|
%0 = load i32, i32* %arrayidx, align 4
|
|
%add = add nsw i32 %sum.0, %0
|
|
%inc = add nsw i32 %i.0, 1
|
|
br label %for.cond
|
|
|
|
for.end:
|
|
ret i32 %sum.0
|
|
}
|
|
|
|
declare i32 @fn1(i8 signext)
|
|
|
|
; PR21030
|
|
; CHECK-LABEL: @test4
|
|
; CHECK: for.body:
|
|
; CHECK: phi i32
|
|
; CHECK: icmp sgt i8
|
|
|
|
define i32 @test4(i32 %a) {
|
|
entry:
|
|
br label %for.body
|
|
|
|
for.body:
|
|
%c.07 = phi i8 [ -3, %entry ], [ %dec, %for.body ]
|
|
%conv6 = zext i8 %c.07 to i32
|
|
%or = or i32 %a, %conv6
|
|
%conv3 = trunc i32 %or to i8
|
|
%call = call i32 @fn1(i8 signext %conv3)
|
|
%dec = add i8 %c.07, -1
|
|
%cmp = icmp sgt i8 %dec, -14
|
|
br i1 %cmp, label %for.body, label %for.end
|
|
|
|
for.end:
|
|
ret i32 0
|
|
}
|
|
|
|
; CHECK-LABEL: @test5
|
|
; CHECK: zext i32 %b
|
|
; CHECK: for.cond:
|
|
; CHECK: phi i64
|
|
; CHECK: icmp ule i64
|
|
|
|
define i32 @test5(i32* %a, i32 %b) {
|
|
entry:
|
|
br label %for.cond
|
|
|
|
for.cond:
|
|
%sum.0 = phi i32 [ 0, %entry ], [ %add, %for.body ]
|
|
%i.0 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
|
|
%cmp = icmp ule i32 %i.0, %b
|
|
br i1 %cmp, label %for.body, label %for.end
|
|
|
|
for.body:
|
|
%idxprom = zext i32 %i.0 to i64
|
|
%arrayidx = getelementptr inbounds i32, i32* %a, i64 %idxprom
|
|
%0 = load i32, i32* %arrayidx, align 4
|
|
%add = add nsw i32 %sum.0, %0
|
|
%inc = add nsw i32 %i.0, 1
|
|
br label %for.cond
|
|
|
|
for.end:
|
|
ret i32 %sum.0
|
|
}
|
|
|
|
define i32 @test6(i32* %a, i32 %b) {
|
|
; CHECK-LABEL: @test6(
|
|
; CHECK: [[B_SEXT:%[a-z0-9]+]] = sext i32 %b to i64
|
|
; CHECK: for.cond:
|
|
; CHECK: icmp sle i64 %indvars.iv, [[B_SEXT]]
|
|
|
|
entry:
|
|
br label %for.cond
|
|
|
|
for.cond:
|
|
%sum.0 = phi i32 [ 0, %entry ], [ %add, %for.body ]
|
|
%i.0 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
|
|
%cmp = icmp sle i32 %i.0, %b
|
|
br i1 %cmp, label %for.body, label %for.end
|
|
|
|
for.body:
|
|
%idxprom = zext i32 %i.0 to i64
|
|
%arrayidx = getelementptr inbounds i32, i32* %a, i64 %idxprom
|
|
%0 = load i32, i32* %arrayidx, align 4
|
|
%add = add nsw i32 %sum.0, %0
|
|
%inc = add nsw i32 %i.0, 1
|
|
br label %for.cond
|
|
|
|
for.end:
|
|
ret i32 %sum.0
|
|
}
|
|
|
|
define i32 @test7(i32* %a, i32 %b) {
|
|
; CHECK-LABEL: @test7(
|
|
; CHECK: [[B_ZEXT:%[a-z0-9]+]] = zext i32 %b to i64
|
|
; CHECK: [[B_SEXT:%[a-z0-9]+]] = sext i32 %b to i64
|
|
; CHECK: for.cond:
|
|
; CHECK: icmp ule i64 %indvars.iv, [[B_ZEXT]]
|
|
; CHECK: for.body:
|
|
; CHECK: icmp sle i64 %indvars.iv, [[B_SEXT]]
|
|
|
|
entry:
|
|
br label %for.cond
|
|
|
|
for.cond:
|
|
%sum.0 = phi i32 [ 0, %entry ], [ %add, %for.body ]
|
|
%i.0 = phi i32 [ 0, %entry ], [ %inc, %for.body ]
|
|
%cmp = icmp ule i32 %i.0, %b
|
|
br i1 %cmp, label %for.body, label %for.end
|
|
|
|
for.body:
|
|
%idxprom = sext i32 %i.0 to i64
|
|
%arrayidx = getelementptr inbounds i32, i32* %a, i64 %idxprom
|
|
%0 = load i32, i32* %arrayidx, align 4
|
|
%add = add nsw i32 %sum.0, %0
|
|
%inc = add nsw i32 %i.0, 1
|
|
%cmp2 = icmp sle i32 %i.0, %b
|
|
br i1 %cmp2, label %for.cond, label %for.end
|
|
|
|
for.end:
|
|
ret i32 %sum.0
|
|
}
|
|
|
|
define i32 @test8(i32* %a, i32 %b, i32 %init) {
|
|
; CHECK-LABEL: @test8(
|
|
; CHECK: [[INIT_SEXT:%[a-z0-9]+]] = sext i32 %init to i64
|
|
; CHECK: [[B_ZEXT:%[a-z0-9]+]] = zext i32 %b to i64
|
|
; CHECK: for.cond:
|
|
; Note: %indvars.iv is the sign extension of %i.0
|
|
; CHECK: %indvars.iv = phi i64 [ [[INIT_SEXT]], %for.cond.preheader ], [ %indvars.iv.next, %for.body ]
|
|
; CHECK: icmp ule i64 %indvars.iv, [[B_ZEXT]]
|
|
|
|
entry:
|
|
%e = icmp sgt i32 %init, 0
|
|
br i1 %e, label %for.cond, label %leave
|
|
|
|
for.cond:
|
|
%sum.0 = phi i32 [ 0, %entry ], [ %add, %for.body ]
|
|
%i.0 = phi i32 [ %init, %entry ], [ %inc, %for.body ]
|
|
%cmp = icmp ule i32 %i.0, %b
|
|
br i1 %cmp, label %for.body, label %for.end
|
|
|
|
for.body:
|
|
%idxprom = sext i32 %i.0 to i64
|
|
%arrayidx = getelementptr inbounds i32, i32* %a, i64 %idxprom
|
|
%0 = load i32, i32* %arrayidx, align 4
|
|
%add = add nsw i32 %sum.0, %0
|
|
%inc = add nsw i32 %i.0, 1
|
|
%cmp2 = icmp slt i32 0, %inc
|
|
br i1 %cmp2, label %for.cond, label %for.end
|
|
|
|
for.end:
|
|
ret i32 %sum.0
|
|
|
|
leave:
|
|
ret i32 0
|
|
}
|
|
|
|
define i32 @test9(i32* %a, i32 %b, i32 %init) {
|
|
; CHECK-LABEL: @test9(
|
|
; CHECK: [[INIT_ZEXT:%[a-z0-9]+]] = zext i32 %init to i64
|
|
; CHECK: [[B_SEXT:%[a-z0-9]+]] = sext i32 %b to i64
|
|
; CHECK: for.cond:
|
|
; Note: %indvars.iv is the zero extension of %i.0
|
|
; CHECK: %indvars.iv = phi i64 [ [[INIT_ZEXT]], %for.cond.preheader ], [ %indvars.iv.next, %for.body ]
|
|
; CHECK: icmp slt i64 %indvars.iv, [[B_SEXT]]
|
|
|
|
entry:
|
|
%e = icmp sgt i32 %init, 0
|
|
br i1 %e, label %for.cond, label %leave
|
|
|
|
for.cond:
|
|
%sum.0 = phi i32 [ 0, %entry ], [ %add, %for.body ]
|
|
%i.0 = phi i32 [ %init, %entry ], [ %inc, %for.body ]
|
|
%cmp = icmp slt i32 %i.0, %b
|
|
br i1 %cmp, label %for.body, label %for.end
|
|
|
|
for.body:
|
|
%idxprom = zext i32 %i.0 to i64
|
|
%arrayidx = getelementptr inbounds i32, i32* %a, i64 %idxprom
|
|
%0 = load i32, i32* %arrayidx, align 4
|
|
%add = add nsw i32 %sum.0, %0
|
|
%inc = add nsw i32 %i.0, 1
|
|
%cmp2 = icmp slt i32 0, %inc
|
|
br i1 %cmp2, label %for.cond, label %for.end
|
|
|
|
for.end:
|
|
ret i32 %sum.0
|
|
|
|
leave:
|
|
ret i32 0
|
|
}
|
|
|
|
declare void @consume.i64(i64)
|
|
declare void @consume.i1(i1)
|
|
|
|
define i32 @test10(i32 %v) {
|
|
; CHECK-LABEL: @test10(
|
|
entry:
|
|
; CHECK-NOT: zext
|
|
br label %loop
|
|
|
|
loop:
|
|
; CHECK: loop:
|
|
; CHECK: %indvars.iv = phi i64 [ %indvars.iv.next, %loop ], [ 0, %entry ]
|
|
; CHECK: %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
|
|
; CHECK: [[MUL:%[a-z0-9]+]] = mul nsw i64 %indvars.iv, -1
|
|
; CHECK: [[MUL_TRUNC:%[a-z0-9]+]] = trunc i64 [[MUL]] to i32
|
|
; CHECK: [[CMP:%[a-z0-9]+]] = icmp eq i32 [[MUL_TRUNC]], %v
|
|
; CHECK: call void @consume.i1(i1 [[CMP]])
|
|
|
|
%i = phi i32 [ 0, %entry ], [ %i.inc, %loop ]
|
|
%i.inc = add i32 %i, 1
|
|
%iv = mul i32 %i, -1
|
|
%cmp = icmp eq i32 %iv, %v
|
|
call void @consume.i1(i1 %cmp)
|
|
%be.cond = icmp slt i32 %i.inc, 11
|
|
%ext = sext i32 %iv to i64
|
|
call void @consume.i64(i64 %ext)
|
|
br i1 %be.cond, label %loop, label %leave
|
|
|
|
leave:
|
|
ret i32 22
|
|
}
|