mirror of
https://github.com/RPCS3/llvm.git
synced 2025-01-25 12:04:36 +00:00
35c93e4e42
This allows us to make more use of the many compare reg,mem instructions. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@189099 91177308-0d34-0410-b5e6-96231b3b80d8
197 lines
5.2 KiB
LLVM
197 lines
5.2 KiB
LLVM
; Test 32-bit signed comparison in which the second operand is a variable.
|
|
;
|
|
; RUN: llc < %s -mtriple=s390x-linux-gnu | FileCheck %s
|
|
|
|
declare i32 @foo()
|
|
|
|
; Check register comparison.
|
|
define double @f1(double %a, double %b, i32 %i1, i32 %i2) {
|
|
; CHECK-LABEL: f1:
|
|
; CHECK: crjl %r2, %r3
|
|
; CHECK: ldr %f0, %f2
|
|
; CHECK: br %r14
|
|
%cond = icmp slt i32 %i1, %i2
|
|
%res = select i1 %cond, double %a, double %b
|
|
ret double %res
|
|
}
|
|
|
|
; Check the low end of the C range.
|
|
define double @f2(double %a, double %b, i32 %i1, i32 *%ptr) {
|
|
; CHECK-LABEL: f2:
|
|
; CHECK: c %r2, 0(%r3)
|
|
; CHECK-NEXT: jl
|
|
; CHECK: ldr %f0, %f2
|
|
; CHECK: br %r14
|
|
%i2 = load i32 *%ptr
|
|
%cond = icmp slt i32 %i1, %i2
|
|
%res = select i1 %cond, double %a, double %b
|
|
ret double %res
|
|
}
|
|
|
|
; Check the high end of the aligned C range.
|
|
define double @f3(double %a, double %b, i32 %i1, i32 *%base) {
|
|
; CHECK-LABEL: f3:
|
|
; CHECK: c %r2, 4092(%r3)
|
|
; CHECK-NEXT: jl
|
|
; CHECK: ldr %f0, %f2
|
|
; CHECK: br %r14
|
|
%ptr = getelementptr i32 *%base, i64 1023
|
|
%i2 = load i32 *%ptr
|
|
%cond = icmp slt i32 %i1, %i2
|
|
%res = select i1 %cond, double %a, double %b
|
|
ret double %res
|
|
}
|
|
|
|
; Check the next word up, which should use CY instead of C.
|
|
define double @f4(double %a, double %b, i32 %i1, i32 *%base) {
|
|
; CHECK-LABEL: f4:
|
|
; CHECK: cy %r2, 4096(%r3)
|
|
; CHECK-NEXT: jl
|
|
; CHECK: ldr %f0, %f2
|
|
; CHECK: br %r14
|
|
%ptr = getelementptr i32 *%base, i64 1024
|
|
%i2 = load i32 *%ptr
|
|
%cond = icmp slt i32 %i1, %i2
|
|
%res = select i1 %cond, double %a, double %b
|
|
ret double %res
|
|
}
|
|
|
|
; Check the high end of the aligned CY range.
|
|
define double @f5(double %a, double %b, i32 %i1, i32 *%base) {
|
|
; CHECK-LABEL: f5:
|
|
; CHECK: cy %r2, 524284(%r3)
|
|
; CHECK-NEXT: jl
|
|
; CHECK: ldr %f0, %f2
|
|
; CHECK: br %r14
|
|
%ptr = getelementptr i32 *%base, i64 131071
|
|
%i2 = load i32 *%ptr
|
|
%cond = icmp slt i32 %i1, %i2
|
|
%res = select i1 %cond, double %a, double %b
|
|
ret double %res
|
|
}
|
|
|
|
; Check the next word up, which needs separate address logic.
|
|
; Other sequences besides this one would be OK.
|
|
define double @f6(double %a, double %b, i32 %i1, i32 *%base) {
|
|
; CHECK-LABEL: f6:
|
|
; CHECK: agfi %r3, 524288
|
|
; CHECK: c %r2, 0(%r3)
|
|
; CHECK-NEXT: jl
|
|
; CHECK: ldr %f0, %f2
|
|
; CHECK: br %r14
|
|
%ptr = getelementptr i32 *%base, i64 131072
|
|
%i2 = load i32 *%ptr
|
|
%cond = icmp slt i32 %i1, %i2
|
|
%res = select i1 %cond, double %a, double %b
|
|
ret double %res
|
|
}
|
|
|
|
; Check the high end of the negative aligned CY range.
|
|
define double @f7(double %a, double %b, i32 %i1, i32 *%base) {
|
|
; CHECK-LABEL: f7:
|
|
; CHECK: cy %r2, -4(%r3)
|
|
; CHECK-NEXT: jl
|
|
; CHECK: ldr %f0, %f2
|
|
; CHECK: br %r14
|
|
%ptr = getelementptr i32 *%base, i64 -1
|
|
%i2 = load i32 *%ptr
|
|
%cond = icmp slt i32 %i1, %i2
|
|
%res = select i1 %cond, double %a, double %b
|
|
ret double %res
|
|
}
|
|
|
|
; Check the low end of the CY range.
|
|
define double @f8(double %a, double %b, i32 %i1, i32 *%base) {
|
|
; CHECK-LABEL: f8:
|
|
; CHECK: cy %r2, -524288(%r3)
|
|
; CHECK-NEXT: jl
|
|
; CHECK: ldr %f0, %f2
|
|
; CHECK: br %r14
|
|
%ptr = getelementptr i32 *%base, i64 -131072
|
|
%i2 = load i32 *%ptr
|
|
%cond = icmp slt i32 %i1, %i2
|
|
%res = select i1 %cond, double %a, double %b
|
|
ret double %res
|
|
}
|
|
|
|
; Check the next word down, which needs separate address logic.
|
|
; Other sequences besides this one would be OK.
|
|
define double @f9(double %a, double %b, i32 %i1, i32 *%base) {
|
|
; CHECK-LABEL: f9:
|
|
; CHECK: agfi %r3, -524292
|
|
; CHECK: c %r2, 0(%r3)
|
|
; CHECK-NEXT: jl
|
|
; CHECK: ldr %f0, %f2
|
|
; CHECK: br %r14
|
|
%ptr = getelementptr i32 *%base, i64 -131073
|
|
%i2 = load i32 *%ptr
|
|
%cond = icmp slt i32 %i1, %i2
|
|
%res = select i1 %cond, double %a, double %b
|
|
ret double %res
|
|
}
|
|
|
|
; Check that C allows an index.
|
|
define double @f10(double %a, double %b, i32 %i1, i64 %base, i64 %index) {
|
|
; CHECK-LABEL: f10:
|
|
; CHECK: c %r2, 4092({{%r4,%r3|%r3,%r4}})
|
|
; CHECK-NEXT: jl
|
|
; CHECK: ldr %f0, %f2
|
|
; CHECK: br %r14
|
|
%add1 = add i64 %base, %index
|
|
%add2 = add i64 %add1, 4092
|
|
%ptr = inttoptr i64 %add2 to i32 *
|
|
%i2 = load i32 *%ptr
|
|
%cond = icmp slt i32 %i1, %i2
|
|
%res = select i1 %cond, double %a, double %b
|
|
ret double %res
|
|
}
|
|
|
|
; Check that CY allows an index.
|
|
define double @f11(double %a, double %b, i32 %i1, i64 %base, i64 %index) {
|
|
; CHECK-LABEL: f11:
|
|
; CHECK: cy %r2, 4096({{%r4,%r3|%r3,%r4}})
|
|
; CHECK-NEXT: jl
|
|
; CHECK: ldr %f0, %f2
|
|
; CHECK: br %r14
|
|
%add1 = add i64 %base, %index
|
|
%add2 = add i64 %add1, 4096
|
|
%ptr = inttoptr i64 %add2 to i32 *
|
|
%i2 = load i32 *%ptr
|
|
%cond = icmp slt i32 %i1, %i2
|
|
%res = select i1 %cond, double %a, double %b
|
|
ret double %res
|
|
}
|
|
|
|
; The first branch here got recreated by InsertBranch while splitting the
|
|
; critical edge %entry->%while.body, which lost the kills information for CC.
|
|
define void @f12(i32 %a, i32 %b) {
|
|
; CHECK-LABEL: f12:
|
|
; CHECK: cije %r2, 0
|
|
; CHECK: crjlh %r2,
|
|
; CHECK: br %r14
|
|
entry:
|
|
%cmp11 = icmp eq i32 %a, 0
|
|
br i1 %cmp11, label %while.end, label %while.body
|
|
|
|
while.body:
|
|
%c = call i32 @foo()
|
|
%cmp12 = icmp eq i32 %c, %b
|
|
br i1 %cmp12, label %while.end, label %while.body
|
|
|
|
while.end:
|
|
ret void
|
|
}
|
|
|
|
; Check the comparison can be reversed if that allows C to be used.
|
|
define double @f13(double %a, double %b, i32 %i2, i32 *%ptr) {
|
|
; CHECK-LABEL: f13:
|
|
; CHECK: c %r2, 0(%r3)
|
|
; CHECK-NEXT: jh {{\.L.*}}
|
|
; CHECK: ldr %f0, %f2
|
|
; CHECK: br %r14
|
|
%i1 = load i32 *%ptr
|
|
%cond = icmp slt i32 %i1, %i2
|
|
%res = select i1 %cond, double %a, double %b
|
|
ret double %res
|
|
}
|