llvm/test/CodeGen/NVPTX/combine-min-max.ll
Bjarke Hammersholt Roune 935e1b6640 [NVPTX] Let NVPTX backend detect integer min and max patterns.
Summary:
Let NVPTX backend detect integer min and max patterns during isel and emit intrinsics that enable hardware support.


Reviewers: jholewinski, meheff, jingyue

Subscribers: arsenm, llvm-commits, meheff, jingyue, eliben, jholewinski

Differential Revision: http://reviews.llvm.org/D12377

git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@246107 91177308-0d34-0410-b5e6-96231b3b80d8
2015-08-26 23:22:02 +00:00

308 lines
6.4 KiB
LLVM

; RUN: llc < %s -march=nvptx -mcpu=sm_20 -O2 | FileCheck %s
; *************************************
; * Cases with no min/max
define i32 @ab_eq_i32(i32 %a, i32 %b) {
; LABEL: @ab_slt_i32
; CHECK-NOT: min
; CHECK-NOT: max
%cmp = icmp eq i32 %a, %b
%sel = select i1 %cmp, i32 %a, i32 %b
ret i32 %sel
}
define i64 @ba_ne_i64(i64 %a, i64 %b) {
; LABEL: @ab_ne_i64
; CHECK-NOT: min
; CHECK-NOT: max
%cmp = icmp ne i64 %a, %b
%sel = select i1 %cmp, i64 %b, i64 %a
ret i64 %sel
}
; PTX does have e.g. max.s16, but at least as of Kepler (sm_3x) that
; gets compiled to SASS that converts the 16 bit parameters to 32 bit
; before using a 32 bit instruction. That is probably not a win and
; NVCC 7.5 does not emit 16 bit min/max either, presumably for that
; reason.
define i16 @ab_ugt_i16(i16 %a, i16 %b) {
; LABEL: @ab_ugt_i16
; CHECK-NOT: min
; CHECK-NOT: max
%cmp = icmp ugt i16 %a, %b
%sel = select i1 %cmp, i16 %a, i16 %b
ret i16 %sel
}
; *************************************
; * All variations with i32
; *** ab, unsigned, i32
define i32 @ab_ugt_i32(i32 %a, i32 %b) {
; LABEL: @ab_ugt_i32
; CHECK: max.u32
%cmp = icmp ugt i32 %a, %b
%sel = select i1 %cmp, i32 %a, i32 %b
ret i32 %sel
}
define i32 @ab_uge_i32(i32 %a, i32 %b) {
; LABEL: @ab_uge_i32
; CHECK: max.u32
%cmp = icmp uge i32 %a, %b
%sel = select i1 %cmp, i32 %a, i32 %b
ret i32 %sel
}
define i32 @ab_ult_i32(i32 %a, i32 %b) {
; LABEL: @ab_ult_i32
; CHECK: min.u32
%cmp = icmp ult i32 %a, %b
%sel = select i1 %cmp, i32 %a, i32 %b
ret i32 %sel
}
define i32 @ab_ule_i32(i32 %a, i32 %b) {
; LABEL: @ab_ule_i32
; CHECK: min.u32
%cmp = icmp ule i32 %a, %b
%sel = select i1 %cmp, i32 %a, i32 %b
ret i32 %sel
}
; *** ab, signed, i32
define i32 @ab_sgt_i32(i32 %a, i32 %b) {
; LABEL: @ab_ugt_i32
; CHECK: max.s32
%cmp = icmp sgt i32 %a, %b
%sel = select i1 %cmp, i32 %a, i32 %b
ret i32 %sel
}
define i32 @ab_sge_i32(i32 %a, i32 %b) {
; LABEL: @ab_sge_i32
; CHECK: max.s32
%cmp = icmp sge i32 %a, %b
%sel = select i1 %cmp, i32 %a, i32 %b
ret i32 %sel
}
define i32 @ab_slt_i32(i32 %a, i32 %b) {
; LABEL: @ab_slt_i32
; CHECK: min.s32
%cmp = icmp slt i32 %a, %b
%sel = select i1 %cmp, i32 %a, i32 %b
ret i32 %sel
}
define i32 @ab_sle_i32(i32 %a, i32 %b) {
; LABEL: @ab_sle_i32
; CHECK: min.s32
%cmp = icmp sle i32 %a, %b
%sel = select i1 %cmp, i32 %a, i32 %b
ret i32 %sel
}
; *** ba, unsigned, i32
define i32 @ba_ugt_i32(i32 %a, i32 %b) {
; LABEL: @ba_ugt_i32
; CHECK: min.u32
%cmp = icmp ugt i32 %a, %b
%sel = select i1 %cmp, i32 %b, i32 %a
ret i32 %sel
}
define i32 @ba_uge_i32(i32 %a, i32 %b) {
; LABEL: @ba_uge_i32
; CHECK: min.u32
%cmp = icmp uge i32 %a, %b
%sel = select i1 %cmp, i32 %b, i32 %a
ret i32 %sel
}
define i32 @ba_ult_i32(i32 %a, i32 %b) {
; LABEL: @ba_ult_i32
; CHECK: max.u32
%cmp = icmp ult i32 %a, %b
%sel = select i1 %cmp, i32 %b, i32 %a
ret i32 %sel
}
define i32 @ba_ule_i32(i32 %a, i32 %b) {
; LABEL: @ba_ule_i32
; CHECK: max.u32
%cmp = icmp ule i32 %a, %b
%sel = select i1 %cmp, i32 %b, i32 %a
ret i32 %sel
}
; *** ba, signed, i32
define i32 @ba_sgt_i32(i32 %a, i32 %b) {
; LBAEL: @ba_ugt_i32
; CHECK: min.s32
%cmp = icmp sgt i32 %a, %b
%sel = select i1 %cmp, i32 %b, i32 %a
ret i32 %sel
}
define i32 @ba_sge_i32(i32 %a, i32 %b) {
; LABEL: @ba_sge_i32
; CHECK: min.s32
%cmp = icmp sge i32 %a, %b
%sel = select i1 %cmp, i32 %b, i32 %a
ret i32 %sel
}
define i32 @ba_slt_i32(i32 %a, i32 %b) {
; LABEL: @ba_slt_i32
; CHECK: max.s32
%cmp = icmp slt i32 %a, %b
%sel = select i1 %cmp, i32 %b, i32 %a
ret i32 %sel
}
define i32 @ba_sle_i32(i32 %a, i32 %b) {
; LABEL: @ba_sle_i32
; CHECK: max.s32
%cmp = icmp sle i32 %a, %b
%sel = select i1 %cmp, i32 %b, i32 %a
ret i32 %sel
}
; *************************************
; * All variations with i64
; *** ab, unsigned, i64
define i64 @ab_ugt_i64(i64 %a, i64 %b) {
; LABEL: @ab_ugt_i64
; CHECK: max.u64
%cmp = icmp ugt i64 %a, %b
%sel = select i1 %cmp, i64 %a, i64 %b
ret i64 %sel
}
define i64 @ab_uge_i64(i64 %a, i64 %b) {
; LABEL: @ab_uge_i64
; CHECK: max.u64
%cmp = icmp uge i64 %a, %b
%sel = select i1 %cmp, i64 %a, i64 %b
ret i64 %sel
}
define i64 @ab_ult_i64(i64 %a, i64 %b) {
; LABEL: @ab_ult_i64
; CHECK: min.u64
%cmp = icmp ult i64 %a, %b
%sel = select i1 %cmp, i64 %a, i64 %b
ret i64 %sel
}
define i64 @ab_ule_i64(i64 %a, i64 %b) {
; LABEL: @ab_ule_i64
; CHECK: min.u64
%cmp = icmp ule i64 %a, %b
%sel = select i1 %cmp, i64 %a, i64 %b
ret i64 %sel
}
; *** ab, signed, i64
define i64 @ab_sgt_i64(i64 %a, i64 %b) {
; LABEL: @ab_ugt_i64
; CHECK: max.s64
%cmp = icmp sgt i64 %a, %b
%sel = select i1 %cmp, i64 %a, i64 %b
ret i64 %sel
}
define i64 @ab_sge_i64(i64 %a, i64 %b) {
; LABEL: @ab_sge_i64
; CHECK: max.s64
%cmp = icmp sge i64 %a, %b
%sel = select i1 %cmp, i64 %a, i64 %b
ret i64 %sel
}
define i64 @ab_slt_i64(i64 %a, i64 %b) {
; LABEL: @ab_slt_i64
; CHECK: min.s64
%cmp = icmp slt i64 %a, %b
%sel = select i1 %cmp, i64 %a, i64 %b
ret i64 %sel
}
define i64 @ab_sle_i64(i64 %a, i64 %b) {
; LABEL: @ab_sle_i64
; CHECK: min.s64
%cmp = icmp sle i64 %a, %b
%sel = select i1 %cmp, i64 %a, i64 %b
ret i64 %sel
}
; *** ba, unsigned, i64
define i64 @ba_ugt_i64(i64 %a, i64 %b) {
; LABEL: @ba_ugt_i64
; CHECK: min.u64
%cmp = icmp ugt i64 %a, %b
%sel = select i1 %cmp, i64 %b, i64 %a
ret i64 %sel
}
define i64 @ba_uge_i64(i64 %a, i64 %b) {
; LABEL: @ba_uge_i64
; CHECK: min.u64
%cmp = icmp uge i64 %a, %b
%sel = select i1 %cmp, i64 %b, i64 %a
ret i64 %sel
}
define i64 @ba_ult_i64(i64 %a, i64 %b) {
; LABEL: @ba_ult_i64
; CHECK: max.u64
%cmp = icmp ult i64 %a, %b
%sel = select i1 %cmp, i64 %b, i64 %a
ret i64 %sel
}
define i64 @ba_ule_i64(i64 %a, i64 %b) {
; LABEL: @ba_ule_i64
; CHECK: max.u64
%cmp = icmp ule i64 %a, %b
%sel = select i1 %cmp, i64 %b, i64 %a
ret i64 %sel
}
; *** ba, signed, i64
define i64 @ba_sgt_i64(i64 %a, i64 %b) {
; LBAEL: @ba_ugt_i64
; CHECK: min.s64
%cmp = icmp sgt i64 %a, %b
%sel = select i1 %cmp, i64 %b, i64 %a
ret i64 %sel
}
define i64 @ba_sge_i64(i64 %a, i64 %b) {
; LABEL: @ba_sge_i64
; CHECK: min.s64
%cmp = icmp sge i64 %a, %b
%sel = select i1 %cmp, i64 %b, i64 %a
ret i64 %sel
}
define i64 @ba_slt_i64(i64 %a, i64 %b) {
; LABEL: @ba_slt_i64
; CHECK: max.s64
%cmp = icmp slt i64 %a, %b
%sel = select i1 %cmp, i64 %b, i64 %a
ret i64 %sel
}
define i64 @ba_sle_i64(i64 %a, i64 %b) {
; LABEL: @ba_sle_i64
; CHECK: max.s64
%cmp = icmp sle i64 %a, %b
%sel = select i1 %cmp, i64 %b, i64 %a
ret i64 %sel
}