mirror of
https://github.com/RPCSX/llvm.git
synced 2025-01-27 07:12:06 +00:00
944f96975b
This handles the case in: https://llvm.org/bugs/show_bug.cgi?id=28895 ...but we are not getting all of the possibilities yet. Eg, we use 'X86::FANDN' for scalar FP select combines. That enhancement is filed as: https://llvm.org/bugs/show_bug.cgi?id=28925 Differential Revision: https://reviews.llvm.org/D23337 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@278270 91177308-0d34-0410-b5e6-96231b3b80d8
172 lines
5.3 KiB
LLVM
172 lines
5.3 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
|
|
; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+avx | FileCheck %s
|
|
|
|
define <4 x i32> @test1(<4 x float> %a, <4 x float> %b, <4 x i32> %c) {
|
|
; CHECK-LABEL: test1:
|
|
; CHECK: # BB#0:
|
|
; CHECK-NEXT: vcmpnleps %xmm0, %xmm1, %xmm0
|
|
; CHECK-NEXT: vandps %xmm2, %xmm0, %xmm0
|
|
; CHECK-NEXT: retq
|
|
;
|
|
%f = fcmp ult <4 x float> %a, %b
|
|
%r = select <4 x i1> %f, <4 x i32> %c, <4 x i32> zeroinitializer
|
|
ret <4 x i32> %r
|
|
}
|
|
|
|
define <4 x i32> @test2(<4 x float> %a, <4 x float> %b, <4 x i32> %c) {
|
|
; CHECK-LABEL: test2:
|
|
; CHECK: # BB#0:
|
|
; CHECK-NEXT: vcmpnleps %xmm0, %xmm1, %xmm0
|
|
; CHECK-NEXT: vorps %xmm2, %xmm0, %xmm0
|
|
; CHECK-NEXT: retq
|
|
;
|
|
%f = fcmp ult <4 x float> %a, %b
|
|
%r = select <4 x i1> %f, <4 x i32> <i32 -1, i32 -1, i32 -1, i32 -1>, <4 x i32> %c
|
|
ret <4 x i32> %r
|
|
}
|
|
|
|
define <4 x i32> @test3(<4 x float> %a, <4 x float> %b, <4 x i32> %c) {
|
|
; CHECK-LABEL: test3:
|
|
; CHECK: # BB#0:
|
|
; CHECK-NEXT: vcmpleps %xmm0, %xmm1, %xmm0
|
|
; CHECK-NEXT: vandps %xmm2, %xmm0, %xmm0
|
|
; CHECK-NEXT: retq
|
|
;
|
|
%f = fcmp ult <4 x float> %a, %b
|
|
%r = select <4 x i1> %f, <4 x i32> zeroinitializer, <4 x i32> %c
|
|
ret <4 x i32> %r
|
|
}
|
|
|
|
define <4 x i32> @test4(<4 x float> %a, <4 x float> %b, <4 x i32> %c) {
|
|
; CHECK-LABEL: test4:
|
|
; CHECK: # BB#0:
|
|
; CHECK-NEXT: vcmpleps %xmm0, %xmm1, %xmm0
|
|
; CHECK-NEXT: vorps %xmm2, %xmm0, %xmm0
|
|
; CHECK-NEXT: retq
|
|
;
|
|
%f = fcmp ult <4 x float> %a, %b
|
|
%r = select <4 x i1> %f, <4 x i32> %c, <4 x i32> <i32 -1, i32 -1, i32 -1, i32 -1>
|
|
ret <4 x i32> %r
|
|
}
|
|
|
|
define <4 x i32> @test5(<4 x float> %a, <4 x float> %b, <4 x i32> %c) {
|
|
; CHECK-LABEL: test5:
|
|
; CHECK: # BB#0:
|
|
; CHECK-NEXT: vcmpnleps %xmm0, %xmm1, %xmm0
|
|
; CHECK-NEXT: retq
|
|
;
|
|
%f = fcmp ult <4 x float> %a, %b
|
|
%r = sext <4 x i1> %f to <4 x i32>
|
|
ret <4 x i32> %r
|
|
}
|
|
|
|
define <4 x i32> @test6(<4 x float> %a, <4 x float> %b, <4 x i32> %c) {
|
|
; CHECK-LABEL: test6:
|
|
; CHECK: # BB#0:
|
|
; CHECK-NEXT: vcmpleps %xmm0, %xmm1, %xmm0
|
|
; CHECK-NEXT: retq
|
|
;
|
|
%not.f = fcmp oge <4 x float> %a, %b
|
|
%r = sext <4 x i1> %not.f to <4 x i32>
|
|
ret <4 x i32> %r
|
|
}
|
|
|
|
define <4 x i32> @test7(<4 x float> %a, <4 x float> %b, <4 x i32>* %p) {
|
|
; CHECK-LABEL: test7:
|
|
; CHECK: # BB#0:
|
|
; CHECK-NEXT: vcmpnleps %xmm0, %xmm1, %xmm0
|
|
; CHECK-NEXT: vandps (%rdi), %xmm0, %xmm0
|
|
; CHECK-NEXT: retq
|
|
;
|
|
%f = fcmp ult <4 x float> %a, %b
|
|
%l = load <4 x i32>, <4 x i32>* %p, align 16
|
|
%r = select <4 x i1> %f, <4 x i32> %l, <4 x i32> zeroinitializer
|
|
ret <4 x i32> %r
|
|
}
|
|
|
|
; Repeat all with FP types for the select operands. Also, use different comparison predicates for better test coverage.
|
|
|
|
define <2 x double> @test1f(<2 x double> %a, <2 x double> %b, <2 x double> %c) {
|
|
; CHECK-LABEL: test1f:
|
|
; CHECK: # BB#0:
|
|
; CHECK-NEXT: vcmpltpd %xmm0, %xmm1, %xmm0
|
|
; CHECK-NEXT: vandpd %xmm2, %xmm0, %xmm0
|
|
; CHECK-NEXT: retq
|
|
;
|
|
%f = fcmp ogt <2 x double> %a, %b
|
|
%r = select <2 x i1> %f, <2 x double> %c, <2 x double> zeroinitializer
|
|
ret <2 x double> %r
|
|
}
|
|
|
|
define <2 x double> @test2f(<2 x double> %a, <2 x double> %b, <2 x double> %c) {
|
|
; CHECK-LABEL: test2f:
|
|
; CHECK: # BB#0:
|
|
; CHECK-NEXT: vcmplepd %xmm0, %xmm1, %xmm0
|
|
; CHECK-NEXT: vorpd %xmm2, %xmm0, %xmm0
|
|
; CHECK-NEXT: retq
|
|
;
|
|
%f = fcmp oge <2 x double> %a, %b
|
|
%r = select <2 x i1> %f, <2 x double> <double 0xffffffffffffffff, double 0xffffffffffffffff>, <2 x double> %c
|
|
ret <2 x double> %r
|
|
}
|
|
|
|
define <2 x double> @test3f(<2 x double> %a, <2 x double> %b, <2 x double> %c) {
|
|
; CHECK-LABEL: test3f:
|
|
; CHECK: # BB#0:
|
|
; CHECK-NEXT: vcmpnltpd %xmm1, %xmm0, %xmm0
|
|
; CHECK-NEXT: vandpd %xmm2, %xmm0, %xmm0
|
|
; CHECK-NEXT: retq
|
|
;
|
|
%f = fcmp olt <2 x double> %a, %b
|
|
%r = select <2 x i1> %f, <2 x double> zeroinitializer, <2 x double> %c
|
|
ret <2 x double> %r
|
|
}
|
|
|
|
define <2 x double> @test4f(<2 x double> %a, <2 x double> %b, <2 x double> %c) {
|
|
; CHECK-LABEL: test4f:
|
|
; CHECK: # BB#0:
|
|
; CHECK-NEXT: vcmpnlepd %xmm1, %xmm0, %xmm0
|
|
; CHECK-NEXT: vorpd %xmm2, %xmm0, %xmm0
|
|
; CHECK-NEXT: retq
|
|
;
|
|
%f = fcmp ole <2 x double> %a, %b
|
|
%r = select <2 x i1> %f, <2 x double> %c, <2 x double> <double 0xffffffffffffffff, double 0xffffffffffffffff>
|
|
ret <2 x double> %r
|
|
}
|
|
|
|
define <2 x double> @test5f(<2 x double> %a, <2 x double> %b, <2 x double> %c) {
|
|
; CHECK-LABEL: test5f:
|
|
; CHECK: # BB#0:
|
|
; CHECK-NEXT: vcmpnlepd %xmm1, %xmm0, %xmm0
|
|
; CHECK-NEXT: retq
|
|
;
|
|
%f = fcmp ugt <2 x double> %a, %b
|
|
%r = select <2 x i1> %f, <2 x double> <double 0xffffffffffffffff, double 0xffffffffffffffff>, <2 x double> zeroinitializer
|
|
ret <2 x double> %r
|
|
}
|
|
|
|
define <2 x double> @test6f(<2 x double> %a, <2 x double> %b, <2 x double> %c) {
|
|
; CHECK-LABEL: test6f:
|
|
; CHECK: # BB#0:
|
|
; CHECK-NEXT: vcmpltpd %xmm0, %xmm1, %xmm0
|
|
; CHECK-NEXT: retq
|
|
;
|
|
%f = fcmp ule <2 x double> %a, %b
|
|
%r = select <2 x i1> %f, <2 x double> zeroinitializer, <2 x double> <double 0xffffffffffffffff, double 0xffffffffffffffff>
|
|
ret <2 x double> %r
|
|
}
|
|
|
|
define <2 x double> @test7f(<2 x double> %a, <2 x double> %b, <2 x double>* %p) {
|
|
; CHECK-LABEL: test7f:
|
|
; CHECK: # BB#0:
|
|
; CHECK-NEXT: vcmpeqpd %xmm1, %xmm0, %xmm0
|
|
; CHECK-NEXT: vandpd (%rdi), %xmm0, %xmm0
|
|
; CHECK-NEXT: retq
|
|
;
|
|
%f = fcmp oeq <2 x double> %a, %b
|
|
%l = load <2 x double>, <2 x double>* %p, align 16
|
|
%r = select <2 x i1> %f, <2 x double> %l, <2 x double> zeroinitializer
|
|
ret <2 x double> %r
|
|
}
|
|
|