mirror of
https://github.com/RPCS3/llvm.git
synced 2025-01-10 06:03:52 +00:00
[AVX-512] Fix the execution domain for scalar FMA instructions.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@296271 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
5d138fe5d3
commit
955b35337f
@ -5599,7 +5599,7 @@ multiclass avx512_fma3s_common<bits<8> opc, string OpcodeStr, X86VectorVTInfo _,
|
||||
multiclass avx512_fma3s_all<bits<8> opc213, bits<8> opc231, bits<8> opc132,
|
||||
string OpcodeStr, SDNode OpNode, SDNode OpNodeRnds1,
|
||||
SDNode OpNodeRnds3, X86VectorVTInfo _ , string SUFF> {
|
||||
|
||||
let ExeDomain = _.ExeDomain in {
|
||||
defm NAME#213#SUFF#Z: avx512_fma3s_common<opc213, OpcodeStr#"213"#_.Suffix , _ ,
|
||||
// Operands for intrinsic are in 123 order to preserve passthu
|
||||
// semantics.
|
||||
@ -5634,6 +5634,7 @@ multiclass avx512_fma3s_all<bits<8> opc213, bits<8> opc231, bits<8> opc132,
|
||||
_.FRC:$src2))),
|
||||
(set _.FRC:$dst, (_.EltVT (OpNode _.FRC:$src1,
|
||||
(_.ScalarLdFrag addr:$src3), _.FRC:$src2)))>;
|
||||
}
|
||||
}
|
||||
|
||||
multiclass avx512_fma3s<bits<8> opc213, bits<8> opc231, bits<8> opc132,
|
||||
|
@ -4738,11 +4738,11 @@ define <2 x double>@test_int_x86_avx512_mask_vfmadd_sd(<2 x double> %x0, <2 x do
|
||||
; CHECK: ## BB#0:
|
||||
; CHECK-NEXT: andl $1, %edi
|
||||
; CHECK-NEXT: kmovw %edi, %k1
|
||||
; CHECK-NEXT: vmovaps %xmm0, %xmm3
|
||||
; CHECK-NEXT: vmovapd %xmm0, %xmm3
|
||||
; CHECK-NEXT: vfmadd213sd %xmm2, %xmm1, %xmm3 {%k1}
|
||||
; CHECK-NEXT: vmovaps %xmm0, %xmm4
|
||||
; CHECK-NEXT: vmovapd %xmm0, %xmm4
|
||||
; CHECK-NEXT: vfmadd213sd %xmm2, %xmm1, %xmm4
|
||||
; CHECK-NEXT: vmovaps %xmm0, %xmm5
|
||||
; CHECK-NEXT: vmovapd %xmm0, %xmm5
|
||||
; CHECK-NEXT: vfmadd213sd {rz-sae}, %xmm2, %xmm1, %xmm5 {%k1}
|
||||
; CHECK-NEXT: vfmadd213sd {rz-sae}, %xmm2, %xmm1, %xmm0
|
||||
; CHECK-NEXT: vaddpd %xmm3, %xmm4, %xmm1
|
||||
@ -4794,7 +4794,7 @@ define <2 x double>@test_int_x86_avx512_maskz_vfmadd_sd(<2 x double> %x0, <2 x d
|
||||
; CHECK: ## BB#0:
|
||||
; CHECK-NEXT: andl $1, %edi
|
||||
; CHECK-NEXT: kmovw %edi, %k1
|
||||
; CHECK-NEXT: vmovaps %xmm0, %xmm3
|
||||
; CHECK-NEXT: vmovapd %xmm0, %xmm3
|
||||
; CHECK-NEXT: vfmadd213sd %xmm2, %xmm1, %xmm3 {%k1} {z}
|
||||
; CHECK-NEXT: vfmadd213sd {rz-sae}, %xmm2, %xmm1, %xmm0 {%k1} {z}
|
||||
; CHECK-NEXT: vaddpd %xmm0, %xmm3, %xmm0
|
||||
@ -4826,11 +4826,11 @@ define <2 x double>@test_int_x86_avx512_mask3_vfmadd_sd(<2 x double> %x0, <2 x d
|
||||
; CHECK: ## BB#0:
|
||||
; CHECK-NEXT: andl $1, %edi
|
||||
; CHECK-NEXT: kmovw %edi, %k1
|
||||
; CHECK-NEXT: vmovaps %xmm2, %xmm3
|
||||
; CHECK-NEXT: vmovapd %xmm2, %xmm3
|
||||
; CHECK-NEXT: vfmadd231sd %xmm1, %xmm0, %xmm3 {%k1}
|
||||
; CHECK-NEXT: vmovaps %xmm2, %xmm4
|
||||
; CHECK-NEXT: vmovapd %xmm2, %xmm4
|
||||
; CHECK-NEXT: vfmadd231sd %xmm1, %xmm0, %xmm4
|
||||
; CHECK-NEXT: vmovaps %xmm2, %xmm5
|
||||
; CHECK-NEXT: vmovapd %xmm2, %xmm5
|
||||
; CHECK-NEXT: vfmadd231sd {rz-sae}, %xmm1, %xmm0, %xmm5 {%k1}
|
||||
; CHECK-NEXT: vfmadd231sd {rz-sae}, %xmm1, %xmm0, %xmm2
|
||||
; CHECK-NEXT: vaddpd %xmm3, %xmm4, %xmm0
|
||||
@ -4938,7 +4938,7 @@ define void @fmadd_sd_mask_memfold(double* %a, double* %b, i8 %c) {
|
||||
; CHECK-NEXT: andl $1, %edx
|
||||
; CHECK-NEXT: kmovw %edx, %k1
|
||||
; CHECK-NEXT: vfmadd132sd (%rsi), %xmm0, %xmm0 {%k1}
|
||||
; CHECK-NEXT: vmovlps %xmm0, (%rdi)
|
||||
; CHECK-NEXT: vmovlpd %xmm0, (%rdi)
|
||||
; CHECK-NEXT: retq
|
||||
%a.val = load double, double* %a
|
||||
%av0 = insertelement <2 x double> undef, double %a.val, i32 0
|
||||
@ -4962,7 +4962,7 @@ define void @fmadd_sd_maskz_memfold(double* %a, double* %b, i8 %c) {
|
||||
; CHECK-NEXT: andl $1, %edx
|
||||
; CHECK-NEXT: kmovw %edx, %k1
|
||||
; CHECK-NEXT: vfmadd132sd (%rsi), %xmm0, %xmm0 {%k1} {z}
|
||||
; CHECK-NEXT: vmovlps %xmm0, (%rdi)
|
||||
; CHECK-NEXT: vmovlpd %xmm0, (%rdi)
|
||||
; CHECK-NEXT: retq
|
||||
%a.val = load double, double* %a
|
||||
%av0 = insertelement <2 x double> undef, double %a.val, i32 0
|
||||
@ -4986,11 +4986,11 @@ define <2 x double>@test_int_x86_avx512_mask3_vfmsub_sd(<2 x double> %x0, <2 x d
|
||||
; CHECK: ## BB#0:
|
||||
; CHECK-NEXT: andl $1, %edi
|
||||
; CHECK-NEXT: kmovw %edi, %k1
|
||||
; CHECK-NEXT: vmovaps %xmm2, %xmm3
|
||||
; CHECK-NEXT: vmovapd %xmm2, %xmm3
|
||||
; CHECK-NEXT: vfmsub231sd %xmm1, %xmm0, %xmm3 {%k1}
|
||||
; CHECK-NEXT: vmovaps %xmm2, %xmm4
|
||||
; CHECK-NEXT: vmovapd %xmm2, %xmm4
|
||||
; CHECK-NEXT: vfmsub231sd %xmm1, %xmm0, %xmm4
|
||||
; CHECK-NEXT: vmovaps %xmm2, %xmm5
|
||||
; CHECK-NEXT: vmovapd %xmm2, %xmm5
|
||||
; CHECK-NEXT: vfmsub231sd {rz-sae}, %xmm1, %xmm0, %xmm5 {%k1}
|
||||
; CHECK-NEXT: vfmsub231sd {rz-sae}, %xmm1, %xmm0, %xmm2
|
||||
; CHECK-NEXT: vaddpd %xmm3, %xmm4, %xmm0
|
||||
@ -5042,11 +5042,11 @@ define <2 x double>@test_int_x86_avx512_mask3_vfnmsub_sd(<2 x double> %x0, <2 x
|
||||
; CHECK: ## BB#0:
|
||||
; CHECK-NEXT: andl $1, %edi
|
||||
; CHECK-NEXT: kmovw %edi, %k1
|
||||
; CHECK-NEXT: vmovaps %xmm2, %xmm3
|
||||
; CHECK-NEXT: vmovapd %xmm2, %xmm3
|
||||
; CHECK-NEXT: vfnmsub231sd %xmm1, %xmm0, %xmm3 {%k1}
|
||||
; CHECK-NEXT: vmovaps %xmm2, %xmm4
|
||||
; CHECK-NEXT: vmovapd %xmm2, %xmm4
|
||||
; CHECK-NEXT: vfnmsub231sd %xmm1, %xmm0, %xmm4
|
||||
; CHECK-NEXT: vmovaps %xmm2, %xmm5
|
||||
; CHECK-NEXT: vmovapd %xmm2, %xmm5
|
||||
; CHECK-NEXT: vfnmsub231sd {rz-sae}, %xmm1, %xmm0, %xmm5 {%k1}
|
||||
; CHECK-NEXT: vfnmsub231sd {rz-sae}, %xmm1, %xmm0, %xmm2
|
||||
; CHECK-NEXT: vaddpd %xmm3, %xmm4, %xmm0
|
||||
|
@ -127,7 +127,7 @@ define <2 x double> @test10(<2 x double> %a, <2 x double> %b, <2 x double> %c) {
|
||||
; CHECK-LABEL: test10:
|
||||
; CHECK: # BB#0: # %entry
|
||||
; CHECK-NEXT: vfmadd213sd %xmm2, %xmm1, %xmm0
|
||||
; CHECK-NEXT: vxorps {{.*}}(%rip), %xmm0, %xmm0
|
||||
; CHECK-NEXT: vxorpd {{.*}}(%rip), %xmm0, %xmm0
|
||||
; CHECK-NEXT: retq
|
||||
entry:
|
||||
%0 = tail call <2 x double> @llvm.x86.avx512.mask.vfmadd.sd(<2 x double> %a, <2 x double> %b, <2 x double> %c, i8 -1, i32 4) #2
|
||||
@ -185,7 +185,7 @@ entry:
|
||||
define <2 x double> @test13(<2 x double> %a, <2 x double> %b, <2 x double> %c, i8 %mask) {
|
||||
; CHECK-LABEL: test13:
|
||||
; CHECK: # BB#0: # %entry
|
||||
; CHECK-NEXT: vxorps {{.*}}(%rip), %xmm0, %xmm0
|
||||
; CHECK-NEXT: vxorpd {{.*}}(%rip), %xmm0, %xmm0
|
||||
; CHECK-NEXT: andl $1, %edi
|
||||
; CHECK-NEXT: kmovw %edi, %k1
|
||||
; CHECK-NEXT: vfmadd213sd %xmm2, %xmm1, %xmm0 {%k1}
|
||||
|
@ -1483,7 +1483,7 @@ define double @test_f64_fneg_fmul(double %x, double %y) #0 {
|
||||
;
|
||||
; AVX512-LABEL: test_f64_fneg_fmul:
|
||||
; AVX512: # BB#0:
|
||||
; AVX512-NEXT: vxorps %xmm2, %xmm2, %xmm2
|
||||
; AVX512-NEXT: vxorpd %xmm2, %xmm2, %xmm2
|
||||
; AVX512-NEXT: vfnmsub213sd %xmm2, %xmm1, %xmm0
|
||||
; AVX512-NEXT: retq
|
||||
%m = fmul nsz double %x, %y
|
||||
|
Loading…
Reference in New Issue
Block a user