mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2025-01-16 16:48:02 +00:00
PTX: Fix disabling of MAD instruction selection
llvm-svn: 142352
This commit is contained in:
parent
2faab7dd2a
commit
361b3c9ff2
@ -885,19 +885,26 @@ def : Pat<(f64 (fdiv RegF64:$a, fpimm:$b)),
|
||||
|
||||
// FMUL+FADD
|
||||
def : Pat<(f32 (fadd (fmul RegF32:$a, RegF32:$b), RegF32:$c)),
|
||||
(FMADrrr32 RndDefault, RegF32:$a, RegF32:$b, RegF32:$c)>;
|
||||
(FMADrrr32 RndDefault, RegF32:$a, RegF32:$b, RegF32:$c)>,
|
||||
Requires<[SupportsFMA]>;
|
||||
def : Pat<(f32 (fadd (fmul RegF32:$a, RegF32:$b), fpimm:$c)),
|
||||
(FMADrri32 RndDefault, RegF32:$a, RegF32:$b, fpimm:$c)>;
|
||||
(FMADrri32 RndDefault, RegF32:$a, RegF32:$b, fpimm:$c)>,
|
||||
Requires<[SupportsFMA]>;
|
||||
def : Pat<(f32 (fadd (fmul RegF32:$a, fpimm:$b), fpimm:$c)),
|
||||
(FMADrrr32 RndDefault, RegF32:$a, fpimm:$b, fpimm:$c)>;
|
||||
(FMADrrr32 RndDefault, RegF32:$a, fpimm:$b, fpimm:$c)>,
|
||||
Requires<[SupportsFMA]>;
|
||||
def : Pat<(f32 (fadd (fmul RegF32:$a, RegF32:$b), fpimm:$c)),
|
||||
(FMADrri32 RndDefault, RegF32:$a, RegF32:$b, fpimm:$c)>;
|
||||
(FMADrri32 RndDefault, RegF32:$a, RegF32:$b, fpimm:$c)>,
|
||||
Requires<[SupportsFMA]>;
|
||||
def : Pat<(f64 (fadd (fmul RegF64:$a, RegF64:$b), RegF64:$c)),
|
||||
(FMADrrr64 RndDefault, RegF64:$a, RegF64:$b, RegF64:$c)>;
|
||||
(FMADrrr64 RndDefault, RegF64:$a, RegF64:$b, RegF64:$c)>,
|
||||
Requires<[SupportsFMA]>;
|
||||
def : Pat<(f64 (fadd (fmul RegF64:$a, RegF64:$b), fpimm:$c)),
|
||||
(FMADrri64 RndDefault, RegF64:$a, RegF64:$b, fpimm:$c)>;
|
||||
(FMADrri64 RndDefault, RegF64:$a, RegF64:$b, fpimm:$c)>,
|
||||
Requires<[SupportsFMA]>;
|
||||
def : Pat<(f64 (fadd (fmul RegF64:$a, fpimm:$b), fpimm:$c)),
|
||||
(FMADrri64 RndDefault, RegF64:$a, fpimm:$b, fpimm:$c)>;
|
||||
(FMADrri64 RndDefault, RegF64:$a, fpimm:$b, fpimm:$c)>,
|
||||
Requires<[SupportsFMA]>;
|
||||
|
||||
// FNEG
|
||||
def : Pat<(f32 (fneg RegF32:$a)), (FNEGrr32 RndDefault, RegF32:$a)>;
|
||||
|
@ -1,8 +1,13 @@
|
||||
; RUN: llc < %s -march=ptx32 -mattr=+ptx20,+sm20 | grep "mad"
|
||||
; RUN: llc < %s -march=ptx32 -mattr=+ptx20,+sm20,+no-fma | grep -v "mad"
|
||||
; RUN: llc < %s -march=ptx32 -mattr=+ptx20,+sm20 | FileCheck %s -check-prefix=FMA
|
||||
; RUN: llc < %s -march=ptx32 -mattr=+ptx20,+sm20,+no-fma | FileCheck %s -check-prefix=MUL
|
||||
; RUN: llc < %s -march=ptx64 -mattr=+ptx20,+sm20 | FileCheck %s -check-prefix=FMA
|
||||
; RUN: llc < %s -march=ptx64 -mattr=+ptx20,+sm20,+no-fma | FileCheck %s -check-prefix=MUL
|
||||
|
||||
define ptx_device float @test_mul_add_f(float %x, float %y, float %z) {
|
||||
entry:
|
||||
; FMA: mad.rn.f32
|
||||
; MUL: mul.rn.f32
|
||||
; MUL: add.rn.f32
|
||||
%a = fmul float %x, %y
|
||||
%b = fadd float %a, %z
|
||||
ret float %b
|
||||
@ -10,6 +15,9 @@ entry:
|
||||
|
||||
define ptx_device double @test_mul_add_d(double %x, double %y, double %z) {
|
||||
entry:
|
||||
; FMA: mad.rn.f64
|
||||
; MUL: mul.rn.f64
|
||||
; MUL: add.rn.f64
|
||||
%a = fmul double %x, %y
|
||||
%b = fadd double %a, %z
|
||||
ret double %b
|
||||
|
Loading…
x
Reference in New Issue
Block a user