mirror of
https://github.com/RPCSX/llvm.git
synced 2025-01-11 23:16:11 +00:00
63be72069d
If 2.5 ulp is acceptable, denormals are not required, and isn't a reciprocal which will already be handled, replace with a faster fdiv. Simplify the lowering tests by using per function subtarget features. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@276051 91177308-0d34-0410-b5e6-96231b3b80d8
19 lines
583 B
LLVM
19 lines
583 B
LLVM
; RUN: llc -march=amdgcn -verify-machineinstrs < %s | FileCheck %s
|
|
|
|
declare float @llvm.amdgcn.fdiv.fast(float, float) #0
|
|
|
|
; CHECK-LABEL: {{^}}test_fdiv_fast:
|
|
; CHECK: v_cndmask_b32_e32 v{{[0-9]+}}, 1.0, v{{[0-9]+}}, vcc
|
|
; CHECK: v_mul_f32_e32
|
|
; CHECK: v_rcp_f32_e32
|
|
; CHECK: v_mul_f32_e32
|
|
; CHECK: v_mul_f32_e32
|
|
define void @test_fdiv_fast(float addrspace(1)* %out, float %a, float %b) #1 {
|
|
%fdiv = call float @llvm.amdgcn.fdiv.fast(float %a, float %b)
|
|
store float %fdiv, float addrspace(1)* %out
|
|
ret void
|
|
}
|
|
|
|
attributes #0 = { nounwind readnone }
|
|
attributes #1 = { nounwind }
|