mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2025-02-21 21:11:36 +00:00
R600: support f16 -> f64 conversion intrinsic.
Unfortunately, we don't seem to have a direct truncation, but the extension can be legally split into two operations so we should support that. llvm-svn: 213357
This commit is contained in:
parent
86458323c0
commit
de7867151d
@ -242,6 +242,8 @@ AMDGPUTargetLowering::AMDGPUTargetLowering(TargetMachine &TM) :
|
||||
setOperationAction(ISD::FCOPYSIGN, MVT::f64, Expand);
|
||||
}
|
||||
|
||||
setOperationAction(ISD::FP16_TO_FP, MVT::f64, Expand);
|
||||
|
||||
const MVT ScalarIntVTs[] = { MVT::i32, MVT::i64 };
|
||||
for (MVT VT : ScalarIntVTs) {
|
||||
setOperationAction(ISD::SREM, VT, Expand);
|
||||
|
@ -1,6 +1,7 @@
|
||||
; RUN: llc -march=r600 -mcpu=SI -verify-machineinstrs < %s | FileCheck -check-prefix=SI %s
|
||||
|
||||
declare float @llvm.convert.from.fp16.f32(i16) nounwind readnone
|
||||
declare double @llvm.convert.from.fp16.f64(i16) nounwind readnone
|
||||
|
||||
; SI-LABEL: @test_convert_fp16_to_fp32:
|
||||
; SI: BUFFER_LOAD_USHORT [[VAL:v[0-9]+]]
|
||||
@ -12,3 +13,16 @@ define void @test_convert_fp16_to_fp32(float addrspace(1)* noalias %out, i16 add
|
||||
store float %cvt, float addrspace(1)* %out, align 4
|
||||
ret void
|
||||
}
|
||||
|
||||
|
||||
; SI-LABEL: @test_convert_fp16_to_fp64:
|
||||
; SI: BUFFER_LOAD_USHORT [[VAL:v[0-9]+]]
|
||||
; SI: V_CVT_F32_F16_e32 [[RESULT32:v[0-9]+]], [[VAL]]
|
||||
; SI: V_CVT_F64_F32_e32 [[RESULT:v\[[0-9]+:[0-9]+\]]], [[RESULT32]]
|
||||
; SI: BUFFER_STORE_DWORDX2 [[RESULT]]
|
||||
define void @test_convert_fp16_to_fp64(double addrspace(1)* noalias %out, i16 addrspace(1)* noalias %in) nounwind {
|
||||
%val = load i16 addrspace(1)* %in, align 2
|
||||
%cvt = call double @llvm.convert.from.fp16.f64(i16 %val) nounwind readnone
|
||||
store double %cvt, double addrspace(1)* %out, align 4
|
||||
ret void
|
||||
}
|
Loading…
x
Reference in New Issue
Block a user