mirror of
https://github.com/RPCS3/llvm.git
synced 2025-03-04 00:29:28 +00:00
AMDGPU/GlobalISel: legalize and select 32-bit G_SITOFP
Reviewers: arsenm, nhaehnle Reviewed By: arsenm Subscribers: kzhuravl, wdng, yaxunl, rovka, kristof.beyls, dstuttard, tpr, t-tye, llvm-commits Differential Revision: https://reviews.llvm.org/D48195 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@335316 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
b93460fa62
commit
20f413f83a
@ -26,6 +26,10 @@ def gi_vop3mods :
|
|||||||
GIComplexOperandMatcher<s32, "selectVOP3Mods">,
|
GIComplexOperandMatcher<s32, "selectVOP3Mods">,
|
||||||
GIComplexPatternEquiv<VOP3Mods>;
|
GIComplexPatternEquiv<VOP3Mods>;
|
||||||
|
|
||||||
|
def gi_vop3omods :
|
||||||
|
GIComplexOperandMatcher<s32, "selectVOP3OMods">,
|
||||||
|
GIComplexPatternEquiv<VOP3OMods>;
|
||||||
|
|
||||||
class GISelSop2Pat <
|
class GISelSop2Pat <
|
||||||
SDPatternOperator node,
|
SDPatternOperator node,
|
||||||
Instruction inst,
|
Instruction inst,
|
||||||
|
@ -537,6 +537,7 @@ bool AMDGPUInstructionSelector::select(MachineInstr &I,
|
|||||||
switch (I.getOpcode()) {
|
switch (I.getOpcode()) {
|
||||||
default:
|
default:
|
||||||
break;
|
break;
|
||||||
|
case TargetOpcode::G_SITOFP:
|
||||||
case TargetOpcode::G_FMUL:
|
case TargetOpcode::G_FMUL:
|
||||||
case TargetOpcode::G_FADD:
|
case TargetOpcode::G_FADD:
|
||||||
case TargetOpcode::G_FPTOUI:
|
case TargetOpcode::G_FPTOUI:
|
||||||
@ -582,6 +583,14 @@ AMDGPUInstructionSelector::selectVOP3Mods0(MachineOperand &Root) const {
|
|||||||
[=](MachineInstrBuilder &MIB) { MIB.addImm(0); } // omod
|
[=](MachineInstrBuilder &MIB) { MIB.addImm(0); } // omod
|
||||||
}};
|
}};
|
||||||
}
|
}
|
||||||
|
InstructionSelector::ComplexRendererFns
|
||||||
|
AMDGPUInstructionSelector::selectVOP3OMods(MachineOperand &Root) const {
|
||||||
|
return {{
|
||||||
|
[=](MachineInstrBuilder &MIB) { MIB.add(Root); },
|
||||||
|
[=](MachineInstrBuilder &MIB) { MIB.addImm(0); }, // clamp
|
||||||
|
[=](MachineInstrBuilder &MIB) { MIB.addImm(0); } // omod
|
||||||
|
}};
|
||||||
|
}
|
||||||
|
|
||||||
InstructionSelector::ComplexRendererFns
|
InstructionSelector::ComplexRendererFns
|
||||||
AMDGPUInstructionSelector::selectVOP3Mods(MachineOperand &Root) const {
|
AMDGPUInstructionSelector::selectVOP3Mods(MachineOperand &Root) const {
|
||||||
|
@ -78,6 +78,8 @@ private:
|
|||||||
InstructionSelector::ComplexRendererFns
|
InstructionSelector::ComplexRendererFns
|
||||||
selectVOP3Mods0(MachineOperand &Root) const;
|
selectVOP3Mods0(MachineOperand &Root) const;
|
||||||
InstructionSelector::ComplexRendererFns
|
InstructionSelector::ComplexRendererFns
|
||||||
|
selectVOP3OMods(MachineOperand &Root) const;
|
||||||
|
InstructionSelector::ComplexRendererFns
|
||||||
selectVOP3Mods(MachineOperand &Root) const;
|
selectVOP3Mods(MachineOperand &Root) const;
|
||||||
|
|
||||||
const SIInstrInfo &TII;
|
const SIInstrInfo &TII;
|
||||||
|
@ -91,6 +91,9 @@ AMDGPULegalizerInfo::AMDGPULegalizerInfo(const SISubtarget &ST,
|
|||||||
setAction({G_FPTOSI, S32}, Legal);
|
setAction({G_FPTOSI, S32}, Legal);
|
||||||
setAction({G_FPTOSI, 1, S32}, Legal);
|
setAction({G_FPTOSI, 1, S32}, Legal);
|
||||||
|
|
||||||
|
setAction({G_SITOFP, S32}, Legal);
|
||||||
|
setAction({G_SITOFP, 1, S32}, Legal);
|
||||||
|
|
||||||
setAction({G_FPTOUI, S32}, Legal);
|
setAction({G_FPTOUI, S32}, Legal);
|
||||||
setAction({G_FPTOUI, 1, S32}, Legal);
|
setAction({G_FPTOUI, 1, S32}, Legal);
|
||||||
|
|
||||||
|
36
test/CodeGen/AMDGPU/GlobalISel/inst-select-sitofp.mir
Normal file
36
test/CodeGen/AMDGPU/GlobalISel/inst-select-sitofp.mir
Normal file
@ -0,0 +1,36 @@
|
|||||||
|
# RUN: llc -march=amdgcn -run-pass=instruction-select -verify-machineinstrs -global-isel %s -o - | FileCheck %s -check-prefixes=GCN
|
||||||
|
|
||||||
|
--- |
|
||||||
|
define amdgpu_kernel void @sitofp(i32 addrspace(1)* %global0) {ret void}
|
||||||
|
...
|
||||||
|
---
|
||||||
|
|
||||||
|
name: sitofp
|
||||||
|
legalized: true
|
||||||
|
regBankSelected: true
|
||||||
|
|
||||||
|
# GCN-LABEL: name: sitofp
|
||||||
|
body: |
|
||||||
|
bb.0:
|
||||||
|
liveins: $sgpr0, $vgpr0, $vgpr3_vgpr4
|
||||||
|
|
||||||
|
; GCN: [[SGPR:%[0-9]+]]:sreg_32_xm0 = COPY $sgpr0
|
||||||
|
%0:sgpr(s32) = COPY $sgpr0
|
||||||
|
|
||||||
|
; GCN: [[VGPR:%[0-9]+]]:vgpr_32 = COPY $vgpr0
|
||||||
|
%1:vgpr(s32) = COPY $vgpr0
|
||||||
|
|
||||||
|
%2:vgpr(s64) = COPY $vgpr3_vgpr4
|
||||||
|
|
||||||
|
; sitofp s
|
||||||
|
; GCN: V_CVT_F32_I32_e64 [[SGPR]], 0, 0
|
||||||
|
%3:vgpr(s32) = G_SITOFP %0
|
||||||
|
|
||||||
|
; sitofp v
|
||||||
|
; GCN: V_CVT_F32_I32_e64 [[VGPR]], 0, 0
|
||||||
|
%4:vgpr(s32) = G_SITOFP %1
|
||||||
|
|
||||||
|
G_STORE %3, %2 :: (store 4 into %ir.global0)
|
||||||
|
G_STORE %4, %2 :: (store 4 into %ir.global0)
|
||||||
|
...
|
||||||
|
---
|
14
test/CodeGen/AMDGPU/GlobalISel/legalize-sitofp.mir
Normal file
14
test/CodeGen/AMDGPU/GlobalISel/legalize-sitofp.mir
Normal file
@ -0,0 +1,14 @@
|
|||||||
|
# NOTE: Assertions have been autogenerated by utils/update_mir_test_checks.py
|
||||||
|
# RUN: llc -mtriple=amdgcn-mesa-mesa3d -mcpu=fiji -run-pass=legalizer -global-isel %s -o - | FileCheck %s
|
||||||
|
|
||||||
|
---
|
||||||
|
name: test_sitofp_f32_to_i32
|
||||||
|
body: |
|
||||||
|
bb.0:
|
||||||
|
liveins: $vgpr0
|
||||||
|
|
||||||
|
; CHECK-LABEL: name: test_sitofp_f32_to_i32
|
||||||
|
; CHECK: [[COPY:%[0-9]+]]:_(s32) = COPY $vgpr0
|
||||||
|
%0:_(s32) = COPY $vgpr0
|
||||||
|
%1:_(s32) = G_SITOFP %0
|
||||||
|
...
|
Loading…
x
Reference in New Issue
Block a user