mirror of
https://github.com/RPCSX/llvm.git
synced 2025-02-06 04:19:10 +00:00
[AMDGPU] Disassembler: fix for disaasembling v_mac_f32/16_dpp/sdwa
Summary: Real instruction should copy constraints from real instruction. This allows auto-generated disassembler to correctly process tied operands. Reviewers: nhaustov, vpykhtin, tstellarAMD Subscribers: arsenm, kzhuravl, wdng, nhaehnle, yaxunl, tony-tye Differential Revision: https://reviews.llvm.org/D27847 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@290336 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
64a0af2928
commit
b94ac0f1d9
@ -56,6 +56,9 @@ class VOP1_Real <VOP1_Pseudo ps, int EncodingFamily> :
|
||||
let isPseudo = 0;
|
||||
let isCodeGenOnly = 0;
|
||||
|
||||
let Constraints = ps.Constraints;
|
||||
let DisableEncoding = ps.DisableEncoding;
|
||||
|
||||
// copy relevant pseudo op flags
|
||||
let SubtargetPredicate = ps.SubtargetPredicate;
|
||||
let AsmMatchConverter = ps.AsmMatchConverter;
|
||||
@ -212,7 +215,6 @@ def VOP_MOVRELD : VOPProfile<[untyped, i32, untyped, untyped]> {
|
||||
let Outs = (outs);
|
||||
let Ins32 = (ins Src0RC32:$vdst, VSrc_b32:$src0);
|
||||
let Ins64 = (ins Src0RC64:$vdst, VSrc_b32:$src0);
|
||||
|
||||
let InsDPP = (ins Src0RC32:$vdst, Src0RC32:$src0, dpp_ctrl:$dpp_ctrl, row_mask:$row_mask,
|
||||
bank_mask:$bank_mask, bound_ctrl:$bound_ctrl);
|
||||
let InsSDWA = (ins Src0RC32:$vdst, Int32InputMods:$src0_modifiers, VCSrc_b32:$src0,
|
||||
@ -426,6 +428,8 @@ class VOP1_SDWA <bits<8> op, VOP1_Pseudo ps, VOPProfile P = ps.Pfl> :
|
||||
let Uses = ps.Uses;
|
||||
let SchedRW = ps.SchedRW;
|
||||
let hasSideEffects = ps.hasSideEffects;
|
||||
let Constraints = ps.Constraints;
|
||||
let DisableEncoding = ps.DisableEncoding;
|
||||
let AsmMatchConverter = "cvtSdwaVOP1";
|
||||
|
||||
bits<8> vdst;
|
||||
@ -441,6 +445,8 @@ class VOP1_DPP <bits<8> op, VOP1_Pseudo ps, VOPProfile P = ps.Pfl> :
|
||||
let Uses = ps.Uses;
|
||||
let SchedRW = ps.SchedRW;
|
||||
let hasSideEffects = ps.hasSideEffects;
|
||||
let Constraints = ps.Constraints;
|
||||
let DisableEncoding = ps.DisableEncoding;
|
||||
|
||||
bits<8> vdst;
|
||||
let Inst{8-0} = 0xfa; // dpp
|
||||
|
@ -72,6 +72,9 @@ class VOP2_Real <VOP2_Pseudo ps, int EncodingFamily> :
|
||||
let isPseudo = 0;
|
||||
let isCodeGenOnly = 0;
|
||||
|
||||
let Constraints = ps.Constraints;
|
||||
let DisableEncoding = ps.DisableEncoding;
|
||||
|
||||
// copy relevant pseudo op flags
|
||||
let SubtargetPredicate = ps.SubtargetPredicate;
|
||||
let AsmMatchConverter = ps.AsmMatchConverter;
|
||||
@ -157,13 +160,13 @@ class VOP_MAC <ValueType vt> : VOPProfile <[vt, vt, vt, vt]> {
|
||||
let Ins32 = (ins Src0RC32:$src0, Src1RC32:$src1, VGPR_32:$src2);
|
||||
let Ins64 = getIns64<Src0RC64, Src1RC64, RegisterOperand<VGPR_32>, 3,
|
||||
HasModifiers, Src0Mod, Src1Mod, Src2Mod>.ret;
|
||||
let InsDPP = (ins FP32InputMods:$src0_modifiers, Src0RC32:$src0,
|
||||
FP32InputMods:$src1_modifiers, Src1RC32:$src1,
|
||||
let InsDPP = (ins FP32InputMods:$src0_modifiers, Src0DPP:$src0,
|
||||
FP32InputMods:$src1_modifiers, Src1DPP:$src1,
|
||||
VGPR_32:$src2, // stub argument
|
||||
dpp_ctrl:$dpp_ctrl, row_mask:$row_mask,
|
||||
bank_mask:$bank_mask, bound_ctrl:$bound_ctrl);
|
||||
let InsSDWA = (ins FP32InputMods:$src0_modifiers, Src0RC32:$src0,
|
||||
FP32InputMods:$src1_modifiers, Src1RC32:$src1,
|
||||
let InsSDWA = (ins FP32InputMods:$src0_modifiers, Src0SDWA:$src0,
|
||||
FP32InputMods:$src1_modifiers, Src1SDWA:$src1,
|
||||
VGPR_32:$src2, // stub argument
|
||||
clampmod:$clamp, dst_sel:$dst_sel, dst_unused:$dst_unused,
|
||||
src0_sel:$src0_sel, src1_sel:$src1_sel);
|
||||
@ -557,6 +560,8 @@ class VOP2_SDWA <bits<6> op, VOP2_Pseudo ps, VOPProfile P = ps.Pfl> :
|
||||
let Uses = ps.Uses;
|
||||
let SchedRW = ps.SchedRW;
|
||||
let hasSideEffects = ps.hasSideEffects;
|
||||
let Constraints = ps.Constraints;
|
||||
let DisableEncoding = ps.DisableEncoding;
|
||||
let AsmMatchConverter = "cvtSdwaVOP2";
|
||||
|
||||
bits<8> vdst;
|
||||
@ -574,6 +579,8 @@ class VOP2_DPP <bits<6> op, VOP2_Pseudo ps, VOPProfile P = ps.Pfl> :
|
||||
let Uses = ps.Uses;
|
||||
let SchedRW = ps.SchedRW;
|
||||
let hasSideEffects = ps.hasSideEffects;
|
||||
let Constraints = ps.Constraints;
|
||||
let DisableEncoding = ps.DisableEncoding;
|
||||
|
||||
bits<8> vdst;
|
||||
bits<8> src1;
|
||||
|
@ -71,6 +71,9 @@ class VOPC_Real <VOPC_Pseudo ps, int EncodingFamily> :
|
||||
let isPseudo = 0;
|
||||
let isCodeGenOnly = 0;
|
||||
|
||||
let Constraints = ps.Constraints;
|
||||
let DisableEncoding = ps.DisableEncoding;
|
||||
|
||||
// copy relevant pseudo op flags
|
||||
let SubtargetPredicate = ps.SubtargetPredicate;
|
||||
let AsmMatchConverter = ps.AsmMatchConverter;
|
||||
@ -826,6 +829,8 @@ class VOPC_SDWA<bits<8> op, VOPC_Pseudo ps, VOPProfile P = ps.Pfl> :
|
||||
let AsmMatchConverter = "cvtSdwaVOPC";
|
||||
let isCompare = ps.isCompare;
|
||||
let isCommutable = ps.isCommutable;
|
||||
let Constraints = ps.Constraints;
|
||||
let DisableEncoding = ps.DisableEncoding;
|
||||
|
||||
bits<8> src1;
|
||||
let Inst{8-0} = 0xf9; // sdwa
|
||||
|
@ -118,6 +118,9 @@ class VOP3_Real <VOP3_Pseudo ps, int EncodingFamily> :
|
||||
let isPseudo = 0;
|
||||
let isCodeGenOnly = 0;
|
||||
|
||||
let Constraints = ps.Constraints;
|
||||
let DisableEncoding = ps.DisableEncoding;
|
||||
|
||||
// copy relevant pseudo op flags
|
||||
let SubtargetPredicate = ps.SubtargetPredicate;
|
||||
let AsmMatchConverter = ps.AsmMatchConverter;
|
||||
|
@ -85,5 +85,10 @@
|
||||
0xfa 0x00 0x00 0x02 0x00 0x01 0x99 0xa1
|
||||
|
||||
# VI: v_add_f32_dpp v0, |v0|, -v0 row_shl:1 row_mask:0xa bank_mask:0x1 bound_ctrl:0 ; encoding: [0xfa,0x00,0x00,0x02,0x00,0x01,0x69,0xa1]
|
||||
0xfa 0x00 0x00 0x02 0x00 0x01 0x69 0xa1
|
||||
|
||||
0xfa 0x00 0x00 0x02 0x00 0x01 0x69 0xa1
|
||||
# VI: v_mac_f32_dpp v76, v76, v114 quad_perm:[2,3,0,1] row_mask:0xf bank_mask:0xf ; encoding: [0xfa,0xe4,0x98,0x2c,0x4c,0x4e,0x00,0xff]
|
||||
0xfa 0xe4 0x98 0x2c 0x4c 0x4e 0x00 0xff
|
||||
|
||||
# VI: v_mac_f16_dpp v1, v2, v3 row_shl:1 row_mask:0xa bank_mask:0x1 bound_ctrl:0 ; encoding: [0xfa,0x06,0x02,0x46,0x02,0x01,0x09,0xa1]
|
||||
0xfa 0x06 0x02 0x46 0x02 0x01 0x09 0xa1
|
@ -300,8 +300,11 @@
|
||||
# VI: v_mul_f16_sdwa v1, v2, v3 dst_sel:DWORD dst_unused:UNUSED_PAD src0_sel:WORD_1 src1_sel:BYTE_2 ; encoding: [0xf9,0x06,0x02,0x44,0x02,0x06,0x05,0x02]
|
||||
0xf9 0x06 0x02 0x44 0x02 0x06 0x05 0x02
|
||||
|
||||
# VI: v_mac_f16_e32 v1, v2, v3 ; encoding: [0x02,0x07,0x02,0x46]
|
||||
0x02,0x07,0x02,0x46
|
||||
# VI: v_mac_f32_sdwa v15, v99, v194 dst_sel:DWORD dst_unused:UNUSED_SEXT src0_sel:WORD_0 src1_sel:DWORD ; encoding: [0xf9,0x84,0x1f,0x2c,0x63,0x0e,0x04,0x06]
|
||||
0xf9 0x84 0x1f 0x2c 0x63 0x0e 0x04 0x06
|
||||
|
||||
# VI: v_mac_f16_sdwa v1, v2, v3 dst_sel:DWORD dst_unused:UNUSED_PAD src0_sel:WORD_1 src1_sel:BYTE_2 ; encoding: [0xf9,0x06,0x02,0x46,0x02,0x06,0x05,0x02]
|
||||
0xf9 0x06 0x02 0x46 0x02 0x06 0x05 0x02
|
||||
|
||||
# VI: v_add_u16_sdwa v1, v2, v3 dst_sel:DWORD dst_unused:UNUSED_PAD src0_sel:WORD_1 src1_sel:BYTE_2 ; encoding: [0xf9,0x06,0x02,0x4c,0x02,0x06,0x05,0x02]
|
||||
0xf9 0x06 0x02 0x4c 0x02 0x06 0x05 0x02
|
||||
|
Loading…
x
Reference in New Issue
Block a user