mirror of
https://github.com/capstone-engine/llvm-capstone.git
synced 2025-01-24 10:07:48 +00:00
Remove VMOVDneon and VMOVQ, which are just aliases for VORR. This continues to simplify the path towards an auto-generated disassembler.
llvm-svn: 135290
This commit is contained in:
parent
e0dda9c1c8
commit
454e1c7abb
@ -637,7 +637,7 @@ void ARMBaseInstrInfo::copyPhysReg(MachineBasicBlock &MBB,
|
||||
else if (ARM::DPRRegClass.contains(DestReg, SrcReg))
|
||||
Opc = ARM::VMOVD;
|
||||
else if (ARM::QPRRegClass.contains(DestReg, SrcReg))
|
||||
Opc = ARM::VMOVQ;
|
||||
Opc = ARM::VORRq;
|
||||
else if (ARM::QQPRRegClass.contains(DestReg, SrcReg))
|
||||
Opc = ARM::VMOVQQ;
|
||||
else if (ARM::QQQQPRRegClass.contains(DestReg, SrcReg))
|
||||
@ -647,6 +647,8 @@ void ARMBaseInstrInfo::copyPhysReg(MachineBasicBlock &MBB,
|
||||
|
||||
MachineInstrBuilder MIB = BuildMI(MBB, I, DL, get(Opc), DestReg);
|
||||
MIB.addReg(SrcReg, getKillRegState(KillSrc));
|
||||
if (Opc == ARM::VORRq)
|
||||
MIB.addReg(SrcReg, getKillRegState(KillSrc));
|
||||
if (Opc != ARM::VMOVQQ && Opc != ARM::VMOVQQQQ)
|
||||
AddDefaultPred(MIB);
|
||||
}
|
||||
|
@ -964,15 +964,17 @@ bool ARMExpandPseudo::ExpandMI(MachineBasicBlock &MBB,
|
||||
unsigned OddSrc = TRI->getSubReg(SrcReg, ARM::qsub_1);
|
||||
MachineInstrBuilder Even =
|
||||
AddDefaultPred(BuildMI(MBB, MBBI, MI.getDebugLoc(),
|
||||
TII->get(ARM::VMOVQ))
|
||||
TII->get(ARM::VORRq))
|
||||
.addReg(EvenDst,
|
||||
RegState::Define | getDeadRegState(DstIsDead))
|
||||
.addReg(EvenSrc, getKillRegState(SrcIsKill))
|
||||
.addReg(EvenSrc, getKillRegState(SrcIsKill)));
|
||||
MachineInstrBuilder Odd =
|
||||
AddDefaultPred(BuildMI(MBB, MBBI, MI.getDebugLoc(),
|
||||
TII->get(ARM::VMOVQ))
|
||||
TII->get(ARM::VORRq))
|
||||
.addReg(OddDst,
|
||||
RegState::Define | getDeadRegState(DstIsDead))
|
||||
.addReg(OddSrc, getKillRegState(SrcIsKill))
|
||||
.addReg(OddSrc, getKillRegState(SrcIsKill)));
|
||||
TransferImpOps(MI, Even, Odd);
|
||||
MI.eraseFromParent();
|
||||
|
@ -4214,17 +4214,12 @@ def VSWPq : N2VX<0b11, 0b11, 0b00, 0b10, 0b00000, 1, 0,
|
||||
// Vector Move Operations.
|
||||
|
||||
// VMOV : Vector Move (Register)
|
||||
def : InstAlias<"vmov${p} $Vd, $Vm",
|
||||
(VORRd DPR:$Vd, DPR:$Vm, DPR:$Vm, pred:$p)>;
|
||||
def : InstAlias<"vmov${p} $Vd, $Vm",
|
||||
(VORRq QPR:$Vd, QPR:$Vm, QPR:$Vm, pred:$p)>;
|
||||
|
||||
let neverHasSideEffects = 1 in {
|
||||
def VMOVDneon: N3VX<0, 0, 0b10, 0b0001, 0, 1, (outs DPR:$Vd), (ins DPR:$Vm),
|
||||
N3RegFrm, IIC_VMOV, "vmov", "$Vd, $Vm", "", []> {
|
||||
let Vn{4-0} = Vm{4-0};
|
||||
}
|
||||
def VMOVQ : N3VX<0, 0, 0b10, 0b0001, 1, 1, (outs QPR:$Vd), (ins QPR:$Vm),
|
||||
N3RegFrm, IIC_VMOV, "vmov", "$Vd, $Vm", "", []> {
|
||||
let Vn{4-0} = Vm{4-0};
|
||||
}
|
||||
|
||||
// Pseudo vector move instructions for QQ and QQQQ registers. This should
|
||||
// be expanded after register allocation is completed.
|
||||
def VMOVQQ : PseudoInst<(outs QQPR:$dst), (ins QQPR:$src),
|
||||
|
@ -3093,11 +3093,6 @@ static bool DisassembleNVdVnVmOptImm(MCInst &MI, unsigned Opcode, uint32_t insn,
|
||||
: decodeNEONRm(insn))));
|
||||
++OpIdx;
|
||||
|
||||
// Special case handling for VMOVDneon and VMOVQ because they are marked as
|
||||
// N3RegFrm.
|
||||
if (Opcode == ARM::VMOVDneon || Opcode == ARM::VMOVQ)
|
||||
return true;
|
||||
|
||||
// Dm = Inst{5:3-0} => NEON Rm
|
||||
// or
|
||||
// Dm is restricted to D0-D7 if size is 16, D0-D15 otherwise
|
||||
|
@ -77,7 +77,7 @@ bool NEONMoveFixPass::InsertMoves(MachineBasicBlock &MBB) {
|
||||
}
|
||||
|
||||
if (inNEONDomain(Domain, isA8)) {
|
||||
// Convert VMOVD to VMOVDneon
|
||||
// Convert VMOVD to VORRd
|
||||
unsigned DestReg = MI->getOperand(0).getReg();
|
||||
|
||||
DEBUG({errs() << "vmov convert: "; MI->dump();});
|
||||
@ -88,7 +88,8 @@ bool NEONMoveFixPass::InsertMoves(MachineBasicBlock &MBB) {
|
||||
// - The imp-defs / imp-uses are superregs only, we don't care about
|
||||
// them.
|
||||
AddDefaultPred(BuildMI(MBB, *MI, MI->getDebugLoc(),
|
||||
TII->get(ARM::VMOVDneon), DestReg).addReg(SrcReg));
|
||||
TII->get(ARM::VORRd), DestReg)
|
||||
.addReg(SrcReg).addReg(SrcReg));
|
||||
MBB.erase(MI);
|
||||
MachineBasicBlock::iterator I = prior(NextMII);
|
||||
MI = &*I;
|
||||
|
@ -19,7 +19,7 @@ entry:
|
||||
%5 = call <2 x float> @llvm.arm.neon.vpadd.v2f32(<2 x float> %3, <2 x float> %4) nounwind ; <<2 x float>> [#uses=2]
|
||||
%6 = call <2 x float> @llvm.arm.neon.vpadd.v2f32(<2 x float> %5, <2 x float> %5) nounwind ; <<2 x float>> [#uses=2]
|
||||
%7 = shufflevector <2 x float> %6, <2 x float> %6, <4 x i32> <i32 0, i32 1, i32 2, i32 3> ; <<4 x float>> [#uses=2]
|
||||
;CHECK: vmov
|
||||
;CHECK: vorr
|
||||
%8 = call <4 x float> @llvm.arm.neon.vrsqrte.v4f32(<4 x float> %7) nounwind ; <<4 x float>> [#uses=3]
|
||||
%9 = fmul <4 x float> %8, %8 ; <<4 x float>> [#uses=1]
|
||||
%10 = call <4 x float> @llvm.arm.neon.vrsqrts.v4f32(<4 x float> %9, <4 x float> %7) nounwind ; <<4 x float>> [#uses=1]
|
||||
|
@ -124,7 +124,7 @@ return1:
|
||||
return2:
|
||||
; CHECK: %return2
|
||||
; CHECK: vadd.i32
|
||||
; CHECK: vmov {{q[0-9]+}}, {{q[0-9]+}}
|
||||
; CHECK: vorr {{q[0-9]+}}, {{q[0-9]+}}
|
||||
; CHECK-NOT: vmov
|
||||
; CHECK: vst2.32 {d{{[0-9]+}}, d{{[0-9]+}}, d{{[0-9]+}}, d{{[0-9]+}}}
|
||||
%tmp100 = extractvalue %struct.__neon_int32x4x2_t %tmp2, 0 ; <<4 x i32>> [#uses=1]
|
||||
@ -139,7 +139,7 @@ define <8 x i16> @t5(i16* %A, <8 x i16>* %B) nounwind {
|
||||
; CHECK: t5:
|
||||
; CHECK: vldmia
|
||||
; How can FileCheck match Q and D registers? We need a lisp interpreter.
|
||||
; CHECK: vmov {{q[0-9]+}}, {{q[0-9]+}}
|
||||
; CHECK: vorr {{q[0-9]+}}, {{q[0-9]+}}, {{q[0-9]+}}
|
||||
; CHECK-NOT: vmov
|
||||
; CHECK: vld2.16 {d{{[0-9]+}}[1], d{{[0-9]+}}[1]}, [r0]
|
||||
; CHECK-NOT: vmov
|
||||
@ -156,7 +156,7 @@ define <8 x i16> @t5(i16* %A, <8 x i16>* %B) nounwind {
|
||||
define <8 x i8> @t6(i8* %A, <8 x i8>* %B) nounwind {
|
||||
; CHECK: t6:
|
||||
; CHECK: vldr.64
|
||||
; CHECK: vmov d[[D0:[0-9]+]], d[[D1:[0-9]+]]
|
||||
; CHECK: vorr d[[D0:[0-9]+]], d[[D1:[0-9]+]]
|
||||
; CHECK-NEXT: vld2.8 {d[[D1]][1], d[[D0]][1]}
|
||||
%tmp1 = load <8 x i8>* %B ; <<8 x i8>> [#uses=2]
|
||||
%tmp2 = call %struct.__neon_int8x8x2_t @llvm.arm.neon.vld2lane.v8i8(i8* %A, <8 x i8> %tmp1, <8 x i8> %tmp1, i32 1, i32 1) ; <%struct.__neon_int8x8x2_t> [#uses=2]
|
||||
@ -172,7 +172,7 @@ entry:
|
||||
; CHECK: vld2.32
|
||||
; CHECK: vst2.32
|
||||
; CHECK: vld1.32 {d{{[0-9]+}}, d{{[0-9]+}}},
|
||||
; CHECK: vmov q[[Q0:[0-9]+]], q[[Q1:[0-9]+]]
|
||||
; CHECK: vorr q[[Q0:[0-9]+]], q[[Q1:[0-9]+]], q[[Q1:[0-9]+]]
|
||||
; CHECK-NOT: vmov
|
||||
; CHECK: vuzp.32 q[[Q1]], q[[Q0]]
|
||||
; CHECK: vst1.32
|
||||
@ -272,8 +272,8 @@ define arm_aapcs_vfpcc float @t9(%0* nocapture, %3* nocapture) nounwind {
|
||||
define arm_aapcs_vfpcc i32 @t10() nounwind {
|
||||
entry:
|
||||
; CHECK: t10:
|
||||
; CHECK: vmul.f32 q8, q8, d0[0]
|
||||
; CHECK: vmov.i32 q[[Q0:[0-9]+]], #0x3F000000
|
||||
; CHECK: vmul.f32 q8, q8, d0[0]
|
||||
; CHECK: vadd.f32 q8, q8, q8
|
||||
%0 = shufflevector <4 x float> zeroinitializer, <4 x float> undef, <4 x i32> zeroinitializer ; <<4 x float>> [#uses=1]
|
||||
%1 = insertelement <4 x float> %0, float undef, i32 1 ; <<4 x float>> [#uses=1]
|
||||
|
@ -27,7 +27,7 @@
|
||||
# CHECK: vld4.16 {d3[], d4[], d5[], d6[]}, [r0, :64]!
|
||||
0x7d 0x3f 0xa0 0xf4
|
||||
|
||||
# CHECK: vmov d0, d15
|
||||
# CHECK: vorr d0, d15, d15
|
||||
0x1f 0x01 0x2f 0xf2
|
||||
|
||||
# CHECK: vmov.i64 q6, #0xFF00FF00FF
|
||||
|
Loading…
x
Reference in New Issue
Block a user