mirror of
https://github.com/RPCSX/llvm.git
synced 2025-02-04 11:27:34 +00:00
Use predication instead of pseudo-opcodes when folding into MOVCC.
Now that it is possible to dynamically tie MachineInstr operands, predicated instructions are possible in SSA form: %vreg3<def> = SUBri %vreg1, -2147483647, pred:14, pred:%noreg, %opt:%noreg %vreg4<def,tied1> = MOVCCr %vreg3<tied0>, %vreg1, %pred:12, pred:%CPSR Becomes a predicated SUBri with a tied imp-use: SUBri %vreg1, -2147483647, pred:13, pred:%CPSR, opt:%noreg, %vreg1<imp-use,tied0> This means that any instruction that is safe to move can be folded into a MOVCC, and the *CC pseudo-instructions are no longer needed. The test case changes reflect that Thumb2SizeReduce recognizes the predicated instructions. It didn't understand the pseudos. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@163274 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
366df7945f
commit
098c6a547f
@ -1580,16 +1580,20 @@ ARMBaseInstrInfo::commuteInstruction(MachineInstr *MI, bool NewMI) const {
|
|||||||
}
|
}
|
||||||
|
|
||||||
/// Identify instructions that can be folded into a MOVCC instruction, and
|
/// Identify instructions that can be folded into a MOVCC instruction, and
|
||||||
/// return the corresponding opcode for the predicated pseudo-instruction.
|
/// return the defining instruction.
|
||||||
static unsigned canFoldIntoMOVCC(unsigned Reg, MachineInstr *&MI,
|
static MachineInstr *canFoldIntoMOVCC(unsigned Reg,
|
||||||
const MachineRegisterInfo &MRI) {
|
const MachineRegisterInfo &MRI,
|
||||||
|
const TargetInstrInfo *TII) {
|
||||||
if (!TargetRegisterInfo::isVirtualRegister(Reg))
|
if (!TargetRegisterInfo::isVirtualRegister(Reg))
|
||||||
return 0;
|
return 0;
|
||||||
if (!MRI.hasOneNonDBGUse(Reg))
|
if (!MRI.hasOneNonDBGUse(Reg))
|
||||||
return 0;
|
return 0;
|
||||||
MI = MRI.getVRegDef(Reg);
|
MachineInstr *MI = MRI.getVRegDef(Reg);
|
||||||
if (!MI)
|
if (!MI)
|
||||||
return 0;
|
return 0;
|
||||||
|
// MI is folded into the MOVCC by predicating it.
|
||||||
|
if (!MI->isPredicable())
|
||||||
|
return 0;
|
||||||
// Check if MI has any non-dead defs or physreg uses. This also detects
|
// Check if MI has any non-dead defs or physreg uses. This also detects
|
||||||
// predicated instructions which will be reading CPSR.
|
// predicated instructions which will be reading CPSR.
|
||||||
for (unsigned i = 1, e = MI->getNumOperands(); i != e; ++i) {
|
for (unsigned i = 1, e = MI->getNumOperands(); i != e; ++i) {
|
||||||
@ -1599,55 +1603,18 @@ static unsigned canFoldIntoMOVCC(unsigned Reg, MachineInstr *&MI,
|
|||||||
return 0;
|
return 0;
|
||||||
if (!MO.isReg())
|
if (!MO.isReg())
|
||||||
continue;
|
continue;
|
||||||
|
// MI can't have any tied operands, that would conflict with predication.
|
||||||
|
if (MO.isTied())
|
||||||
|
return 0;
|
||||||
if (TargetRegisterInfo::isPhysicalRegister(MO.getReg()))
|
if (TargetRegisterInfo::isPhysicalRegister(MO.getReg()))
|
||||||
return 0;
|
return 0;
|
||||||
if (MO.isDef() && !MO.isDead())
|
if (MO.isDef() && !MO.isDead())
|
||||||
return 0;
|
return 0;
|
||||||
}
|
}
|
||||||
switch (MI->getOpcode()) {
|
bool DontMoveAcrossStores = true;
|
||||||
default: return 0;
|
if (!MI->isSafeToMove(TII, /* AliasAnalysis = */ 0, DontMoveAcrossStores))
|
||||||
case ARM::ANDri: return ARM::ANDCCri;
|
return 0;
|
||||||
case ARM::ANDrr: return ARM::ANDCCrr;
|
return MI;
|
||||||
case ARM::ANDrsi: return ARM::ANDCCrsi;
|
|
||||||
case ARM::ANDrsr: return ARM::ANDCCrsr;
|
|
||||||
case ARM::t2ANDri: return ARM::t2ANDCCri;
|
|
||||||
case ARM::t2ANDrr: return ARM::t2ANDCCrr;
|
|
||||||
case ARM::t2ANDrs: return ARM::t2ANDCCrs;
|
|
||||||
case ARM::EORri: return ARM::EORCCri;
|
|
||||||
case ARM::EORrr: return ARM::EORCCrr;
|
|
||||||
case ARM::EORrsi: return ARM::EORCCrsi;
|
|
||||||
case ARM::EORrsr: return ARM::EORCCrsr;
|
|
||||||
case ARM::t2EORri: return ARM::t2EORCCri;
|
|
||||||
case ARM::t2EORrr: return ARM::t2EORCCrr;
|
|
||||||
case ARM::t2EORrs: return ARM::t2EORCCrs;
|
|
||||||
case ARM::ORRri: return ARM::ORRCCri;
|
|
||||||
case ARM::ORRrr: return ARM::ORRCCrr;
|
|
||||||
case ARM::ORRrsi: return ARM::ORRCCrsi;
|
|
||||||
case ARM::ORRrsr: return ARM::ORRCCrsr;
|
|
||||||
case ARM::t2ORRri: return ARM::t2ORRCCri;
|
|
||||||
case ARM::t2ORRrr: return ARM::t2ORRCCrr;
|
|
||||||
case ARM::t2ORRrs: return ARM::t2ORRCCrs;
|
|
||||||
|
|
||||||
// ARM ADD/SUB
|
|
||||||
case ARM::ADDri: return ARM::ADDCCri;
|
|
||||||
case ARM::ADDrr: return ARM::ADDCCrr;
|
|
||||||
case ARM::ADDrsi: return ARM::ADDCCrsi;
|
|
||||||
case ARM::ADDrsr: return ARM::ADDCCrsr;
|
|
||||||
case ARM::SUBri: return ARM::SUBCCri;
|
|
||||||
case ARM::SUBrr: return ARM::SUBCCrr;
|
|
||||||
case ARM::SUBrsi: return ARM::SUBCCrsi;
|
|
||||||
case ARM::SUBrsr: return ARM::SUBCCrsr;
|
|
||||||
|
|
||||||
// Thumb2 ADD/SUB
|
|
||||||
case ARM::t2ADDri: return ARM::t2ADDCCri;
|
|
||||||
case ARM::t2ADDri12: return ARM::t2ADDCCri12;
|
|
||||||
case ARM::t2ADDrr: return ARM::t2ADDCCrr;
|
|
||||||
case ARM::t2ADDrs: return ARM::t2ADDCCrs;
|
|
||||||
case ARM::t2SUBri: return ARM::t2SUBCCri;
|
|
||||||
case ARM::t2SUBri12: return ARM::t2SUBCCri12;
|
|
||||||
case ARM::t2SUBrr: return ARM::t2SUBCCrr;
|
|
||||||
case ARM::t2SUBrs: return ARM::t2SUBCCrs;
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
|
|
||||||
bool ARMBaseInstrInfo::analyzeSelect(const MachineInstr *MI,
|
bool ARMBaseInstrInfo::analyzeSelect(const MachineInstr *MI,
|
||||||
@ -1676,19 +1643,18 @@ MachineInstr *ARMBaseInstrInfo::optimizeSelect(MachineInstr *MI,
|
|||||||
assert((MI->getOpcode() == ARM::MOVCCr || MI->getOpcode() == ARM::t2MOVCCr) &&
|
assert((MI->getOpcode() == ARM::MOVCCr || MI->getOpcode() == ARM::t2MOVCCr) &&
|
||||||
"Unknown select instruction");
|
"Unknown select instruction");
|
||||||
const MachineRegisterInfo &MRI = MI->getParent()->getParent()->getRegInfo();
|
const MachineRegisterInfo &MRI = MI->getParent()->getParent()->getRegInfo();
|
||||||
MachineInstr *DefMI = 0;
|
MachineInstr *DefMI = canFoldIntoMOVCC(MI->getOperand(2).getReg(), MRI, this);
|
||||||
unsigned Opc = canFoldIntoMOVCC(MI->getOperand(2).getReg(), DefMI, MRI);
|
bool Invert = !DefMI;
|
||||||
bool Invert = !Opc;
|
if (!DefMI)
|
||||||
if (!Opc)
|
DefMI = canFoldIntoMOVCC(MI->getOperand(1).getReg(), MRI, this);
|
||||||
Opc = canFoldIntoMOVCC(MI->getOperand(1).getReg(), DefMI, MRI);
|
if (!DefMI)
|
||||||
if (!Opc)
|
|
||||||
return 0;
|
return 0;
|
||||||
|
|
||||||
// Create a new predicated version of DefMI.
|
// Create a new predicated version of DefMI.
|
||||||
// Rfalse is the first use.
|
// Rfalse is the first use.
|
||||||
MachineInstrBuilder NewMI = BuildMI(*MI->getParent(), MI, MI->getDebugLoc(),
|
MachineInstrBuilder NewMI = BuildMI(*MI->getParent(), MI, MI->getDebugLoc(),
|
||||||
get(Opc), MI->getOperand(0).getReg())
|
DefMI->getDesc(),
|
||||||
.addOperand(MI->getOperand(Invert ? 2 : 1));
|
MI->getOperand(0).getReg());
|
||||||
|
|
||||||
// Copy all the DefMI operands, excluding its (null) predicate.
|
// Copy all the DefMI operands, excluding its (null) predicate.
|
||||||
const MCInstrDesc &DefDesc = DefMI->getDesc();
|
const MCInstrDesc &DefDesc = DefMI->getDesc();
|
||||||
@ -1707,6 +1673,15 @@ MachineInstr *ARMBaseInstrInfo::optimizeSelect(MachineInstr *MI,
|
|||||||
if (NewMI->hasOptionalDef())
|
if (NewMI->hasOptionalDef())
|
||||||
AddDefaultCC(NewMI);
|
AddDefaultCC(NewMI);
|
||||||
|
|
||||||
|
// The output register value when the predicate is false is an implicit
|
||||||
|
// register operand tied to the first def.
|
||||||
|
// The tie makes the register allocator ensure the FalseReg is allocated the
|
||||||
|
// same register as operand 0.
|
||||||
|
MachineOperand FalseReg = MI->getOperand(Invert ? 2 : 1);
|
||||||
|
FalseReg.setImplicit();
|
||||||
|
NewMI->addOperand(FalseReg);
|
||||||
|
NewMI->tieOperands(0, NewMI->getNumOperands() - 1);
|
||||||
|
|
||||||
// The caller will erase MI, but not DefMI.
|
// The caller will erase MI, but not DefMI.
|
||||||
DefMI->eraseFromParent();
|
DefMI->eraseFromParent();
|
||||||
return NewMI;
|
return NewMI;
|
||||||
|
@ -80,7 +80,7 @@ define double @f7(double %a, double %b) {
|
|||||||
; CHECK-NEON: adr [[R2:r[0-9]+]], LCPI7_0
|
; CHECK-NEON: adr [[R2:r[0-9]+]], LCPI7_0
|
||||||
; CHECK-NEON-NEXT: cmp r0, [[R3]]
|
; CHECK-NEON-NEXT: cmp r0, [[R3]]
|
||||||
; CHECK-NEON-NEXT: it eq
|
; CHECK-NEON-NEXT: it eq
|
||||||
; CHECK-NEON-NEXT: addeq.w {{r.*}}, [[R2]]
|
; CHECK-NEON-NEXT: addeq{{.*}} [[R2]], #4
|
||||||
; CHECK-NEON-NEXT: ldr
|
; CHECK-NEON-NEXT: ldr
|
||||||
; CHECK-NEON: bx
|
; CHECK-NEON: bx
|
||||||
|
|
||||||
|
@ -9,7 +9,7 @@ define i32 @t1(i32 %a, i32 %b, i32 %c) nounwind {
|
|||||||
|
|
||||||
; T2: t1:
|
; T2: t1:
|
||||||
; T2: mvn r0, #-2147483648
|
; T2: mvn r0, #-2147483648
|
||||||
; T2: addle.w r1, r1
|
; T2: addle r1, r0
|
||||||
; T2: mov r0, r1
|
; T2: mov r0, r1
|
||||||
%tmp1 = icmp sgt i32 %c, 10
|
%tmp1 = icmp sgt i32 %c, 10
|
||||||
%tmp2 = select i1 %tmp1, i32 0, i32 2147483647
|
%tmp2 = select i1 %tmp1, i32 0, i32 2147483647
|
||||||
@ -23,7 +23,7 @@ define i32 @t2(i32 %a, i32 %b, i32 %c, i32 %d) nounwind {
|
|||||||
; ARM: mov r0, r1
|
; ARM: mov r0, r1
|
||||||
|
|
||||||
; T2: t2:
|
; T2: t2:
|
||||||
; T2: suble.w r1, r1, #10
|
; T2: suble r1, #10
|
||||||
; T2: mov r0, r1
|
; T2: mov r0, r1
|
||||||
%tmp1 = icmp sgt i32 %c, 10
|
%tmp1 = icmp sgt i32 %c, 10
|
||||||
%tmp2 = select i1 %tmp1, i32 0, i32 10
|
%tmp2 = select i1 %tmp1, i32 0, i32 10
|
||||||
@ -37,7 +37,7 @@ define i32 @t3(i32 %a, i32 %b, i32 %x, i32 %y) nounwind {
|
|||||||
; ARM: mov r0, r3
|
; ARM: mov r0, r3
|
||||||
|
|
||||||
; T2: t3:
|
; T2: t3:
|
||||||
; T2: andge.w r3, r3, r2
|
; T2: andge r3, r2
|
||||||
; T2: mov r0, r3
|
; T2: mov r0, r3
|
||||||
%cond = icmp slt i32 %a, %b
|
%cond = icmp slt i32 %a, %b
|
||||||
%z = select i1 %cond, i32 -1, i32 %x
|
%z = select i1 %cond, i32 -1, i32 %x
|
||||||
@ -51,7 +51,7 @@ define i32 @t4(i32 %a, i32 %b, i32 %x, i32 %y) nounwind {
|
|||||||
; ARM: mov r0, r3
|
; ARM: mov r0, r3
|
||||||
|
|
||||||
; T2: t4:
|
; T2: t4:
|
||||||
; T2: orrge.w r3, r3, r2
|
; T2: orrge r3, r2
|
||||||
; T2: mov r0, r3
|
; T2: mov r0, r3
|
||||||
%cond = icmp slt i32 %a, %b
|
%cond = icmp slt i32 %a, %b
|
||||||
%z = select i1 %cond, i32 0, i32 %x
|
%z = select i1 %cond, i32 0, i32 %x
|
||||||
@ -81,7 +81,7 @@ define i32 @t6(i32 %a, i32 %b, i32 %c, i32 %d) nounwind {
|
|||||||
|
|
||||||
; T2: t6:
|
; T2: t6:
|
||||||
; T2-NOT: movge
|
; T2-NOT: movge
|
||||||
; T2: eorlt.w r3, r3, r2
|
; T2: eorlt r3, r2
|
||||||
%cond = icmp slt i32 %a, %b
|
%cond = icmp slt i32 %a, %b
|
||||||
%tmp1 = select i1 %cond, i32 %c, i32 0
|
%tmp1 = select i1 %cond, i32 %c, i32 0
|
||||||
%tmp2 = xor i32 %tmp1, %d
|
%tmp2 = xor i32 %tmp1, %d
|
||||||
@ -200,7 +200,7 @@ entry:
|
|||||||
|
|
||||||
; T2: t13
|
; T2: t13
|
||||||
; T2: cmp r1, #10
|
; T2: cmp r1, #10
|
||||||
; T2: addgt.w r0, r0, #1
|
; T2: addgt r0, #1
|
||||||
%cmp = icmp sgt i32 %a, 10
|
%cmp = icmp sgt i32 %a, 10
|
||||||
%conv = zext i1 %cmp to i32
|
%conv = zext i1 %cmp to i32
|
||||||
%add = add i32 %conv, %c
|
%add = add i32 %conv, %c
|
||||||
@ -216,7 +216,7 @@ entry:
|
|||||||
|
|
||||||
; T2: t14
|
; T2: t14
|
||||||
; T2: cmp r1, #10
|
; T2: cmp r1, #10
|
||||||
; T2: subgt.w r0, r0, #1
|
; T2: subgt r0, #1
|
||||||
%cmp = icmp sgt i32 %a, 10
|
%cmp = icmp sgt i32 %a, 10
|
||||||
%conv = sext i1 %cmp to i32
|
%conv = sext i1 %cmp to i32
|
||||||
%add = add i32 %conv, %c
|
%add = add i32 %conv, %c
|
||||||
|
@ -5,7 +5,7 @@ define i32 @t1(i32 %a, i32 %b, i32 %c) nounwind {
|
|||||||
; CHECK: mvn r0, #-2147483648
|
; CHECK: mvn r0, #-2147483648
|
||||||
; CHECK: cmp r2, #10
|
; CHECK: cmp r2, #10
|
||||||
; CHECK: it le
|
; CHECK: it le
|
||||||
; CHECK: addle.w r1, r1, r0
|
; CHECK: addle r1, r0
|
||||||
; CHECK: mov r0, r1
|
; CHECK: mov r0, r1
|
||||||
%tmp1 = icmp sgt i32 %c, 10
|
%tmp1 = icmp sgt i32 %c, 10
|
||||||
%tmp2 = select i1 %tmp1, i32 0, i32 2147483647
|
%tmp2 = select i1 %tmp1, i32 0, i32 2147483647
|
||||||
@ -30,7 +30,7 @@ define i32 @t3(i32 %a, i32 %b, i32 %c, i32 %d) nounwind {
|
|||||||
; CHECK: t3
|
; CHECK: t3
|
||||||
; CHECK: cmp r2, #10
|
; CHECK: cmp r2, #10
|
||||||
; CHECK: it le
|
; CHECK: it le
|
||||||
; CHECK: suble.w r1, r1, #10
|
; CHECK: suble r1, #10
|
||||||
; CHECK: mov r0, r1
|
; CHECK: mov r0, r1
|
||||||
%tmp1 = icmp sgt i32 %c, 10
|
%tmp1 = icmp sgt i32 %c, 10
|
||||||
%tmp2 = select i1 %tmp1, i32 0, i32 10
|
%tmp2 = select i1 %tmp1, i32 0, i32 10
|
||||||
|
Loading…
x
Reference in New Issue
Block a user