diff --git a/lib/CodeGen/MachineCSE.cpp b/lib/CodeGen/MachineCSE.cpp index 80982bca8ce..35ba7ff35e6 100644 --- a/lib/CodeGen/MachineCSE.cpp +++ b/lib/CodeGen/MachineCSE.cpp @@ -133,16 +133,26 @@ bool MachineCSE::PerformTrivialCoalescing(MachineInstr *MI, continue; if (DefMI->getOperand(0).getSubReg()) continue; - unsigned SrcSubReg = DefMI->getOperand(1).getSubReg(); + // FIXME: We should trivially coalesce subregister copies to expose CSE + // opportunities on instructions with truncated operands (see + // cse-add-with-overflow.ll). This can be done here as follows: + // if (SrcSubReg) + // RC = TRI->getMatchingSuperRegClass(MRI->getRegClass(SrcReg), RC, + // SrcSubReg); + // MO.substVirtReg(SrcReg, SrcSubReg, *TRI); + // + // The 2-addr pass has been updated to handle coalesced subregs. However, + // some machine-specific code still can't handle it. + // To handle it properly we also need a way find a constrained subregister + // class given a super-reg class and subreg index. + if (DefMI->getOperand(1).getSubReg()) + continue; const TargetRegisterClass *RC = MRI->getRegClass(Reg); - if (SrcSubReg) - RC = TRI->getMatchingSuperRegClass(MRI->getRegClass(SrcReg), RC, - SrcSubReg); if (!MRI->constrainRegClass(SrcReg, RC)) continue; DEBUG(dbgs() << "Coalescing: " << *DefMI); DEBUG(dbgs() << "*** to: " << *MI); - MO.substVirtReg(SrcReg, SrcSubReg, *TRI); + MO.setReg(SrcReg); MRI->clearKillFlags(SrcReg); DefMI->eraseFromParent(); ++NumCoalesces; diff --git a/test/CodeGen/X86/cmov.ll b/test/CodeGen/X86/cmov.ll index d7c684a730d..d38d2b430cc 100644 --- a/test/CodeGen/X86/cmov.ll +++ b/test/CodeGen/X86/cmov.ll @@ -42,7 +42,7 @@ declare void @bar(i64) nounwind define void @test3(i64 %a, i64 %b, i1 %p) nounwind { ; CHECK-LABEL: test3: ; CHECK: cmov{{n?}}el %[[R1:e..]], %[[R2:e..]] -; CHECK-NEXT: movl %[[R2]], %[[R2]] +; CHECK-NEXT: movl %[[R2]], %{{e..}} %c = trunc i64 %a to i32 %d = trunc i64 %b to i32 diff --git a/test/CodeGen/X86/cse-add-with-overflow.ll b/test/CodeGen/X86/cse-add-with-overflow.ll index ee4fbad4506..1fcc03f117d 100644 --- a/test/CodeGen/X86/cse-add-with-overflow.ll +++ b/test/CodeGen/X86/cse-add-with-overflow.ll @@ -1,4 +1,5 @@ ; RUN: llc < %s -mtriple=x86_64-darwin -mcpu=generic | FileCheck %s +; XFAIL: * ; rdar:15661073 simple example of redundant adds ; ; MachineCSE should coalesce trivial subregister copies.