mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-12-14 15:19:33 +00:00
[X86] Make sure the prologue does not clobber EFLAGS when it lives accross it.
This is a superset of the fix done in r254448. This fixes PR25607. llvm-svn: 254478
This commit is contained in:
parent
c434b24d59
commit
096b1e51ee
@ -204,10 +204,13 @@ static bool isEAXLiveIn(MachineFunction &MF) {
|
||||
return false;
|
||||
}
|
||||
|
||||
/// Check whether or not the terminators of \p MBB needs to read EFLAGS.
|
||||
static bool terminatorsNeedFlagsAsInput(const MachineBasicBlock &MBB) {
|
||||
/// Check if the flags need to be preserved before the terminators.
|
||||
/// This would be the case, if the eflags is live-in of the region
|
||||
/// composed by the terminators or live-out of that region, without
|
||||
/// being defined by a terminator.
|
||||
static bool
|
||||
flagsNeedToBePreservedBeforeTheTerminators(const MachineBasicBlock &MBB) {
|
||||
for (const MachineInstr &MI : MBB.terminators()) {
|
||||
bool BreakNext = false;
|
||||
for (const MachineOperand &MO : MI.operands()) {
|
||||
if (!MO.isReg())
|
||||
continue;
|
||||
@ -215,15 +218,22 @@ static bool terminatorsNeedFlagsAsInput(const MachineBasicBlock &MBB) {
|
||||
if (Reg != X86::EFLAGS)
|
||||
continue;
|
||||
|
||||
// This terminator needs an eflag that is not defined
|
||||
// by a previous terminator.
|
||||
// This terminator needs an eflags that is not defined
|
||||
// by a previous another terminator:
|
||||
// EFLAGS is live-in of the region composed by the terminators.
|
||||
if (!MO.isDef())
|
||||
return true;
|
||||
BreakNext = true;
|
||||
// This terminator defines the eflags, i.e., we don't need to preserve it.
|
||||
return false;
|
||||
}
|
||||
if (BreakNext)
|
||||
break;
|
||||
}
|
||||
|
||||
// None of the terminators use or define the eflags.
|
||||
// Check if they are live-out, that would imply we need to preserve them.
|
||||
for (const MachineBasicBlock *Succ : MBB.successors())
|
||||
if (Succ->isLiveIn(X86::EFLAGS))
|
||||
return true;
|
||||
|
||||
return false;
|
||||
}
|
||||
|
||||
@ -297,28 +307,6 @@ void X86FrameLowering::emitSPUpdate(MachineBasicBlock &MBB,
|
||||
}
|
||||
}
|
||||
|
||||
// Check if \p MBB defines the flags register before the first terminator.
|
||||
static bool flagsDefinedLocally(const MachineBasicBlock &MBB) {
|
||||
MachineBasicBlock::const_iterator FirstTerminator = MBB.getFirstTerminator();
|
||||
for (MachineBasicBlock::const_iterator MII : MBB) {
|
||||
if (MII == FirstTerminator)
|
||||
return false;
|
||||
|
||||
for (const MachineOperand &MO : MII->operands()) {
|
||||
if (!MO.isReg())
|
||||
continue;
|
||||
unsigned Reg = MO.getReg();
|
||||
if (Reg != X86::EFLAGS)
|
||||
continue;
|
||||
|
||||
// This instruction sets the eflag.
|
||||
if (MO.isDef())
|
||||
return true;
|
||||
}
|
||||
}
|
||||
return false;
|
||||
}
|
||||
|
||||
MachineInstrBuilder X86FrameLowering::BuildStackAdjustment(
|
||||
MachineBasicBlock &MBB, MachineBasicBlock::iterator MBBI, DebugLoc DL,
|
||||
int64_t Offset, bool InEpilogue) const {
|
||||
@ -330,14 +318,9 @@ MachineInstrBuilder X86FrameLowering::BuildStackAdjustment(
|
||||
if (!InEpilogue) {
|
||||
// Check if inserting the prologue at the beginning
|
||||
// of MBB would require to use LEA operations.
|
||||
// We need to use LEA operations if both conditions are true:
|
||||
// 1. One of the terminators need the flags.
|
||||
// 2. The flags are not defined after the insertion point of the prologue.
|
||||
// Note: Checking for the predecessors is a shortcut when obviously nothing
|
||||
// will live accross the prologue.
|
||||
UseLEA = STI.useLeaForSP() ||
|
||||
(!MBB.pred_empty() && terminatorsNeedFlagsAsInput(MBB) &&
|
||||
!flagsDefinedLocally(MBB));
|
||||
// We need to use LEA operations if EFLAGS is live in, because
|
||||
// it means an instruction will read it before it gets defined.
|
||||
UseLEA = STI.useLeaForSP() || MBB.isLiveIn(X86::EFLAGS);
|
||||
} else {
|
||||
// If we can use LEA for SP but we shouldn't, check that none
|
||||
// of the terminators uses the eflags. Otherwise we will insert
|
||||
@ -346,10 +329,10 @@ MachineInstrBuilder X86FrameLowering::BuildStackAdjustment(
|
||||
// and is an optimization anyway.
|
||||
UseLEA = canUseLEAForSPInEpilogue(*MBB.getParent());
|
||||
if (UseLEA && !STI.useLeaForSP())
|
||||
UseLEA = terminatorsNeedFlagsAsInput(MBB);
|
||||
UseLEA = flagsNeedToBePreservedBeforeTheTerminators(MBB);
|
||||
// If that assert breaks, that means we do not do the right thing
|
||||
// in canUseAsEpilogue.
|
||||
assert((UseLEA || !terminatorsNeedFlagsAsInput(MBB)) &&
|
||||
assert((UseLEA || !flagsNeedToBePreservedBeforeTheTerminators(MBB)) &&
|
||||
"We shouldn't have allowed this insertion point");
|
||||
}
|
||||
|
||||
@ -2597,10 +2580,10 @@ bool X86FrameLowering::canUseAsEpilogue(const MachineBasicBlock &MBB) const {
|
||||
return true;
|
||||
|
||||
// If we cannot use LEA to adjust SP, we may need to use ADD, which
|
||||
// clobbers the EFLAGS. Check that none of the terminators reads the
|
||||
// EFLAGS, and if one uses it, conservatively assume this is not
|
||||
// clobbers the EFLAGS. Check that we do not need to preserve it,
|
||||
// otherwise, conservatively assume this is not
|
||||
// safe to insert the epilogue here.
|
||||
return !terminatorsNeedFlagsAsInput(MBB);
|
||||
return !flagsNeedToBePreservedBeforeTheTerminators(MBB);
|
||||
}
|
||||
|
||||
MachineBasicBlock::iterator X86FrameLowering::restoreWin32EHStackPointers(
|
||||
|
113
test/CodeGen/X86/i386-shrink-wrapping.ll
Normal file
113
test/CodeGen/X86/i386-shrink-wrapping.ll
Normal file
@ -0,0 +1,113 @@
|
||||
; RUN: llc %s -o - -enable-shrink-wrap=true | FileCheck %s --check-prefix=CHECK --check-prefix=ENABLE
|
||||
; RUN: llc %s -o - -enable-shrink-wrap=false | FileCheck %s --check-prefix=CHECK --check-prefix=DISABLE
|
||||
target datalayout = "e-m:e-p:32:32-f64:32:64-f80:32-n8:16:32-S128"
|
||||
target triple = "i386-apple-macosx"
|
||||
|
||||
@a = common global i32 0, align 4
|
||||
@d = internal unnamed_addr global i1 false
|
||||
@b = common global i32 0, align 4
|
||||
@e = common global i8 0, align 1
|
||||
@f = common global i8 0, align 1
|
||||
@c = common global i32 0, align 4
|
||||
@.str = private unnamed_addr constant [4 x i8] c"%d\0A\00", align 1
|
||||
|
||||
|
||||
; Check that we are clobbering the flags when they are live-in of the
|
||||
; prologue block and the prologue needs to adjust the stack.
|
||||
; PR25607.
|
||||
;
|
||||
; CHECK-LABEL: eflagsLiveInPrologue:
|
||||
;
|
||||
; DISABLE: pushl
|
||||
; DISABLE-NEXT: pushl
|
||||
; DISABLE-NEXT: subl $20, %esp
|
||||
;
|
||||
; CHECK: movl L_a$non_lazy_ptr, [[A:%[a-z]+]]
|
||||
; CHECK-NEXT: cmpl $0, ([[A]])
|
||||
; CHECK-NEXT: je [[PREHEADER_LABEL:LBB[0-9_]+]]
|
||||
;
|
||||
; CHECK: movb $1, _d
|
||||
;
|
||||
; CHECK: [[PREHEADER_LABEL]]:
|
||||
; CHECK-NEXT: movl L_b$non_lazy_ptr, [[B:%[a-z]+]]
|
||||
; CHECK-NEXT: movl ([[B]]), [[TMP1:%[a-z]+]]
|
||||
; CHECK-NEXT: testl [[TMP1]], [[TMP1]]
|
||||
; CHECK-NEXT: je [[FOREND_LABEL:LBB[0-9_]+]]
|
||||
;
|
||||
; Skip the loop.
|
||||
; [...]
|
||||
;
|
||||
; The for.end block is split to accomadate the different selects.
|
||||
; We are interested in the one with the call, so skip until the branch.
|
||||
; CHECK: [[FOREND_LABEL]]:
|
||||
; CHECK-NEXT: movb _d, [[D:%[a-z]+]]
|
||||
; [...]
|
||||
; CHECK: jne [[CALL_LABEL:LBB[0-9_]+]]
|
||||
;
|
||||
; CHECK: movb $6, [[D]]
|
||||
;
|
||||
; CHECK: [[CALL_LABEL]]
|
||||
;
|
||||
; ENABLE-NEXT: pushl
|
||||
; ENABLE-NEXT: pushl
|
||||
; We must not use sub here otherwise we will clobber the eflags.
|
||||
; ENABLE-NEXT: leal -20(%esp), %esp
|
||||
;
|
||||
; CHECK-NEXT: L_e$non_lazy_ptr, [[E:%[a-z]+]]
|
||||
; CHECK-NEXT: movb [[D]], ([[E]])
|
||||
; CHECK-NEXT: L_f$non_lazy_ptr, [[F:%[a-z]+]]
|
||||
; CHECK-NEXT: movsbl ([[F]]), [[CONV:%[a-z]+]]
|
||||
; CHECK-NEXT: movl $6, [[CONV:%[a-z]+]]
|
||||
; The eflags is used in the next instruction.
|
||||
; If that instruction disappear, we are not exercising the bug
|
||||
; anymore.
|
||||
; CHECK-NEXT: cmovnel {{%[a-z]+}}, [[CONV]]
|
||||
;
|
||||
; Skip all the crust of vaarg lowering.
|
||||
; CHECK: calll L_varfunc$stub
|
||||
; Set the return value to 0.
|
||||
; CHECK-NEXT: xorl %eax, %eax
|
||||
; CHECK-NEXT: addl $20, %esp
|
||||
; CHECK-NEXT: popl
|
||||
; CHECK-NEXT: popl
|
||||
; CHECK-NEXT: retl
|
||||
define i32 @eflagsLiveInPrologue() #0 {
|
||||
entry:
|
||||
%tmp = load i32, i32* @a, align 4
|
||||
%tobool = icmp eq i32 %tmp, 0
|
||||
br i1 %tobool, label %for.cond.preheader, label %if.then
|
||||
|
||||
if.then: ; preds = %entry
|
||||
store i1 true, i1* @d, align 1
|
||||
br label %for.cond.preheader
|
||||
|
||||
for.cond.preheader: ; preds = %if.then, %entry
|
||||
%tmp1 = load i32, i32* @b, align 4
|
||||
%tobool14 = icmp eq i32 %tmp1, 0
|
||||
br i1 %tobool14, label %for.end, label %for.body.preheader
|
||||
|
||||
for.body.preheader: ; preds = %for.cond.preheader
|
||||
br label %for.body
|
||||
|
||||
for.body: ; preds = %for.body, %for.body.preheader
|
||||
br label %for.body
|
||||
|
||||
for.end: ; preds = %for.cond.preheader
|
||||
%.b3 = load i1, i1* @d, align 1
|
||||
%tmp2 = select i1 %.b3, i8 0, i8 6
|
||||
store i8 %tmp2, i8* @e, align 1
|
||||
%tmp3 = load i8, i8* @f, align 1
|
||||
%conv = sext i8 %tmp3 to i32
|
||||
%add = add nsw i32 %conv, 1
|
||||
%rem = srem i32 %tmp1, %add
|
||||
store i32 %rem, i32* @c, align 4
|
||||
%conv2 = select i1 %.b3, i32 0, i32 6
|
||||
%call = tail call i32 (i8*, ...) @varfunc(i8* nonnull getelementptr inbounds ([4 x i8], [4 x i8]* @.str, i32 0, i32 0), i32 %conv2) #1
|
||||
ret i32 0
|
||||
}
|
||||
|
||||
; Function Attrs: nounwind
|
||||
declare i32 @varfunc(i8* nocapture readonly, ...) #0
|
||||
|
||||
attributes #0 = { nounwind "disable-tail-calls"="false" "less-precise-fpmad"="false" "no-frame-pointer-elim"="false" "no-infs-fp-math"="false" "no-nans-fp-math"="false" "stack-protector-buffer-size"="8" "target-features"="+mmx,+sse" "unsafe-fp-math"="false" "use-soft-float"="false" }
|
||||
attributes #1 = { nounwind }
|
Loading…
Reference in New Issue
Block a user