mirror of
https://github.com/RPCS3/llvm.git
synced 2024-12-28 07:05:03 +00:00
e6c3cc8dc5
local frame causes problem. For example: void f(StructToPass s) { g(&s, sizeof(s)); } will cause problem with tail-call since part of s is passed via registers and saved in f's local frame. When g tries to access s, part of s may be corrupted since f's local frame is popped out before the tail-call. The current fix is to disable tail-call if getVarArgsRegSaveSize is not 0 for the caller. This is a conservative approach, if we can prove the address of s or part of s is not taken and passed to g, it should be okay to perform tail-call. rdar://12442472 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@165853 91177308-0d34-0410-b5e6-96231b3b80d8
91 lines
2.5 KiB
LLVM
91 lines
2.5 KiB
LLVM
; RUN: llc < %s -mtriple=armv7-apple-ios6.0 | FileCheck %s
|
|
|
|
; rdar://9877866
|
|
%struct.SmallStruct = type { i32, [8 x i32], [37 x i8] }
|
|
%struct.LargeStruct = type { i32, [1001 x i8], [300 x i32] }
|
|
|
|
define i32 @f() nounwind ssp {
|
|
entry:
|
|
; CHECK: f:
|
|
; CHECK: ldr
|
|
; CHECK: str
|
|
; CHECK-NOT:bne
|
|
%st = alloca %struct.SmallStruct, align 4
|
|
%call = call i32 @e1(%struct.SmallStruct* byval %st)
|
|
ret i32 0
|
|
}
|
|
|
|
; Generate a loop for large struct byval
|
|
define i32 @g() nounwind ssp {
|
|
entry:
|
|
; CHECK: g:
|
|
; CHECK: ldr
|
|
; CHECK: sub
|
|
; CHECK: str
|
|
; CHECK: bne
|
|
%st = alloca %struct.LargeStruct, align 4
|
|
%call = call i32 @e2(%struct.LargeStruct* byval %st)
|
|
ret i32 0
|
|
}
|
|
|
|
; Generate a loop using NEON instructions
|
|
define i32 @h() nounwind ssp {
|
|
entry:
|
|
; CHECK: h:
|
|
; CHECK: vld1
|
|
; CHECK: sub
|
|
; CHECK: vst1
|
|
; CHECK: bne
|
|
%st = alloca %struct.LargeStruct, align 16
|
|
%call = call i32 @e3(%struct.LargeStruct* byval align 16 %st)
|
|
ret i32 0
|
|
}
|
|
|
|
declare i32 @e1(%struct.SmallStruct* nocapture byval %in) nounwind
|
|
declare i32 @e2(%struct.LargeStruct* nocapture byval %in) nounwind
|
|
declare i32 @e3(%struct.LargeStruct* nocapture byval align 16 %in) nounwind
|
|
|
|
; rdar://12442472
|
|
; We can't do tail call since address of s is passed to the callee and part of
|
|
; s is in caller's local frame.
|
|
define void @f3(%struct.SmallStruct* nocapture byval %s) nounwind optsize {
|
|
; CHECK: f3
|
|
; CHECK: bl _consumestruct
|
|
entry:
|
|
%0 = bitcast %struct.SmallStruct* %s to i8*
|
|
tail call void @consumestruct(i8* %0, i32 80) optsize
|
|
ret void
|
|
}
|
|
|
|
define void @f4(%struct.SmallStruct* nocapture byval %s) nounwind optsize {
|
|
; CHECK: f4
|
|
; CHECK: bl _consumestruct
|
|
entry:
|
|
%addr = getelementptr inbounds %struct.SmallStruct* %s, i32 0, i32 0
|
|
%0 = bitcast i32* %addr to i8*
|
|
tail call void @consumestruct(i8* %0, i32 80) optsize
|
|
ret void
|
|
}
|
|
|
|
; We can do tail call here since s is in the incoming argument area.
|
|
define void @f5(i32 %a, i32 %b, i32 %c, i32 %d, %struct.SmallStruct* nocapture byval %s) nounwind optsize {
|
|
; CHECK: f5
|
|
; CHECK: b _consumestruct
|
|
entry:
|
|
%0 = bitcast %struct.SmallStruct* %s to i8*
|
|
tail call void @consumestruct(i8* %0, i32 80) optsize
|
|
ret void
|
|
}
|
|
|
|
define void @f6(i32 %a, i32 %b, i32 %c, i32 %d, %struct.SmallStruct* nocapture byval %s) nounwind optsize {
|
|
; CHECK: f6
|
|
; CHECK: b _consumestruct
|
|
entry:
|
|
%addr = getelementptr inbounds %struct.SmallStruct* %s, i32 0, i32 0
|
|
%0 = bitcast i32* %addr to i8*
|
|
tail call void @consumestruct(i8* %0, i32 80) optsize
|
|
ret void
|
|
}
|
|
|
|
declare void @consumestruct(i8* nocapture %structp, i32 %structsize) nounwind
|