mirror of
https://github.com/RPCSX/llvm.git
synced 2025-01-24 21:25:41 +00:00
f2558c2db4
Currently, in MachineBlockPlacement pass the loop is rotated to let the best exit to be the last BB in the loop chain, to maximize the fall-through from the loop to outside. With profile data, we can determine the cost in terms of missed fall through opportunities when rotating a loop chain and select the best rotation. Basically, there are three kinds of cost to consider for each rotation: 1. The possibly missed fall through edge (if it exists) from BB out of the loop to the loop header. 2. The possibly missed fall through edges (if they exist) from the loop exits to BB out of the loop. 3. The missed fall through edge (if it exists) from the last BB to the first BB in the loop chain. Therefore, the cost for a given rotation is the sum of costs listed above. We select the best rotation with the smallest cost. This is only for PGO mode when we have more precise edge frequencies. Differential revision: http://reviews.llvm.org/D10717 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@250754 91177308-0d34-0410-b5e6-96231b3b80d8
123 lines
2.2 KiB
LLVM
123 lines
2.2 KiB
LLVM
; RUN: llc -mcpu=corei7 -mtriple=x86_64-linux < %s | FileCheck %s -check-prefix=CHECK
|
|
; RUN: llc -mcpu=corei7 -mtriple=x86_64-linux -precise-rotation-cost < %s | FileCheck %s -check-prefix=CHECK-PROFILE
|
|
|
|
define void @foo() {
|
|
; Test a nested loop case when profile data is not available.
|
|
;
|
|
; CHECK-LABEL: foo:
|
|
; CHECK: callq b
|
|
; CHECK: callq c
|
|
; CHECK: callq d
|
|
; CHECK: callq e
|
|
; CHECK: callq f
|
|
; CHECK: callq g
|
|
; CHECK: callq h
|
|
|
|
entry:
|
|
br label %header
|
|
|
|
header:
|
|
call void @b()
|
|
%call = call zeroext i1 @a()
|
|
br i1 %call, label %if.then, label %if.else, !prof !2
|
|
|
|
if.then:
|
|
br label %header2
|
|
|
|
header2:
|
|
call void @c()
|
|
%call1 = call zeroext i1 @a()
|
|
br i1 %call1, label %if.then2, label %if.else2, !prof !2
|
|
|
|
if.then2:
|
|
call void @d()
|
|
br label %if.end2
|
|
|
|
if.else2:
|
|
call void @e()
|
|
br label %if.end2
|
|
|
|
if.end2:
|
|
call void @f()
|
|
%call2 = call zeroext i1 @a()
|
|
br i1 %call2, label %header2, label %if.end
|
|
|
|
if.else:
|
|
call void @g()
|
|
br label %if.end
|
|
|
|
if.end:
|
|
call void @h()
|
|
%call3 = call zeroext i1 @a()
|
|
br i1 %call3, label %header, label %end
|
|
|
|
end:
|
|
ret void
|
|
}
|
|
|
|
define void @bar() !prof !1 {
|
|
; Test a nested loop case when profile data is available.
|
|
;
|
|
; CHECK-PROFILE-LABEL: bar:
|
|
; CHECK-PROFILE: callq e
|
|
; CHECK-PROFILE: callq f
|
|
; CHECK-PROFILE: callq c
|
|
; CHECK-PROFILE: callq d
|
|
; CHECK-PROFILE: callq h
|
|
; CHECK-PROFILE: callq b
|
|
; CHECK-PROFILE: callq g
|
|
|
|
entry:
|
|
br label %header
|
|
|
|
header:
|
|
call void @b()
|
|
%call = call zeroext i1 @a()
|
|
br i1 %call, label %if.then, label %if.else, !prof !2
|
|
|
|
if.then:
|
|
br label %header2
|
|
|
|
header2:
|
|
call void @c()
|
|
%call1 = call zeroext i1 @a()
|
|
br i1 %call1, label %if.then2, label %if.else2, !prof !2
|
|
|
|
if.then2:
|
|
call void @d()
|
|
br label %if.end2
|
|
|
|
if.else2:
|
|
call void @e()
|
|
br label %if.end2
|
|
|
|
if.end2:
|
|
call void @f()
|
|
%call2 = call zeroext i1 @a()
|
|
br i1 %call2, label %header2, label %if.end
|
|
|
|
if.else:
|
|
call void @g()
|
|
br label %if.end
|
|
|
|
if.end:
|
|
call void @h()
|
|
%call3 = call zeroext i1 @a()
|
|
br i1 %call3, label %header, label %end
|
|
|
|
end:
|
|
ret void
|
|
}
|
|
|
|
declare zeroext i1 @a()
|
|
declare void @b()
|
|
declare void @c()
|
|
declare void @d()
|
|
declare void @e()
|
|
declare void @f()
|
|
declare void @g()
|
|
declare void @h()
|
|
|
|
!1 = !{!"function_entry_count", i64 1}
|
|
!2 = !{!"branch_weights", i32 16, i32 16}
|