mirror of
https://github.com/RPCSX/llvm.git
synced 2024-11-23 19:59:57 +00:00
f41c3c9239
The benchmarking summarized in http://lists.llvm.org/pipermail/llvm-dev/2017-May/113525.html showed this is beneficial for a wide range of cores. As is to be expected, quite a few small adaptations are needed to the regressions tests, as the difference in scheduling results in: - Quite a few small instruction schedule differences. - A few changes in register allocation decisions caused by different instruction schedules. - A few changes in IfConversion decisions, due to a difference in instruction schedule and/or the estimated cost of a branch mispredict. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@306514 91177308-0d34-0410-b5e6-96231b3b80d8
40 lines
1.4 KiB
LLVM
40 lines
1.4 KiB
LLVM
; REQUIRES: asserts
|
|
; RUN: llc < %s -mtriple=armv8r-eabi -mcpu=cortex-r52 -enable-misched -verify-misched -debug-only=machine-scheduler -o - 2>&1 > /dev/null | FileCheck %s --check-prefix=CHECK --check-prefix=R52_SCHED
|
|
; RUN: llc < %s -mtriple=armv8r-eabi -mcpu=generic -enable-misched -verify-misched -debug-only=machine-scheduler -o - 2>&1 > /dev/null | FileCheck %s --check-prefix=CHECK --check-prefix=GENERIC
|
|
;
|
|
; Check the latency for instructions for both generic and cortex-r52.
|
|
; Cortex-r52 machine model will cause the div to be sceduled before eor
|
|
; as div takes more cycles to compute than eor.
|
|
;
|
|
; CHECK: ********** MI Scheduling **********
|
|
; CHECK: foo:BB#0 entry
|
|
; CHECK: EORrr
|
|
; GENERIC: Latency : 1
|
|
; R52_SCHED: Latency : 3
|
|
; CHECK: MLA
|
|
; GENERIC: Latency : 2
|
|
; R52_SCHED: Latency : 4
|
|
; CHECK: SDIV
|
|
; GENERIC: Latency : 0
|
|
; R52_SCHED: Latency : 8
|
|
; CHECK: ** Final schedule for BB#0 ***
|
|
; GENERIC: EORrr
|
|
; GENERIC: SDIV
|
|
; R52_SCHED: SDIV
|
|
; R52_SCHED: EORrr
|
|
; CHECK: ********** INTERVALS **********
|
|
|
|
target datalayout = "e-m:e-p:32:32-i64:64-v128:64:128-a:0:32-n32-S64"
|
|
target triple = "armv8r-arm-none-eabi"
|
|
|
|
; Function Attrs: norecurse nounwind readnone
|
|
define hidden i32 @foo(i32 %a, i32 %b, i32 %c) local_unnamed_addr #0 {
|
|
entry:
|
|
%xor = xor i32 %c, %b
|
|
%mul = mul nsw i32 %xor, %c
|
|
%add = add nsw i32 %mul, %a
|
|
%div = sdiv i32 %a, %b
|
|
%sub = sub i32 %add, %div
|
|
ret i32 %sub
|
|
}
|