mirror of
https://github.com/RPCS3/llvm.git
synced 2025-01-23 11:04:49 +00:00
c60a59cad3
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@208316 91177308-0d34-0410-b5e6-96231b3b80d8
78 lines
2.5 KiB
LLVM
78 lines
2.5 KiB
LLVM
; RUN: llc -mtriple=arm-eabi %s -o - | FileCheck %s -check-prefix=CHECK --check-prefix=CHECK-LE
|
|
; RUN: llc -mtriple=armv7-eabi %s -o - | FileCheck %s --check-prefix=CHECK-V7-LE
|
|
; RUN: llc -mtriple=armeb-eabi %s -o - | FileCheck %s --check-prefix=CHECK --check-prefix=CHECK-BE
|
|
; RUN: llc -mtriple=armebv7-eabi %s -o - | FileCheck %s -check-prefix=CHECK-V7-BE
|
|
; Check generated signed and unsigned multiply accumulate long.
|
|
|
|
define i64 @MACLongTest1(i32 %a, i32 %b, i64 %c) {
|
|
;CHECK-LABEL: MACLongTest1:
|
|
;CHECK: umlal
|
|
%conv = zext i32 %a to i64
|
|
%conv1 = zext i32 %b to i64
|
|
%mul = mul i64 %conv1, %conv
|
|
%add = add i64 %mul, %c
|
|
ret i64 %add
|
|
}
|
|
|
|
define i64 @MACLongTest2(i32 %a, i32 %b, i64 %c) {
|
|
;CHECK-LABEL: MACLongTest2:
|
|
;CHECK: smlal
|
|
%conv = sext i32 %a to i64
|
|
%conv1 = sext i32 %b to i64
|
|
%mul = mul nsw i64 %conv1, %conv
|
|
%add = add nsw i64 %mul, %c
|
|
ret i64 %add
|
|
}
|
|
|
|
define i64 @MACLongTest3(i32 %a, i32 %b, i32 %c) {
|
|
;CHECK-LABEL: MACLongTest3:
|
|
;CHECK: umlal
|
|
%conv = zext i32 %b to i64
|
|
%conv1 = zext i32 %a to i64
|
|
%mul = mul i64 %conv, %conv1
|
|
%conv2 = zext i32 %c to i64
|
|
%add = add i64 %mul, %conv2
|
|
ret i64 %add
|
|
}
|
|
|
|
define i64 @MACLongTest4(i32 %a, i32 %b, i32 %c) {
|
|
;CHECK-LABEL: MACLongTest4:
|
|
;CHECK: smlal
|
|
%conv = sext i32 %b to i64
|
|
%conv1 = sext i32 %a to i64
|
|
%mul = mul nsw i64 %conv, %conv1
|
|
%conv2 = sext i32 %c to i64
|
|
%add = add nsw i64 %mul, %conv2
|
|
ret i64 %add
|
|
}
|
|
|
|
; Two things to check here: the @earlyclobber constraint (on <= v5) and the "$Rd = $R" ones.
|
|
; + Without @earlyclobber the v7 code is natural. With it, the first two
|
|
; registers must be distinct from the third.
|
|
; + Without "$Rd = $R", this can be satisfied without a mov before the umlal
|
|
; by trying to use 6 different registers in the MachineInstr. The natural
|
|
; evolution of this attempt currently leaves only two movs in the final
|
|
; function, both after the umlal. With it, *some* move has to happen
|
|
; before the umlal.
|
|
define i64 @MACLongTest5(i64 %c, i32 %a, i32 %b) {
|
|
; CHECK-V7-LE-LABEL: MACLongTest5:
|
|
; CHECK-V7-LE-LABEL: umlal r0, r1, r0, r0
|
|
; CHECK-V7-BE-LABEL: MACLongTest5:
|
|
; CHECK-V7-BE-LABEL: umlal r1, r0, r1, r1
|
|
|
|
; CHECK-LABEL: MACLongTest5:
|
|
; CHECK-LE: mov [[RDLO:r[0-9]+]], r0
|
|
; CHECK-LE: umlal [[RDLO]], r1, r0, r0
|
|
; CHECK-LE: mov r0, [[RDLO]]
|
|
; CHECK-BE: mov [[RDLO:r[0-9]+]], r1
|
|
; CHECK-BE: umlal [[RDLO]], r0, r1, r1
|
|
; CHECK-BE: mov r1, [[RDLO]]
|
|
|
|
%conv.trunc = trunc i64 %c to i32
|
|
%conv = zext i32 %conv.trunc to i64
|
|
%conv1 = zext i32 %b to i64
|
|
%mul = mul i64 %conv, %conv
|
|
%add = add i64 %mul, %c
|
|
ret i64 %add
|
|
}
|