mirror of
https://github.com/RPCS3/llvm.git
synced 2025-01-27 13:42:24 +00:00
7b837d8c75
This adds a second implementation of the AArch64 architecture to LLVM, accessible in parallel via the "arm64" triple. The plan over the coming weeks & months is to merge the two into a single backend, during which time thorough code review should naturally occur. Everything will be easier with the target in-tree though, hence this commit. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@205090 91177308-0d34-0410-b5e6-96231b3b80d8
93 lines
2.7 KiB
LLVM
93 lines
2.7 KiB
LLVM
; RUN: llc < %s -march=arm64 -arm64-neon-syntax=apple | FileCheck %s
|
|
|
|
define i32 @vmax_u8x8(<8 x i8> %a) nounwind ssp {
|
|
; CHECK-LABEL: vmax_u8x8:
|
|
; CHECK: umaxv.8b b[[REG:[0-9]+]], v0
|
|
; CHECK: fmov [[REG2:w[0-9]+]], s[[REG]]
|
|
; CHECK-NOT: and
|
|
; CHECK: cbz [[REG2]],
|
|
entry:
|
|
%vmaxv.i = tail call i32 @llvm.arm64.neon.umaxv.i32.v8i8(<8 x i8> %a) nounwind
|
|
%tmp = trunc i32 %vmaxv.i to i8
|
|
%tobool = icmp eq i8 %tmp, 0
|
|
br i1 %tobool, label %return, label %if.then
|
|
|
|
if.then:
|
|
%call1 = tail call i32 bitcast (i32 (...)* @bar to i32 ()*)() nounwind
|
|
br label %return
|
|
|
|
return:
|
|
%retval.0 = phi i32 [ %call1, %if.then ], [ 0, %entry ]
|
|
ret i32 %retval.0
|
|
}
|
|
|
|
declare i32 @bar(...)
|
|
|
|
define i32 @vmax_u4x16(<4 x i16> %a) nounwind ssp {
|
|
; CHECK-LABEL: vmax_u4x16:
|
|
; CHECK: umaxv.4h h[[REG:[0-9]+]], v0
|
|
; CHECK: fmov [[REG2:w[0-9]+]], s[[REG]]
|
|
; CHECK-NOT: and
|
|
; CHECK: cbz [[REG2]],
|
|
entry:
|
|
%vmaxv.i = tail call i32 @llvm.arm64.neon.umaxv.i32.v4i16(<4 x i16> %a) nounwind
|
|
%tmp = trunc i32 %vmaxv.i to i16
|
|
%tobool = icmp eq i16 %tmp, 0
|
|
br i1 %tobool, label %return, label %if.then
|
|
|
|
if.then:
|
|
%call1 = tail call i32 bitcast (i32 (...)* @bar to i32 ()*)() nounwind
|
|
br label %return
|
|
|
|
return:
|
|
%retval.0 = phi i32 [ %call1, %if.then ], [ 0, %entry ]
|
|
ret i32 %retval.0
|
|
}
|
|
|
|
define i32 @vmax_u8x16(<8 x i16> %a) nounwind ssp {
|
|
; CHECK-LABEL: vmax_u8x16:
|
|
; CHECK: umaxv.8h h[[REG:[0-9]+]], v0
|
|
; CHECK: fmov [[REG2:w[0-9]+]], s[[REG]]
|
|
; CHECK-NOT: and
|
|
; CHECK: cbz [[REG2]],
|
|
entry:
|
|
%vmaxv.i = tail call i32 @llvm.arm64.neon.umaxv.i32.v8i16(<8 x i16> %a) nounwind
|
|
%tmp = trunc i32 %vmaxv.i to i16
|
|
%tobool = icmp eq i16 %tmp, 0
|
|
br i1 %tobool, label %return, label %if.then
|
|
|
|
if.then:
|
|
%call1 = tail call i32 bitcast (i32 (...)* @bar to i32 ()*)() nounwind
|
|
br label %return
|
|
|
|
return:
|
|
%retval.0 = phi i32 [ %call1, %if.then ], [ 0, %entry ]
|
|
ret i32 %retval.0
|
|
}
|
|
|
|
define i32 @vmax_u16x8(<16 x i8> %a) nounwind ssp {
|
|
; CHECK-LABEL: vmax_u16x8:
|
|
; CHECK: umaxv.16b b[[REG:[0-9]+]], v0
|
|
; CHECK: fmov [[REG2:w[0-9]+]], s[[REG]]
|
|
; CHECK-NOT: and
|
|
; CHECK: cbz [[REG2]],
|
|
entry:
|
|
%vmaxv.i = tail call i32 @llvm.arm64.neon.umaxv.i32.v16i8(<16 x i8> %a) nounwind
|
|
%tmp = trunc i32 %vmaxv.i to i8
|
|
%tobool = icmp eq i8 %tmp, 0
|
|
br i1 %tobool, label %return, label %if.then
|
|
|
|
if.then:
|
|
%call1 = tail call i32 bitcast (i32 (...)* @bar to i32 ()*)() nounwind
|
|
br label %return
|
|
|
|
return:
|
|
%retval.0 = phi i32 [ %call1, %if.then ], [ 0, %entry ]
|
|
ret i32 %retval.0
|
|
}
|
|
|
|
declare i32 @llvm.arm64.neon.umaxv.i32.v16i8(<16 x i8>) nounwind readnone
|
|
declare i32 @llvm.arm64.neon.umaxv.i32.v8i16(<8 x i16>) nounwind readnone
|
|
declare i32 @llvm.arm64.neon.umaxv.i32.v4i16(<4 x i16>) nounwind readnone
|
|
declare i32 @llvm.arm64.neon.umaxv.i32.v8i8(<8 x i8>) nounwind readnone
|