mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-12-05 02:07:56 +00:00
8a77617721
Summary: This patch fixes an issue so that the right alias is printed when the instruction has tied operands. It checks the number of operands in the resulting instruction as opposed to the alias, and then skips over tied operands that should not be printed in the alias. This allows to generate the preferred assembly syntax for the AArch64 'ins' instruction, which should always be displayed as 'mov' according to the ARM Architecture Reference Manual. Several unit tests have changed as a result, but only to reflect the preferred disassembly. Some other InstAlias patterns (movk/bic/orr) needed a slight adjustment to stop them becoming the default and breaking other unit tests. Please note that the patch is mostly the same as https://reviews.llvm.org/D29219 which was reverted because of an issue found when running TableGen with the Address Sanitizer. That issue has been addressed in this iteration of the patch. Reviewers: rengolin, stoklund, huntergr, SjoerdMeijer, rovka Reviewed By: rengolin, SjoerdMeijer Subscribers: fhahn, aemerson, javed.absar, kristof.beyls, llvm-commits Differential Revision: https://reviews.llvm.org/D40030 llvm-svn: 318650
165 lines
5.2 KiB
LLVM
165 lines
5.2 KiB
LLVM
; RUN: llc < %s -mtriple=arm64-eabi -aarch64-neon-syntax=apple -asm-verbose=false | FileCheck %s
|
|
|
|
define i32 @vmax_u8x8(<8 x i8> %a) nounwind ssp {
|
|
; CHECK-LABEL: vmax_u8x8:
|
|
; CHECK: umaxv.8b b[[REG:[0-9]+]], v0
|
|
; CHECK: fmov [[REG2:w[0-9]+]], s[[REG]]
|
|
; CHECK-NOT: and
|
|
; CHECK: cbz [[REG2]],
|
|
entry:
|
|
%vmaxv.i = tail call i32 @llvm.aarch64.neon.umaxv.i32.v8i8(<8 x i8> %a) nounwind
|
|
%tmp = trunc i32 %vmaxv.i to i8
|
|
%tobool = icmp eq i8 %tmp, 0
|
|
br i1 %tobool, label %return, label %if.then
|
|
|
|
if.then:
|
|
%call1 = tail call i32 bitcast (i32 (...)* @bar to i32 ()*)() nounwind
|
|
br label %return
|
|
|
|
return:
|
|
%retval.0 = phi i32 [ %call1, %if.then ], [ 0, %entry ]
|
|
ret i32 %retval.0
|
|
}
|
|
|
|
declare i32 @bar(...)
|
|
|
|
define i32 @vmax_u4x16(<4 x i16> %a) nounwind ssp {
|
|
; CHECK-LABEL: vmax_u4x16:
|
|
; CHECK: umaxv.4h h[[REG:[0-9]+]], v0
|
|
; CHECK: fmov [[REG2:w[0-9]+]], s[[REG]]
|
|
; CHECK-NOT: and
|
|
; CHECK: cbz [[REG2]],
|
|
entry:
|
|
%vmaxv.i = tail call i32 @llvm.aarch64.neon.umaxv.i32.v4i16(<4 x i16> %a) nounwind
|
|
%tmp = trunc i32 %vmaxv.i to i16
|
|
%tobool = icmp eq i16 %tmp, 0
|
|
br i1 %tobool, label %return, label %if.then
|
|
|
|
if.then:
|
|
%call1 = tail call i32 bitcast (i32 (...)* @bar to i32 ()*)() nounwind
|
|
br label %return
|
|
|
|
return:
|
|
%retval.0 = phi i32 [ %call1, %if.then ], [ 0, %entry ]
|
|
ret i32 %retval.0
|
|
}
|
|
|
|
define i32 @vmax_u8x16(<8 x i16> %a) nounwind ssp {
|
|
; CHECK-LABEL: vmax_u8x16:
|
|
; CHECK: umaxv.8h h[[REG:[0-9]+]], v0
|
|
; CHECK: fmov [[REG2:w[0-9]+]], s[[REG]]
|
|
; CHECK-NOT: and
|
|
; CHECK: cbz [[REG2]],
|
|
entry:
|
|
%vmaxv.i = tail call i32 @llvm.aarch64.neon.umaxv.i32.v8i16(<8 x i16> %a) nounwind
|
|
%tmp = trunc i32 %vmaxv.i to i16
|
|
%tobool = icmp eq i16 %tmp, 0
|
|
br i1 %tobool, label %return, label %if.then
|
|
|
|
if.then:
|
|
%call1 = tail call i32 bitcast (i32 (...)* @bar to i32 ()*)() nounwind
|
|
br label %return
|
|
|
|
return:
|
|
%retval.0 = phi i32 [ %call1, %if.then ], [ 0, %entry ]
|
|
ret i32 %retval.0
|
|
}
|
|
|
|
define i32 @vmax_u16x8(<16 x i8> %a) nounwind ssp {
|
|
; CHECK-LABEL: vmax_u16x8:
|
|
; CHECK: umaxv.16b b[[REG:[0-9]+]], v0
|
|
; CHECK: fmov [[REG2:w[0-9]+]], s[[REG]]
|
|
; CHECK-NOT: and
|
|
; CHECK: cbz [[REG2]],
|
|
entry:
|
|
%vmaxv.i = tail call i32 @llvm.aarch64.neon.umaxv.i32.v16i8(<16 x i8> %a) nounwind
|
|
%tmp = trunc i32 %vmaxv.i to i8
|
|
%tobool = icmp eq i8 %tmp, 0
|
|
br i1 %tobool, label %return, label %if.then
|
|
|
|
if.then:
|
|
%call1 = tail call i32 bitcast (i32 (...)* @bar to i32 ()*)() nounwind
|
|
br label %return
|
|
|
|
return:
|
|
%retval.0 = phi i32 [ %call1, %if.then ], [ 0, %entry ]
|
|
ret i32 %retval.0
|
|
}
|
|
|
|
define <8 x i8> @test_vmaxv_u8_used_by_laneop(<8 x i8> %a1, <8 x i8> %a2) {
|
|
; CHECK-LABEL: test_vmaxv_u8_used_by_laneop:
|
|
; CHECK: umaxv.8b b[[REGNUM:[0-9]+]], v1
|
|
; CHECK-NEXT: mov.b v0[3], v[[REGNUM]][0]
|
|
; CHECK-NEXT: ret
|
|
entry:
|
|
%0 = tail call i32 @llvm.aarch64.neon.umaxv.i32.v8i8(<8 x i8> %a2)
|
|
%1 = trunc i32 %0 to i8
|
|
%2 = insertelement <8 x i8> %a1, i8 %1, i32 3
|
|
ret <8 x i8> %2
|
|
}
|
|
|
|
define <4 x i16> @test_vmaxv_u16_used_by_laneop(<4 x i16> %a1, <4 x i16> %a2) {
|
|
; CHECK-LABEL: test_vmaxv_u16_used_by_laneop:
|
|
; CHECK: umaxv.4h h[[REGNUM:[0-9]+]], v1
|
|
; CHECK-NEXT: mov.h v0[3], v[[REGNUM]][0]
|
|
; CHECK-NEXT: ret
|
|
entry:
|
|
%0 = tail call i32 @llvm.aarch64.neon.umaxv.i32.v4i16(<4 x i16> %a2)
|
|
%1 = trunc i32 %0 to i16
|
|
%2 = insertelement <4 x i16> %a1, i16 %1, i32 3
|
|
ret <4 x i16> %2
|
|
}
|
|
|
|
define <2 x i32> @test_vmaxv_u32_used_by_laneop(<2 x i32> %a1, <2 x i32> %a2) {
|
|
; CHECK-LABEL: test_vmaxv_u32_used_by_laneop:
|
|
; CHECK: umaxp.2s v[[REGNUM:[0-9]+]], v1, v1
|
|
; CHECK-NEXT: mov.s v0[1], v[[REGNUM]][0]
|
|
; CHECK-NEXT: ret
|
|
entry:
|
|
%0 = tail call i32 @llvm.aarch64.neon.umaxv.i32.v2i32(<2 x i32> %a2)
|
|
%1 = insertelement <2 x i32> %a1, i32 %0, i32 1
|
|
ret <2 x i32> %1
|
|
}
|
|
|
|
define <16 x i8> @test_vmaxvq_u8_used_by_laneop(<16 x i8> %a1, <16 x i8> %a2) {
|
|
; CHECK-LABEL: test_vmaxvq_u8_used_by_laneop:
|
|
; CHECK: umaxv.16b b[[REGNUM:[0-9]+]], v1
|
|
; CHECK-NEXT: mov.b v0[3], v[[REGNUM]][0]
|
|
; CHECK-NEXT: ret
|
|
entry:
|
|
%0 = tail call i32 @llvm.aarch64.neon.umaxv.i32.v16i8(<16 x i8> %a2)
|
|
%1 = trunc i32 %0 to i8
|
|
%2 = insertelement <16 x i8> %a1, i8 %1, i32 3
|
|
ret <16 x i8> %2
|
|
}
|
|
|
|
define <8 x i16> @test_vmaxvq_u16_used_by_laneop(<8 x i16> %a1, <8 x i16> %a2) {
|
|
; CHECK-LABEL: test_vmaxvq_u16_used_by_laneop:
|
|
; CHECK: umaxv.8h h[[REGNUM:[0-9]+]], v1
|
|
; CHECK-NEXT: mov.h v0[3], v[[REGNUM]][0]
|
|
; CHECK-NEXT: ret
|
|
entry:
|
|
%0 = tail call i32 @llvm.aarch64.neon.umaxv.i32.v8i16(<8 x i16> %a2)
|
|
%1 = trunc i32 %0 to i16
|
|
%2 = insertelement <8 x i16> %a1, i16 %1, i32 3
|
|
ret <8 x i16> %2
|
|
}
|
|
|
|
define <4 x i32> @test_vmaxvq_u32_used_by_laneop(<4 x i32> %a1, <4 x i32> %a2) {
|
|
; CHECK-LABEL: test_vmaxvq_u32_used_by_laneop:
|
|
; CHECK: umaxv.4s s[[REGNUM:[0-9]+]], v1
|
|
; CHECK-NEXT: mov.s v0[3], v[[REGNUM]][0]
|
|
; CHECK-NEXT: ret
|
|
entry:
|
|
%0 = tail call i32 @llvm.aarch64.neon.umaxv.i32.v4i32(<4 x i32> %a2)
|
|
%1 = insertelement <4 x i32> %a1, i32 %0, i32 3
|
|
ret <4 x i32> %1
|
|
}
|
|
|
|
declare i32 @llvm.aarch64.neon.umaxv.i32.v16i8(<16 x i8>) nounwind readnone
|
|
declare i32 @llvm.aarch64.neon.umaxv.i32.v8i16(<8 x i16>) nounwind readnone
|
|
declare i32 @llvm.aarch64.neon.umaxv.i32.v4i16(<4 x i16>) nounwind readnone
|
|
declare i32 @llvm.aarch64.neon.umaxv.i32.v8i8(<8 x i8>) nounwind readnone
|
|
declare i32 @llvm.aarch64.neon.umaxv.i32.v2i32(<2 x i32>) nounwind readnone
|
|
declare i32 @llvm.aarch64.neon.umaxv.i32.v4i32(<4 x i32>) nounwind readnone
|