mirror of
https://github.com/RPCS3/llvm.git
synced 2024-12-22 20:20:03 +00:00
X86: Enable ISel of 16-bit MOVBE instructions.
When the MOVBE instructions are available, use them for 16-bit endian swapping as well as for 32 and 64 bit. The patterns were already present on the instructions, but weren't being matched because the operation was unconditionally marked to 'Expand.' Change that to be conditional on whether the MOVBE instructions are available. Use 'rolw' to implement the in-register version (32 and 64 bit have the dedicated 'bswap' instruction for that). Patch by Louis Gerbarg <lgg@apple.com>. rdar://15479984 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@203524 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
2ab1641041
commit
7a37166a7a
@ -505,7 +505,9 @@ void X86TargetLowering::resetOperationActions() {
|
||||
}
|
||||
|
||||
setOperationAction(ISD::READCYCLECOUNTER , MVT::i64 , Custom);
|
||||
setOperationAction(ISD::BSWAP , MVT::i16 , Expand);
|
||||
|
||||
if (!Subtarget->hasMOVBE())
|
||||
setOperationAction(ISD::BSWAP , MVT::i16 , Expand);
|
||||
|
||||
// These should be promoted to a larger select which is supported.
|
||||
setOperationAction(ISD::SELECT , MVT::i1 , Promote);
|
||||
|
@ -1839,3 +1839,9 @@ def : Pat<(cttz_zero_undef GR64:$src), (BSF64rr GR64:$src)>;
|
||||
def : Pat<(cttz_zero_undef (loadi16 addr:$src)), (BSF16rm addr:$src)>;
|
||||
def : Pat<(cttz_zero_undef (loadi32 addr:$src)), (BSF32rm addr:$src)>;
|
||||
def : Pat<(cttz_zero_undef (loadi64 addr:$src)), (BSF64rm addr:$src)>;
|
||||
|
||||
// When HasMOVBE is enabled it is possible to get a non-legalized
|
||||
// register-register 16 bit bswap. This maps it to a ROL instruction.
|
||||
let Predicates = [HasMOVBE] in {
|
||||
def : Pat<(bswap GR16:$src), (ROL16ri GR16:$src, (i8 8))>;
|
||||
}
|
||||
|
@ -1,45 +1,66 @@
|
||||
; RUN: llc -mtriple=x86_64-linux -mcpu=atom < %s | FileCheck %s
|
||||
; RUN: llc -mtriple=x86_64-linux -mcpu=slm < %s | FileCheck %s -check-prefix=SLM
|
||||
|
||||
declare i16 @llvm.bswap.i16(i16) nounwind readnone
|
||||
declare i32 @llvm.bswap.i32(i32) nounwind readnone
|
||||
declare i64 @llvm.bswap.i64(i64) nounwind readnone
|
||||
|
||||
define void @test1(i32* nocapture %x, i32 %y) nounwind {
|
||||
define void @test1(i16* nocapture %x, i16 %y) nounwind {
|
||||
%bswap = call i16 @llvm.bswap.i16(i16 %y)
|
||||
store i16 %bswap, i16* %x, align 2
|
||||
ret void
|
||||
; CHECK-LABEL: test1:
|
||||
; CHECK: movbew %si, (%rdi)
|
||||
; SLM-LABEL: test1:
|
||||
; SLM: movbew %si, (%rdi)
|
||||
}
|
||||
|
||||
define i16 @test2(i16* %x) nounwind {
|
||||
%load = load i16* %x, align 2
|
||||
%bswap = call i16 @llvm.bswap.i16(i16 %load)
|
||||
ret i16 %bswap
|
||||
; CHECK-LABEL: test2:
|
||||
; CHECK: movbew (%rdi), %ax
|
||||
; SLM-LABEL: test2:
|
||||
; SLM: movbew (%rdi), %ax
|
||||
}
|
||||
|
||||
define void @test3(i32* nocapture %x, i32 %y) nounwind {
|
||||
%bswap = call i32 @llvm.bswap.i32(i32 %y)
|
||||
store i32 %bswap, i32* %x, align 4
|
||||
ret void
|
||||
; CHECK-LABEL: test1:
|
||||
; CHECK-LABEL: test3:
|
||||
; CHECK: movbel %esi, (%rdi)
|
||||
; SLM-LABEL: test1:
|
||||
; SLM-LABEL: test3:
|
||||
; SLM: movbel %esi, (%rdi)
|
||||
}
|
||||
|
||||
define i32 @test2(i32* %x) nounwind {
|
||||
define i32 @test4(i32* %x) nounwind {
|
||||
%load = load i32* %x, align 4
|
||||
%bswap = call i32 @llvm.bswap.i32(i32 %load)
|
||||
ret i32 %bswap
|
||||
; CHECK-LABEL: test2:
|
||||
; CHECK-LABEL: test4:
|
||||
; CHECK: movbel (%rdi), %eax
|
||||
; SLM-LABEL: test2:
|
||||
; SLM-LABEL: test4:
|
||||
; SLM: movbel (%rdi), %eax
|
||||
}
|
||||
|
||||
define void @test3(i64* %x, i64 %y) nounwind {
|
||||
define void @test5(i64* %x, i64 %y) nounwind {
|
||||
%bswap = call i64 @llvm.bswap.i64(i64 %y)
|
||||
store i64 %bswap, i64* %x, align 8
|
||||
ret void
|
||||
; CHECK-LABEL: test3:
|
||||
; CHECK-LABEL: test5:
|
||||
; CHECK: movbeq %rsi, (%rdi)
|
||||
; SLM-LABEL: test3:
|
||||
; SLM-LABEL: test5:
|
||||
; SLM: movbeq %rsi, (%rdi)
|
||||
}
|
||||
|
||||
define i64 @test4(i64* %x) nounwind {
|
||||
define i64 @test6(i64* %x) nounwind {
|
||||
%load = load i64* %x, align 8
|
||||
%bswap = call i64 @llvm.bswap.i64(i64 %load)
|
||||
ret i64 %bswap
|
||||
; CHECK-LABEL: test4:
|
||||
; CHECK-LABEL: test6:
|
||||
; CHECK: movbeq (%rdi), %rax
|
||||
; SLM-LABEL: test4:
|
||||
; SLM-LABEL: test6:
|
||||
; SLM: movbeq (%rdi), %rax
|
||||
}
|
||||
|
Loading…
Reference in New Issue
Block a user