mirror of
https://github.com/RPCSX/llvm.git
synced 2024-11-23 19:59:57 +00:00
69edad7913
Turn expensive 64 bit shift into 32 bit if shift does not overflow int: shl (ext x) => zext (shl x) Differential Revision: https://reviews.llvm.org/D33367 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@303569 91177308-0d34-0410-b5e6-96231b3b80d8
46 lines
1.3 KiB
LLVM
46 lines
1.3 KiB
LLVM
; RUN: llc -march=amdgcn < %s | FileCheck %s
|
|
|
|
; CHECK-LABEL: {{^}}zext_shl64_to_32:
|
|
; CHECK: s_lshl_b32
|
|
; CHECK-NOT: s_lshl_b64
|
|
define amdgpu_kernel void @zext_shl64_to_32(i64 addrspace(1)* nocapture %out, i32 %x) {
|
|
%and = and i32 %x, 1073741823
|
|
%ext = zext i32 %and to i64
|
|
%shl = shl i64 %ext, 2
|
|
store i64 %shl, i64 addrspace(1)* %out, align 4
|
|
ret void
|
|
}
|
|
|
|
; CHECK-LABEL: {{^}}sext_shl64_to_32:
|
|
; CHECK: s_lshl_b32
|
|
; CHECK-NOT: s_lshl_b64
|
|
define amdgpu_kernel void @sext_shl64_to_32(i64 addrspace(1)* nocapture %out, i32 %x) {
|
|
%and = and i32 %x, 536870911
|
|
%ext = sext i32 %and to i64
|
|
%shl = shl i64 %ext, 2
|
|
store i64 %shl, i64 addrspace(1)* %out, align 4
|
|
ret void
|
|
}
|
|
|
|
; CHECK-LABEL: {{^}}zext_shl64_overflow:
|
|
; CHECK: s_lshl_b64
|
|
; CHECK-NOT: s_lshl_b32
|
|
define amdgpu_kernel void @zext_shl64_overflow(i64 addrspace(1)* nocapture %out, i32 %x) {
|
|
%and = and i32 %x, 2147483647
|
|
%ext = zext i32 %and to i64
|
|
%shl = shl i64 %ext, 2
|
|
store i64 %shl, i64 addrspace(1)* %out, align 4
|
|
ret void
|
|
}
|
|
|
|
; CHECK-LABEL: {{^}}sext_shl64_overflow:
|
|
; CHECK: s_lshl_b64
|
|
; CHECK-NOT: s_lshl_b32
|
|
define amdgpu_kernel void @sext_shl64_overflow(i64 addrspace(1)* nocapture %out, i32 %x) {
|
|
%and = and i32 %x, 2147483647
|
|
%ext = sext i32 %and to i64
|
|
%shl = shl i64 %ext, 2
|
|
store i64 %shl, i64 addrspace(1)* %out, align 4
|
|
ret void
|
|
}
|