mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2024-12-11 13:37:07 +00:00
4c381d496d
InstSimplify should do all transformations that ConstProp does, but one thing that ConstProp does that InstSimplify wouldn't is inline vector instructions that are constants, e.g. into a ret. Previously vector instructions wouldn't be inlined in InstSimplify because llvm::Simplify*Instruction() would return nullptr for specific instructions, such as vector instructions that were actually constants, if it couldn't simplify them. This changes SimplifyInsertElementInst, SimplifyExtractElementInst, and SimplifyShuffleVectorInst to return a vector constant when possible. Reviewed By: efriedma Differential Revision: https://reviews.llvm.org/D85946
199 lines
7.6 KiB
LLVM
199 lines
7.6 KiB
LLVM
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
|
|
; RUN: opt < %s -instsimplify -S -verify | FileCheck %s
|
|
|
|
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
;; Vector Operations
|
|
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
|
|
; insertelement
|
|
|
|
define <vscale x 4 x i32> @insertelement_idx_undef(<vscale x 4 x i32> %a) {
|
|
; CHECK-LABEL: @insertelement_idx_undef(
|
|
; CHECK-NEXT: ret <vscale x 4 x i32> undef
|
|
;
|
|
%r = insertelement <vscale x 4 x i32> %a, i32 5, i64 undef
|
|
ret <vscale x 4 x i32> %r
|
|
}
|
|
|
|
define <vscale x 4 x i32> @insertelement_value_undef(<vscale x 4 x i32> %a) {
|
|
; CHECK-LABEL: @insertelement_value_undef(
|
|
; CHECK-NEXT: [[R:%.*]] = insertelement <vscale x 4 x i32> [[A:%.*]], i32 undef, i64 0
|
|
; CHECK-NEXT: ret <vscale x 4 x i32> [[R]]
|
|
;
|
|
%r = insertelement <vscale x 4 x i32> %a, i32 undef, i64 0
|
|
ret <vscale x 4 x i32> %r
|
|
}
|
|
|
|
define <vscale x 4 x i32> @insertelement_idx_maybe_out_of_bound(<vscale x 4 x i32> %a) {
|
|
; CHECK-LABEL: @insertelement_idx_maybe_out_of_bound(
|
|
; CHECK-NEXT: [[R:%.*]] = insertelement <vscale x 4 x i32> [[A:%.*]], i32 5, i64 4
|
|
; CHECK-NEXT: ret <vscale x 4 x i32> [[R]]
|
|
;
|
|
%r = insertelement <vscale x 4 x i32> %a, i32 5, i64 4
|
|
ret <vscale x 4 x i32> %r
|
|
}
|
|
|
|
define <vscale x 4 x i32> @insertelement_idx_large_bound(<vscale x 4 x i32> %a) {
|
|
; CHECK-LABEL: @insertelement_idx_large_bound(
|
|
; CHECK-NEXT: [[R:%.*]] = insertelement <vscale x 4 x i32> [[A:%.*]], i32 5, i64 12345
|
|
; CHECK-NEXT: ret <vscale x 4 x i32> [[R]]
|
|
;
|
|
%r = insertelement <vscale x 4 x i32> %a, i32 5, i64 12345
|
|
ret <vscale x 4 x i32> %r
|
|
}
|
|
|
|
define <vscale x 4 x i32> @insert_extract_element_same_vec_idx_1(<vscale x 4 x i32> %a) {
|
|
; CHECK-LABEL: @insert_extract_element_same_vec_idx_1(
|
|
; CHECK-NEXT: ret <vscale x 4 x i32> [[A:%.*]]
|
|
;
|
|
%v = extractelement <vscale x 4 x i32> %a, i64 1
|
|
%r = insertelement <vscale x 4 x i32> %a, i32 %v, i64 1
|
|
ret <vscale x 4 x i32> %r
|
|
}
|
|
|
|
define <vscale x 4 x i32> @insertelement_inline_to_ret() {
|
|
; CHECK-LABEL: @insertelement_inline_to_ret(
|
|
; CHECK-NEXT: ret <vscale x 4 x i32> insertelement (<vscale x 4 x i32> undef, i32 1, i32 0)
|
|
;
|
|
%i = insertelement <vscale x 4 x i32> undef, i32 1, i32 0
|
|
ret <vscale x 4 x i32> %i
|
|
}
|
|
|
|
define <vscale x 4 x i32> @insertelement_shufflevector_inline_to_ret() {
|
|
; CHECK-LABEL: @insertelement_shufflevector_inline_to_ret(
|
|
; CHECK-NEXT: ret <vscale x 4 x i32> shufflevector (<vscale x 4 x i32> insertelement (<vscale x 4 x i32> undef, i32 1, i32 0), <vscale x 4 x i32> undef, <vscale x 4 x i32> zeroinitializer)
|
|
;
|
|
%i = insertelement <vscale x 4 x i32> undef, i32 1, i32 0
|
|
%i2 = shufflevector <vscale x 4 x i32> %i, <vscale x 4 x i32> undef, <vscale x 4 x i32> zeroinitializer
|
|
ret <vscale x 4 x i32> %i2
|
|
}
|
|
|
|
; extractelement
|
|
|
|
define i32 @extractelement_idx_undef(<vscale x 4 x i32> %a) {
|
|
; CHECK-LABEL: @extractelement_idx_undef(
|
|
; CHECK-NEXT: ret i32 undef
|
|
;
|
|
%r = extractelement <vscale x 4 x i32> %a, i64 undef
|
|
ret i32 %r
|
|
}
|
|
|
|
define i32 @extractelement_vec_undef(<vscale x 4 x i32> %a) {
|
|
; CHECK-LABEL: @extractelement_vec_undef(
|
|
; CHECK-NEXT: ret i32 undef
|
|
;
|
|
%r = extractelement <vscale x 4 x i32> undef, i64 1
|
|
ret i32 %r
|
|
}
|
|
|
|
define i32 @extractelement_idx_maybe_out_of_bound(<vscale x 4 x i32> %a) {
|
|
; CHECK-LABEL: @extractelement_idx_maybe_out_of_bound(
|
|
; CHECK-NEXT: [[R:%.*]] = extractelement <vscale x 4 x i32> [[A:%.*]], i64 4
|
|
; CHECK-NEXT: ret i32 [[R]]
|
|
;
|
|
%r = extractelement <vscale x 4 x i32> %a, i64 4
|
|
ret i32 %r
|
|
}
|
|
define i32 @extractelement_idx_large_bound(<vscale x 4 x i32> %a) {
|
|
; CHECK-LABEL: @extractelement_idx_large_bound(
|
|
; CHECK-NEXT: [[R:%.*]] = extractelement <vscale x 4 x i32> [[A:%.*]], i64 12345
|
|
; CHECK-NEXT: ret i32 [[R]]
|
|
;
|
|
%r = extractelement <vscale x 4 x i32> %a, i64 12345
|
|
ret i32 %r
|
|
}
|
|
|
|
define i32 @insert_extract_element_same_vec_idx_2() {
|
|
; CHECK-LABEL: @insert_extract_element_same_vec_idx_2(
|
|
; CHECK-NEXT: ret i32 1
|
|
;
|
|
%v = insertelement <vscale x 4 x i32> undef, i32 1, i64 4
|
|
%r = extractelement <vscale x 4 x i32> %v, i64 4
|
|
ret i32 %r
|
|
}
|
|
|
|
define i32 @insert_extract_element_same_vec_idx_3() {
|
|
; CHECK-LABEL: @insert_extract_element_same_vec_idx_3(
|
|
; CHECK-NEXT: ret i32 1
|
|
;
|
|
%r = extractelement <vscale x 4 x i32> insertelement (<vscale x 4 x i32> undef, i32 1, i64 4), i64 4
|
|
ret i32 %r
|
|
}
|
|
|
|
define i32 @insert_extract_element_same_vec_idx_4() {
|
|
; CHECK-LABEL: @insert_extract_element_same_vec_idx_4(
|
|
; CHECK-NEXT: ret i32 1
|
|
;
|
|
%r = extractelement <vscale x 4 x i32> insertelement (<vscale x 4 x i32> insertelement (<vscale x 4 x i32> undef, i32 1, i32 4), i32 2, i64 3), i64 4
|
|
ret i32 %r
|
|
}
|
|
|
|
; more complicated expressions
|
|
|
|
define <vscale x 2 x i1> @cmp_le_smax_always_true(<vscale x 2 x i64> %x) {
|
|
; CHECK-LABEL: @cmp_le_smax_always_true(
|
|
; CHECK-NEXT: ret <vscale x 2 x i1> shufflevector (<vscale x 2 x i1> insertelement (<vscale x 2 x i1> undef, i1 true, i32 0), <vscale x 2 x i1> undef, <vscale x 2 x i32> zeroinitializer)
|
|
%cmp = icmp sle <vscale x 2 x i64> %x, shufflevector (<vscale x 2 x i64> insertelement (<vscale x 2 x i64> undef, i64 9223372036854775807, i32 0), <vscale x 2 x i64> undef, <vscale x 2 x i32> zeroinitializer)
|
|
ret <vscale x 2 x i1> %cmp
|
|
}
|
|
|
|
define <vscale x 4 x float> @bitcast() {
|
|
; CHECK-LABEL: @bitcast(
|
|
; CHECK-NEXT: ret <vscale x 4 x float> bitcast (<vscale x 4 x i32> shufflevector (<vscale x 4 x i32> insertelement (<vscale x 4 x i32> undef, i32 1, i32 0), <vscale x 4 x i32> undef, <vscale x 4 x i32> zeroinitializer) to <vscale x 4 x float>)
|
|
;
|
|
%i1 = insertelement <vscale x 4 x i32> undef, i32 1, i32 0
|
|
%i2 = shufflevector <vscale x 4 x i32> %i1, <vscale x 4 x i32> undef, <vscale x 4 x i32> zeroinitializer
|
|
%i3 = bitcast <vscale x 4 x i32> %i2 to <vscale x 4 x float>
|
|
ret <vscale x 4 x float> %i3
|
|
}
|
|
|
|
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
;; Memory Access and Addressing Operations
|
|
;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;
|
|
|
|
; getelementptr
|
|
|
|
define <vscale x 4 x i32*> @getelementptr_constant_foldable_1() {
|
|
; CHECK-LABEL: @getelementptr_constant_foldable_1(
|
|
; CHECK-NEXT: ret <vscale x 4 x i32*> zeroinitializer
|
|
;
|
|
%ptr = getelementptr i32, <vscale x 4 x i32*> zeroinitializer, <vscale x 4 x i64> undef
|
|
ret <vscale x 4 x i32*> %ptr
|
|
}
|
|
|
|
define <vscale x 4 x <vscale x 4 x i32>*> @getelementptr_constant_foldable_2() {
|
|
; CHECK-LABEL: @getelementptr_constant_foldable_2(
|
|
; CHECK-NEXT: ret <vscale x 4 x <vscale x 4 x i32>*> zeroinitializer
|
|
;
|
|
%ptr = getelementptr <vscale x 4 x i32>, <vscale x 4 x i32>* null, <vscale x 4 x i64> undef
|
|
ret <vscale x 4 x <vscale x 4 x i32>*> %ptr
|
|
}
|
|
|
|
; fold getelementptr P, 0 -> P.
|
|
define <vscale x 4 x i32>* @getelementptr_constant_foldable_3() {
|
|
; CHECK-LABEL: @getelementptr_constant_foldable_3(
|
|
; CHECK-NEXT: ret <vscale x 4 x i32>* null
|
|
;
|
|
%ptr = getelementptr <vscale x 4 x i32>, <vscale x 4 x i32>* null, i64 0
|
|
ret <vscale x 4 x i32>* %ptr
|
|
}
|
|
|
|
define <vscale x 4 x i32>* @getelementptr_not_constant_foldable(i64 %x) {
|
|
; CHECK-LABEL: @getelementptr_not_constant_foldable(
|
|
; CHECK-NEXT: [[PTR:%.*]] = getelementptr <vscale x 4 x i32>, <vscale x 4 x i32>* null, i64 [[X:%.*]]
|
|
; CHECK-NEXT: ret <vscale x 4 x i32>* [[PTR]]
|
|
;
|
|
%ptr = getelementptr <vscale x 4 x i32>, <vscale x 4 x i32>* null, i64 %x
|
|
ret <vscale x 4 x i32>* %ptr
|
|
}
|
|
|
|
; Check GEP's result is known to be non-null.
|
|
define i1 @getelementptr_check_non_null(<vscale x 16 x i8>* %ptr) {
|
|
; CHECK-LABEL: @getelementptr_check_non_null(
|
|
; CHECK-NEXT: ret i1 false
|
|
;
|
|
%x = getelementptr inbounds <vscale x 16 x i8>, <vscale x 16 x i8>* %ptr, i32 1
|
|
%cmp = icmp eq <vscale x 16 x i8>* %x, null
|
|
ret i1 %cmp
|
|
}
|