mirror of
https://github.com/RPCS3/llvm.git
synced 2024-11-28 14:10:55 +00:00
3e5d5c53a0
The xorps instruction is smaller than pxor, so prefer that encoding. The ExecutionDepsFix pass will switch the encoding to pxor and xorpd when appropriate. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@143996 91177308-0d34-0410-b5e6-96231b3b80d8
31 lines
906 B
LLVM
31 lines
906 B
LLVM
; RUN: llc < %s -march=x86 -mattr=+sse2 | FileCheck %s
|
|
|
|
; CHECK: foo
|
|
; CHECK: xorps
|
|
define void @foo(<4 x float>* %P) {
|
|
%T = load <4 x float>* %P ; <<4 x float>> [#uses=1]
|
|
%S = fadd <4 x float> zeroinitializer, %T ; <<4 x float>> [#uses=1]
|
|
store <4 x float> %S, <4 x float>* %P
|
|
ret void
|
|
}
|
|
|
|
; CHECK: bar
|
|
; CHECK: pxor
|
|
define void @bar(<4 x i32>* %P) {
|
|
%T = load <4 x i32>* %P ; <<4 x i32>> [#uses=1]
|
|
%S = add <4 x i32> zeroinitializer, %T ; <<4 x i32>> [#uses=1]
|
|
store <4 x i32> %S, <4 x i32>* %P
|
|
ret void
|
|
}
|
|
|
|
; Without any type hints from operations, we fall back to the smaller xorps.
|
|
; The IR type <4 x i32> is ignored.
|
|
; CHECK: untyped_zero
|
|
; CHECK: xorps
|
|
; CHECK: movaps
|
|
define void @untyped_zero(<4 x i32>* %p) {
|
|
entry:
|
|
store <4 x i32> zeroinitializer, <4 x i32>* %p, align 16
|
|
ret void
|
|
}
|