mirror of
https://github.com/RPCS3/llvm-mirror.git
synced 2025-01-29 16:12:44 +00:00
Add support for additional in-reg vbroadcast patterns
llvm-svn: 157127
This commit is contained in:
parent
386e9a3f75
commit
441318ee29
@ -5026,12 +5026,18 @@ X86TargetLowering::LowerVectorBroadcast(SDValue &Op, SelectionDAG &DAG) const {
|
||||
}
|
||||
}
|
||||
|
||||
// The scalar source must be a normal load.
|
||||
if (!ISD::isNormalLoad(Ld.getNode()))
|
||||
return SDValue();
|
||||
|
||||
bool IsLoad = ISD::isNormalLoad(Ld.getNode());
|
||||
unsigned ScalarSize = Ld.getValueType().getSizeInBits();
|
||||
|
||||
// Handle AVX2 in-register broadcasts.
|
||||
if (!IsLoad && Subtarget->hasAVX2() &&
|
||||
(ScalarSize == 32 || (Is256 && ScalarSize == 64)))
|
||||
return DAG.getNode(X86ISD::VBROADCAST, dl, VT, Ld);
|
||||
|
||||
// The scalar source must be a normal load.
|
||||
if (!IsLoad)
|
||||
return SDValue();
|
||||
|
||||
if (ScalarSize == 32 || (Is256 && ScalarSize == 64))
|
||||
return DAG.getNode(X86ISD::VBROADCAST, dl, VT, Ld);
|
||||
|
||||
|
@ -222,3 +222,40 @@ footer349VF:
|
||||
ret:
|
||||
ret void
|
||||
}
|
||||
|
||||
; CHECK: _inreg0
|
||||
; CHECK: broadcastss
|
||||
; CHECK: ret
|
||||
define <8 x i32> @_inreg0(i32 %scalar) nounwind uwtable readnone ssp {
|
||||
%in = insertelement <8 x i32> undef, i32 %scalar, i32 0
|
||||
%wide = shufflevector <8 x i32> %in, <8 x i32> undef, <8 x i32> zeroinitializer
|
||||
ret <8 x i32> %wide
|
||||
}
|
||||
|
||||
; CHECK: _inreg1
|
||||
; CHECK: broadcastss
|
||||
; CHECK: ret
|
||||
define <8 x float> @_inreg1(float %scalar) nounwind uwtable readnone ssp {
|
||||
%in = insertelement <8 x float> undef, float %scalar, i32 0
|
||||
%wide = shufflevector <8 x float> %in, <8 x float> undef, <8 x i32> zeroinitializer
|
||||
ret <8 x float> %wide
|
||||
}
|
||||
|
||||
; CHECK: _inreg2
|
||||
; CHECK: broadcastss
|
||||
; CHECK: ret
|
||||
define <4 x float> @_inreg2(float %scalar) nounwind uwtable readnone ssp {
|
||||
%in = insertelement <4 x float> undef, float %scalar, i32 0
|
||||
%wide = shufflevector <4 x float> %in, <4 x float> undef, <4 x i32> zeroinitializer
|
||||
ret <4 x float> %wide
|
||||
}
|
||||
|
||||
; CHECK: _inreg3
|
||||
; CHECK: broadcastsd
|
||||
; CHECK: ret
|
||||
define <4 x double> @_inreg3(double %scalar) nounwind uwtable readnone ssp {
|
||||
%in = insertelement <4 x double> undef, double %scalar, i32 0
|
||||
%wide = shufflevector <4 x double> %in, <4 x double> undef, <4 x i32> zeroinitializer
|
||||
ret <4 x double> %wide
|
||||
}
|
||||
|
||||
|
Loading…
x
Reference in New Issue
Block a user