mirror of
https://github.com/RPCS3/llvm.git
synced 2025-04-05 06:41:51 +00:00
Speculatively micro-optimize memory-zeroing calls on Darwin 10.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@49048 91177308-0d34-0410-b5e6-96231b3b80d8
This commit is contained in:
parent
b6d5b14390
commit
68d599df37
@ -4560,6 +4560,11 @@ SDOperand X86TargetLowering::LowerMEMSET(SDOperand Op, SelectionDAG &DAG) {
|
|||||||
// address value and run time information about the CPU.
|
// address value and run time information about the CPU.
|
||||||
if ((Align & 3) != 0 ||
|
if ((Align & 3) != 0 ||
|
||||||
(I && I->getValue() > Subtarget->getMaxInlineSizeThreshold())) {
|
(I && I->getValue() > Subtarget->getMaxInlineSizeThreshold())) {
|
||||||
|
|
||||||
|
// Check to see if there is a specialized entry-point for memory zeroing.
|
||||||
|
const char *bzeroEntry = Subtarget->getBZeroEntry();
|
||||||
|
ConstantSDNode *V = dyn_cast<ConstantSDNode>(Op.getOperand(2));
|
||||||
|
|
||||||
MVT::ValueType IntPtr = getPointerTy();
|
MVT::ValueType IntPtr = getPointerTy();
|
||||||
const Type *IntPtrTy = getTargetData()->getIntPtrType();
|
const Type *IntPtrTy = getTargetData()->getIntPtrType();
|
||||||
TargetLowering::ArgListTy Args;
|
TargetLowering::ArgListTy Args;
|
||||||
@ -4567,15 +4572,20 @@ SDOperand X86TargetLowering::LowerMEMSET(SDOperand Op, SelectionDAG &DAG) {
|
|||||||
Entry.Node = Op.getOperand(1);
|
Entry.Node = Op.getOperand(1);
|
||||||
Entry.Ty = IntPtrTy;
|
Entry.Ty = IntPtrTy;
|
||||||
Args.push_back(Entry);
|
Args.push_back(Entry);
|
||||||
|
|
||||||
|
if (!bzeroEntry) {
|
||||||
// Extend the unsigned i8 argument to be an int value for the call.
|
// Extend the unsigned i8 argument to be an int value for the call.
|
||||||
Entry.Node = DAG.getNode(ISD::ZERO_EXTEND, MVT::i32, Op.getOperand(2));
|
Entry.Node = DAG.getNode(ISD::ZERO_EXTEND, MVT::i32, Op.getOperand(2));
|
||||||
Entry.Ty = IntPtrTy;
|
Entry.Ty = IntPtrTy;
|
||||||
Args.push_back(Entry);
|
Args.push_back(Entry);
|
||||||
|
}
|
||||||
|
|
||||||
Entry.Node = Op.getOperand(3);
|
Entry.Node = Op.getOperand(3);
|
||||||
Args.push_back(Entry);
|
Args.push_back(Entry);
|
||||||
|
const char *Name = bzeroEntry ? bzeroEntry : "memset";
|
||||||
std::pair<SDOperand,SDOperand> CallResult =
|
std::pair<SDOperand,SDOperand> CallResult =
|
||||||
LowerCallTo(Chain, Type::VoidTy, false, false, false, CallingConv::C,
|
LowerCallTo(Chain, Type::VoidTy, false, false, false, CallingConv::C,
|
||||||
false, DAG.getExternalSymbol("memset", IntPtr), Args, DAG);
|
false, DAG.getExternalSymbol(Name, IntPtr), Args, DAG);
|
||||||
return CallResult.second;
|
return CallResult.second;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -53,6 +53,20 @@ bool X86Subtarget::GVRequiresExtraLoad(const GlobalValue* GV,
|
|||||||
return false;
|
return false;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/// This function returns the name of a function which has an interface
|
||||||
|
/// like the non-standard bzero function, if such a function exists on
|
||||||
|
/// the current subtarget and it is considered prefereable over
|
||||||
|
/// memset with zero passed as the second argument. Otherwise it
|
||||||
|
/// returns null.
|
||||||
|
const char *X86Subtarget::getBZeroEntry() const {
|
||||||
|
|
||||||
|
// Darwin 10 has a __bzero entry point for this purpose.
|
||||||
|
if (getDarwinVers() >= 10)
|
||||||
|
return "__bzero";
|
||||||
|
|
||||||
|
return 0;
|
||||||
|
}
|
||||||
|
|
||||||
/// GetCpuIDAndInfo - Execute the specified cpuid and return the 4 values in the
|
/// GetCpuIDAndInfo - Execute the specified cpuid and return the 4 values in the
|
||||||
/// specified arguments. If we can't run cpuid on the host, return true.
|
/// specified arguments. If we can't run cpuid on the host, return true.
|
||||||
bool X86::GetCpuIDAndInfo(unsigned value, unsigned *rEAX, unsigned *rEBX,
|
bool X86::GetCpuIDAndInfo(unsigned value, unsigned *rEAX, unsigned *rEBX,
|
||||||
|
@ -171,6 +171,12 @@ public:
|
|||||||
bool GVRequiresExtraLoad(const GlobalValue* GV, const TargetMachine& TM,
|
bool GVRequiresExtraLoad(const GlobalValue* GV, const TargetMachine& TM,
|
||||||
bool isDirectCall) const;
|
bool isDirectCall) const;
|
||||||
|
|
||||||
|
/// This function returns the name of a function which has an interface
|
||||||
|
/// like the non-standard bzero function, if such a function exists on
|
||||||
|
/// the current subtarget and it is considered prefereable over
|
||||||
|
/// memset with zero passed as the second argument. Otherwise it
|
||||||
|
/// returns null.
|
||||||
|
const char *getBZeroEntry() const;
|
||||||
};
|
};
|
||||||
|
|
||||||
namespace X86 {
|
namespace X86 {
|
||||||
|
8
test/CodeGen/X86/darwin-bzero.ll
Normal file
8
test/CodeGen/X86/darwin-bzero.ll
Normal file
@ -0,0 +1,8 @@
|
|||||||
|
; RUN: llvm-as < %s | llc -mtriple=i386-apple-darwin10 | grep __bzero
|
||||||
|
|
||||||
|
declare void @llvm.memset.i32(i8*, i8, i32, i32)
|
||||||
|
|
||||||
|
define void @foo(i8* %p, i32 %len) {
|
||||||
|
call void @llvm.memset.i32(i8* %p, i8 0, i32 %len, i32 1);
|
||||||
|
ret void
|
||||||
|
}
|
Loading…
x
Reference in New Issue
Block a user