mirror of
https://github.com/RPCS3/llvm.git
synced 2025-04-04 22:31:44 +00:00

Summary: SamplePGO binaries built with -gmlt to collect profile. The current -gmlt debug info is limited, and we need some additional info: * start line of all subprograms * linkage name of all subprograms * standalone subprograms (functions that has neither inlined nor been inlined) This patch adds these information to the -gmlt binary. The impact on speccpu2006 binary size (size increase comparing with -g0 binary, also includes data for -g binary, which does not change with this patch): -gmlt(orig) -gmlt(patched) -g 433.milc 4.68% 5.40% 19.73% 444.namd 8.45% 8.93% 45.99% 447.dealII 97.43% 115.21% 374.89% 450.soplex 27.75% 31.88% 126.04% 453.povray 21.81% 26.16% 92.03% 470.lbm 0.60% 0.67% 1.96% 482.sphinx3 5.77% 6.47% 26.17% 400.perlbench 17.81% 19.43% 73.08% 401.bzip2 3.73% 3.92% 12.18% 403.gcc 31.75% 34.48% 122.75% 429.mcf 0.78% 0.88% 3.89% 445.gobmk 6.08% 7.92% 42.27% 456.hmmer 10.36% 11.25% 35.23% 458.sjeng 5.08% 5.42% 14.36% 462.libquantum 1.71% 1.96% 6.36% 464.h264ref 15.61% 16.56% 43.92% 471.omnetpp 11.93% 15.84% 60.09% 473.astar 3.11% 3.69% 14.18% 483.xalancbmk 56.29% 81.63% 353.22% geomean 15.60% 18.30% 57.81% Debug info size change for -gmlt binary with this patch: 433.milc 13.46% 444.namd 5.35% 447.dealII 18.21% 450.soplex 14.68% 453.povray 19.65% 470.lbm 6.03% 482.sphinx3 11.21% 400.perlbench 8.91% 401.bzip2 4.41% 403.gcc 8.56% 429.mcf 8.24% 445.gobmk 29.47% 456.hmmer 8.19% 458.sjeng 6.05% 462.libquantum 11.23% 464.h264ref 5.93% 471.omnetpp 31.89% 473.astar 16.20% 483.xalancbmk 44.62% geomean 16.83% Reviewers: davidxl, echristo, dblaikie Reviewed By: echristo, dblaikie Subscribers: aprantl, probinson, llvm-commits, mehdi_amini Differential Revision: https://reviews.llvm.org/D25434 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@292457 91177308-0d34-0410-b5e6-96231b3b80d8
231 lines
8.5 KiB
C++
231 lines
8.5 KiB
C++
//===-- TargetMachine.cpp - General Target Information ---------------------==//
|
|
//
|
|
// The LLVM Compiler Infrastructure
|
|
//
|
|
// This file is distributed under the University of Illinois Open Source
|
|
// License. See LICENSE.TXT for details.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This file describes the general parts of a Target machine.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "llvm/Target/TargetMachine.h"
|
|
#include "llvm/Analysis/TargetTransformInfo.h"
|
|
#include "llvm/CodeGen/MachineFunction.h"
|
|
#include "llvm/IR/Function.h"
|
|
#include "llvm/IR/GlobalAlias.h"
|
|
#include "llvm/IR/GlobalValue.h"
|
|
#include "llvm/IR/GlobalVariable.h"
|
|
#include "llvm/IR/LegacyPassManager.h"
|
|
#include "llvm/IR/Mangler.h"
|
|
#include "llvm/MC/MCAsmInfo.h"
|
|
#include "llvm/MC/MCContext.h"
|
|
#include "llvm/MC/MCInstrInfo.h"
|
|
#include "llvm/MC/MCSectionMachO.h"
|
|
#include "llvm/MC/MCTargetOptions.h"
|
|
#include "llvm/MC/SectionKind.h"
|
|
#include "llvm/Target/TargetLowering.h"
|
|
#include "llvm/Target/TargetLoweringObjectFile.h"
|
|
#include "llvm/Target/TargetSubtargetInfo.h"
|
|
using namespace llvm;
|
|
|
|
cl::opt<bool> EnableIPRA("enable-ipra", cl::init(false), cl::Hidden,
|
|
cl::desc("Enable interprocedural register allocation "
|
|
"to reduce load/store at procedure calls."));
|
|
|
|
cl::opt<bool> DebugInfoForProfiling(
|
|
"debug-info-for-profiling", cl::init(false), cl::Hidden,
|
|
cl::desc("Emit extra debug info to make sample profile more accurate."));
|
|
|
|
//---------------------------------------------------------------------------
|
|
// TargetMachine Class
|
|
//
|
|
|
|
TargetMachine::TargetMachine(const Target &T, StringRef DataLayoutString,
|
|
const Triple &TT, StringRef CPU, StringRef FS,
|
|
const TargetOptions &Options)
|
|
: TheTarget(T), DL(DataLayoutString), TargetTriple(TT), TargetCPU(CPU),
|
|
TargetFS(FS), AsmInfo(nullptr), MRI(nullptr), MII(nullptr), STI(nullptr),
|
|
RequireStructuredCFG(false), DefaultOptions(Options), Options(Options) {
|
|
if (EnableIPRA.getNumOccurrences())
|
|
this->Options.EnableIPRA = EnableIPRA;
|
|
if (DebugInfoForProfiling.getNumOccurrences())
|
|
this->Options.DebugInfoForProfiling = DebugInfoForProfiling;
|
|
}
|
|
|
|
TargetMachine::~TargetMachine() {
|
|
delete AsmInfo;
|
|
delete MRI;
|
|
delete MII;
|
|
delete STI;
|
|
}
|
|
|
|
bool TargetMachine::isPositionIndependent() const {
|
|
return getRelocationModel() == Reloc::PIC_;
|
|
}
|
|
|
|
/// \brief Reset the target options based on the function's attributes.
|
|
// FIXME: This function needs to go away for a number of reasons:
|
|
// a) global state on the TargetMachine is terrible in general,
|
|
// b) these target options should be passed only on the function
|
|
// and not on the TargetMachine (via TargetOptions) at all.
|
|
void TargetMachine::resetTargetOptions(const Function &F) const {
|
|
#define RESET_OPTION(X, Y) \
|
|
do { \
|
|
if (F.hasFnAttribute(Y)) \
|
|
Options.X = (F.getFnAttribute(Y).getValueAsString() == "true"); \
|
|
else \
|
|
Options.X = DefaultOptions.X; \
|
|
} while (0)
|
|
|
|
RESET_OPTION(LessPreciseFPMADOption, "less-precise-fpmad");
|
|
RESET_OPTION(UnsafeFPMath, "unsafe-fp-math");
|
|
RESET_OPTION(NoInfsFPMath, "no-infs-fp-math");
|
|
RESET_OPTION(NoNaNsFPMath, "no-nans-fp-math");
|
|
RESET_OPTION(NoTrappingFPMath, "no-trapping-math");
|
|
|
|
StringRef Denormal =
|
|
F.getFnAttribute("denormal-fp-math").getValueAsString();
|
|
if (Denormal == "ieee")
|
|
Options.FPDenormalMode = FPDenormal::IEEE;
|
|
else if (Denormal == "preserve-sign")
|
|
Options.FPDenormalMode = FPDenormal::PreserveSign;
|
|
else if (Denormal == "positive-zero")
|
|
Options.FPDenormalMode = FPDenormal::PositiveZero;
|
|
else
|
|
Options.FPDenormalMode = DefaultOptions.FPDenormalMode;
|
|
}
|
|
|
|
/// Returns the code generation relocation model. The choices are static, PIC,
|
|
/// and dynamic-no-pic.
|
|
Reloc::Model TargetMachine::getRelocationModel() const { return RM; }
|
|
|
|
/// Returns the code model. The choices are small, kernel, medium, large, and
|
|
/// target default.
|
|
CodeModel::Model TargetMachine::getCodeModel() const { return CMModel; }
|
|
|
|
/// Get the IR-specified TLS model for Var.
|
|
static TLSModel::Model getSelectedTLSModel(const GlobalValue *GV) {
|
|
switch (GV->getThreadLocalMode()) {
|
|
case GlobalVariable::NotThreadLocal:
|
|
llvm_unreachable("getSelectedTLSModel for non-TLS variable");
|
|
break;
|
|
case GlobalVariable::GeneralDynamicTLSModel:
|
|
return TLSModel::GeneralDynamic;
|
|
case GlobalVariable::LocalDynamicTLSModel:
|
|
return TLSModel::LocalDynamic;
|
|
case GlobalVariable::InitialExecTLSModel:
|
|
return TLSModel::InitialExec;
|
|
case GlobalVariable::LocalExecTLSModel:
|
|
return TLSModel::LocalExec;
|
|
}
|
|
llvm_unreachable("invalid TLS model");
|
|
}
|
|
|
|
bool TargetMachine::shouldAssumeDSOLocal(const Module &M,
|
|
const GlobalValue *GV) const {
|
|
Reloc::Model RM = getRelocationModel();
|
|
const Triple &TT = getTargetTriple();
|
|
|
|
// DLLImport explicitly marks the GV as external.
|
|
if (GV && GV->hasDLLImportStorageClass())
|
|
return false;
|
|
|
|
// Every other GV is local on COFF.
|
|
// Make an exception for windows OS in the triple: Some firmwares builds use
|
|
// *-win32-macho triples. This (accidentally?) produced windows relocations
|
|
// without GOT tables in older clang versions; Keep this behaviour.
|
|
if (TT.isOSBinFormatCOFF() || (TT.isOSWindows() && TT.isOSBinFormatMachO()))
|
|
return true;
|
|
|
|
if (GV && (GV->hasLocalLinkage() || !GV->hasDefaultVisibility()))
|
|
return true;
|
|
|
|
if (TT.isOSBinFormatMachO()) {
|
|
if (RM == Reloc::Static)
|
|
return true;
|
|
return GV && GV->isStrongDefinitionForLinker();
|
|
}
|
|
|
|
assert(TT.isOSBinFormatELF());
|
|
assert(RM != Reloc::DynamicNoPIC);
|
|
|
|
bool IsExecutable =
|
|
RM == Reloc::Static || M.getPIELevel() != PIELevel::Default;
|
|
if (IsExecutable) {
|
|
// If the symbol is defined, it cannot be preempted.
|
|
if (GV && !GV->isDeclarationForLinker())
|
|
return true;
|
|
|
|
bool IsTLS = GV && GV->isThreadLocal();
|
|
bool IsAccessViaCopyRelocs =
|
|
Options.MCOptions.MCPIECopyRelocations && GV && isa<GlobalVariable>(GV);
|
|
// Check if we can use copy relocations.
|
|
if (!IsTLS && (RM == Reloc::Static || IsAccessViaCopyRelocs))
|
|
return true;
|
|
}
|
|
|
|
// ELF supports preemption of other symbols.
|
|
return false;
|
|
}
|
|
|
|
TLSModel::Model TargetMachine::getTLSModel(const GlobalValue *GV) const {
|
|
bool IsPIE = GV->getParent()->getPIELevel() != PIELevel::Default;
|
|
Reloc::Model RM = getRelocationModel();
|
|
bool IsSharedLibrary = RM == Reloc::PIC_ && !IsPIE;
|
|
bool IsLocal = shouldAssumeDSOLocal(*GV->getParent(), GV);
|
|
|
|
TLSModel::Model Model;
|
|
if (IsSharedLibrary) {
|
|
if (IsLocal)
|
|
Model = TLSModel::LocalDynamic;
|
|
else
|
|
Model = TLSModel::GeneralDynamic;
|
|
} else {
|
|
if (IsLocal)
|
|
Model = TLSModel::LocalExec;
|
|
else
|
|
Model = TLSModel::InitialExec;
|
|
}
|
|
|
|
// If the user specified a more specific model, use that.
|
|
TLSModel::Model SelectedModel = getSelectedTLSModel(GV);
|
|
if (SelectedModel > Model)
|
|
return SelectedModel;
|
|
|
|
return Model;
|
|
}
|
|
|
|
/// Returns the optimization level: None, Less, Default, or Aggressive.
|
|
CodeGenOpt::Level TargetMachine::getOptLevel() const { return OptLevel; }
|
|
|
|
void TargetMachine::setOptLevel(CodeGenOpt::Level Level) { OptLevel = Level; }
|
|
|
|
TargetIRAnalysis TargetMachine::getTargetIRAnalysis() {
|
|
return TargetIRAnalysis([](const Function &F) {
|
|
return TargetTransformInfo(F.getParent()->getDataLayout());
|
|
});
|
|
}
|
|
|
|
void TargetMachine::getNameWithPrefix(SmallVectorImpl<char> &Name,
|
|
const GlobalValue *GV, Mangler &Mang,
|
|
bool MayAlwaysUsePrivate) const {
|
|
if (MayAlwaysUsePrivate || !GV->hasPrivateLinkage()) {
|
|
// Simple case: If GV is not private, it is not important to find out if
|
|
// private labels are legal in this case or not.
|
|
Mang.getNameWithPrefix(Name, GV, false);
|
|
return;
|
|
}
|
|
const TargetLoweringObjectFile *TLOF = getObjFileLowering();
|
|
TLOF->getNameWithPrefix(Name, GV, *this);
|
|
}
|
|
|
|
MCSymbol *TargetMachine::getSymbol(const GlobalValue *GV) const {
|
|
const TargetLoweringObjectFile *TLOF = getObjFileLowering();
|
|
SmallString<128> NameStr;
|
|
getNameWithPrefix(NameStr, GV, TLOF->getMangler());
|
|
return TLOF->getContext().getOrCreateSymbol(NameStr);
|
|
}
|