mirror of
https://github.com/capstone-engine/llvm-capstone.git
synced 2024-12-03 19:32:35 +00:00
f3dc9649ce
llvm-svn: 346431
549 lines
16 KiB
C++
549 lines
16 KiB
C++
//===- SymbolTable.cpp ----------------------------------------------------===//
|
|
//
|
|
// The LLVM Linker
|
|
//
|
|
// This file is distributed under the University of Illinois Open Source
|
|
// License. See LICENSE.TXT for details.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "SymbolTable.h"
|
|
#include "Config.h"
|
|
#include "Driver.h"
|
|
#include "LTO.h"
|
|
#include "PDB.h"
|
|
#include "Symbols.h"
|
|
#include "lld/Common/ErrorHandler.h"
|
|
#include "lld/Common/Memory.h"
|
|
#include "lld/Common/Timer.h"
|
|
#include "llvm/IR/LLVMContext.h"
|
|
#include "llvm/Support/Debug.h"
|
|
#include "llvm/Support/raw_ostream.h"
|
|
#include <utility>
|
|
|
|
using namespace llvm;
|
|
|
|
namespace lld {
|
|
namespace coff {
|
|
|
|
static Timer LTOTimer("LTO", Timer::root());
|
|
|
|
SymbolTable *Symtab;
|
|
|
|
void SymbolTable::addFile(InputFile *File) {
|
|
log("Reading " + toString(File));
|
|
File->parse();
|
|
|
|
MachineTypes MT = File->getMachineType();
|
|
if (Config->Machine == IMAGE_FILE_MACHINE_UNKNOWN) {
|
|
Config->Machine = MT;
|
|
} else if (MT != IMAGE_FILE_MACHINE_UNKNOWN && Config->Machine != MT) {
|
|
error(toString(File) + ": machine type " + machineToStr(MT) +
|
|
" conflicts with " + machineToStr(Config->Machine));
|
|
return;
|
|
}
|
|
|
|
if (auto *F = dyn_cast<ObjFile>(File)) {
|
|
ObjFile::Instances.push_back(F);
|
|
} else if (auto *F = dyn_cast<BitcodeFile>(File)) {
|
|
BitcodeFile::Instances.push_back(F);
|
|
} else if (auto *F = dyn_cast<ImportFile>(File)) {
|
|
ImportFile::Instances.push_back(F);
|
|
}
|
|
|
|
StringRef S = File->getDirectives();
|
|
if (S.empty())
|
|
return;
|
|
|
|
log("Directives: " + toString(File) + ": " + S);
|
|
Driver->parseDirectives(S);
|
|
}
|
|
|
|
static void errorOrWarn(const Twine &S) {
|
|
if (Config->ForceUnresolved)
|
|
warn(S);
|
|
else
|
|
error(S);
|
|
}
|
|
|
|
// Returns the symbol in SC whose value is <= Addr that is closest to Addr.
|
|
// This is generally the global variable or function whose definition contains
|
|
// Addr.
|
|
static Symbol *getSymbol(SectionChunk *SC, uint32_t Addr) {
|
|
DefinedRegular *Candidate = nullptr;
|
|
|
|
for (Symbol *S : SC->File->getSymbols()) {
|
|
auto *D = dyn_cast_or_null<DefinedRegular>(S);
|
|
if (!D || D->getChunk() != SC || D->getValue() > Addr ||
|
|
(Candidate && D->getValue() < Candidate->getValue()))
|
|
continue;
|
|
|
|
Candidate = D;
|
|
}
|
|
|
|
return Candidate;
|
|
}
|
|
|
|
std::string getSymbolLocations(ObjFile *File, uint32_t SymIndex) {
|
|
struct Location {
|
|
Symbol *Sym;
|
|
std::pair<StringRef, uint32_t> FileLine;
|
|
};
|
|
std::vector<Location> Locations;
|
|
|
|
for (Chunk *C : File->getChunks()) {
|
|
auto *SC = dyn_cast<SectionChunk>(C);
|
|
if (!SC)
|
|
continue;
|
|
for (const coff_relocation &R : SC->Relocs) {
|
|
if (R.SymbolTableIndex != SymIndex)
|
|
continue;
|
|
std::pair<StringRef, uint32_t> FileLine =
|
|
getFileLine(SC, R.VirtualAddress);
|
|
Symbol *Sym = getSymbol(SC, R.VirtualAddress);
|
|
if (!FileLine.first.empty() || Sym)
|
|
Locations.push_back({Sym, FileLine});
|
|
}
|
|
}
|
|
|
|
if (Locations.empty())
|
|
return "\n>>> referenced by " + toString(File);
|
|
|
|
std::string Out;
|
|
llvm::raw_string_ostream OS(Out);
|
|
for (Location Loc : Locations) {
|
|
OS << "\n>>> referenced by ";
|
|
if (!Loc.FileLine.first.empty())
|
|
OS << Loc.FileLine.first << ":" << Loc.FileLine.second
|
|
<< "\n>>> ";
|
|
OS << toString(File);
|
|
if (Loc.Sym)
|
|
OS << ":(" << toString(*Loc.Sym) << ')';
|
|
}
|
|
return OS.str();
|
|
}
|
|
|
|
void SymbolTable::loadMinGWAutomaticImports() {
|
|
for (auto &I : SymMap) {
|
|
Symbol *Sym = I.second;
|
|
auto *Undef = dyn_cast<Undefined>(Sym);
|
|
if (!Undef)
|
|
continue;
|
|
if (!Sym->IsUsedInRegularObj)
|
|
continue;
|
|
|
|
StringRef Name = Undef->getName();
|
|
|
|
if (Name.startswith("__imp_"))
|
|
continue;
|
|
// If we have an undefined symbol, but we have a Lazy representing a
|
|
// symbol we could load from file, make sure to load that.
|
|
Lazy *L = dyn_cast_or_null<Lazy>(find(("__imp_" + Name).str()));
|
|
if (!L || L->PendingArchiveLoad)
|
|
continue;
|
|
|
|
log("Loading lazy " + L->getName() + " from " + L->File->getName() +
|
|
" for automatic import");
|
|
L->PendingArchiveLoad = true;
|
|
L->File->addMember(&L->Sym);
|
|
}
|
|
}
|
|
|
|
bool SymbolTable::handleMinGWAutomaticImport(Symbol *Sym, StringRef Name) {
|
|
if (Name.startswith("__imp_"))
|
|
return false;
|
|
Defined *Imp = dyn_cast_or_null<Defined>(find(("__imp_" + Name).str()));
|
|
if (!Imp)
|
|
return false;
|
|
|
|
// Replace the reference directly to a variable with a reference
|
|
// to the import address table instead. This obviously isn't right,
|
|
// but we mark the symbol as IsRuntimePseudoReloc, and a later pass
|
|
// will add runtime pseudo relocations for every relocation against
|
|
// this Symbol. The runtime pseudo relocation framework expects the
|
|
// reference itself to point at the IAT entry.
|
|
size_t ImpSize = 0;
|
|
if (isa<DefinedImportData>(Imp)) {
|
|
log("Automatically importing " + Name + " from " +
|
|
cast<DefinedImportData>(Imp)->getDLLName());
|
|
ImpSize = sizeof(DefinedImportData);
|
|
} else if (isa<DefinedRegular>(Imp)) {
|
|
log("Automatically importing " + Name + " from " +
|
|
toString(cast<DefinedRegular>(Imp)->File));
|
|
ImpSize = sizeof(DefinedRegular);
|
|
} else {
|
|
warn("unable to automatically import " + Name + " from " + Imp->getName() +
|
|
" from " + toString(cast<DefinedRegular>(Imp)->File) +
|
|
"; unexpected symbol type");
|
|
return false;
|
|
}
|
|
Sym->replaceKeepingName(Imp, ImpSize);
|
|
Sym->IsRuntimePseudoReloc = true;
|
|
|
|
// There may exist symbols named .refptr.<name> which only consist
|
|
// of a single pointer to <name>. If it turns out <name> is
|
|
// automatically imported, we don't need to keep the .refptr.<name>
|
|
// pointer at all, but redirect all accesses to it to the IAT entry
|
|
// for __imp_<name> instead, and drop the whole .refptr.<name> chunk.
|
|
DefinedRegular *Refptr =
|
|
dyn_cast_or_null<DefinedRegular>(find((".refptr." + Name).str()));
|
|
if (Refptr && Refptr->getChunk()->getSize() == Config->Wordsize) {
|
|
SectionChunk *SC = dyn_cast_or_null<SectionChunk>(Refptr->getChunk());
|
|
if (SC && SC->Relocs.size() == 1 && *SC->symbols().begin() == Sym) {
|
|
log("Replacing .refptr." + Name + " with " + Imp->getName());
|
|
Refptr->getChunk()->Live = false;
|
|
Refptr->replaceKeepingName(Imp, ImpSize);
|
|
}
|
|
}
|
|
return true;
|
|
}
|
|
|
|
void SymbolTable::reportRemainingUndefines() {
|
|
SmallPtrSet<Symbol *, 8> Undefs;
|
|
DenseMap<Symbol *, Symbol *> LocalImports;
|
|
|
|
for (auto &I : SymMap) {
|
|
Symbol *Sym = I.second;
|
|
auto *Undef = dyn_cast<Undefined>(Sym);
|
|
if (!Undef)
|
|
continue;
|
|
if (!Sym->IsUsedInRegularObj)
|
|
continue;
|
|
|
|
StringRef Name = Undef->getName();
|
|
|
|
// A weak alias may have been resolved, so check for that.
|
|
if (Defined *D = Undef->getWeakAlias()) {
|
|
// We want to replace Sym with D. However, we can't just blindly
|
|
// copy sizeof(SymbolUnion) bytes from D to Sym because D may be an
|
|
// internal symbol, and internal symbols are stored as "unparented"
|
|
// Symbols. For that reason we need to check which type of symbol we
|
|
// are dealing with and copy the correct number of bytes.
|
|
if (isa<DefinedRegular>(D))
|
|
memcpy(Sym, D, sizeof(DefinedRegular));
|
|
else if (isa<DefinedAbsolute>(D))
|
|
memcpy(Sym, D, sizeof(DefinedAbsolute));
|
|
else
|
|
memcpy(Sym, D, sizeof(SymbolUnion));
|
|
continue;
|
|
}
|
|
|
|
// If we can resolve a symbol by removing __imp_ prefix, do that.
|
|
// This odd rule is for compatibility with MSVC linker.
|
|
if (Name.startswith("__imp_")) {
|
|
Symbol *Imp = find(Name.substr(strlen("__imp_")));
|
|
if (Imp && isa<Defined>(Imp)) {
|
|
auto *D = cast<Defined>(Imp);
|
|
replaceSymbol<DefinedLocalImport>(Sym, Name, D);
|
|
LocalImportChunks.push_back(cast<DefinedLocalImport>(Sym)->getChunk());
|
|
LocalImports[Sym] = D;
|
|
continue;
|
|
}
|
|
}
|
|
|
|
// We don't want to report missing Microsoft precompiled headers symbols.
|
|
// A proper message will be emitted instead in PDBLinker::aquirePrecompObj
|
|
if (Name.contains("_PchSym_"))
|
|
continue;
|
|
|
|
if (Config->MinGW && handleMinGWAutomaticImport(Sym, Name))
|
|
continue;
|
|
|
|
// Remaining undefined symbols are not fatal if /force is specified.
|
|
// They are replaced with dummy defined symbols.
|
|
if (Config->ForceUnresolved)
|
|
replaceSymbol<DefinedAbsolute>(Sym, Name, 0);
|
|
Undefs.insert(Sym);
|
|
}
|
|
|
|
if (Undefs.empty() && LocalImports.empty())
|
|
return;
|
|
|
|
for (Symbol *B : Config->GCRoot) {
|
|
if (Undefs.count(B))
|
|
errorOrWarn("<root>: undefined symbol: " + toString(*B));
|
|
if (Config->WarnLocallyDefinedImported)
|
|
if (Symbol *Imp = LocalImports.lookup(B))
|
|
warn("<root>: locally defined symbol imported: " + toString(*Imp) +
|
|
" (defined in " + toString(Imp->getFile()) + ") [LNK4217]");
|
|
}
|
|
|
|
for (ObjFile *File : ObjFile::Instances) {
|
|
size_t SymIndex = (size_t)-1;
|
|
for (Symbol *Sym : File->getSymbols()) {
|
|
++SymIndex;
|
|
if (!Sym)
|
|
continue;
|
|
if (Undefs.count(Sym))
|
|
errorOrWarn("undefined symbol: " + toString(*Sym) +
|
|
getSymbolLocations(File, SymIndex));
|
|
if (Config->WarnLocallyDefinedImported)
|
|
if (Symbol *Imp = LocalImports.lookup(Sym))
|
|
warn(toString(File) +
|
|
": locally defined symbol imported: " + toString(*Imp) +
|
|
" (defined in " + toString(Imp->getFile()) + ") [LNK4217]");
|
|
}
|
|
}
|
|
}
|
|
|
|
std::pair<Symbol *, bool> SymbolTable::insert(StringRef Name) {
|
|
bool Inserted = false;
|
|
Symbol *&Sym = SymMap[CachedHashStringRef(Name)];
|
|
if (!Sym) {
|
|
Sym = reinterpret_cast<Symbol *>(make<SymbolUnion>());
|
|
Sym->IsUsedInRegularObj = false;
|
|
Sym->PendingArchiveLoad = false;
|
|
Inserted = true;
|
|
}
|
|
return {Sym, Inserted};
|
|
}
|
|
|
|
std::pair<Symbol *, bool> SymbolTable::insert(StringRef Name, InputFile *File) {
|
|
std::pair<Symbol *, bool> Result = insert(Name);
|
|
if (!File || !isa<BitcodeFile>(File))
|
|
Result.first->IsUsedInRegularObj = true;
|
|
return Result;
|
|
}
|
|
|
|
Symbol *SymbolTable::addUndefined(StringRef Name, InputFile *F,
|
|
bool IsWeakAlias) {
|
|
Symbol *S;
|
|
bool WasInserted;
|
|
std::tie(S, WasInserted) = insert(Name, F);
|
|
if (WasInserted || (isa<Lazy>(S) && IsWeakAlias)) {
|
|
replaceSymbol<Undefined>(S, Name);
|
|
return S;
|
|
}
|
|
if (auto *L = dyn_cast<Lazy>(S)) {
|
|
if (!S->PendingArchiveLoad) {
|
|
S->PendingArchiveLoad = true;
|
|
L->File->addMember(&L->Sym);
|
|
}
|
|
}
|
|
return S;
|
|
}
|
|
|
|
void SymbolTable::addLazy(ArchiveFile *F, const Archive::Symbol Sym) {
|
|
StringRef Name = Sym.getName();
|
|
Symbol *S;
|
|
bool WasInserted;
|
|
std::tie(S, WasInserted) = insert(Name);
|
|
if (WasInserted) {
|
|
replaceSymbol<Lazy>(S, F, Sym);
|
|
return;
|
|
}
|
|
auto *U = dyn_cast<Undefined>(S);
|
|
if (!U || U->WeakAlias || S->PendingArchiveLoad)
|
|
return;
|
|
S->PendingArchiveLoad = true;
|
|
F->addMember(&Sym);
|
|
}
|
|
|
|
void SymbolTable::reportDuplicate(Symbol *Existing, InputFile *NewFile) {
|
|
std::string Msg = "duplicate symbol: " + toString(*Existing) + " in " +
|
|
toString(Existing->getFile()) + " and in " +
|
|
toString(NewFile);
|
|
|
|
if (Config->ForceMultiple)
|
|
warn(Msg);
|
|
else
|
|
error(Msg);
|
|
}
|
|
|
|
Symbol *SymbolTable::addAbsolute(StringRef N, COFFSymbolRef Sym) {
|
|
Symbol *S;
|
|
bool WasInserted;
|
|
std::tie(S, WasInserted) = insert(N, nullptr);
|
|
S->IsUsedInRegularObj = true;
|
|
if (WasInserted || isa<Undefined>(S) || isa<Lazy>(S))
|
|
replaceSymbol<DefinedAbsolute>(S, N, Sym);
|
|
else if (!isa<DefinedCOFF>(S))
|
|
reportDuplicate(S, nullptr);
|
|
return S;
|
|
}
|
|
|
|
Symbol *SymbolTable::addAbsolute(StringRef N, uint64_t VA) {
|
|
Symbol *S;
|
|
bool WasInserted;
|
|
std::tie(S, WasInserted) = insert(N, nullptr);
|
|
S->IsUsedInRegularObj = true;
|
|
if (WasInserted || isa<Undefined>(S) || isa<Lazy>(S))
|
|
replaceSymbol<DefinedAbsolute>(S, N, VA);
|
|
else if (!isa<DefinedCOFF>(S))
|
|
reportDuplicate(S, nullptr);
|
|
return S;
|
|
}
|
|
|
|
Symbol *SymbolTable::addSynthetic(StringRef N, Chunk *C) {
|
|
Symbol *S;
|
|
bool WasInserted;
|
|
std::tie(S, WasInserted) = insert(N, nullptr);
|
|
S->IsUsedInRegularObj = true;
|
|
if (WasInserted || isa<Undefined>(S) || isa<Lazy>(S))
|
|
replaceSymbol<DefinedSynthetic>(S, N, C);
|
|
else if (!isa<DefinedCOFF>(S))
|
|
reportDuplicate(S, nullptr);
|
|
return S;
|
|
}
|
|
|
|
Symbol *SymbolTable::addRegular(InputFile *F, StringRef N,
|
|
const coff_symbol_generic *Sym,
|
|
SectionChunk *C) {
|
|
Symbol *S;
|
|
bool WasInserted;
|
|
std::tie(S, WasInserted) = insert(N, F);
|
|
if (WasInserted || !isa<DefinedRegular>(S))
|
|
replaceSymbol<DefinedRegular>(S, F, N, /*IsCOMDAT*/ false,
|
|
/*IsExternal*/ true, Sym, C);
|
|
else
|
|
reportDuplicate(S, F);
|
|
return S;
|
|
}
|
|
|
|
std::pair<Symbol *, bool>
|
|
SymbolTable::addComdat(InputFile *F, StringRef N,
|
|
const coff_symbol_generic *Sym) {
|
|
Symbol *S;
|
|
bool WasInserted;
|
|
std::tie(S, WasInserted) = insert(N, F);
|
|
if (WasInserted || !isa<DefinedRegular>(S)) {
|
|
replaceSymbol<DefinedRegular>(S, F, N, /*IsCOMDAT*/ true,
|
|
/*IsExternal*/ true, Sym, nullptr);
|
|
return {S, true};
|
|
}
|
|
if (!cast<DefinedRegular>(S)->isCOMDAT())
|
|
reportDuplicate(S, F);
|
|
return {S, false};
|
|
}
|
|
|
|
Symbol *SymbolTable::addCommon(InputFile *F, StringRef N, uint64_t Size,
|
|
const coff_symbol_generic *Sym, CommonChunk *C) {
|
|
Symbol *S;
|
|
bool WasInserted;
|
|
std::tie(S, WasInserted) = insert(N, F);
|
|
if (WasInserted || !isa<DefinedCOFF>(S))
|
|
replaceSymbol<DefinedCommon>(S, F, N, Size, Sym, C);
|
|
else if (auto *DC = dyn_cast<DefinedCommon>(S))
|
|
if (Size > DC->getSize())
|
|
replaceSymbol<DefinedCommon>(S, F, N, Size, Sym, C);
|
|
return S;
|
|
}
|
|
|
|
Symbol *SymbolTable::addImportData(StringRef N, ImportFile *F) {
|
|
Symbol *S;
|
|
bool WasInserted;
|
|
std::tie(S, WasInserted) = insert(N, nullptr);
|
|
S->IsUsedInRegularObj = true;
|
|
if (WasInserted || isa<Undefined>(S) || isa<Lazy>(S)) {
|
|
replaceSymbol<DefinedImportData>(S, N, F);
|
|
return S;
|
|
}
|
|
|
|
reportDuplicate(S, F);
|
|
return nullptr;
|
|
}
|
|
|
|
Symbol *SymbolTable::addImportThunk(StringRef Name, DefinedImportData *ID,
|
|
uint16_t Machine) {
|
|
Symbol *S;
|
|
bool WasInserted;
|
|
std::tie(S, WasInserted) = insert(Name, nullptr);
|
|
S->IsUsedInRegularObj = true;
|
|
if (WasInserted || isa<Undefined>(S) || isa<Lazy>(S)) {
|
|
replaceSymbol<DefinedImportThunk>(S, Name, ID, Machine);
|
|
return S;
|
|
}
|
|
|
|
reportDuplicate(S, ID->File);
|
|
return nullptr;
|
|
}
|
|
|
|
std::vector<Chunk *> SymbolTable::getChunks() {
|
|
std::vector<Chunk *> Res;
|
|
for (ObjFile *File : ObjFile::Instances) {
|
|
ArrayRef<Chunk *> V = File->getChunks();
|
|
Res.insert(Res.end(), V.begin(), V.end());
|
|
}
|
|
return Res;
|
|
}
|
|
|
|
Symbol *SymbolTable::find(StringRef Name) {
|
|
return SymMap.lookup(CachedHashStringRef(Name));
|
|
}
|
|
|
|
Symbol *SymbolTable::findUnderscore(StringRef Name) {
|
|
if (Config->Machine == I386)
|
|
return find(("_" + Name).str());
|
|
return find(Name);
|
|
}
|
|
|
|
StringRef SymbolTable::findByPrefix(StringRef Prefix) {
|
|
for (auto Pair : SymMap) {
|
|
StringRef Name = Pair.first.val();
|
|
if (Name.startswith(Prefix))
|
|
return Name;
|
|
}
|
|
return "";
|
|
}
|
|
|
|
StringRef SymbolTable::findMangle(StringRef Name) {
|
|
if (Symbol *Sym = find(Name))
|
|
if (!isa<Undefined>(Sym))
|
|
return Name;
|
|
if (Config->Machine != I386)
|
|
return findByPrefix(("?" + Name + "@@Y").str());
|
|
if (!Name.startswith("_"))
|
|
return "";
|
|
// Search for x86 stdcall function.
|
|
StringRef S = findByPrefix((Name + "@").str());
|
|
if (!S.empty())
|
|
return S;
|
|
// Search for x86 fastcall function.
|
|
S = findByPrefix(("@" + Name.substr(1) + "@").str());
|
|
if (!S.empty())
|
|
return S;
|
|
// Search for x86 vectorcall function.
|
|
S = findByPrefix((Name.substr(1) + "@@").str());
|
|
if (!S.empty())
|
|
return S;
|
|
// Search for x86 C++ non-member function.
|
|
return findByPrefix(("?" + Name.substr(1) + "@@Y").str());
|
|
}
|
|
|
|
void SymbolTable::mangleMaybe(Symbol *B) {
|
|
auto *U = dyn_cast<Undefined>(B);
|
|
if (!U || U->WeakAlias)
|
|
return;
|
|
StringRef Alias = findMangle(U->getName());
|
|
if (!Alias.empty()) {
|
|
log(U->getName() + " aliased to " + Alias);
|
|
U->WeakAlias = addUndefined(Alias);
|
|
}
|
|
}
|
|
|
|
Symbol *SymbolTable::addUndefined(StringRef Name) {
|
|
return addUndefined(Name, nullptr, false);
|
|
}
|
|
|
|
std::vector<StringRef> SymbolTable::compileBitcodeFiles() {
|
|
LTO.reset(new BitcodeCompiler);
|
|
for (BitcodeFile *F : BitcodeFile::Instances)
|
|
LTO->add(*F);
|
|
return LTO->compile();
|
|
}
|
|
|
|
void SymbolTable::addCombinedLTOObjects() {
|
|
if (BitcodeFile::Instances.empty())
|
|
return;
|
|
|
|
ScopedTimer T(LTOTimer);
|
|
for (StringRef Object : compileBitcodeFiles()) {
|
|
auto *Obj = make<ObjFile>(MemoryBufferRef(Object, "lto.tmp"));
|
|
Obj->parse();
|
|
ObjFile::Instances.push_back(Obj);
|
|
}
|
|
}
|
|
|
|
} // namespace coff
|
|
} // namespace lld
|