mirror of
https://github.com/RPCS3/llvm.git
synced 2025-01-10 14:12:11 +00:00
c39f5dd0e2
Fixes PR19582. Previously, when an asm assignment (.set or =) was created, we would look up the section immediately in MCSymbol::setVariableValue. This caused symbols to receive the wrong section if the RHS of the assignment had not been seen yet. This had a knock-on effect in the object file emitters, causing them to emit extra symbols, or to give symbols the wrong visibility or the wrong section. For example, in the following asm: .data .Llocal: .text leaq .Llocal1(%rip), %rdi .Llocal1 = .Llocal2 .Llocal2 = .Llocal the first assignment would give .Llocal1 a null section, which would never get fixed up by the second assignment. This would cause the ELF object file emitter to consider .Llocal1 to be an undefined symbol and give it external linkage, even though .Llocal1 should not have been emitted at all in the object file. Or in the following asm: alias_to_local = Ltmp0 Ltmp0: the Mach-O object file emitter would give the alias_to_local symbol a n_type of N_SECT and a n_sect of 0. This is invalid under the Mach-O specification, which requires N_SECT symbols to receive a non-zero section number if the symbol is defined in a section in the object file. https://developer.apple.com/library/mac/documentation/DeveloperTools/Conceptual/MachORuntime/#//apple_ref/c/tag/nlist After this change we do not look up the section when the assignment is created, but instead look it up on demand and store it in Section, which is treated as a cache if the symbol is a variable symbol. This change also fixes a bug in MCExpr::FindAssociatedSection. Previously, if we saw a subtraction, we would return the first referenced section, even in cases where we should have been returning the absolute pseudo-section. Now we always return the absolute pseudo-section for expressions that subtract two section-derived expressions. This isn't always correct (e.g. if one of the sections ends up being laid out at an absolute address), but it's probably the best we can do without more context. This allows us to remove code in two places where we appear to have been working around this bug, in MachObjectWriter::markAbsoluteVariableSymbols and in X86AsmPrinter::EmitStartOfAsmFile. Re-applies r233595 (aka D8586), which was reverted in r233898. Differential Revision: http://reviews.llvm.org/D8798 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@233995 91177308-0d34-0410-b5e6-96231b3b80d8
89 lines
2.5 KiB
C++
89 lines
2.5 KiB
C++
//===- lib/MC/MCSymbol.cpp - MCSymbol implementation ----------------------===//
|
|
//
|
|
// The LLVM Compiler Infrastructure
|
|
//
|
|
// This file is distributed under the University of Illinois Open Source
|
|
// License. See LICENSE.TXT for details.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "llvm/MC/MCSymbol.h"
|
|
#include "llvm/MC/MCExpr.h"
|
|
#include "llvm/Support/Debug.h"
|
|
#include "llvm/Support/raw_ostream.h"
|
|
using namespace llvm;
|
|
|
|
// Sentinel value for the absolute pseudo section.
|
|
const MCSection *MCSymbol::AbsolutePseudoSection =
|
|
reinterpret_cast<const MCSection *>(1);
|
|
|
|
static bool isAcceptableChar(char C) {
|
|
if ((C < 'a' || C > 'z') &&
|
|
(C < 'A' || C > 'Z') &&
|
|
(C < '0' || C > '9') &&
|
|
C != '_' && C != '$' && C != '.' && C != '@')
|
|
return false;
|
|
return true;
|
|
}
|
|
|
|
/// NameNeedsQuoting - Return true if the identifier \p Str needs quotes to be
|
|
/// syntactically correct.
|
|
static bool NameNeedsQuoting(StringRef Str) {
|
|
assert(!Str.empty() && "Cannot create an empty MCSymbol");
|
|
|
|
// If any of the characters in the string is an unacceptable character, force
|
|
// quotes.
|
|
for (unsigned i = 0, e = Str.size(); i != e; ++i)
|
|
if (!isAcceptableChar(Str[i]))
|
|
return true;
|
|
return false;
|
|
}
|
|
|
|
const MCSymbol &MCSymbol::AliasedSymbol() const {
|
|
const MCSymbol *S = this;
|
|
while (S->isVariable()) {
|
|
const MCExpr *Value = S->getVariableValue();
|
|
if (Value->getKind() != MCExpr::SymbolRef)
|
|
return *S;
|
|
const MCSymbolRefExpr *Ref = static_cast<const MCSymbolRefExpr*>(Value);
|
|
S = &Ref->getSymbol();
|
|
}
|
|
return *S;
|
|
}
|
|
|
|
void MCSymbol::setVariableValue(const MCExpr *Value) {
|
|
assert(!IsUsed && "Cannot set a variable that has already been used.");
|
|
assert(Value && "Invalid variable value!");
|
|
this->Value = Value;
|
|
this->Section = nullptr;
|
|
}
|
|
|
|
void MCSymbol::print(raw_ostream &OS) const {
|
|
// The name for this MCSymbol is required to be a valid target name. However,
|
|
// some targets support quoting names with funny characters. If the name
|
|
// contains a funny character, then print it quoted.
|
|
StringRef Name = getName();
|
|
if (!NameNeedsQuoting(Name)) {
|
|
OS << Name;
|
|
return;
|
|
}
|
|
|
|
OS << '"';
|
|
for (unsigned I = 0, E = Name.size(); I != E; ++I) {
|
|
char C = Name[I];
|
|
if (C == '\n')
|
|
OS << "\\n";
|
|
else if (C == '"')
|
|
OS << "\\\"";
|
|
else
|
|
OS << C;
|
|
}
|
|
OS << '"';
|
|
}
|
|
|
|
#if !defined(NDEBUG) || defined(LLVM_ENABLE_DUMP)
|
|
void MCSymbol::dump() const {
|
|
print(dbgs());
|
|
}
|
|
#endif
|