//===-- AsmWriter.cpp - Printing LLVM as an assembly file -----------------===// // // The LLVM Compiler Infrastructure // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// // // This library implements the functionality defined in llvm/Assembly/Writer.h // // Note that these routines must be extremely tolerant of various errors in the // LLVM code, because it can be used for debugging transformations. // //===----------------------------------------------------------------------===// #include "llvm/Assembly/Writer.h" #include "llvm/Assembly/PrintModulePass.h" #include "llvm/Assembly/AsmAnnotationWriter.h" #include "llvm/CallingConv.h" #include "llvm/Constants.h" #include "llvm/DerivedTypes.h" #include "llvm/InlineAsm.h" #include "llvm/Instruction.h" #include "llvm/Instructions.h" #include "llvm/Module.h" #include "llvm/ValueSymbolTable.h" #include "llvm/TypeSymbolTable.h" #include "llvm/ADT/StringExtras.h" #include "llvm/ADT/STLExtras.h" #include "llvm/Support/CFG.h" #include "llvm/Support/MathExtras.h" #include "llvm/Support/Streams.h" #include "llvm/Support/raw_ostream.h" #include #include using namespace llvm; namespace llvm { // Make virtual table appear in this compilation unit. AssemblyAnnotationWriter::~AssemblyAnnotationWriter() {} /// This class provides computation of slot numbers for LLVM Assembly writing. /// class SlotMachine { public: /// ValueMap - A mapping of Values to slot numbers typedef std::map ValueMap; private: /// TheModule - The module for which we are holding slot numbers const Module* TheModule; /// TheFunction - The function for which we are holding slot numbers const Function* TheFunction; bool FunctionProcessed; /// mMap - The TypePlanes map for the module level data ValueMap mMap; unsigned mNext; /// fMap - The TypePlanes map for the function level data ValueMap fMap; unsigned fNext; public: /// Construct from a module explicit SlotMachine(const Module *M); /// Construct from a function, starting out in incorp state. explicit SlotMachine(const Function *F); /// Return the slot number of the specified value in it's type /// plane. If something is not in the SlotMachine, return -1. int getLocalSlot(const Value *V); int getGlobalSlot(const GlobalValue *V); /// If you'd like to deal with a function instead of just a module, use /// this method to get its data into the SlotMachine. void incorporateFunction(const Function *F) { TheFunction = F; FunctionProcessed = false; } /// After calling incorporateFunction, use this method to remove the /// most recently incorporated function from the SlotMachine. This /// will reset the state of the machine back to just the module contents. void purgeFunction(); // Implementation Details private: /// This function does the actual initialization. inline void initialize(); /// CreateModuleSlot - Insert the specified GlobalValue* into the slot table. void CreateModuleSlot(const GlobalValue *V); /// CreateFunctionSlot - Insert the specified Value* into the slot table. void CreateFunctionSlot(const Value *V); /// Add all of the module level global variables (and their initializers) /// and function declarations, but not the contents of those functions. void processModule(); /// Add all of the functions arguments, basic blocks, and instructions void processFunction(); SlotMachine(const SlotMachine &); // DO NOT IMPLEMENT void operator=(const SlotMachine &); // DO NOT IMPLEMENT }; } // end namespace llvm char PrintModulePass::ID = 0; static RegisterPass X("printm", "Print module to stderr"); char PrintFunctionPass::ID = 0; static RegisterPass Y("print","Print function to stderr"); static void WriteAsOperandInternal(std::ostream &Out, const Value *V, std::map &TypeTable, SlotMachine *Machine); static const Module *getModuleFromVal(const Value *V) { if (const Argument *MA = dyn_cast(V)) return MA->getParent() ? MA->getParent()->getParent() : 0; else if (const BasicBlock *BB = dyn_cast(V)) return BB->getParent() ? BB->getParent()->getParent() : 0; else if (const Instruction *I = dyn_cast(V)) { const Function *M = I->getParent() ? I->getParent()->getParent() : 0; return M ? M->getParent() : 0; } else if (const GlobalValue *GV = dyn_cast(V)) return GV->getParent(); return 0; } static SlotMachine *createSlotMachine(const Value *V) { if (const Argument *FA = dyn_cast(V)) { return new SlotMachine(FA->getParent()); } else if (const Instruction *I = dyn_cast(V)) { return new SlotMachine(I->getParent()->getParent()); } else if (const BasicBlock *BB = dyn_cast(V)) { return new SlotMachine(BB->getParent()); } else if (const GlobalVariable *GV = dyn_cast(V)){ return new SlotMachine(GV->getParent()); } else if (const GlobalAlias *GA = dyn_cast(V)){ return new SlotMachine(GA->getParent()); } else if (const Function *Func = dyn_cast(V)) { return new SlotMachine(Func); } return 0; } /// NameNeedsQuotes - Return true if the specified llvm name should be wrapped /// with ""'s. static std::string QuoteNameIfNeeded(const std::string &Name) { std::string result; bool needsQuotes = Name[0] >= '0' && Name[0] <= '9'; // Scan the name to see if it needs quotes and to replace funky chars with // their octal equivalent. for (unsigned i = 0, e = Name.size(); i != e; ++i) { char C = Name[i]; assert(C != '"' && "Illegal character in LLVM value name!"); if (isalnum(C) || C == '-' || C == '.' || C == '_') result += C; else if (C == '\\') { needsQuotes = true; result += "\\\\"; } else if (isprint(C)) { needsQuotes = true; result += C; } else { needsQuotes = true; result += "\\"; char hex1 = (C >> 4) & 0x0F; if (hex1 < 10) result += hex1 + '0'; else result += hex1 - 10 + 'A'; char hex2 = C & 0x0F; if (hex2 < 10) result += hex2 + '0'; else result += hex2 - 10 + 'A'; } } if (needsQuotes) { result.insert(0,"\""); result += '"'; } return result; } enum PrefixType { GlobalPrefix, LabelPrefix, LocalPrefix }; /// getLLVMName - Turn the specified string into an 'LLVM name', which is either /// prefixed with % (if the string only contains simple characters) or is /// surrounded with ""'s (if it has special chars in it). static std::string getLLVMName(const std::string &Name, PrefixType Prefix) { assert(!Name.empty() && "Cannot get empty name!"); switch (Prefix) { default: assert(0 && "Bad prefix!"); case GlobalPrefix: return '@' + QuoteNameIfNeeded(Name); case LabelPrefix: return QuoteNameIfNeeded(Name); case LocalPrefix: return '%' + QuoteNameIfNeeded(Name); } } /// PrintLLVMName - Turn the specified name into an 'LLVM name', which is either /// prefixed with % (if the string only contains simple characters) or is /// surrounded with ""'s (if it has special chars in it). Print it out. static void PrintLLVMName(std::ostream &OS, const ValueName *Name, PrefixType Prefix) { assert(Name && "Cannot get empty name!"); switch (Prefix) { default: assert(0 && "Bad prefix!"); case GlobalPrefix: OS << '@'; break; case LabelPrefix: break; case LocalPrefix: OS << '%'; break; } // Scan the name to see if it needs quotes first. const char *NameStr = Name->getKeyData(); unsigned NameLen = Name->getKeyLength(); bool NeedsQuotes = NameStr[0] >= '0' && NameStr[0] <= '9'; if (!NeedsQuotes) { for (unsigned i = 0; i != NameLen; ++i) { char C = NameStr[i]; if (!isalnum(C) && C != '-' && C != '.' && C != '_') { NeedsQuotes = true; break; } } } // If we didn't need any quotes, just write out the name in one blast. if (!NeedsQuotes) { OS.write(NameStr, NameLen); return; } // Okay, we need quotes. Output the quotes and escape any scary characters as // needed. OS << '"'; for (unsigned i = 0; i != NameLen; ++i) { char C = NameStr[i]; assert(C != '"' && "Illegal character in LLVM value name!"); if (C == '\\') { OS << "\\\\"; } else if (isprint(C)) { OS << C; } else { OS << "\\"; char hex1 = (C >> 4) & 0x0F; if (hex1 < 10) OS << (hex1 + '0'); else OS << (hex1 - 10 + 'A'); char hex2 = C & 0x0F; if (hex2 < 10) OS << (hex2 + '0'); else OS << (hex2 - 10 + 'A'); } } OS << '"'; } static void PrintLLVMName(std::ostream &OS, const Value *V) { PrintLLVMName(OS, V->getValueName(), isa(V) ? GlobalPrefix : LocalPrefix); } /// fillTypeNameTable - If the module has a symbol table, take all global types /// and stuff their names into the TypeNames map. /// static void fillTypeNameTable(const Module *M, std::map &TypeNames) { if (!M) return; const TypeSymbolTable &ST = M->getTypeSymbolTable(); TypeSymbolTable::const_iterator TI = ST.begin(); for (; TI != ST.end(); ++TI) { // As a heuristic, don't insert pointer to primitive types, because // they are used too often to have a single useful name. // const Type *Ty = cast(TI->second); if (!isa(Ty) || !cast(Ty)->getElementType()->isPrimitiveType() || !cast(Ty)->getElementType()->isInteger() || isa(cast(Ty)->getElementType())) TypeNames.insert(std::make_pair(Ty, getLLVMName(TI->first, LocalPrefix))); } } static void calcTypeName(const Type *Ty, std::vector &TypeStack, std::map &TypeNames, std::string & Result){ if (Ty->isInteger() || (Ty->isPrimitiveType() && !isa(Ty))) { Result += Ty->getDescription(); // Base case return; } // Check to see if the type is named. std::map::iterator I = TypeNames.find(Ty); if (I != TypeNames.end()) { Result += I->second; return; } if (isa(Ty)) { Result += "opaque"; return; } // Check to see if the Type is already on the stack... unsigned Slot = 0, CurSize = TypeStack.size(); while (Slot < CurSize && TypeStack[Slot] != Ty) ++Slot; // Scan for type // This is another base case for the recursion. In this case, we know // that we have looped back to a type that we have previously visited. // Generate the appropriate upreference to handle this. if (Slot < CurSize) { Result += "\\" + utostr(CurSize-Slot); // Here's the upreference return; } TypeStack.push_back(Ty); // Recursive case: Add us to the stack.. switch (Ty->getTypeID()) { case Type::IntegerTyID: { unsigned BitWidth = cast(Ty)->getBitWidth(); Result += "i" + utostr(BitWidth); break; } case Type::FunctionTyID: { const FunctionType *FTy = cast(Ty); calcTypeName(FTy->getReturnType(), TypeStack, TypeNames, Result); Result += " ("; for (FunctionType::param_iterator I = FTy->param_begin(), E = FTy->param_end(); I != E; ++I) { if (I != FTy->param_begin()) Result += ", "; calcTypeName(*I, TypeStack, TypeNames, Result); } if (FTy->isVarArg()) { if (FTy->getNumParams()) Result += ", "; Result += "..."; } Result += ")"; break; } case Type::StructTyID: { const StructType *STy = cast(Ty); if (STy->isPacked()) Result += '<'; Result += "{ "; for (StructType::element_iterator I = STy->element_begin(), E = STy->element_end(); I != E; ++I) { if (I != STy->element_begin()) Result += ", "; calcTypeName(*I, TypeStack, TypeNames, Result); } Result += " }"; if (STy->isPacked()) Result += '>'; break; } case Type::PointerTyID: { const PointerType *PTy = cast(Ty); calcTypeName(PTy->getElementType(), TypeStack, TypeNames, Result); if (unsigned AddressSpace = PTy->getAddressSpace()) Result += " addrspace(" + utostr(AddressSpace) + ")"; Result += "*"; break; } case Type::ArrayTyID: { const ArrayType *ATy = cast(Ty); Result += "[" + utostr(ATy->getNumElements()) + " x "; calcTypeName(ATy->getElementType(), TypeStack, TypeNames, Result); Result += "]"; break; } case Type::VectorTyID: { const VectorType *PTy = cast(Ty); Result += "<" + utostr(PTy->getNumElements()) + " x "; calcTypeName(PTy->getElementType(), TypeStack, TypeNames, Result); Result += ">"; break; } case Type::OpaqueTyID: Result += "opaque"; break; default: Result += ""; break; } TypeStack.pop_back(); // Remove self from stack... } /// printTypeInt - The internal guts of printing out a type that has a /// potentially named portion. /// static std::ostream &printTypeInt(std::ostream &Out, const Type *Ty, std::map &TypeNames) { // Primitive types always print out their description, regardless of whether // they have been named or not. // if (Ty->isInteger() || (Ty->isPrimitiveType() && !isa(Ty))) return Out << Ty->getDescription(); // Check to see if the type is named. std::map::iterator I = TypeNames.find(Ty); if (I != TypeNames.end()) return Out << I->second; // Otherwise we have a type that has not been named but is a derived type. // Carefully recurse the type hierarchy to print out any contained symbolic // names. // std::vector TypeStack; std::string TypeName; calcTypeName(Ty, TypeStack, TypeNames, TypeName); TypeNames.insert(std::make_pair(Ty, TypeName));//Cache type name for later use return (Out << TypeName); } /// WriteTypeSymbolic - This attempts to write the specified type as a symbolic /// type, iff there is an entry in the modules symbol table for the specified /// type or one of it's component types. This is slower than a simple x << Type /// std::ostream &llvm::WriteTypeSymbolic(std::ostream &Out, const Type *Ty, const Module *M) { Out << ' '; // If they want us to print out a type, but there is no context, we can't // print it symbolically. if (!M) return Out << Ty->getDescription(); std::map TypeNames; fillTypeNameTable(M, TypeNames); return printTypeInt(Out, Ty, TypeNames); } // PrintEscapedString - Print each character of the specified string, escaping // it if it is not printable or if it is an escape char. static void PrintEscapedString(const std::string &Str, std::ostream &Out) { for (unsigned i = 0, e = Str.size(); i != e; ++i) { unsigned char C = Str[i]; if (isprint(C) && C != '"' && C != '\\') { Out << C; } else { Out << '\\' << (char) ((C/16 < 10) ? ( C/16 +'0') : ( C/16 -10+'A')) << (char)(((C&15) < 10) ? ((C&15)+'0') : ((C&15)-10+'A')); } } } static const char *getPredicateText(unsigned predicate) { const char * pred = "unknown"; switch (predicate) { case FCmpInst::FCMP_FALSE: pred = "false"; break; case FCmpInst::FCMP_OEQ: pred = "oeq"; break; case FCmpInst::FCMP_OGT: pred = "ogt"; break; case FCmpInst::FCMP_OGE: pred = "oge"; break; case FCmpInst::FCMP_OLT: pred = "olt"; break; case FCmpInst::FCMP_OLE: pred = "ole"; break; case FCmpInst::FCMP_ONE: pred = "one"; break; case FCmpInst::FCMP_ORD: pred = "ord"; break; case FCmpInst::FCMP_UNO: pred = "uno"; break; case FCmpInst::FCMP_UEQ: pred = "ueq"; break; case FCmpInst::FCMP_UGT: pred = "ugt"; break; case FCmpInst::FCMP_UGE: pred = "uge"; break; case FCmpInst::FCMP_ULT: pred = "ult"; break; case FCmpInst::FCMP_ULE: pred = "ule"; break; case FCmpInst::FCMP_UNE: pred = "une"; break; case FCmpInst::FCMP_TRUE: pred = "true"; break; case ICmpInst::ICMP_EQ: pred = "eq"; break; case ICmpInst::ICMP_NE: pred = "ne"; break; case ICmpInst::ICMP_SGT: pred = "sgt"; break; case ICmpInst::ICMP_SGE: pred = "sge"; break; case ICmpInst::ICMP_SLT: pred = "slt"; break; case ICmpInst::ICMP_SLE: pred = "sle"; break; case ICmpInst::ICMP_UGT: pred = "ugt"; break; case ICmpInst::ICMP_UGE: pred = "uge"; break; case ICmpInst::ICMP_ULT: pred = "ult"; break; case ICmpInst::ICMP_ULE: pred = "ule"; break; } return pred; } static void WriteConstantInt(std::ostream &Out, const Constant *CV, std::map &TypeTable, SlotMachine *Machine) { const int IndentSize = 4; // FIXME: WHY IS INDENT STATIC?? static std::string Indent = "\n"; if (const ConstantInt *CI = dyn_cast(CV)) { if (CI->getType() == Type::Int1Ty) { Out << (CI->getZExtValue() ? "true" : "false"); return; } Out << CI->getValue(); return; } if (const ConstantFP *CFP = dyn_cast(CV)) { if (&CFP->getValueAPF().getSemantics() == &APFloat::IEEEdouble || &CFP->getValueAPF().getSemantics() == &APFloat::IEEEsingle) { // We would like to output the FP constant value in exponential notation, // but we cannot do this if doing so will lose precision. Check here to // make sure that we only output it in exponential format if we can parse // the value back and get the same value. // bool isDouble = &CFP->getValueAPF().getSemantics()==&APFloat::IEEEdouble; double Val = isDouble ? CFP->getValueAPF().convertToDouble() : CFP->getValueAPF().convertToFloat(); std::string StrVal = ftostr(CFP->getValueAPF()); // Check to make sure that the stringized number is not some string like // "Inf" or NaN, that atof will accept, but the lexer will not. Check // that the string matches the "[-+]?[0-9]" regex. // if ((StrVal[0] >= '0' && StrVal[0] <= '9') || ((StrVal[0] == '-' || StrVal[0] == '+') && (StrVal[1] >= '0' && StrVal[1] <= '9'))) { // Reparse stringized version! if (atof(StrVal.c_str()) == Val) { Out << StrVal; return; } } // Otherwise we could not reparse it to exactly the same value, so we must // output the string in hexadecimal format! assert(sizeof(double) == sizeof(uint64_t) && "assuming that double is 64 bits!"); Out << "0x" << utohexstr(DoubleToBits(Val)); } else { // Some form of long double. These appear as a magic letter identifying // the type, then a fixed number of hex digits. Out << "0x"; if (&CFP->getValueAPF().getSemantics() == &APFloat::x87DoubleExtended) Out << 'K'; else if (&CFP->getValueAPF().getSemantics() == &APFloat::IEEEquad) Out << 'L'; else if (&CFP->getValueAPF().getSemantics() == &APFloat::PPCDoubleDouble) Out << 'M'; else assert(0 && "Unsupported floating point type"); // api needed to prevent premature destruction APInt api = CFP->getValueAPF().convertToAPInt(); const uint64_t* p = api.getRawData(); uint64_t word = *p; int shiftcount=60; int width = api.getBitWidth(); for (int j=0; j>shiftcount) & 15; if (nibble < 10) Out << (unsigned char)(nibble + '0'); else Out << (unsigned char)(nibble - 10 + 'A'); if (shiftcount == 0 && j+4 < width) { word = *(++p); shiftcount = 64; if (width-j-4 < 64) shiftcount = width-j-4; } } } } else if (isa(CV)) { Out << "zeroinitializer"; } else if (const ConstantArray *CA = dyn_cast(CV)) { // As a special case, print the array as a string if it is an array of // i8 with ConstantInt values. // const Type *ETy = CA->getType()->getElementType(); if (CA->isString()) { Out << "c\""; PrintEscapedString(CA->getAsString(), Out); Out << "\""; } else { // Cannot output in string format... Out << '['; if (CA->getNumOperands()) { Out << ' '; printTypeInt(Out, ETy, TypeTable); WriteAsOperandInternal(Out, CA->getOperand(0), TypeTable, Machine); for (unsigned i = 1, e = CA->getNumOperands(); i != e; ++i) { Out << ", "; printTypeInt(Out, ETy, TypeTable); WriteAsOperandInternal(Out, CA->getOperand(i), TypeTable, Machine); } } Out << " ]"; } } else if (const ConstantStruct *CS = dyn_cast(CV)) { if (CS->getType()->isPacked()) Out << '<'; Out << '{'; unsigned N = CS->getNumOperands(); if (N) { if (N > 2) { Indent += std::string(IndentSize, ' '); Out << Indent; } else { Out << ' '; } printTypeInt(Out, CS->getOperand(0)->getType(), TypeTable); WriteAsOperandInternal(Out, CS->getOperand(0), TypeTable, Machine); for (unsigned i = 1; i < N; i++) { Out << ", "; if (N > 2) Out << Indent; printTypeInt(Out, CS->getOperand(i)->getType(), TypeTable); WriteAsOperandInternal(Out, CS->getOperand(i), TypeTable, Machine); } if (N > 2) Indent.resize(Indent.size() - IndentSize); } Out << " }"; if (CS->getType()->isPacked()) Out << '>'; } else if (const ConstantVector *CP = dyn_cast(CV)) { const Type *ETy = CP->getType()->getElementType(); assert(CP->getNumOperands() > 0 && "Number of operands for a PackedConst must be > 0"); Out << '<'; Out << ' '; printTypeInt(Out, ETy, TypeTable); WriteAsOperandInternal(Out, CP->getOperand(0), TypeTable, Machine); for (unsigned i = 1, e = CP->getNumOperands(); i != e; ++i) { Out << ", "; printTypeInt(Out, ETy, TypeTable); WriteAsOperandInternal(Out, CP->getOperand(i), TypeTable, Machine); } Out << " >"; } else if (isa(CV)) { Out << "null"; } else if (isa(CV)) { Out << "undef"; } else if (const ConstantExpr *CE = dyn_cast(CV)) { Out << CE->getOpcodeName(); if (CE->isCompare()) Out << " " << getPredicateText(CE->getPredicate()); Out << " ("; for (User::const_op_iterator OI=CE->op_begin(); OI != CE->op_end(); ++OI) { printTypeInt(Out, (*OI)->getType(), TypeTable); WriteAsOperandInternal(Out, *OI, TypeTable, Machine); if (OI+1 != CE->op_end()) Out << ", "; } if (CE->hasIndices()) { const SmallVector &Indices = CE->getIndices(); for (unsigned i = 0, e = Indices.size(); i != e; ++i) Out << ", " << Indices[i]; } if (CE->isCast()) { Out << " to "; printTypeInt(Out, CE->getType(), TypeTable); } Out << ')'; } else { Out << ""; } } /// WriteAsOperand - Write the name of the specified value out to the specified /// ostream. This can be useful when you just want to print int %reg126, not /// the whole instruction that generated it. /// static void WriteAsOperandInternal(std::ostream &Out, const Value *V, std::map &TypeTable, SlotMachine *Machine) { Out << ' '; if (V->hasName()) { PrintLLVMName(Out, V); return; } const Constant *CV = dyn_cast(V); if (CV && !isa(CV)) { WriteConstantInt(Out, CV, TypeTable, Machine); } else if (const InlineAsm *IA = dyn_cast(V)) { Out << "asm "; if (IA->hasSideEffects()) Out << "sideeffect "; Out << '"'; PrintEscapedString(IA->getAsmString(), Out); Out << "\", \""; PrintEscapedString(IA->getConstraintString(), Out); Out << '"'; } else { char Prefix = '%'; int Slot; if (Machine) { if (const GlobalValue *GV = dyn_cast(V)) { Slot = Machine->getGlobalSlot(GV); Prefix = '@'; } else { Slot = Machine->getLocalSlot(V); } } else { Machine = createSlotMachine(V); if (Machine) { if (const GlobalValue *GV = dyn_cast(V)) { Slot = Machine->getGlobalSlot(GV); Prefix = '@'; } else { Slot = Machine->getLocalSlot(V); } } else { Slot = -1; } delete Machine; } if (Slot != -1) Out << Prefix << Slot; else Out << ""; } } /// WriteAsOperand - Write the name of the specified value out to the specified /// ostream. This can be useful when you just want to print int %reg126, not /// the whole instruction that generated it. /// std::ostream &llvm::WriteAsOperand(std::ostream &Out, const Value *V, bool PrintType, const Module *Context) { std::map TypeNames; if (Context == 0) Context = getModuleFromVal(V); if (Context) fillTypeNameTable(Context, TypeNames); if (PrintType) printTypeInt(Out, V->getType(), TypeNames); WriteAsOperandInternal(Out, V, TypeNames, 0); return Out; } namespace llvm { class AssemblyWriter { std::ostream &Out; SlotMachine &Machine; const Module *TheModule; std::map TypeNames; AssemblyAnnotationWriter *AnnotationWriter; public: inline AssemblyWriter(std::ostream &o, SlotMachine &Mac, const Module *M, AssemblyAnnotationWriter *AAW) : Out(o), Machine(Mac), TheModule(M), AnnotationWriter(AAW) { // If the module has a symbol table, take all global types and stuff their // names into the TypeNames map. // fillTypeNameTable(M, TypeNames); } inline void write(const Module *M) { printModule(M); } inline void write(const GlobalVariable *G) { printGlobal(G); } inline void write(const GlobalAlias *G) { printAlias(G); } inline void write(const Function *F) { printFunction(F); } inline void write(const BasicBlock *BB) { printBasicBlock(BB); } inline void write(const Instruction *I) { printInstruction(*I); } inline void write(const Type *Ty) { printType(Ty); } void writeOperand(const Value *Op, bool PrintType); void writeParamOperand(const Value *Operand, ParameterAttributes Attrs); const Module* getModule() { return TheModule; } private: void printModule(const Module *M); void printTypeSymbolTable(const TypeSymbolTable &ST); void printGlobal(const GlobalVariable *GV); void printAlias(const GlobalAlias *GV); void printFunction(const Function *F); void printArgument(const Argument *FA, ParameterAttributes Attrs); void printBasicBlock(const BasicBlock *BB); void printInstruction(const Instruction &I); // printType - Go to extreme measures to attempt to print out a short, // symbolic version of a type name. // std::ostream &printType(const Type *Ty) { return printTypeInt(Out, Ty, TypeNames); } // printTypeAtLeastOneLevel - Print out one level of the possibly complex type // without considering any symbolic types that we may have equal to it. // std::ostream &printTypeAtLeastOneLevel(const Type *Ty); // printInfoComment - Print a little comment after the instruction indicating // which slot it occupies. void printInfoComment(const Value &V); }; } // end of llvm namespace /// printTypeAtLeastOneLevel - Print out one level of the possibly complex type /// without considering any symbolic types that we may have equal to it. /// std::ostream &AssemblyWriter::printTypeAtLeastOneLevel(const Type *Ty) { if (const IntegerType *ITy = dyn_cast(Ty)) Out << "i" << utostr(ITy->getBitWidth()); else if (const FunctionType *FTy = dyn_cast(Ty)) { printType(FTy->getReturnType()); Out << " ("; for (FunctionType::param_iterator I = FTy->param_begin(), E = FTy->param_end(); I != E; ++I) { if (I != FTy->param_begin()) Out << ", "; printType(*I); } if (FTy->isVarArg()) { if (FTy->getNumParams()) Out << ", "; Out << "..."; } Out << ')'; } else if (const StructType *STy = dyn_cast(Ty)) { if (STy->isPacked()) Out << '<'; Out << "{ "; for (StructType::element_iterator I = STy->element_begin(), E = STy->element_end(); I != E; ++I) { if (I != STy->element_begin()) Out << ", "; printType(*I); } Out << " }"; if (STy->isPacked()) Out << '>'; } else if (const PointerType *PTy = dyn_cast(Ty)) { printType(PTy->getElementType()); if (unsigned AddressSpace = PTy->getAddressSpace()) Out << " addrspace(" << AddressSpace << ")"; Out << '*'; } else if (const ArrayType *ATy = dyn_cast(Ty)) { Out << '[' << ATy->getNumElements() << " x "; printType(ATy->getElementType()) << ']'; } else if (const VectorType *PTy = dyn_cast(Ty)) { Out << '<' << PTy->getNumElements() << " x "; printType(PTy->getElementType()) << '>'; } else if (isa(Ty)) { Out << "opaque"; } else { if (!Ty->isPrimitiveType()) Out << ""; printType(Ty); } return Out; } void AssemblyWriter::writeOperand(const Value *Operand, bool PrintType) { if (Operand == 0) { Out << ""; } else { if (PrintType) { Out << ' '; printType(Operand->getType()); } WriteAsOperandInternal(Out, Operand, TypeNames, &Machine); } } void AssemblyWriter::writeParamOperand(const Value *Operand, ParameterAttributes Attrs) { if (Operand == 0) { Out << ""; } else { Out << ' '; // Print the type printType(Operand->getType()); // Print parameter attributes list if (Attrs != ParamAttr::None) Out << ' ' << ParamAttr::getAsString(Attrs); // Print the operand WriteAsOperandInternal(Out, Operand, TypeNames, &Machine); } } void AssemblyWriter::printModule(const Module *M) { if (!M->getModuleIdentifier().empty() && // Don't print the ID if it will start a new line (which would // require a comment char before it). M->getModuleIdentifier().find('\n') == std::string::npos) Out << "; ModuleID = '" << M->getModuleIdentifier() << "'\n"; if (!M->getDataLayout().empty()) Out << "target datalayout = \"" << M->getDataLayout() << "\"\n"; if (!M->getTargetTriple().empty()) Out << "target triple = \"" << M->getTargetTriple() << "\"\n"; if (!M->getModuleInlineAsm().empty()) { // Split the string into lines, to make it easier to read the .ll file. std::string Asm = M->getModuleInlineAsm(); size_t CurPos = 0; size_t NewLine = Asm.find_first_of('\n', CurPos); while (NewLine != std::string::npos) { // We found a newline, print the portion of the asm string from the // last newline up to this newline. Out << "module asm \""; PrintEscapedString(std::string(Asm.begin()+CurPos, Asm.begin()+NewLine), Out); Out << "\"\n"; CurPos = NewLine+1; NewLine = Asm.find_first_of('\n', CurPos); } Out << "module asm \""; PrintEscapedString(std::string(Asm.begin()+CurPos, Asm.end()), Out); Out << "\"\n"; } // Loop over the dependent libraries and emit them. Module::lib_iterator LI = M->lib_begin(); Module::lib_iterator LE = M->lib_end(); if (LI != LE) { Out << "deplibs = [ "; while (LI != LE) { Out << '"' << *LI << '"'; ++LI; if (LI != LE) Out << ", "; } Out << " ]\n"; } // Loop over the symbol table, emitting all named constants. printTypeSymbolTable(M->getTypeSymbolTable()); for (Module::const_global_iterator I = M->global_begin(), E = M->global_end(); I != E; ++I) printGlobal(I); // Output all aliases. if (!M->alias_empty()) Out << "\n"; for (Module::const_alias_iterator I = M->alias_begin(), E = M->alias_end(); I != E; ++I) printAlias(I); // Output all of the functions. for (Module::const_iterator I = M->begin(), E = M->end(); I != E; ++I) printFunction(I); } void AssemblyWriter::printGlobal(const GlobalVariable *GV) { if (GV->hasName()) { PrintLLVMName(Out, GV); Out << " = "; } if (!GV->hasInitializer()) { switch (GV->getLinkage()) { case GlobalValue::DLLImportLinkage: Out << "dllimport "; break; case GlobalValue::ExternalWeakLinkage: Out << "extern_weak "; break; default: Out << "external "; break; } } else { switch (GV->getLinkage()) { case GlobalValue::InternalLinkage: Out << "internal "; break; case GlobalValue::CommonLinkage: Out << "common "; break; case GlobalValue::LinkOnceLinkage: Out << "linkonce "; break; case GlobalValue::WeakLinkage: Out << "weak "; break; case GlobalValue::AppendingLinkage: Out << "appending "; break; case GlobalValue::DLLImportLinkage: Out << "dllimport "; break; case GlobalValue::DLLExportLinkage: Out << "dllexport "; break; case GlobalValue::ExternalWeakLinkage: Out << "extern_weak "; break; case GlobalValue::ExternalLinkage: break; case GlobalValue::GhostLinkage: cerr << "GhostLinkage not allowed in AsmWriter!\n"; abort(); } switch (GV->getVisibility()) { default: assert(0 && "Invalid visibility style!"); case GlobalValue::DefaultVisibility: break; case GlobalValue::HiddenVisibility: Out << "hidden "; break; case GlobalValue::ProtectedVisibility: Out << "protected "; break; } } if (GV->isThreadLocal()) Out << "thread_local "; Out << (GV->isConstant() ? "constant " : "global "); printType(GV->getType()->getElementType()); if (GV->hasInitializer()) writeOperand(GV->getInitializer(), false); if (unsigned AddressSpace = GV->getType()->getAddressSpace()) Out << " addrspace(" << AddressSpace << ") "; if (GV->hasSection()) Out << ", section \"" << GV->getSection() << '"'; if (GV->getAlignment()) Out << ", align " << GV->getAlignment(); printInfoComment(*GV); Out << "\n"; } void AssemblyWriter::printAlias(const GlobalAlias *GA) { // Don't crash when dumping partially built GA if (!GA->hasName()) Out << "<> = "; else { PrintLLVMName(Out, GA); Out << " = "; } switch (GA->getVisibility()) { default: assert(0 && "Invalid visibility style!"); case GlobalValue::DefaultVisibility: break; case GlobalValue::HiddenVisibility: Out << "hidden "; break; case GlobalValue::ProtectedVisibility: Out << "protected "; break; } Out << "alias "; switch (GA->getLinkage()) { case GlobalValue::WeakLinkage: Out << "weak "; break; case GlobalValue::InternalLinkage: Out << "internal "; break; case GlobalValue::ExternalLinkage: break; default: assert(0 && "Invalid alias linkage"); } const Constant *Aliasee = GA->getAliasee(); if (const GlobalVariable *GV = dyn_cast(Aliasee)) { printType(GV->getType()); Out << ' '; PrintLLVMName(Out, GV); } else if (const Function *F = dyn_cast(Aliasee)) { printType(F->getFunctionType()); Out << "* "; if (F->hasName()) PrintLLVMName(Out, F); else Out << "@\"\""; } else if (const GlobalAlias *GA = dyn_cast(Aliasee)) { printType(GA->getType()); Out << " "; PrintLLVMName(Out, GA); } else { const ConstantExpr *CE = 0; if ((CE = dyn_cast(Aliasee)) && (CE->getOpcode() == Instruction::BitCast)) { writeOperand(CE, false); } else assert(0 && "Unsupported aliasee"); } printInfoComment(*GA); Out << "\n"; } void AssemblyWriter::printTypeSymbolTable(const TypeSymbolTable &ST) { // Print the types. for (TypeSymbolTable::const_iterator TI = ST.begin(), TE = ST.end(); TI != TE; ++TI) { Out << "\t" << getLLVMName(TI->first, LocalPrefix) << " = type "; // Make sure we print out at least one level of the type structure, so // that we do not get %FILE = type %FILE // printTypeAtLeastOneLevel(TI->second) << "\n"; } } /// printFunction - Print all aspects of a function. /// void AssemblyWriter::printFunction(const Function *F) { // Print out the return type and name... Out << "\n"; if (AnnotationWriter) AnnotationWriter->emitFunctionAnnot(F, Out); if (F->isDeclaration()) Out << "declare "; else Out << "define "; switch (F->getLinkage()) { case GlobalValue::InternalLinkage: Out << "internal "; break; case GlobalValue::LinkOnceLinkage: Out << "linkonce "; break; case GlobalValue::WeakLinkage: Out << "weak "; break; case GlobalValue::CommonLinkage: Out << "common "; break; case GlobalValue::AppendingLinkage: Out << "appending "; break; case GlobalValue::DLLImportLinkage: Out << "dllimport "; break; case GlobalValue::DLLExportLinkage: Out << "dllexport "; break; case GlobalValue::ExternalWeakLinkage: Out << "extern_weak "; break; case GlobalValue::ExternalLinkage: break; case GlobalValue::GhostLinkage: cerr << "GhostLinkage not allowed in AsmWriter!\n"; abort(); } switch (F->getVisibility()) { default: assert(0 && "Invalid visibility style!"); case GlobalValue::DefaultVisibility: break; case GlobalValue::HiddenVisibility: Out << "hidden "; break; case GlobalValue::ProtectedVisibility: Out << "protected "; break; } // Print the calling convention. switch (F->getCallingConv()) { case CallingConv::C: break; // default case CallingConv::Fast: Out << "fastcc "; break; case CallingConv::Cold: Out << "coldcc "; break; case CallingConv::X86_StdCall: Out << "x86_stdcallcc "; break; case CallingConv::X86_FastCall: Out << "x86_fastcallcc "; break; case CallingConv::X86_SSECall: Out << "x86_ssecallcc "; break; default: Out << "cc" << F->getCallingConv() << " "; break; } const FunctionType *FT = F->getFunctionType(); const PAListPtr &Attrs = F->getParamAttrs(); printType(F->getReturnType()) << ' '; if (!F->getName().empty()) PrintLLVMName(Out, F); else Out << "@\"\""; Out << '('; Machine.incorporateFunction(F); // Loop over the arguments, printing them... unsigned Idx = 1; if (!F->isDeclaration()) { // If this isn't a declaration, print the argument names as well. for (Function::const_arg_iterator I = F->arg_begin(), E = F->arg_end(); I != E; ++I) { // Insert commas as we go... the first arg doesn't get a comma if (I != F->arg_begin()) Out << ", "; printArgument(I, Attrs.getParamAttrs(Idx)); Idx++; } } else { // Otherwise, print the types from the function type. for (unsigned i = 0, e = FT->getNumParams(); i != e; ++i) { // Insert commas as we go... the first arg doesn't get a comma if (i) Out << ", "; // Output type... printType(FT->getParamType(i)); ParameterAttributes ArgAttrs = Attrs.getParamAttrs(i+1); if (ArgAttrs != ParamAttr::None) Out << ' ' << ParamAttr::getAsString(ArgAttrs); } } // Finish printing arguments... if (FT->isVarArg()) { if (FT->getNumParams()) Out << ", "; Out << "..."; // Output varargs portion of signature! } Out << ')'; ParameterAttributes RetAttrs = Attrs.getParamAttrs(0); if (RetAttrs != ParamAttr::None) Out << ' ' << ParamAttr::getAsString(Attrs.getParamAttrs(0)); if (F->hasSection()) Out << " section \"" << F->getSection() << '"'; if (F->getAlignment()) Out << " align " << F->getAlignment(); if (F->hasCollector()) Out << " gc \"" << F->getCollector() << '"'; if (F->isDeclaration()) { Out << "\n"; } else { Out << " {"; // Output all of its basic blocks... for the function for (Function::const_iterator I = F->begin(), E = F->end(); I != E; ++I) printBasicBlock(I); Out << "}\n"; } Machine.purgeFunction(); } /// printArgument - This member is called for every argument that is passed into /// the function. Simply print it out /// void AssemblyWriter::printArgument(const Argument *Arg, ParameterAttributes Attrs) { // Output type... printType(Arg->getType()); // Output parameter attributes list if (Attrs != ParamAttr::None) Out << ' ' << ParamAttr::getAsString(Attrs); // Output name, if available... if (Arg->hasName()) { Out << ' '; PrintLLVMName(Out, Arg); } } /// printBasicBlock - This member is called for each basic block in a method. /// void AssemblyWriter::printBasicBlock(const BasicBlock *BB) { if (BB->hasName()) { // Print out the label if it exists... Out << "\n"; PrintLLVMName(Out, BB->getValueName(), LabelPrefix); Out << ':'; } else if (!BB->use_empty()) { // Don't print block # of no uses... Out << "\n;