| //===-- llvm-objdump.cpp - Object file dumping utility for llvm -----------===// |
| // |
| // The LLVM Compiler Infrastructure |
| // |
| // This file is distributed under the University of Illinois Open Source |
| // License. See LICENSE.TXT for details. |
| // |
| //===----------------------------------------------------------------------===// |
| // |
| // This program is a utility that works like binutils "objdump", that is, it |
| // dumps out a plethora of information about an object file depending on the |
| // flags. |
| // |
| // The flags and output of this program should be near identical to those of |
| // binutils objdump. |
| // |
| //===----------------------------------------------------------------------===// |
| |
| #include "llvm-objdump.h" |
| #include "llvm/ADT/STLExtras.h" |
| #include "llvm/ADT/StringExtras.h" |
| #include "llvm/ADT/Triple.h" |
| #include "llvm/MC/MCAnalysis/MCAtom.h" |
| #include "llvm/MC/MCAnalysis/MCFunction.h" |
| #include "llvm/MC/MCAnalysis/MCModule.h" |
| #include "llvm/MC/MCAnalysis/MCModuleYAML.h" |
| #include "llvm/MC/MCAsmInfo.h" |
| #include "llvm/MC/MCContext.h" |
| #include "llvm/MC/MCDisassembler.h" |
| #include "llvm/MC/MCInst.h" |
| #include "llvm/MC/MCInstPrinter.h" |
| #include "llvm/MC/MCInstrAnalysis.h" |
| #include "llvm/MC/MCInstrInfo.h" |
| #include "llvm/MC/MCObjectDisassembler.h" |
| #include "llvm/MC/MCObjectFileInfo.h" |
| #include "llvm/MC/MCObjectSymbolizer.h" |
| #include "llvm/MC/MCRegisterInfo.h" |
| #include "llvm/MC/MCRelocationInfo.h" |
| #include "llvm/MC/MCSubtargetInfo.h" |
| #include "llvm/Object/Archive.h" |
| #include "llvm/Object/COFF.h" |
| #include "llvm/Object/MachO.h" |
| #include "llvm/Object/ObjectFile.h" |
| #include "llvm/Support/Casting.h" |
| #include "llvm/Support/CommandLine.h" |
| #include "llvm/Support/Debug.h" |
| #include "llvm/Support/FileSystem.h" |
| #include "llvm/Support/Format.h" |
| #include "llvm/Support/GraphWriter.h" |
| #include "llvm/Support/Host.h" |
| #include "llvm/Support/ManagedStatic.h" |
| #include "llvm/Support/MemoryBuffer.h" |
| #include "llvm/Support/MemoryObject.h" |
| #include "llvm/Support/PrettyStackTrace.h" |
| #include "llvm/Support/Signals.h" |
| #include "llvm/Support/SourceMgr.h" |
| #include "llvm/Support/TargetRegistry.h" |
| #include "llvm/Support/TargetSelect.h" |
| #include "llvm/Support/raw_ostream.h" |
| #include <algorithm> |
| #include <cctype> |
| #include <cstring> |
| #include <system_error> |
| |
| using namespace llvm; |
| using namespace object; |
| |
| static cl::list<std::string> |
| InputFilenames(cl::Positional, cl::desc("<input object files>"),cl::ZeroOrMore); |
| |
| static cl::opt<bool> |
| Disassemble("disassemble", |
| cl::desc("Display assembler mnemonics for the machine instructions")); |
| static cl::alias |
| Disassembled("d", cl::desc("Alias for --disassemble"), |
| cl::aliasopt(Disassemble)); |
| |
| static cl::opt<bool> |
| Relocations("r", cl::desc("Display the relocation entries in the file")); |
| |
| static cl::opt<bool> |
| SectionContents("s", cl::desc("Display the content of each section")); |
| |
| static cl::opt<bool> |
| SymbolTable("t", cl::desc("Display the symbol table")); |
| |
| static cl::opt<bool> |
| MachOOpt("macho", cl::desc("Use MachO specific object file parser")); |
| static cl::alias |
| MachOm("m", cl::desc("Alias for --macho"), cl::aliasopt(MachOOpt)); |
| |
| cl::opt<std::string> |
| llvm::TripleName("triple", cl::desc("Target triple to disassemble for, " |
| "see -version for available targets")); |
| |
| cl::opt<std::string> |
| llvm::ArchName("arch", cl::desc("Target arch to disassemble for, " |
| "see -version for available targets")); |
| |
| static cl::opt<bool> |
| SectionHeaders("section-headers", cl::desc("Display summaries of the headers " |
| "for each section.")); |
| static cl::alias |
| SectionHeadersShort("headers", cl::desc("Alias for --section-headers"), |
| cl::aliasopt(SectionHeaders)); |
| static cl::alias |
| SectionHeadersShorter("h", cl::desc("Alias for --section-headers"), |
| cl::aliasopt(SectionHeaders)); |
| |
| static cl::list<std::string> |
| MAttrs("mattr", |
| cl::CommaSeparated, |
| cl::desc("Target specific attributes"), |
| cl::value_desc("a1,+a2,-a3,...")); |
| |
| static cl::opt<bool> |
| NoShowRawInsn("no-show-raw-insn", cl::desc("When disassembling instructions, " |
| "do not print the instruction bytes.")); |
| |
| static cl::opt<bool> |
| UnwindInfo("unwind-info", cl::desc("Display unwind information")); |
| |
| static cl::alias |
| UnwindInfoShort("u", cl::desc("Alias for --unwind-info"), |
| cl::aliasopt(UnwindInfo)); |
| |
| static cl::opt<bool> |
| PrivateHeaders("private-headers", |
| cl::desc("Display format specific file headers")); |
| |
| static cl::alias |
| PrivateHeadersShort("p", cl::desc("Alias for --private-headers"), |
| cl::aliasopt(PrivateHeaders)); |
| |
| static cl::opt<bool> |
| Symbolize("symbolize", cl::desc("When disassembling instructions, " |
| "try to symbolize operands.")); |
| |
| static cl::opt<bool> |
| CFG("cfg", cl::desc("Create a CFG for every function found in the object" |
| " and write it to a graphviz file")); |
| |
| // FIXME: Does it make sense to have a dedicated tool for yaml cfg output? |
| static cl::opt<std::string> |
| YAMLCFG("yaml-cfg", |
| cl::desc("Create a CFG and write it as a YAML MCModule."), |
| cl::value_desc("yaml output file")); |
| |
| static StringRef ToolName; |
| |
| bool llvm::error(std::error_code EC) { |
| if (!EC) |
| return false; |
| |
| outs() << ToolName << ": error reading file: " << EC.message() << ".\n"; |
| outs().flush(); |
| return true; |
| } |
| |
| static const Target *getTarget(const ObjectFile *Obj = nullptr) { |
| // Figure out the target triple. |
| llvm::Triple TheTriple("unknown-unknown-unknown"); |
| if (TripleName.empty()) { |
| if (Obj) { |
| TheTriple.setArch(Triple::ArchType(Obj->getArch())); |
| // TheTriple defaults to ELF, and COFF doesn't have an environment: |
| // the best we can do here is indicate that it is mach-o. |
| if (Obj->isMachO()) |
| TheTriple.setObjectFormat(Triple::MachO); |
| |
| if (Obj->isCOFF()) { |
| const auto COFFObj = dyn_cast<COFFObjectFile>(Obj); |
| if (COFFObj->getArch() == Triple::thumb) |
| TheTriple.setTriple("thumbv7-windows"); |
| } |
| } |
| } else |
| TheTriple.setTriple(Triple::normalize(TripleName)); |
| |
| // Get the target specific parser. |
| std::string Error; |
| const Target *TheTarget = TargetRegistry::lookupTarget(ArchName, TheTriple, |
| Error); |
| if (!TheTarget) { |
| errs() << ToolName << ": " << Error; |
| return nullptr; |
| } |
| |
| // Update the triple name and return the found target. |
| TripleName = TheTriple.getTriple(); |
| return TheTarget; |
| } |
| |
| // Write a graphviz file for the CFG inside an MCFunction. |
| // FIXME: Use GraphWriter |
| static void emitDOTFile(const char *FileName, const MCFunction &f, |
| MCInstPrinter *IP) { |
| // Start a new dot file. |
| std::string Error; |
| raw_fd_ostream Out(FileName, Error, sys::fs::F_Text); |
| if (!Error.empty()) { |
| errs() << "llvm-objdump: warning: " << Error << '\n'; |
| return; |
| } |
| |
| Out << "digraph \"" << f.getName() << "\" {\n"; |
| Out << "graph [ rankdir = \"LR\" ];\n"; |
| for (MCFunction::const_iterator i = f.begin(), e = f.end(); i != e; ++i) { |
| // Only print blocks that have predecessors. |
| bool hasPreds = (*i)->pred_begin() != (*i)->pred_end(); |
| |
| if (!hasPreds && i != f.begin()) |
| continue; |
| |
| Out << '"' << (*i)->getInsts()->getBeginAddr() << "\" [ label=\"<a>"; |
| // Print instructions. |
| for (unsigned ii = 0, ie = (*i)->getInsts()->size(); ii != ie; |
| ++ii) { |
| if (ii != 0) // Not the first line, start a new row. |
| Out << '|'; |
| if (ii + 1 == ie) // Last line, add an end id. |
| Out << "<o>"; |
| |
| // Escape special chars and print the instruction in mnemonic form. |
| std::string Str; |
| raw_string_ostream OS(Str); |
| IP->printInst(&(*i)->getInsts()->at(ii).Inst, OS, ""); |
| Out << DOT::EscapeString(OS.str()); |
| } |
| Out << "\" shape=\"record\" ];\n"; |
| |
| // Add edges. |
| for (MCBasicBlock::succ_const_iterator si = (*i)->succ_begin(), |
| se = (*i)->succ_end(); si != se; ++si) |
| Out << (*i)->getInsts()->getBeginAddr() << ":o -> " |
| << (*si)->getInsts()->getBeginAddr() << ":a\n"; |
| } |
| Out << "}\n"; |
| } |
| |
| void llvm::DumpBytes(StringRef bytes) { |
| static const char hex_rep[] = "0123456789abcdef"; |
| // FIXME: The real way to do this is to figure out the longest instruction |
| // and align to that size before printing. I'll fix this when I get |
| // around to outputting relocations. |
| // 15 is the longest x86 instruction |
| // 3 is for the hex rep of a byte + a space. |
| // 1 is for the null terminator. |
| enum { OutputSize = (15 * 3) + 1 }; |
| char output[OutputSize]; |
| |
| assert(bytes.size() <= 15 |
| && "DumpBytes only supports instructions of up to 15 bytes"); |
| memset(output, ' ', sizeof(output)); |
| unsigned index = 0; |
| for (StringRef::iterator i = bytes.begin(), |
| e = bytes.end(); i != e; ++i) { |
| output[index] = hex_rep[(*i & 0xF0) >> 4]; |
| output[index + 1] = hex_rep[*i & 0xF]; |
| index += 3; |
| } |
| |
| output[sizeof(output) - 1] = 0; |
| outs() << output; |
| } |
| |
| bool llvm::RelocAddressLess(RelocationRef a, RelocationRef b) { |
| uint64_t a_addr, b_addr; |
| if (error(a.getOffset(a_addr))) return false; |
| if (error(b.getOffset(b_addr))) return false; |
| return a_addr < b_addr; |
| } |
| |
| static void DisassembleObject(const ObjectFile *Obj, bool InlineRelocs) { |
| const Target *TheTarget = getTarget(Obj); |
| // getTarget() will have already issued a diagnostic if necessary, so |
| // just bail here if it failed. |
| if (!TheTarget) |
| return; |
| |
| // Package up features to be passed to target/subtarget |
| std::string FeaturesStr; |
| if (MAttrs.size()) { |
| SubtargetFeatures Features; |
| for (unsigned i = 0; i != MAttrs.size(); ++i) |
| Features.AddFeature(MAttrs[i]); |
| FeaturesStr = Features.getString(); |
| } |
| |
| std::unique_ptr<const MCRegisterInfo> MRI( |
| TheTarget->createMCRegInfo(TripleName)); |
| if (!MRI) { |
| errs() << "error: no register info for target " << TripleName << "\n"; |
| return; |
| } |
| |
| // Set up disassembler. |
| std::unique_ptr<const MCAsmInfo> AsmInfo( |
| TheTarget->createMCAsmInfo(*MRI, TripleName)); |
| if (!AsmInfo) { |
| errs() << "error: no assembly info for target " << TripleName << "\n"; |
| return; |
| } |
| |
| std::unique_ptr<const MCSubtargetInfo> STI( |
| TheTarget->createMCSubtargetInfo(TripleName, "", FeaturesStr)); |
| if (!STI) { |
| errs() << "error: no subtarget info for target " << TripleName << "\n"; |
| return; |
| } |
| |
| std::unique_ptr<const MCInstrInfo> MII(TheTarget->createMCInstrInfo()); |
| if (!MII) { |
| errs() << "error: no instruction info for target " << TripleName << "\n"; |
| return; |
| } |
| |
| std::unique_ptr<const MCObjectFileInfo> MOFI(new MCObjectFileInfo); |
| MCContext Ctx(AsmInfo.get(), MRI.get(), MOFI.get()); |
| |
| std::unique_ptr<MCDisassembler> DisAsm( |
| TheTarget->createMCDisassembler(*STI, Ctx)); |
| |
| if (!DisAsm) { |
| errs() << "error: no disassembler for target " << TripleName << "\n"; |
| return; |
| } |
| |
| |
| if (Symbolize) { |
| std::unique_ptr<MCRelocationInfo> RelInfo( |
| TheTarget->createMCRelocationInfo(TripleName, Ctx)); |
| if (RelInfo) { |
| std::unique_ptr<MCSymbolizer> Symzer( |
| MCObjectSymbolizer::createObjectSymbolizer(Ctx, std::move(RelInfo), |
| Obj)); |
| if (Symzer) |
| DisAsm->setSymbolizer(std::move(Symzer)); |
| } |
| } |
| |
| std::unique_ptr<const MCInstrAnalysis> MIA( |
| TheTarget->createMCInstrAnalysis(MII.get())); |
| |
| int AsmPrinterVariant = AsmInfo->getAssemblerDialect(); |
| std::unique_ptr<MCInstPrinter> IP(TheTarget->createMCInstPrinter( |
| AsmPrinterVariant, *AsmInfo, *MII, *MRI, *STI)); |
| if (!IP) { |
| errs() << "error: no instruction printer for target " << TripleName |
| << '\n'; |
| return; |
| } |
| |
| if (CFG || !YAMLCFG.empty()) { |
| std::unique_ptr<MCObjectDisassembler> OD( |
| new MCObjectDisassembler(*Obj, *DisAsm, *MIA)); |
| std::unique_ptr<MCModule> Mod(OD->buildModule(/* withCFG */ true)); |
| for (MCModule::const_atom_iterator AI = Mod->atom_begin(), |
| AE = Mod->atom_end(); |
| AI != AE; ++AI) { |
| outs() << "Atom " << (*AI)->getName() << ": \n"; |
| if (const MCTextAtom *TA = dyn_cast<MCTextAtom>(*AI)) { |
| for (MCTextAtom::const_iterator II = TA->begin(), IE = TA->end(); |
| II != IE; |
| ++II) { |
| IP->printInst(&II->Inst, outs(), ""); |
| outs() << "\n"; |
| } |
| } |
| } |
| if (CFG) { |
| for (MCModule::const_func_iterator FI = Mod->func_begin(), |
| FE = Mod->func_end(); |
| FI != FE; ++FI) { |
| static int filenum = 0; |
| emitDOTFile((Twine((*FI)->getName()) + "_" + |
| utostr(filenum) + ".dot").str().c_str(), |
| **FI, IP.get()); |
| ++filenum; |
| } |
| } |
| if (!YAMLCFG.empty()) { |
| std::string Error; |
| raw_fd_ostream YAMLOut(YAMLCFG.c_str(), Error, sys::fs::F_Text); |
| if (!Error.empty()) { |
| errs() << ToolName << ": warning: " << Error << '\n'; |
| return; |
| } |
| mcmodule2yaml(YAMLOut, *Mod, *MII, *MRI); |
| } |
| } |
| |
| StringRef Fmt = Obj->getBytesInAddress() > 4 ? "\t\t%016" PRIx64 ": " : |
| "\t\t\t%08" PRIx64 ": "; |
| |
| // Create a mapping, RelocSecs = SectionRelocMap[S], where sections |
| // in RelocSecs contain the relocations for section S. |
| std::error_code EC; |
| std::map<SectionRef, SmallVector<SectionRef, 1>> SectionRelocMap; |
| for (const SectionRef &Section : Obj->sections()) { |
| section_iterator Sec2 = Section.getRelocatedSection(); |
| if (Sec2 != Obj->section_end()) |
| SectionRelocMap[*Sec2].push_back(Section); |
| } |
| |
| for (const SectionRef &Section : Obj->sections()) { |
| bool Text; |
| if (error(Section.isText(Text))) |
| break; |
| if (!Text) |
| continue; |
| |
| uint64_t SectionAddr; |
| if (error(Section.getAddress(SectionAddr))) |
| break; |
| |
| uint64_t SectSize; |
| if (error(Section.getSize(SectSize))) |
| break; |
| |
| // Make a list of all the symbols in this section. |
| std::vector<std::pair<uint64_t, StringRef>> Symbols; |
| for (const SymbolRef &Symbol : Obj->symbols()) { |
| bool contains; |
| if (!error(Section.containsSymbol(Symbol, contains)) && contains) { |
| uint64_t Address; |
| if (error(Symbol.getAddress(Address))) |
| break; |
| if (Address == UnknownAddressOrSize) |
| continue; |
| Address -= SectionAddr; |
| if (Address >= SectSize) |
| continue; |
| |
| StringRef Name; |
| if (error(Symbol.getName(Name))) |
| break; |
| Symbols.push_back(std::make_pair(Address, Name)); |
| } |
| } |
| |
| // Sort the symbols by address, just in case they didn't come in that way. |
| array_pod_sort(Symbols.begin(), Symbols.end()); |
| |
| // Make a list of all the relocations for this section. |
| std::vector<RelocationRef> Rels; |
| if (InlineRelocs) { |
| for (const SectionRef &RelocSec : SectionRelocMap[Section]) { |
| for (const RelocationRef &Reloc : RelocSec.relocations()) { |
| Rels.push_back(Reloc); |
| } |
| } |
| } |
| |
| // Sort relocations by address. |
| std::sort(Rels.begin(), Rels.end(), RelocAddressLess); |
| |
| StringRef SegmentName = ""; |
| if (const MachOObjectFile *MachO = dyn_cast<const MachOObjectFile>(Obj)) { |
| DataRefImpl DR = Section.getRawDataRefImpl(); |
| SegmentName = MachO->getSectionFinalSegmentName(DR); |
| } |
| StringRef name; |
| if (error(Section.getName(name))) |
| break; |
| outs() << "Disassembly of section "; |
| if (!SegmentName.empty()) |
| outs() << SegmentName << ","; |
| outs() << name << ':'; |
| |
| // If the section has no symbols just insert a dummy one and disassemble |
| // the whole section. |
| if (Symbols.empty()) |
| Symbols.push_back(std::make_pair(0, name)); |
| |
| |
| SmallString<40> Comments; |
| raw_svector_ostream CommentStream(Comments); |
| |
| StringRef Bytes; |
| if (error(Section.getContents(Bytes))) |
| break; |
| StringRefMemoryObject memoryObject(Bytes, SectionAddr); |
| uint64_t Size; |
| uint64_t Index; |
| |
| std::vector<RelocationRef>::const_iterator rel_cur = Rels.begin(); |
| std::vector<RelocationRef>::const_iterator rel_end = Rels.end(); |
| // Disassemble symbol by symbol. |
| for (unsigned si = 0, se = Symbols.size(); si != se; ++si) { |
| uint64_t Start = Symbols[si].first; |
| uint64_t End; |
| // The end is either the size of the section or the beginning of the next |
| // symbol. |
| if (si == se - 1) |
| End = SectSize; |
| // Make sure this symbol takes up space. |
| else if (Symbols[si + 1].first != Start) |
| End = Symbols[si + 1].first - 1; |
| else |
| // This symbol has the same address as the next symbol. Skip it. |
| continue; |
| |
| outs() << '\n' << Symbols[si].second << ":\n"; |
| |
| #ifndef NDEBUG |
| raw_ostream &DebugOut = DebugFlag ? dbgs() : nulls(); |
| #else |
| raw_ostream &DebugOut = nulls(); |
| #endif |
| |
| for (Index = Start; Index < End; Index += Size) { |
| MCInst Inst; |
| |
| if (DisAsm->getInstruction(Inst, Size, memoryObject, |
| SectionAddr + Index, |
| DebugOut, CommentStream)) { |
| outs() << format("%8" PRIx64 ":", SectionAddr + Index); |
| if (!NoShowRawInsn) { |
| outs() << "\t"; |
| DumpBytes(StringRef(Bytes.data() + Index, Size)); |
| } |
| IP->printInst(&Inst, outs(), ""); |
| outs() << CommentStream.str(); |
| Comments.clear(); |
| outs() << "\n"; |
| } else { |
| errs() << ToolName << ": warning: invalid instruction encoding\n"; |
| if (Size == 0) |
| Size = 1; // skip illegible bytes |
| } |
| |
| // Print relocation for instruction. |
| while (rel_cur != rel_end) { |
| bool hidden = false; |
| uint64_t addr; |
| SmallString<16> name; |
| SmallString<32> val; |
| |
| // If this relocation is hidden, skip it. |
| if (error(rel_cur->getHidden(hidden))) goto skip_print_rel; |
| if (hidden) goto skip_print_rel; |
| |
| if (error(rel_cur->getOffset(addr))) goto skip_print_rel; |
| // Stop when rel_cur's address is past the current instruction. |
| if (addr >= Index + Size) break; |
| if (error(rel_cur->getTypeName(name))) goto skip_print_rel; |
| if (error(rel_cur->getValueString(val))) goto skip_print_rel; |
| |
| outs() << format(Fmt.data(), SectionAddr + addr) << name |
| << "\t" << val << "\n"; |
| |
| skip_print_rel: |
| ++rel_cur; |
| } |
| } |
| } |
| } |
| } |
| |
| static void PrintRelocations(const ObjectFile *Obj) { |
| StringRef Fmt = Obj->getBytesInAddress() > 4 ? "%016" PRIx64 : |
| "%08" PRIx64; |
| for (const SectionRef &Section : Obj->sections()) { |
| if (Section.relocation_begin() == Section.relocation_end()) |
| continue; |
| StringRef secname; |
| if (error(Section.getName(secname))) |
| continue; |
| outs() << "RELOCATION RECORDS FOR [" << secname << "]:\n"; |
| for (const RelocationRef &Reloc : Section.relocations()) { |
| bool hidden; |
| uint64_t address; |
| SmallString<32> relocname; |
| SmallString<32> valuestr; |
| if (error(Reloc.getHidden(hidden))) |
| continue; |
| if (hidden) |
| continue; |
| if (error(Reloc.getTypeName(relocname))) |
| continue; |
| if (error(Reloc.getOffset(address))) |
| continue; |
| if (error(Reloc.getValueString(valuestr))) |
| continue; |
| outs() << format(Fmt.data(), address) << " " << relocname << " " |
| << valuestr << "\n"; |
| } |
| outs() << "\n"; |
| } |
| } |
| |
| static void PrintSectionHeaders(const ObjectFile *Obj) { |
| outs() << "Sections:\n" |
| "Idx Name Size Address Type\n"; |
| unsigned i = 0; |
| for (const SectionRef &Section : Obj->sections()) { |
| StringRef Name; |
| if (error(Section.getName(Name))) |
| return; |
| uint64_t Address; |
| if (error(Section.getAddress(Address))) |
| return; |
| uint64_t Size; |
| if (error(Section.getSize(Size))) |
| return; |
| bool Text, Data, BSS; |
| if (error(Section.isText(Text))) |
| return; |
| if (error(Section.isData(Data))) |
| return; |
| if (error(Section.isBSS(BSS))) |
| return; |
| std::string Type = (std::string(Text ? "TEXT " : "") + |
| (Data ? "DATA " : "") + (BSS ? "BSS" : "")); |
| outs() << format("%3d %-13s %08" PRIx64 " %016" PRIx64 " %s\n", i, |
| Name.str().c_str(), Size, Address, Type.c_str()); |
| ++i; |
| } |
| } |
| |
| static void PrintSectionContents(const ObjectFile *Obj) { |
| std::error_code EC; |
| for (const SectionRef &Section : Obj->sections()) { |
| StringRef Name; |
| StringRef Contents; |
| uint64_t BaseAddr; |
| bool BSS; |
| if (error(Section.getName(Name))) |
| continue; |
| if (error(Section.getAddress(BaseAddr))) |
| continue; |
| if (error(Section.isBSS(BSS))) |
| continue; |
| |
| outs() << "Contents of section " << Name << ":\n"; |
| if (BSS) { |
| uint64_t Size; |
| if (error(Section.getSize(Size))) |
| continue; |
| outs() << format("<skipping contents of bss section at [%04" PRIx64 |
| ", %04" PRIx64 ")>\n", |
| BaseAddr, BaseAddr + Size); |
| continue; |
| } |
| |
| if (error(Section.getContents(Contents))) |
| continue; |
| |
| // Dump out the content as hex and printable ascii characters. |
| for (std::size_t addr = 0, end = Contents.size(); addr < end; addr += 16) { |
| outs() << format(" %04" PRIx64 " ", BaseAddr + addr); |
| // Dump line of hex. |
| for (std::size_t i = 0; i < 16; ++i) { |
| if (i != 0 && i % 4 == 0) |
| outs() << ' '; |
| if (addr + i < end) |
| outs() << hexdigit((Contents[addr + i] >> 4) & 0xF, true) |
| << hexdigit(Contents[addr + i] & 0xF, true); |
| else |
| outs() << " "; |
| } |
| // Print ascii. |
| outs() << " "; |
| for (std::size_t i = 0; i < 16 && addr + i < end; ++i) { |
| if (std::isprint(static_cast<unsigned char>(Contents[addr + i]) & 0xFF)) |
| outs() << Contents[addr + i]; |
| else |
| outs() << "."; |
| } |
| outs() << "\n"; |
| } |
| } |
| } |
| |
| static void PrintCOFFSymbolTable(const COFFObjectFile *coff) { |
| const coff_file_header *header; |
| if (error(coff->getHeader(header))) |
| return; |
| |
| for (unsigned SI = 0, SE = header->NumberOfSymbols; SI != SE; ++SI) { |
| const coff_symbol *Symbol; |
| StringRef Name; |
| if (error(coff->getSymbol(SI, Symbol))) |
| return; |
| |
| if (error(coff->getSymbolName(Symbol, Name))) |
| return; |
| |
| outs() << "[" << format("%2d", SI) << "]" |
| << "(sec " << format("%2d", int(Symbol->SectionNumber)) << ")" |
| << "(fl 0x00)" // Flag bits, which COFF doesn't have. |
| << "(ty " << format("%3x", unsigned(Symbol->Type)) << ")" |
| << "(scl " << format("%3x", unsigned(Symbol->StorageClass)) << ") " |
| << "(nx " << unsigned(Symbol->NumberOfAuxSymbols) << ") " |
| << "0x" << format("%08x", unsigned(Symbol->Value)) << " " |
| << Name << "\n"; |
| |
| for (unsigned AI = 0, AE = Symbol->NumberOfAuxSymbols; AI < AE; ++AI, ++SI) { |
| if (Symbol->isSectionDefinition()) { |
| const coff_aux_section_definition *asd; |
| if (error(coff->getAuxSymbol<coff_aux_section_definition>(SI + 1, asd))) |
| return; |
| |
| outs() << "AUX " |
| << format("scnlen 0x%x nreloc %d nlnno %d checksum 0x%x " |
| , unsigned(asd->Length) |
| , unsigned(asd->NumberOfRelocations) |
| , unsigned(asd->NumberOfLinenumbers) |
| , unsigned(asd->CheckSum)) |
| << format("assoc %d comdat %d\n" |
| , unsigned(asd->Number) |
| , unsigned(asd->Selection)); |
| } else if (Symbol->isFileRecord()) { |
| const coff_aux_file *AF; |
| if (error(coff->getAuxSymbol<coff_aux_file>(SI + 1, AF))) |
| return; |
| |
| StringRef Name(AF->FileName, |
| Symbol->NumberOfAuxSymbols * COFF::SymbolSize); |
| outs() << "AUX " << Name.rtrim(StringRef("\0", 1)) << '\n'; |
| |
| SI = SI + Symbol->NumberOfAuxSymbols; |
| break; |
| } else { |
| outs() << "AUX Unknown\n"; |
| } |
| } |
| } |
| } |
| |
| static void PrintSymbolTable(const ObjectFile *o) { |
| outs() << "SYMBOL TABLE:\n"; |
| |
| if (const COFFObjectFile *coff = dyn_cast<const COFFObjectFile>(o)) { |
| PrintCOFFSymbolTable(coff); |
| return; |
| } |
| for (const SymbolRef &Symbol : o->symbols()) { |
| StringRef Name; |
| uint64_t Address; |
| SymbolRef::Type Type; |
| uint64_t Size; |
| uint32_t Flags = Symbol.getFlags(); |
| section_iterator Section = o->section_end(); |
| if (error(Symbol.getName(Name))) |
| continue; |
| if (error(Symbol.getAddress(Address))) |
| continue; |
| if (error(Symbol.getType(Type))) |
| continue; |
| if (error(Symbol.getSize(Size))) |
| continue; |
| if (error(Symbol.getSection(Section))) |
| continue; |
| |
| bool Global = Flags & SymbolRef::SF_Global; |
| bool Weak = Flags & SymbolRef::SF_Weak; |
| bool Absolute = Flags & SymbolRef::SF_Absolute; |
| |
| if (Address == UnknownAddressOrSize) |
| Address = 0; |
| if (Size == UnknownAddressOrSize) |
| Size = 0; |
| char GlobLoc = ' '; |
| if (Type != SymbolRef::ST_Unknown) |
| GlobLoc = Global ? 'g' : 'l'; |
| char Debug = (Type == SymbolRef::ST_Debug || Type == SymbolRef::ST_File) |
| ? 'd' : ' '; |
| char FileFunc = ' '; |
| if (Type == SymbolRef::ST_File) |
| FileFunc = 'f'; |
| else if (Type == SymbolRef::ST_Function) |
| FileFunc = 'F'; |
| |
| const char *Fmt = o->getBytesInAddress() > 4 ? "%016" PRIx64 : |
| "%08" PRIx64; |
| |
| outs() << format(Fmt, Address) << " " |
| << GlobLoc // Local -> 'l', Global -> 'g', Neither -> ' ' |
| << (Weak ? 'w' : ' ') // Weak? |
| << ' ' // Constructor. Not supported yet. |
| << ' ' // Warning. Not supported yet. |
| << ' ' // Indirect reference to another symbol. |
| << Debug // Debugging (d) or dynamic (D) symbol. |
| << FileFunc // Name of function (F), file (f) or object (O). |
| << ' '; |
| if (Absolute) { |
| outs() << "*ABS*"; |
| } else if (Section == o->section_end()) { |
| outs() << "*UND*"; |
| } else { |
| if (const MachOObjectFile *MachO = |
| dyn_cast<const MachOObjectFile>(o)) { |
| DataRefImpl DR = Section->getRawDataRefImpl(); |
| StringRef SegmentName = MachO->getSectionFinalSegmentName(DR); |
| outs() << SegmentName << ","; |
| } |
| StringRef SectionName; |
| if (error(Section->getName(SectionName))) |
| SectionName = ""; |
| outs() << SectionName; |
| } |
| outs() << '\t' |
| << format("%08" PRIx64 " ", Size) |
| << Name |
| << '\n'; |
| } |
| } |
| |
| static void PrintUnwindInfo(const ObjectFile *o) { |
| outs() << "Unwind info:\n\n"; |
| |
| if (const COFFObjectFile *coff = dyn_cast<COFFObjectFile>(o)) { |
| printCOFFUnwindInfo(coff); |
| } else { |
| // TODO: Extract DWARF dump tool to objdump. |
| errs() << "This operation is only currently supported " |
| "for COFF object files.\n"; |
| return; |
| } |
| } |
| |
| static void printPrivateFileHeader(const ObjectFile *o) { |
| if (o->isELF()) { |
| printELFFileHeader(o); |
| } else if (o->isCOFF()) { |
| printCOFFFileHeader(o); |
| } |
| } |
| |
| static void DumpObject(const ObjectFile *o) { |
| outs() << '\n'; |
| outs() << o->getFileName() |
| << ":\tfile format " << o->getFileFormatName() << "\n\n"; |
| |
| if (Disassemble) |
| DisassembleObject(o, Relocations); |
| if (Relocations && !Disassemble) |
| PrintRelocations(o); |
| if (SectionHeaders) |
| PrintSectionHeaders(o); |
| if (SectionContents) |
| PrintSectionContents(o); |
| if (SymbolTable) |
| PrintSymbolTable(o); |
| if (UnwindInfo) |
| PrintUnwindInfo(o); |
| if (PrivateHeaders) |
| printPrivateFileHeader(o); |
| } |
| |
| /// @brief Dump each object file in \a a; |
| static void DumpArchive(const Archive *a) { |
| for (Archive::child_iterator i = a->child_begin(), e = a->child_end(); i != e; |
| ++i) { |
| ErrorOr<std::unique_ptr<Binary>> ChildOrErr = i->getAsBinary(); |
| if (std::error_code EC = ChildOrErr.getError()) { |
| // Ignore non-object files. |
| if (EC != object_error::invalid_file_type) |
| errs() << ToolName << ": '" << a->getFileName() << "': " << EC.message() |
| << ".\n"; |
| continue; |
| } |
| if (ObjectFile *o = dyn_cast<ObjectFile>(&*ChildOrErr.get())) |
| DumpObject(o); |
| else |
| errs() << ToolName << ": '" << a->getFileName() << "': " |
| << "Unrecognized file type.\n"; |
| } |
| } |
| |
| /// @brief Open file and figure out how to dump it. |
| static void DumpInput(StringRef file) { |
| // If file isn't stdin, check that it exists. |
| if (file != "-" && !sys::fs::exists(file)) { |
| errs() << ToolName << ": '" << file << "': " << "No such file\n"; |
| return; |
| } |
| |
| if (MachOOpt && Disassemble) { |
| DisassembleInputMachO(file); |
| return; |
| } |
| |
| // Attempt to open the binary. |
| ErrorOr<Binary *> BinaryOrErr = createBinary(file); |
| if (std::error_code EC = BinaryOrErr.getError()) { |
| errs() << ToolName << ": '" << file << "': " << EC.message() << ".\n"; |
| return; |
| } |
| std::unique_ptr<Binary> binary(BinaryOrErr.get()); |
| |
| if (Archive *a = dyn_cast<Archive>(binary.get())) |
| DumpArchive(a); |
| else if (ObjectFile *o = dyn_cast<ObjectFile>(binary.get())) |
| DumpObject(o); |
| else |
| errs() << ToolName << ": '" << file << "': " << "Unrecognized file type.\n"; |
| } |
| |
| int main(int argc, char **argv) { |
| // Print a stack trace if we signal out. |
| sys::PrintStackTraceOnErrorSignal(); |
| PrettyStackTraceProgram X(argc, argv); |
| llvm_shutdown_obj Y; // Call llvm_shutdown() on exit. |
| |
| // Initialize targets and assembly printers/parsers. |
| llvm::InitializeAllTargetInfos(); |
| llvm::InitializeAllTargetMCs(); |
| llvm::InitializeAllAsmParsers(); |
| llvm::InitializeAllDisassemblers(); |
| |
| // Register the target printer for --version. |
| cl::AddExtraVersionPrinter(TargetRegistry::printRegisteredTargetsForVersion); |
| |
| cl::ParseCommandLineOptions(argc, argv, "llvm object file dumper\n"); |
| TripleName = Triple::normalize(TripleName); |
| |
| ToolName = argv[0]; |
| |
| // Defaults to a.out if no filenames specified. |
| if (InputFilenames.size() == 0) |
| InputFilenames.push_back("a.out"); |
| |
| if (!Disassemble |
| && !Relocations |
| && !SectionHeaders |
| && !SectionContents |
| && !SymbolTable |
| && !UnwindInfo |
| && !PrivateHeaders) { |
| cl::PrintHelpMessage(); |
| return 2; |
| } |
| |
| std::for_each(InputFilenames.begin(), InputFilenames.end(), |
| DumpInput); |
| |
| return 0; |
| } |