Home | History | Annotate | Download | only in llvm-objdump
      1 //===-- MachODump.cpp - Object file dumping utility for llvm --------------===//
      2 //
      3 //                     The LLVM Compiler Infrastructure
      4 //
      5 // This file is distributed under the University of Illinois Open Source
      6 // License. See LICENSE.TXT for details.
      7 //
      8 //===----------------------------------------------------------------------===//
      9 //
     10 // This file implements the MachO-specific dumper for llvm-objdump.
     11 //
     12 //===----------------------------------------------------------------------===//
     13 
     14 #include "llvm-objdump.h"
     15 #include "MCFunction.h"
     16 #include "llvm/Support/MachO.h"
     17 #include "llvm/Object/MachO.h"
     18 #include "llvm/ADT/OwningPtr.h"
     19 #include "llvm/ADT/Triple.h"
     20 #include "llvm/ADT/STLExtras.h"
     21 #include "llvm/DebugInfo/DIContext.h"
     22 #include "llvm/MC/MCAsmInfo.h"
     23 #include "llvm/MC/MCDisassembler.h"
     24 #include "llvm/MC/MCInst.h"
     25 #include "llvm/MC/MCInstPrinter.h"
     26 #include "llvm/MC/MCInstrAnalysis.h"
     27 #include "llvm/MC/MCInstrDesc.h"
     28 #include "llvm/MC/MCInstrInfo.h"
     29 #include "llvm/MC/MCRegisterInfo.h"
     30 #include "llvm/MC/MCSubtargetInfo.h"
     31 #include "llvm/Support/CommandLine.h"
     32 #include "llvm/Support/Debug.h"
     33 #include "llvm/Support/Format.h"
     34 #include "llvm/Support/GraphWriter.h"
     35 #include "llvm/Support/MemoryBuffer.h"
     36 #include "llvm/Support/TargetRegistry.h"
     37 #include "llvm/Support/TargetSelect.h"
     38 #include "llvm/Support/raw_ostream.h"
     39 #include "llvm/Support/system_error.h"
     40 #include <algorithm>
     41 #include <cstring>
     42 using namespace llvm;
     43 using namespace object;
     44 
     45 static cl::opt<bool>
     46   CFG("cfg", cl::desc("Create a CFG for every symbol in the object file and"
     47                       " write it to a graphviz file (MachO-only)"));
     48 
     49 static cl::opt<bool>
     50   UseDbg("g", cl::desc("Print line information from debug info if available"));
     51 
     52 static cl::opt<std::string>
     53   DSYMFile("dsym", cl::desc("Use .dSYM file for debug info"));
     54 
     55 static const Target *GetTarget(const MachOObject *MachOObj) {
     56   // Figure out the target triple.
     57   if (TripleName.empty()) {
     58     llvm::Triple TT("unknown-unknown-unknown");
     59     switch (MachOObj->getHeader().CPUType) {
     60     case llvm::MachO::CPUTypeI386:
     61       TT.setArch(Triple::ArchType(Triple::x86));
     62       break;
     63     case llvm::MachO::CPUTypeX86_64:
     64       TT.setArch(Triple::ArchType(Triple::x86_64));
     65       break;
     66     case llvm::MachO::CPUTypeARM:
     67       TT.setArch(Triple::ArchType(Triple::arm));
     68       break;
     69     case llvm::MachO::CPUTypePowerPC:
     70       TT.setArch(Triple::ArchType(Triple::ppc));
     71       break;
     72     case llvm::MachO::CPUTypePowerPC64:
     73       TT.setArch(Triple::ArchType(Triple::ppc64));
     74       break;
     75     }
     76     TripleName = TT.str();
     77   }
     78 
     79   // Get the target specific parser.
     80   std::string Error;
     81   const Target *TheTarget = TargetRegistry::lookupTarget(TripleName, Error);
     82   if (TheTarget)
     83     return TheTarget;
     84 
     85   errs() << "llvm-objdump: error: unable to get target for '" << TripleName
     86          << "', see --version and --triple.\n";
     87   return 0;
     88 }
     89 
     90 struct SymbolSorter {
     91   bool operator()(const SymbolRef &A, const SymbolRef &B) {
     92     SymbolRef::Type AType, BType;
     93     A.getType(AType);
     94     B.getType(BType);
     95 
     96     uint64_t AAddr, BAddr;
     97     if (AType != SymbolRef::ST_Function)
     98       AAddr = 0;
     99     else
    100       A.getAddress(AAddr);
    101     if (BType != SymbolRef::ST_Function)
    102       BAddr = 0;
    103     else
    104       B.getAddress(BAddr);
    105     return AAddr < BAddr;
    106   }
    107 };
    108 
    109 // Print additional information about an address, if available.
    110 static void DumpAddress(uint64_t Address, ArrayRef<SectionRef> Sections,
    111                         MachOObject *MachOObj, raw_ostream &OS) {
    112   for (unsigned i = 0; i != Sections.size(); ++i) {
    113     uint64_t SectAddr = 0, SectSize = 0;
    114     Sections[i].getAddress(SectAddr);
    115     Sections[i].getSize(SectSize);
    116     uint64_t addr = SectAddr;
    117     if (SectAddr <= Address &&
    118         SectAddr + SectSize > Address) {
    119       StringRef bytes, name;
    120       Sections[i].getContents(bytes);
    121       Sections[i].getName(name);
    122       // Print constant strings.
    123       if (!name.compare("__cstring"))
    124         OS << '"' << bytes.substr(addr, bytes.find('\0', addr)) << '"';
    125       // Print constant CFStrings.
    126       if (!name.compare("__cfstring"))
    127         OS << "@\"" << bytes.substr(addr, bytes.find('\0', addr)) << '"';
    128     }
    129   }
    130 }
    131 
    132 typedef std::map<uint64_t, MCFunction*> FunctionMapTy;
    133 typedef SmallVector<MCFunction, 16> FunctionListTy;
    134 static void createMCFunctionAndSaveCalls(StringRef Name,
    135                                          const MCDisassembler *DisAsm,
    136                                          MemoryObject &Object, uint64_t Start,
    137                                          uint64_t End,
    138                                          MCInstrAnalysis *InstrAnalysis,
    139                                          uint64_t Address,
    140                                          raw_ostream &DebugOut,
    141                                          FunctionMapTy &FunctionMap,
    142                                          FunctionListTy &Functions) {
    143   SmallVector<uint64_t, 16> Calls;
    144   MCFunction f =
    145     MCFunction::createFunctionFromMC(Name, DisAsm, Object, Start, End,
    146                                      InstrAnalysis, DebugOut, Calls);
    147   Functions.push_back(f);
    148   FunctionMap[Address] = &Functions.back();
    149 
    150   // Add the gathered callees to the map.
    151   for (unsigned i = 0, e = Calls.size(); i != e; ++i)
    152     FunctionMap.insert(std::make_pair(Calls[i], (MCFunction*)0));
    153 }
    154 
    155 // Write a graphviz file for the CFG inside an MCFunction.
    156 static void emitDOTFile(const char *FileName, const MCFunction &f,
    157                         MCInstPrinter *IP) {
    158   // Start a new dot file.
    159   std::string Error;
    160   raw_fd_ostream Out(FileName, Error);
    161   if (!Error.empty()) {
    162     errs() << "llvm-objdump: warning: " << Error << '\n';
    163     return;
    164   }
    165 
    166   Out << "digraph " << f.getName() << " {\n";
    167   Out << "graph [ rankdir = \"LR\" ];\n";
    168   for (MCFunction::iterator i = f.begin(), e = f.end(); i != e; ++i) {
    169     bool hasPreds = false;
    170     // Only print blocks that have predecessors.
    171     // FIXME: Slow.
    172     for (MCFunction::iterator pi = f.begin(), pe = f.end(); pi != pe;
    173         ++pi)
    174       if (pi->second.contains(i->first)) {
    175         hasPreds = true;
    176         break;
    177       }
    178 
    179     if (!hasPreds && i != f.begin())
    180       continue;
    181 
    182     Out << '"' << i->first << "\" [ label=\"<a>";
    183     // Print instructions.
    184     for (unsigned ii = 0, ie = i->second.getInsts().size(); ii != ie;
    185         ++ii) {
    186       // Escape special chars and print the instruction in mnemonic form.
    187       std::string Str;
    188       raw_string_ostream OS(Str);
    189       IP->printInst(&i->second.getInsts()[ii].Inst, OS, "");
    190       Out << DOT::EscapeString(OS.str()) << '|';
    191     }
    192     Out << "<o>\" shape=\"record\" ];\n";
    193 
    194     // Add edges.
    195     for (MCBasicBlock::succ_iterator si = i->second.succ_begin(),
    196         se = i->second.succ_end(); si != se; ++si)
    197       Out << i->first << ":o -> " << *si <<":a\n";
    198   }
    199   Out << "}\n";
    200 }
    201 
    202 static void getSectionsAndSymbols(const macho::Header &Header,
    203                                   MachOObjectFile *MachOObj,
    204                              InMemoryStruct<macho::SymtabLoadCommand> *SymtabLC,
    205                                   std::vector<SectionRef> &Sections,
    206                                   std::vector<SymbolRef> &Symbols,
    207                                   SmallVectorImpl<uint64_t> &FoundFns) {
    208   error_code ec;
    209   for (symbol_iterator SI = MachOObj->begin_symbols(),
    210        SE = MachOObj->end_symbols(); SI != SE; SI.increment(ec))
    211     Symbols.push_back(*SI);
    212 
    213   for (section_iterator SI = MachOObj->begin_sections(),
    214        SE = MachOObj->end_sections(); SI != SE; SI.increment(ec)) {
    215     SectionRef SR = *SI;
    216     StringRef SectName;
    217     SR.getName(SectName);
    218     Sections.push_back(*SI);
    219   }
    220 
    221   for (unsigned i = 0; i != Header.NumLoadCommands; ++i) {
    222     const MachOObject::LoadCommandInfo &LCI =
    223        MachOObj->getObject()->getLoadCommandInfo(i);
    224     if (LCI.Command.Type == macho::LCT_FunctionStarts) {
    225       // We found a function starts segment, parse the addresses for later
    226       // consumption.
    227       InMemoryStruct<macho::LinkeditDataLoadCommand> LLC;
    228       MachOObj->getObject()->ReadLinkeditDataLoadCommand(LCI, LLC);
    229 
    230       MachOObj->getObject()->ReadULEB128s(LLC->DataOffset, FoundFns);
    231     }
    232   }
    233 }
    234 
    235 void llvm::DisassembleInputMachO(StringRef Filename) {
    236   OwningPtr<MemoryBuffer> Buff;
    237 
    238   if (error_code ec = MemoryBuffer::getFileOrSTDIN(Filename, Buff)) {
    239     errs() << "llvm-objdump: " << Filename << ": " << ec.message() << "\n";
    240     return;
    241   }
    242 
    243   OwningPtr<MachOObjectFile> MachOOF(static_cast<MachOObjectFile*>(
    244         ObjectFile::createMachOObjectFile(Buff.take())));
    245   MachOObject *MachOObj = MachOOF->getObject();
    246 
    247   const Target *TheTarget = GetTarget(MachOObj);
    248   if (!TheTarget) {
    249     // GetTarget prints out stuff.
    250     return;
    251   }
    252   OwningPtr<const MCInstrInfo> InstrInfo(TheTarget->createMCInstrInfo());
    253   OwningPtr<MCInstrAnalysis>
    254     InstrAnalysis(TheTarget->createMCInstrAnalysis(InstrInfo.get()));
    255 
    256   // Set up disassembler.
    257   OwningPtr<const MCAsmInfo> AsmInfo(TheTarget->createMCAsmInfo(TripleName));
    258   OwningPtr<const MCSubtargetInfo>
    259     STI(TheTarget->createMCSubtargetInfo(TripleName, "", ""));
    260   OwningPtr<const MCDisassembler> DisAsm(TheTarget->createMCDisassembler(*STI));
    261   OwningPtr<const MCRegisterInfo> MRI(TheTarget->createMCRegInfo(TripleName));
    262   int AsmPrinterVariant = AsmInfo->getAssemblerDialect();
    263   OwningPtr<MCInstPrinter>
    264     IP(TheTarget->createMCInstPrinter(AsmPrinterVariant, *AsmInfo, *InstrInfo,
    265                                       *MRI, *STI));
    266 
    267   if (!InstrAnalysis || !AsmInfo || !STI || !DisAsm || !IP) {
    268     errs() << "error: couldn't initialize disassembler for target "
    269            << TripleName << '\n';
    270     return;
    271   }
    272 
    273   outs() << '\n' << Filename << ":\n\n";
    274 
    275   const macho::Header &Header = MachOObj->getHeader();
    276 
    277   const MachOObject::LoadCommandInfo *SymtabLCI = 0;
    278   // First, find the symbol table segment.
    279   for (unsigned i = 0; i != Header.NumLoadCommands; ++i) {
    280     const MachOObject::LoadCommandInfo &LCI = MachOObj->getLoadCommandInfo(i);
    281     if (LCI.Command.Type == macho::LCT_Symtab) {
    282       SymtabLCI = &LCI;
    283       break;
    284     }
    285   }
    286 
    287   // Read and register the symbol table data.
    288   InMemoryStruct<macho::SymtabLoadCommand> SymtabLC;
    289   if (SymtabLCI) {
    290     MachOObj->ReadSymtabLoadCommand(*SymtabLCI, SymtabLC);
    291     MachOObj->RegisterStringTable(*SymtabLC);
    292   }
    293 
    294   std::vector<SectionRef> Sections;
    295   std::vector<SymbolRef> Symbols;
    296   SmallVector<uint64_t, 8> FoundFns;
    297 
    298   getSectionsAndSymbols(Header, MachOOF.get(), &SymtabLC, Sections, Symbols,
    299                         FoundFns);
    300 
    301   // Make a copy of the unsorted symbol list. FIXME: duplication
    302   std::vector<SymbolRef> UnsortedSymbols(Symbols);
    303   // Sort the symbols by address, just in case they didn't come in that way.
    304   std::sort(Symbols.begin(), Symbols.end(), SymbolSorter());
    305 
    306 #ifndef NDEBUG
    307   raw_ostream &DebugOut = DebugFlag ? dbgs() : nulls();
    308 #else
    309   raw_ostream &DebugOut = nulls();
    310 #endif
    311 
    312   StringRef DebugAbbrevSection, DebugInfoSection, DebugArangesSection,
    313             DebugLineSection, DebugStrSection;
    314   OwningPtr<DIContext> diContext;
    315   OwningPtr<MachOObjectFile> DSYMObj;
    316   MachOObject *DbgInfoObj = MachOObj;
    317   // Try to find debug info and set up the DIContext for it.
    318   if (UseDbg) {
    319     ArrayRef<SectionRef> DebugSections = Sections;
    320     std::vector<SectionRef> DSYMSections;
    321 
    322     // A separate DSym file path was specified, parse it as a macho file,
    323     // get the sections and supply it to the section name parsing machinery.
    324     if (!DSYMFile.empty()) {
    325       OwningPtr<MemoryBuffer> Buf;
    326       if (error_code ec = MemoryBuffer::getFileOrSTDIN(DSYMFile.c_str(), Buf)) {
    327         errs() << "llvm-objdump: " << Filename << ": " << ec.message() << '\n';
    328         return;
    329       }
    330       DSYMObj.reset(static_cast<MachOObjectFile*>(
    331             ObjectFile::createMachOObjectFile(Buf.take())));
    332       const macho::Header &Header = DSYMObj->getObject()->getHeader();
    333 
    334       std::vector<SymbolRef> Symbols;
    335       SmallVector<uint64_t, 8> FoundFns;
    336       getSectionsAndSymbols(Header, DSYMObj.get(), 0, DSYMSections, Symbols,
    337                             FoundFns);
    338       DebugSections = DSYMSections;
    339       DbgInfoObj = DSYMObj.get()->getObject();
    340     }
    341 
    342     // Find the named debug info sections.
    343     for (unsigned SectIdx = 0; SectIdx != DebugSections.size(); SectIdx++) {
    344       StringRef SectName;
    345       if (!DebugSections[SectIdx].getName(SectName)) {
    346         if (SectName.equals("__DWARF,__debug_abbrev"))
    347           DebugSections[SectIdx].getContents(DebugAbbrevSection);
    348         else if (SectName.equals("__DWARF,__debug_info"))
    349           DebugSections[SectIdx].getContents(DebugInfoSection);
    350         else if (SectName.equals("__DWARF,__debug_aranges"))
    351           DebugSections[SectIdx].getContents(DebugArangesSection);
    352         else if (SectName.equals("__DWARF,__debug_line"))
    353           DebugSections[SectIdx].getContents(DebugLineSection);
    354         else if (SectName.equals("__DWARF,__debug_str"))
    355           DebugSections[SectIdx].getContents(DebugStrSection);
    356       }
    357     }
    358 
    359     // Setup the DIContext.
    360     diContext.reset(DIContext::getDWARFContext(DbgInfoObj->isLittleEndian(),
    361                                                DebugInfoSection,
    362                                                DebugAbbrevSection,
    363                                                DebugArangesSection,
    364                                                DebugLineSection,
    365                                                DebugStrSection));
    366   }
    367 
    368   FunctionMapTy FunctionMap;
    369   FunctionListTy Functions;
    370 
    371   for (unsigned SectIdx = 0; SectIdx != Sections.size(); SectIdx++) {
    372     StringRef SectName;
    373     if (Sections[SectIdx].getName(SectName) ||
    374         SectName.compare("__TEXT,__text"))
    375       continue; // Skip non-text sections
    376 
    377     // Insert the functions from the function starts segment into our map.
    378     uint64_t VMAddr;
    379     Sections[SectIdx].getAddress(VMAddr);
    380     for (unsigned i = 0, e = FoundFns.size(); i != e; ++i) {
    381       StringRef SectBegin;
    382       Sections[SectIdx].getContents(SectBegin);
    383       uint64_t Offset = (uint64_t)SectBegin.data();
    384       FunctionMap.insert(std::make_pair(VMAddr + FoundFns[i]-Offset,
    385                                         (MCFunction*)0));
    386     }
    387 
    388     StringRef Bytes;
    389     Sections[SectIdx].getContents(Bytes);
    390     StringRefMemoryObject memoryObject(Bytes);
    391     bool symbolTableWorked = false;
    392 
    393     // Parse relocations.
    394     std::vector<std::pair<uint64_t, SymbolRef> > Relocs;
    395     error_code ec;
    396     for (relocation_iterator RI = Sections[SectIdx].begin_relocations(),
    397          RE = Sections[SectIdx].end_relocations(); RI != RE; RI.increment(ec)) {
    398       uint64_t RelocOffset, SectionAddress;
    399       RI->getAddress(RelocOffset);
    400       Sections[SectIdx].getAddress(SectionAddress);
    401       RelocOffset -= SectionAddress;
    402 
    403       SymbolRef RelocSym;
    404       RI->getSymbol(RelocSym);
    405 
    406       Relocs.push_back(std::make_pair(RelocOffset, RelocSym));
    407     }
    408     array_pod_sort(Relocs.begin(), Relocs.end());
    409 
    410     // Disassemble symbol by symbol.
    411     for (unsigned SymIdx = 0; SymIdx != Symbols.size(); SymIdx++) {
    412       StringRef SymName;
    413       Symbols[SymIdx].getName(SymName);
    414 
    415       SymbolRef::Type ST;
    416       Symbols[SymIdx].getType(ST);
    417       if (ST != SymbolRef::ST_Function)
    418         continue;
    419 
    420       // Make sure the symbol is defined in this section.
    421       bool containsSym = false;
    422       Sections[SectIdx].containsSymbol(Symbols[SymIdx], containsSym);
    423       if (!containsSym)
    424         continue;
    425 
    426       // Start at the address of the symbol relative to the section's address.
    427       uint64_t SectionAddress = 0;
    428       uint64_t Start = 0;
    429       Sections[SectIdx].getAddress(SectionAddress);
    430       Symbols[SymIdx].getAddress(Start);
    431       Start -= SectionAddress;
    432 
    433       // Stop disassembling either at the beginning of the next symbol or at
    434       // the end of the section.
    435       bool containsNextSym = false;
    436       uint64_t NextSym = 0;
    437       uint64_t NextSymIdx = SymIdx+1;
    438       while (Symbols.size() > NextSymIdx) {
    439         SymbolRef::Type NextSymType;
    440         Symbols[NextSymIdx].getType(NextSymType);
    441         if (NextSymType == SymbolRef::ST_Function) {
    442           Sections[SectIdx].containsSymbol(Symbols[NextSymIdx],
    443                                            containsNextSym);
    444           Symbols[NextSymIdx].getAddress(NextSym);
    445           NextSym -= SectionAddress;
    446           break;
    447         }
    448         ++NextSymIdx;
    449       }
    450 
    451       uint64_t SectSize;
    452       Sections[SectIdx].getSize(SectSize);
    453       uint64_t End = containsNextSym ?  NextSym : SectSize;
    454       uint64_t Size;
    455 
    456       symbolTableWorked = true;
    457 
    458       if (!CFG) {
    459         // Normal disassembly, print addresses, bytes and mnemonic form.
    460         StringRef SymName;
    461         Symbols[SymIdx].getName(SymName);
    462 
    463         outs() << SymName << ":\n";
    464         DILineInfo lastLine;
    465         for (uint64_t Index = Start; Index < End; Index += Size) {
    466           MCInst Inst;
    467 
    468           if (DisAsm->getInstruction(Inst, Size, memoryObject, Index,
    469                                      DebugOut, nulls())) {
    470             uint64_t SectAddress = 0;
    471             Sections[SectIdx].getAddress(SectAddress);
    472             outs() << format("%8" PRIx64 ":\t", SectAddress + Index);
    473 
    474             DumpBytes(StringRef(Bytes.data() + Index, Size));
    475             IP->printInst(&Inst, outs(), "");
    476 
    477             // Print debug info.
    478             if (diContext) {
    479               DILineInfo dli =
    480                 diContext->getLineInfoForAddress(SectAddress + Index);
    481               // Print valid line info if it changed.
    482               if (dli != lastLine && dli.getLine() != 0)
    483                 outs() << "\t## " << dli.getFileName() << ':'
    484                        << dli.getLine() << ':' << dli.getColumn();
    485               lastLine = dli;
    486             }
    487             outs() << "\n";
    488           } else {
    489             errs() << "llvm-objdump: warning: invalid instruction encoding\n";
    490             if (Size == 0)
    491               Size = 1; // skip illegible bytes
    492           }
    493         }
    494       } else {
    495         // Create CFG and use it for disassembly.
    496         StringRef SymName;
    497         Symbols[SymIdx].getName(SymName);
    498         createMCFunctionAndSaveCalls(
    499             SymName, DisAsm.get(), memoryObject, Start, End,
    500             InstrAnalysis.get(), Start, DebugOut, FunctionMap, Functions);
    501       }
    502     }
    503     if (!CFG && !symbolTableWorked) {
    504       // Reading the symbol table didn't work, disassemble the whole section.
    505       uint64_t SectAddress;
    506       Sections[SectIdx].getAddress(SectAddress);
    507       uint64_t SectSize;
    508       Sections[SectIdx].getSize(SectSize);
    509       uint64_t InstSize;
    510       for (uint64_t Index = 0; Index < SectSize; Index += InstSize) {
    511         MCInst Inst;
    512 
    513         if (DisAsm->getInstruction(Inst, InstSize, memoryObject, Index,
    514                                    DebugOut, nulls())) {
    515           outs() << format("%8" PRIx64 ":\t", SectAddress + Index);
    516           DumpBytes(StringRef(Bytes.data() + Index, InstSize));
    517           IP->printInst(&Inst, outs(), "");
    518           outs() << "\n";
    519         } else {
    520           errs() << "llvm-objdump: warning: invalid instruction encoding\n";
    521           if (InstSize == 0)
    522             InstSize = 1; // skip illegible bytes
    523         }
    524       }
    525     }
    526 
    527     if (CFG) {
    528       if (!symbolTableWorked) {
    529         // Reading the symbol table didn't work, create a big __TEXT symbol.
    530         uint64_t SectSize = 0, SectAddress = 0;
    531         Sections[SectIdx].getSize(SectSize);
    532         Sections[SectIdx].getAddress(SectAddress);
    533         createMCFunctionAndSaveCalls("__TEXT", DisAsm.get(), memoryObject,
    534                                      0, SectSize,
    535                                      InstrAnalysis.get(),
    536                                      SectAddress, DebugOut,
    537                                      FunctionMap, Functions);
    538       }
    539       for (std::map<uint64_t, MCFunction*>::iterator mi = FunctionMap.begin(),
    540            me = FunctionMap.end(); mi != me; ++mi)
    541         if (mi->second == 0) {
    542           // Create functions for the remaining callees we have gathered,
    543           // but we didn't find a name for them.
    544           uint64_t SectSize = 0;
    545           Sections[SectIdx].getSize(SectSize);
    546 
    547           SmallVector<uint64_t, 16> Calls;
    548           MCFunction f =
    549             MCFunction::createFunctionFromMC("unknown", DisAsm.get(),
    550                                              memoryObject, mi->first,
    551                                              SectSize,
    552                                              InstrAnalysis.get(), DebugOut,
    553                                              Calls);
    554           Functions.push_back(f);
    555           mi->second = &Functions.back();
    556           for (unsigned i = 0, e = Calls.size(); i != e; ++i) {
    557             std::pair<uint64_t, MCFunction*> p(Calls[i], (MCFunction*)0);
    558             if (FunctionMap.insert(p).second)
    559               mi = FunctionMap.begin();
    560           }
    561         }
    562 
    563       DenseSet<uint64_t> PrintedBlocks;
    564       for (unsigned ffi = 0, ffe = Functions.size(); ffi != ffe; ++ffi) {
    565         MCFunction &f = Functions[ffi];
    566         for (MCFunction::iterator fi = f.begin(), fe = f.end(); fi != fe; ++fi){
    567           if (!PrintedBlocks.insert(fi->first).second)
    568             continue; // We already printed this block.
    569 
    570           // We assume a block has predecessors when it's the first block after
    571           // a symbol.
    572           bool hasPreds = FunctionMap.find(fi->first) != FunctionMap.end();
    573 
    574           // See if this block has predecessors.
    575           // FIXME: Slow.
    576           for (MCFunction::iterator pi = f.begin(), pe = f.end(); pi != pe;
    577               ++pi)
    578             if (pi->second.contains(fi->first)) {
    579               hasPreds = true;
    580               break;
    581             }
    582 
    583           uint64_t SectSize = 0, SectAddress;
    584           Sections[SectIdx].getSize(SectSize);
    585           Sections[SectIdx].getAddress(SectAddress);
    586 
    587           // No predecessors, this is a data block. Print as .byte directives.
    588           if (!hasPreds) {
    589             uint64_t End = llvm::next(fi) == fe ? SectSize :
    590                                                   llvm::next(fi)->first;
    591             outs() << "# " << End-fi->first << " bytes of data:\n";
    592             for (unsigned pos = fi->first; pos != End; ++pos) {
    593               outs() << format("%8x:\t", SectAddress + pos);
    594               DumpBytes(StringRef(Bytes.data() + pos, 1));
    595               outs() << format("\t.byte 0x%02x\n", (uint8_t)Bytes[pos]);
    596             }
    597             continue;
    598           }
    599 
    600           if (fi->second.contains(fi->first)) // Print a header for simple loops
    601             outs() << "# Loop begin:\n";
    602 
    603           DILineInfo lastLine;
    604           // Walk over the instructions and print them.
    605           for (unsigned ii = 0, ie = fi->second.getInsts().size(); ii != ie;
    606                ++ii) {
    607             const MCDecodedInst &Inst = fi->second.getInsts()[ii];
    608 
    609             // If there's a symbol at this address, print its name.
    610             if (FunctionMap.find(SectAddress + Inst.Address) !=
    611                 FunctionMap.end())
    612               outs() << FunctionMap[SectAddress + Inst.Address]-> getName()
    613                      << ":\n";
    614 
    615             outs() << format("%8" PRIx64 ":\t", SectAddress + Inst.Address);
    616             DumpBytes(StringRef(Bytes.data() + Inst.Address, Inst.Size));
    617 
    618             if (fi->second.contains(fi->first)) // Indent simple loops.
    619               outs() << '\t';
    620 
    621             IP->printInst(&Inst.Inst, outs(), "");
    622 
    623             // Look for relocations inside this instructions, if there is one
    624             // print its target and additional information if available.
    625             for (unsigned j = 0; j != Relocs.size(); ++j)
    626               if (Relocs[j].first >= SectAddress + Inst.Address &&
    627                   Relocs[j].first < SectAddress + Inst.Address + Inst.Size) {
    628                 StringRef SymName;
    629                 uint64_t Addr;
    630                 Relocs[j].second.getAddress(Addr);
    631                 Relocs[j].second.getName(SymName);
    632 
    633                 outs() << "\t# " << SymName << ' ';
    634                 DumpAddress(Addr, Sections, MachOObj, outs());
    635               }
    636 
    637             // If this instructions contains an address, see if we can evaluate
    638             // it and print additional information.
    639             uint64_t targ = InstrAnalysis->evaluateBranch(Inst.Inst,
    640                                                           Inst.Address,
    641                                                           Inst.Size);
    642             if (targ != -1ULL)
    643               DumpAddress(targ, Sections, MachOObj, outs());
    644 
    645             // Print debug info.
    646             if (diContext) {
    647               DILineInfo dli =
    648                 diContext->getLineInfoForAddress(SectAddress + Inst.Address);
    649               // Print valid line info if it changed.
    650               if (dli != lastLine && dli.getLine() != 0)
    651                 outs() << "\t## " << dli.getFileName() << ':'
    652                        << dli.getLine() << ':' << dli.getColumn();
    653               lastLine = dli;
    654             }
    655 
    656             outs() << '\n';
    657           }
    658         }
    659 
    660         emitDOTFile((f.getName().str() + ".dot").c_str(), f, IP.get());
    661       }
    662     }
    663   }
    664 }
    665