1 //===-- macho-dump.cpp - Mach Object Dumping Tool -------------------------===// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 // 10 // This is a testing tool for use with the MC/Mach-O LLVM components. 11 // 12 //===----------------------------------------------------------------------===// 13 14 #include "llvm/Object/MachO.h" 15 #include "llvm/ADT/StringExtras.h" 16 #include "llvm/ADT/Twine.h" 17 #include "llvm/Support/Casting.h" 18 #include "llvm/Support/CommandLine.h" 19 #include "llvm/Support/Format.h" 20 #include "llvm/Support/ManagedStatic.h" 21 #include "llvm/Support/MemoryBuffer.h" 22 #include "llvm/Support/raw_ostream.h" 23 #include <system_error> 24 using namespace llvm; 25 using namespace llvm::object; 26 27 static cl::opt<std::string> 28 InputFile(cl::Positional, cl::desc("<input file>"), cl::init("-")); 29 30 static cl::opt<bool> 31 ShowSectionData("dump-section-data", cl::desc("Dump the contents of sections"), 32 cl::init(false)); 33 34 /// 35 36 static const char *ProgramName; 37 38 static void Message(const char *Type, const Twine &Msg) { 39 errs() << ProgramName << ": " << Type << ": " << Msg << "\n"; 40 } 41 42 static int Error(const Twine &Msg) { 43 Message("error", Msg); 44 return 1; 45 } 46 47 static void Warning(const Twine &Msg) { 48 Message("warning", Msg); 49 } 50 51 /// 52 53 static void DumpSegmentCommandData(StringRef Name, 54 uint64_t VMAddr, uint64_t VMSize, 55 uint64_t FileOffset, uint64_t FileSize, 56 uint32_t MaxProt, uint32_t InitProt, 57 uint32_t NumSections, uint32_t Flags) { 58 outs() << " ('segment_name', '"; 59 outs().write_escaped(Name, /*UseHexEscapes=*/true) << "')\n"; 60 outs() << " ('vm_addr', " << VMAddr << ")\n"; 61 outs() << " ('vm_size', " << VMSize << ")\n"; 62 outs() << " ('file_offset', " << FileOffset << ")\n"; 63 outs() << " ('file_size', " << FileSize << ")\n"; 64 outs() << " ('maxprot', " << MaxProt << ")\n"; 65 outs() << " ('initprot', " << InitProt << ")\n"; 66 outs() << " ('num_sections', " << NumSections << ")\n"; 67 outs() << " ('flags', " << Flags << ")\n"; 68 } 69 70 static int DumpSectionData(const MachOObjectFile &Obj, unsigned Index, 71 StringRef Name, 72 StringRef SegmentName, uint64_t Address, 73 uint64_t Size, uint32_t Offset, 74 uint32_t Align, uint32_t RelocationTableOffset, 75 uint32_t NumRelocationTableEntries, 76 uint32_t Flags, uint32_t Reserved1, 77 uint32_t Reserved2, uint64_t Reserved3 = ~0ULL) { 78 outs() << " # Section " << Index << "\n"; 79 outs() << " (('section_name', '"; 80 outs().write_escaped(Name, /*UseHexEscapes=*/true) << "')\n"; 81 outs() << " ('segment_name', '"; 82 outs().write_escaped(SegmentName, /*UseHexEscapes=*/true) << "')\n"; 83 outs() << " ('address', " << Address << ")\n"; 84 outs() << " ('size', " << Size << ")\n"; 85 outs() << " ('offset', " << Offset << ")\n"; 86 outs() << " ('alignment', " << Align << ")\n"; 87 outs() << " ('reloc_offset', " << RelocationTableOffset << ")\n"; 88 outs() << " ('num_reloc', " << NumRelocationTableEntries << ")\n"; 89 outs() << " ('flags', " << format("0x%x", Flags) << ")\n"; 90 outs() << " ('reserved1', " << Reserved1 << ")\n"; 91 outs() << " ('reserved2', " << Reserved2 << ")\n"; 92 if (Reserved3 != ~0ULL) 93 outs() << " ('reserved3', " << Reserved3 << ")\n"; 94 outs() << " ),\n"; 95 96 // Dump the relocation entries. 97 outs() << " ('_relocations', [\n"; 98 unsigned RelNum = 0; 99 for (relocation_iterator I = Obj.section_rel_begin(Index), 100 E = Obj.section_rel_end(Index); 101 I != E; ++I, ++RelNum) { 102 MachO::any_relocation_info RE = Obj.getRelocation(I->getRawDataRefImpl()); 103 outs() << " # Relocation " << RelNum << "\n"; 104 outs() << " (('word-0', " << format("0x%x", RE.r_word0) << "),\n"; 105 outs() << " ('word-1', " << format("0x%x", RE.r_word1) << ")),\n"; 106 } 107 outs() << " ])\n"; 108 109 // Dump the section data, if requested. 110 if (ShowSectionData) { 111 outs() << " ('_section_data', '"; 112 StringRef Data = Obj.getData().substr(Offset, Size); 113 for (unsigned i = 0; i != Data.size(); ++i) { 114 if (i && (i % 4) == 0) 115 outs() << ' '; 116 outs() << hexdigit((Data[i] >> 4) & 0xF, /*LowerCase=*/true); 117 outs() << hexdigit((Data[i] >> 0) & 0xF, /*LowerCase=*/true); 118 } 119 outs() << "')\n"; 120 } 121 122 return 0; 123 } 124 125 static int DumpSegmentCommand(const MachOObjectFile &Obj, 126 const MachOObjectFile::LoadCommandInfo &LCI) { 127 MachO::segment_command SLC = Obj.getSegmentLoadCommand(LCI); 128 129 DumpSegmentCommandData(StringRef(SLC.segname, 16), SLC.vmaddr, 130 SLC.vmsize, SLC.fileoff, SLC.filesize, 131 SLC.maxprot, SLC.initprot, SLC.nsects, SLC.flags); 132 133 // Dump the sections. 134 outs() << " ('sections', [\n"; 135 for (unsigned i = 0; i != SLC.nsects; ++i) { 136 MachO::section Sect = Obj.getSection(LCI, i); 137 DumpSectionData(Obj, i, StringRef(Sect.sectname, 16), 138 StringRef(Sect.segname, 16), Sect.addr, 139 Sect.size, Sect.offset, Sect.align, 140 Sect.reloff, Sect.nreloc, Sect.flags, 141 Sect.reserved1, Sect.reserved2); 142 } 143 outs() << " ])\n"; 144 145 return 0; 146 } 147 148 static int DumpSegment64Command(const MachOObjectFile &Obj, 149 const MachOObjectFile::LoadCommandInfo &LCI) { 150 MachO::segment_command_64 SLC = Obj.getSegment64LoadCommand(LCI); 151 DumpSegmentCommandData(StringRef(SLC.segname, 16), SLC.vmaddr, 152 SLC.vmsize, SLC.fileoff, SLC.filesize, 153 SLC.maxprot, SLC.initprot, SLC.nsects, SLC.flags); 154 155 // Dump the sections. 156 outs() << " ('sections', [\n"; 157 for (unsigned i = 0; i != SLC.nsects; ++i) { 158 MachO::section_64 Sect = Obj.getSection64(LCI, i); 159 160 DumpSectionData(Obj, i, StringRef(Sect.sectname, 16), 161 StringRef(Sect.segname, 16), Sect.addr, 162 Sect.size, Sect.offset, Sect.align, 163 Sect.reloff, Sect.nreloc, Sect.flags, 164 Sect.reserved1, Sect.reserved2, 165 Sect.reserved3); 166 } 167 outs() << " ])\n"; 168 169 return 0; 170 } 171 172 static void DumpSymbolTableEntryData(const MachOObjectFile &Obj, 173 unsigned Index, uint32_t StringIndex, 174 uint8_t Type, uint8_t SectionIndex, 175 uint16_t Flags, uint64_t Value, 176 StringRef StringTable) { 177 const char *Name = &StringTable.data()[StringIndex]; 178 outs() << " # Symbol " << Index << "\n"; 179 outs() << " (('n_strx', " << StringIndex << ")\n"; 180 outs() << " ('n_type', " << format("0x%x", Type) << ")\n"; 181 outs() << " ('n_sect', " << uint32_t(SectionIndex) << ")\n"; 182 outs() << " ('n_desc', " << Flags << ")\n"; 183 outs() << " ('n_value', " << Value << ")\n"; 184 outs() << " ('_string', '" << Name << "')\n"; 185 outs() << " ),\n"; 186 } 187 188 static int DumpSymtabCommand(const MachOObjectFile &Obj) { 189 MachO::symtab_command SLC = Obj.getSymtabLoadCommand(); 190 191 outs() << " ('symoff', " << SLC.symoff << ")\n"; 192 outs() << " ('nsyms', " << SLC.nsyms << ")\n"; 193 outs() << " ('stroff', " << SLC.stroff << ")\n"; 194 outs() << " ('strsize', " << SLC.strsize << ")\n"; 195 196 // Dump the string data. 197 outs() << " ('_string_data', '"; 198 StringRef StringTable = Obj.getStringTableData(); 199 outs().write_escaped(StringTable, 200 /*UseHexEscapes=*/true) << "')\n"; 201 202 // Dump the symbol table. 203 outs() << " ('_symbols', [\n"; 204 unsigned SymNum = 0; 205 for (const SymbolRef &Symbol : Obj.symbols()) { 206 DataRefImpl DRI = Symbol.getRawDataRefImpl(); 207 if (Obj.is64Bit()) { 208 MachO::nlist_64 STE = Obj.getSymbol64TableEntry(DRI); 209 DumpSymbolTableEntryData(Obj, SymNum, STE.n_strx, STE.n_type, 210 STE.n_sect, STE.n_desc, STE.n_value, 211 StringTable); 212 } else { 213 MachO::nlist STE = Obj.getSymbolTableEntry(DRI); 214 DumpSymbolTableEntryData(Obj, SymNum, STE.n_strx, STE.n_type, 215 STE.n_sect, STE.n_desc, STE.n_value, 216 StringTable); 217 } 218 SymNum++; 219 } 220 outs() << " ])\n"; 221 222 return 0; 223 } 224 225 static int DumpDysymtabCommand(const MachOObjectFile &Obj) { 226 MachO::dysymtab_command DLC = Obj.getDysymtabLoadCommand(); 227 228 outs() << " ('ilocalsym', " << DLC.ilocalsym << ")\n"; 229 outs() << " ('nlocalsym', " << DLC.nlocalsym << ")\n"; 230 outs() << " ('iextdefsym', " << DLC.iextdefsym << ")\n"; 231 outs() << " ('nextdefsym', " << DLC.nextdefsym << ")\n"; 232 outs() << " ('iundefsym', " << DLC.iundefsym << ")\n"; 233 outs() << " ('nundefsym', " << DLC.nundefsym << ")\n"; 234 outs() << " ('tocoff', " << DLC.tocoff << ")\n"; 235 outs() << " ('ntoc', " << DLC.ntoc << ")\n"; 236 outs() << " ('modtaboff', " << DLC.modtaboff << ")\n"; 237 outs() << " ('nmodtab', " << DLC.nmodtab << ")\n"; 238 outs() << " ('extrefsymoff', " << DLC.extrefsymoff << ")\n"; 239 outs() << " ('nextrefsyms', " << DLC.nextrefsyms << ")\n"; 240 outs() << " ('indirectsymoff', " << DLC.indirectsymoff << ")\n"; 241 outs() << " ('nindirectsyms', " << DLC.nindirectsyms << ")\n"; 242 outs() << " ('extreloff', " << DLC.extreloff << ")\n"; 243 outs() << " ('nextrel', " << DLC.nextrel << ")\n"; 244 outs() << " ('locreloff', " << DLC.locreloff << ")\n"; 245 outs() << " ('nlocrel', " << DLC.nlocrel << ")\n"; 246 247 // Dump the indirect symbol table. 248 outs() << " ('_indirect_symbols', [\n"; 249 for (unsigned i = 0; i != DLC.nindirectsyms; ++i) { 250 uint32_t ISTE = Obj.getIndirectSymbolTableEntry(DLC, i); 251 outs() << " # Indirect Symbol " << i << "\n"; 252 outs() << " (('symbol_index', " << format("0x%x", ISTE) << "),),\n"; 253 } 254 outs() << " ])\n"; 255 256 return 0; 257 } 258 259 static int 260 DumpLinkeditDataCommand(const MachOObjectFile &Obj, 261 const MachOObjectFile::LoadCommandInfo &LCI) { 262 MachO::linkedit_data_command LLC = Obj.getLinkeditDataLoadCommand(LCI); 263 outs() << " ('dataoff', " << LLC.dataoff << ")\n" 264 << " ('datasize', " << LLC.datasize << ")\n" 265 << " ('_addresses', [\n"; 266 267 SmallVector<uint64_t, 8> Addresses; 268 Obj.ReadULEB128s(LLC.dataoff, Addresses); 269 for (unsigned i = 0, e = Addresses.size(); i != e; ++i) 270 outs() << " # Address " << i << '\n' 271 << " ('address', " << format("0x%x", Addresses[i]) << "),\n"; 272 273 outs() << " ])\n"; 274 275 return 0; 276 } 277 278 static int 279 DumpDataInCodeDataCommand(const MachOObjectFile &Obj, 280 const MachOObjectFile::LoadCommandInfo &LCI) { 281 MachO::linkedit_data_command LLC = Obj.getLinkeditDataLoadCommand(LCI); 282 outs() << " ('dataoff', " << LLC.dataoff << ")\n" 283 << " ('datasize', " << LLC.datasize << ")\n" 284 << " ('_data_regions', [\n"; 285 286 unsigned NumRegions = LLC.datasize / sizeof(MachO::data_in_code_entry); 287 for (unsigned i = 0; i < NumRegions; ++i) { 288 MachO::data_in_code_entry DICE= Obj.getDataInCodeTableEntry(LLC.dataoff, i); 289 outs() << " # DICE " << i << "\n" 290 << " ('offset', " << DICE.offset << ")\n" 291 << " ('length', " << DICE.length << ")\n" 292 << " ('kind', " << DICE.kind << ")\n"; 293 } 294 295 outs() <<" ])\n"; 296 297 return 0; 298 } 299 300 static int 301 DumpLinkerOptionsCommand(const MachOObjectFile &Obj, 302 const MachOObjectFile::LoadCommandInfo &LCI) { 303 MachO::linker_options_command LOLC = Obj.getLinkerOptionsLoadCommand(LCI); 304 outs() << " ('count', " << LOLC.count << ")\n" 305 << " ('_strings', [\n"; 306 307 uint64_t DataSize = LOLC.cmdsize - sizeof(MachO::linker_options_command); 308 const char *P = LCI.Ptr + sizeof(MachO::linker_options_command); 309 StringRef Data(P, DataSize); 310 for (unsigned i = 0; i != LOLC.count; ++i) { 311 std::pair<StringRef,StringRef> Split = Data.split('\0'); 312 outs() << "\t\""; 313 outs().write_escaped(Split.first); 314 outs() << "\",\n"; 315 Data = Split.second; 316 } 317 outs() <<" ])\n"; 318 319 return 0; 320 } 321 322 static int 323 DumpVersionMin(const MachOObjectFile &Obj, 324 const MachOObjectFile::LoadCommandInfo &LCI) { 325 MachO::version_min_command VMLC = Obj.getVersionMinLoadCommand(LCI); 326 outs() << " ('version, " << VMLC.version << ")\n" 327 << " ('reserved, " << VMLC.reserved << ")\n"; 328 return 0; 329 } 330 331 static int 332 DumpDylibID(const MachOObjectFile &Obj, 333 const MachOObjectFile::LoadCommandInfo &LCI) { 334 MachO::dylib_command DLLC = Obj.getDylibIDLoadCommand(LCI); 335 outs() << " ('install_name', '" << LCI.Ptr + DLLC.dylib.name << "')\n" 336 << " ('timestamp, " << DLLC.dylib.timestamp << ")\n" 337 << " ('cur_version, " << DLLC.dylib.current_version << ")\n" 338 << " ('compat_version, " << DLLC.dylib.compatibility_version << ")\n"; 339 return 0; 340 } 341 342 static int DumpLoadCommand(const MachOObjectFile &Obj, 343 MachOObjectFile::LoadCommandInfo &LCI) { 344 switch (LCI.C.cmd) { 345 case MachO::LC_SEGMENT: 346 return DumpSegmentCommand(Obj, LCI); 347 case MachO::LC_SEGMENT_64: 348 return DumpSegment64Command(Obj, LCI); 349 case MachO::LC_SYMTAB: 350 return DumpSymtabCommand(Obj); 351 case MachO::LC_DYSYMTAB: 352 return DumpDysymtabCommand(Obj); 353 case MachO::LC_CODE_SIGNATURE: 354 case MachO::LC_SEGMENT_SPLIT_INFO: 355 case MachO::LC_FUNCTION_STARTS: 356 return DumpLinkeditDataCommand(Obj, LCI); 357 case MachO::LC_DATA_IN_CODE: 358 return DumpDataInCodeDataCommand(Obj, LCI); 359 case MachO::LC_LINKER_OPTIONS: 360 return DumpLinkerOptionsCommand(Obj, LCI); 361 case MachO::LC_VERSION_MIN_IPHONEOS: 362 case MachO::LC_VERSION_MIN_MACOSX: 363 return DumpVersionMin(Obj, LCI); 364 case MachO::LC_ID_DYLIB: 365 return DumpDylibID(Obj, LCI); 366 default: 367 Warning("unknown load command: " + Twine(LCI.C.cmd)); 368 return 0; 369 } 370 } 371 372 373 static int DumpLoadCommand(const MachOObjectFile &Obj, unsigned Index, 374 MachOObjectFile::LoadCommandInfo &LCI) { 375 outs() << " # Load Command " << Index << "\n" 376 << " (('command', " << LCI.C.cmd << ")\n" 377 << " ('size', " << LCI.C.cmdsize << ")\n"; 378 int Res = DumpLoadCommand(Obj, LCI); 379 outs() << " ),\n"; 380 return Res; 381 } 382 383 static void printHeader(const MachOObjectFile *Obj, 384 const MachO::mach_header &Header) { 385 outs() << "('cputype', " << Header.cputype << ")\n"; 386 outs() << "('cpusubtype', " << Header.cpusubtype << ")\n"; 387 outs() << "('filetype', " << Header.filetype << ")\n"; 388 outs() << "('num_load_commands', " << Header.ncmds << ")\n"; 389 outs() << "('load_commands_size', " << Header.sizeofcmds << ")\n"; 390 outs() << "('flag', " << Header.flags << ")\n"; 391 392 // Print extended header if 64-bit. 393 if (Obj->is64Bit()) { 394 const MachO::mach_header_64 *Header64 = 395 reinterpret_cast<const MachO::mach_header_64 *>(&Header); 396 outs() << "('reserved', " << Header64->reserved << ")\n"; 397 } 398 } 399 400 int main(int argc, char **argv) { 401 ProgramName = argv[0]; 402 llvm_shutdown_obj Y; // Call llvm_shutdown() on exit. 403 404 cl::ParseCommandLineOptions(argc, argv, "llvm Mach-O dumping tool\n"); 405 406 ErrorOr<Binary *> BinaryOrErr = createBinary(InputFile); 407 if (std::error_code EC = BinaryOrErr.getError()) 408 return Error("unable to read input: '" + EC.message() + "'"); 409 std::unique_ptr<Binary> Binary(BinaryOrErr.get()); 410 411 const MachOObjectFile *InputObject = dyn_cast<MachOObjectFile>(Binary.get()); 412 if (!InputObject) 413 return Error("Not a MachO object"); 414 415 // Print the header 416 MachO::mach_header_64 Header64; 417 MachO::mach_header *Header = reinterpret_cast<MachO::mach_header*>(&Header64); 418 if (InputObject->is64Bit()) 419 Header64 = InputObject->getHeader64(); 420 else 421 *Header = InputObject->getHeader(); 422 printHeader(InputObject, *Header); 423 424 // Print the load commands. 425 int Res = 0; 426 MachOObjectFile::LoadCommandInfo Command = 427 InputObject->getFirstLoadCommandInfo(); 428 outs() << "('load_commands', [\n"; 429 for (unsigned i = 0; ; ++i) { 430 if (DumpLoadCommand(*InputObject, i, Command)) 431 break; 432 433 if (i == Header->ncmds - 1) 434 break; 435 Command = InputObject->getNextLoadCommandInfo(Command); 436 } 437 outs() << "])\n"; 438 439 return Res; 440 } 441