1 //===-- llvm-nm.cpp - Symbol table dumping utility for llvm ---------------===// 2 // 3 // The LLVM Compiler Infrastructure 4 // 5 // This file is distributed under the University of Illinois Open Source 6 // License. See LICENSE.TXT for details. 7 // 8 //===----------------------------------------------------------------------===// 9 // 10 // This program is a utility that works like traditional Unix "nm", that is, it 11 // prints out the names of symbols in a bitcode or object file, along with some 12 // information about each symbol. 13 // 14 // This "nm" supports many of the features of GNU "nm", including its different 15 // output formats. 16 // 17 //===----------------------------------------------------------------------===// 18 19 #include "llvm/IR/LLVMContext.h" 20 #include "llvm/Bitcode/ReaderWriter.h" 21 #include "llvm/IR/Module.h" 22 #include "llvm/Object/Archive.h" 23 #include "llvm/Object/MachOUniversal.h" 24 #include "llvm/Object/ObjectFile.h" 25 #include "llvm/Support/CommandLine.h" 26 #include "llvm/Support/FileSystem.h" 27 #include "llvm/Support/Format.h" 28 #include "llvm/Support/ManagedStatic.h" 29 #include "llvm/Support/MemoryBuffer.h" 30 #include "llvm/Support/PrettyStackTrace.h" 31 #include "llvm/Support/Program.h" 32 #include "llvm/Support/Signals.h" 33 #include "llvm/Support/raw_ostream.h" 34 #include "llvm/Support/system_error.h" 35 #include <algorithm> 36 #include <cctype> 37 #include <cerrno> 38 #include <cstring> 39 #include <vector> 40 using namespace llvm; 41 using namespace object; 42 43 namespace { 44 enum OutputFormatTy { bsd, sysv, posix }; 45 cl::opt<OutputFormatTy> 46 OutputFormat("format", 47 cl::desc("Specify output format"), 48 cl::values(clEnumVal(bsd, "BSD format"), 49 clEnumVal(sysv, "System V format"), 50 clEnumVal(posix, "POSIX.2 format"), 51 clEnumValEnd), cl::init(bsd)); 52 cl::alias OutputFormat2("f", cl::desc("Alias for --format"), 53 cl::aliasopt(OutputFormat)); 54 55 cl::list<std::string> 56 InputFilenames(cl::Positional, cl::desc("<input bitcode files>"), 57 cl::ZeroOrMore); 58 59 cl::opt<bool> UndefinedOnly("undefined-only", 60 cl::desc("Show only undefined symbols")); 61 cl::alias UndefinedOnly2("u", cl::desc("Alias for --undefined-only"), 62 cl::aliasopt(UndefinedOnly)); 63 64 cl::opt<bool> DynamicSyms("dynamic", 65 cl::desc("Display the dynamic symbols instead " 66 "of normal symbols.")); 67 cl::alias DynamicSyms2("D", cl::desc("Alias for --dynamic"), 68 cl::aliasopt(DynamicSyms)); 69 70 cl::opt<bool> DefinedOnly("defined-only", 71 cl::desc("Show only defined symbols")); 72 73 cl::opt<bool> ExternalOnly("extern-only", 74 cl::desc("Show only external symbols")); 75 cl::alias ExternalOnly2("g", cl::desc("Alias for --extern-only"), 76 cl::aliasopt(ExternalOnly)); 77 78 cl::opt<bool> BSDFormat("B", cl::desc("Alias for --format=bsd")); 79 cl::opt<bool> POSIXFormat("P", cl::desc("Alias for --format=posix")); 80 81 cl::opt<bool> PrintFileName("print-file-name", 82 cl::desc("Precede each symbol with the object file it came from")); 83 84 cl::alias PrintFileNameA("A", cl::desc("Alias for --print-file-name"), 85 cl::aliasopt(PrintFileName)); 86 cl::alias PrintFileNameo("o", cl::desc("Alias for --print-file-name"), 87 cl::aliasopt(PrintFileName)); 88 89 cl::opt<bool> DebugSyms("debug-syms", 90 cl::desc("Show all symbols, even debugger only")); 91 cl::alias DebugSymsa("a", cl::desc("Alias for --debug-syms"), 92 cl::aliasopt(DebugSyms)); 93 94 cl::opt<bool> NumericSort("numeric-sort", 95 cl::desc("Sort symbols by address")); 96 cl::alias NumericSortn("n", cl::desc("Alias for --numeric-sort"), 97 cl::aliasopt(NumericSort)); 98 cl::alias NumericSortv("v", cl::desc("Alias for --numeric-sort"), 99 cl::aliasopt(NumericSort)); 100 101 cl::opt<bool> NoSort("no-sort", 102 cl::desc("Show symbols in order encountered")); 103 cl::alias NoSortp("p", cl::desc("Alias for --no-sort"), 104 cl::aliasopt(NoSort)); 105 106 cl::opt<bool> PrintSize("print-size", 107 cl::desc("Show symbol size instead of address")); 108 cl::alias PrintSizeS("S", cl::desc("Alias for --print-size"), 109 cl::aliasopt(PrintSize)); 110 111 cl::opt<bool> SizeSort("size-sort", cl::desc("Sort symbols by size")); 112 113 cl::opt<bool> WithoutAliases("without-aliases", cl::Hidden, 114 cl::desc("Exclude aliases from output")); 115 116 cl::opt<bool> ArchiveMap("print-armap", 117 cl::desc("Print the archive map")); 118 cl::alias ArchiveMaps("s", cl::desc("Alias for --print-armap"), 119 cl::aliasopt(ArchiveMap)); 120 bool PrintAddress = true; 121 122 bool MultipleFiles = false; 123 124 bool HadError = false; 125 126 std::string ToolName; 127 } 128 129 130 static void error(Twine message, Twine path = Twine()) { 131 errs() << ToolName << ": " << path << ": " << message << ".\n"; 132 } 133 134 static bool error(error_code ec, Twine path = Twine()) { 135 if (ec) { 136 error(ec.message(), path); 137 HadError = true; 138 return true; 139 } 140 return false; 141 } 142 143 namespace { 144 struct NMSymbol { 145 uint64_t Address; 146 uint64_t Size; 147 char TypeChar; 148 StringRef Name; 149 }; 150 151 static bool CompareSymbolAddress(const NMSymbol &a, const NMSymbol &b) { 152 if (a.Address < b.Address) 153 return true; 154 else if (a.Address == b.Address && a.Name < b.Name) 155 return true; 156 else if (a.Address == b.Address && a.Name == b.Name && a.Size < b.Size) 157 return true; 158 else 159 return false; 160 161 } 162 163 static bool CompareSymbolSize(const NMSymbol &a, const NMSymbol &b) { 164 if (a.Size < b.Size) 165 return true; 166 else if (a.Size == b.Size && a.Name < b.Name) 167 return true; 168 else if (a.Size == b.Size && a.Name == b.Name && a.Address < b.Address) 169 return true; 170 else 171 return false; 172 } 173 174 static bool CompareSymbolName(const NMSymbol &a, const NMSymbol &b) { 175 if (a.Name < b.Name) 176 return true; 177 else if (a.Name == b.Name && a.Size < b.Size) 178 return true; 179 else if (a.Name == b.Name && a.Size == b.Size && a.Address < b.Address) 180 return true; 181 else 182 return false; 183 } 184 185 StringRef CurrentFilename; 186 typedef std::vector<NMSymbol> SymbolListT; 187 SymbolListT SymbolList; 188 } 189 190 static void SortAndPrintSymbolList() { 191 if (!NoSort) { 192 if (NumericSort) 193 std::sort(SymbolList.begin(), SymbolList.end(), CompareSymbolAddress); 194 else if (SizeSort) 195 std::sort(SymbolList.begin(), SymbolList.end(), CompareSymbolSize); 196 else 197 std::sort(SymbolList.begin(), SymbolList.end(), CompareSymbolName); 198 } 199 200 if (OutputFormat == posix && MultipleFiles) { 201 outs() << '\n' << CurrentFilename << ":\n"; 202 } else if (OutputFormat == bsd && MultipleFiles) { 203 outs() << "\n" << CurrentFilename << ":\n"; 204 } else if (OutputFormat == sysv) { 205 outs() << "\n\nSymbols from " << CurrentFilename << ":\n\n" 206 << "Name Value Class Type" 207 << " Size Line Section\n"; 208 } 209 210 for (SymbolListT::iterator i = SymbolList.begin(), 211 e = SymbolList.end(); i != e; ++i) { 212 if ((i->TypeChar != 'U') && UndefinedOnly) 213 continue; 214 if ((i->TypeChar == 'U') && DefinedOnly) 215 continue; 216 if (SizeSort && !PrintAddress && i->Size == UnknownAddressOrSize) 217 continue; 218 219 char SymbolAddrStr[10] = ""; 220 char SymbolSizeStr[10] = ""; 221 222 if (OutputFormat == sysv || i->Address == object::UnknownAddressOrSize) 223 strcpy(SymbolAddrStr, " "); 224 if (OutputFormat == sysv) 225 strcpy(SymbolSizeStr, " "); 226 227 if (i->Address != object::UnknownAddressOrSize) 228 format("%08" PRIx64, i->Address).print(SymbolAddrStr, 229 sizeof(SymbolAddrStr)); 230 if (i->Size != object::UnknownAddressOrSize) 231 format("%08" PRIx64, i->Size).print(SymbolSizeStr, sizeof(SymbolSizeStr)); 232 233 if (OutputFormat == posix) { 234 outs() << i->Name << " " << i->TypeChar << " " 235 << SymbolAddrStr << SymbolSizeStr << "\n"; 236 } else if (OutputFormat == bsd) { 237 if (PrintAddress) 238 outs() << SymbolAddrStr << ' '; 239 if (PrintSize) { 240 outs() << SymbolSizeStr; 241 if (i->Size != object::UnknownAddressOrSize) 242 outs() << ' '; 243 } 244 outs() << i->TypeChar << " " << i->Name << "\n"; 245 } else if (OutputFormat == sysv) { 246 std::string PaddedName (i->Name); 247 while (PaddedName.length () < 20) 248 PaddedName += " "; 249 outs() << PaddedName << "|" << SymbolAddrStr << "| " 250 << i->TypeChar 251 << " | |" << SymbolSizeStr << "| |\n"; 252 } 253 } 254 255 SymbolList.clear(); 256 } 257 258 static char TypeCharForSymbol(GlobalValue &GV) { 259 if (GV.isDeclaration()) return 'U'; 260 if (GV.hasLinkOnceLinkage()) return 'C'; 261 if (GV.hasCommonLinkage()) return 'C'; 262 if (GV.hasWeakLinkage()) return 'W'; 263 if (isa<Function>(GV) && GV.hasInternalLinkage()) return 't'; 264 if (isa<Function>(GV)) return 'T'; 265 if (isa<GlobalVariable>(GV) && GV.hasInternalLinkage()) return 'd'; 266 if (isa<GlobalVariable>(GV)) return 'D'; 267 if (const GlobalAlias *GA = dyn_cast<GlobalAlias>(&GV)) { 268 const GlobalValue *AliasedGV = GA->getAliasedGlobal(); 269 if (isa<Function>(AliasedGV)) return 'T'; 270 if (isa<GlobalVariable>(AliasedGV)) return 'D'; 271 } 272 return '?'; 273 } 274 275 static void DumpSymbolNameForGlobalValue(GlobalValue &GV) { 276 // Private linkage and available_externally linkage don't exist in symtab. 277 if (GV.hasPrivateLinkage() || 278 GV.hasLinkerPrivateLinkage() || 279 GV.hasLinkerPrivateWeakLinkage() || 280 GV.hasAvailableExternallyLinkage()) 281 return; 282 char TypeChar = TypeCharForSymbol(GV); 283 if (GV.hasLocalLinkage () && ExternalOnly) 284 return; 285 286 NMSymbol s; 287 s.Address = object::UnknownAddressOrSize; 288 s.Size = object::UnknownAddressOrSize; 289 s.TypeChar = TypeChar; 290 s.Name = GV.getName(); 291 SymbolList.push_back(s); 292 } 293 294 static void DumpSymbolNamesFromModule(Module *M) { 295 CurrentFilename = M->getModuleIdentifier(); 296 std::for_each (M->begin(), M->end(), DumpSymbolNameForGlobalValue); 297 std::for_each (M->global_begin(), M->global_end(), 298 DumpSymbolNameForGlobalValue); 299 if (!WithoutAliases) 300 std::for_each (M->alias_begin(), M->alias_end(), 301 DumpSymbolNameForGlobalValue); 302 303 SortAndPrintSymbolList(); 304 } 305 306 static void DumpSymbolNamesFromObject(ObjectFile *obj) { 307 error_code ec; 308 symbol_iterator ibegin = obj->begin_symbols(); 309 symbol_iterator iend = obj->end_symbols(); 310 if (DynamicSyms) { 311 ibegin = obj->begin_dynamic_symbols(); 312 iend = obj->end_dynamic_symbols(); 313 } 314 for (symbol_iterator i = ibegin; i != iend; i.increment(ec)) { 315 if (error(ec)) break; 316 uint32_t symflags; 317 if (error(i->getFlags(symflags))) break; 318 if (!DebugSyms && (symflags & SymbolRef::SF_FormatSpecific)) 319 continue; 320 NMSymbol s; 321 s.Size = object::UnknownAddressOrSize; 322 s.Address = object::UnknownAddressOrSize; 323 if (PrintSize || SizeSort) { 324 if (error(i->getSize(s.Size))) break; 325 } 326 if (PrintAddress) 327 if (error(i->getAddress(s.Address))) break; 328 if (error(i->getNMTypeChar(s.TypeChar))) break; 329 if (error(i->getName(s.Name))) break; 330 SymbolList.push_back(s); 331 } 332 333 CurrentFilename = obj->getFileName(); 334 SortAndPrintSymbolList(); 335 } 336 337 static void DumpSymbolNamesFromFile(std::string &Filename) { 338 if (Filename != "-" && !sys::fs::exists(Filename)) { 339 errs() << ToolName << ": '" << Filename << "': " << "No such file\n"; 340 return; 341 } 342 343 OwningPtr<MemoryBuffer> Buffer; 344 if (error(MemoryBuffer::getFileOrSTDIN(Filename, Buffer), Filename)) 345 return; 346 347 sys::fs::file_magic magic = sys::fs::identify_magic(Buffer->getBuffer()); 348 349 LLVMContext &Context = getGlobalContext(); 350 std::string ErrorMessage; 351 if (magic == sys::fs::file_magic::bitcode) { 352 Module *Result = 0; 353 Result = ParseBitcodeFile(Buffer.get(), Context, &ErrorMessage); 354 if (Result) { 355 DumpSymbolNamesFromModule(Result); 356 delete Result; 357 } else { 358 error(ErrorMessage, Filename); 359 return; 360 } 361 } else if (magic == sys::fs::file_magic::archive) { 362 OwningPtr<Binary> arch; 363 if (error(object::createBinary(Buffer.take(), arch), Filename)) 364 return; 365 366 if (object::Archive *a = dyn_cast<object::Archive>(arch.get())) { 367 if (ArchiveMap) { 368 object::Archive::symbol_iterator I = a->begin_symbols(); 369 object::Archive::symbol_iterator E = a->end_symbols(); 370 if (I !=E) { 371 outs() << "Archive map" << "\n"; 372 for (; I != E; ++I) { 373 object::Archive::child_iterator c; 374 StringRef symname; 375 StringRef filename; 376 if (error(I->getMember(c))) 377 return; 378 if (error(I->getName(symname))) 379 return; 380 if (error(c->getName(filename))) 381 return; 382 outs() << symname << " in " << filename << "\n"; 383 } 384 outs() << "\n"; 385 } 386 } 387 388 for (object::Archive::child_iterator i = a->begin_children(), 389 e = a->end_children(); i != e; ++i) { 390 OwningPtr<Binary> child; 391 if (i->getAsBinary(child)) { 392 // Try opening it as a bitcode file. 393 OwningPtr<MemoryBuffer> buff; 394 if (error(i->getMemoryBuffer(buff))) 395 return; 396 Module *Result = 0; 397 if (buff) 398 Result = ParseBitcodeFile(buff.get(), Context, &ErrorMessage); 399 400 if (Result) { 401 DumpSymbolNamesFromModule(Result); 402 delete Result; 403 } 404 continue; 405 } 406 if (object::ObjectFile *o = dyn_cast<ObjectFile>(child.get())) { 407 outs() << o->getFileName() << ":\n"; 408 DumpSymbolNamesFromObject(o); 409 } 410 } 411 } 412 } else if (magic == sys::fs::file_magic::macho_universal_binary) { 413 OwningPtr<Binary> Bin; 414 if (error(object::createBinary(Buffer.take(), Bin), Filename)) 415 return; 416 417 object::MachOUniversalBinary *UB = 418 cast<object::MachOUniversalBinary>(Bin.get()); 419 for (object::MachOUniversalBinary::object_iterator 420 I = UB->begin_objects(), 421 E = UB->end_objects(); 422 I != E; ++I) { 423 OwningPtr<ObjectFile> Obj; 424 if (!I->getAsObjectFile(Obj)) { 425 outs() << Obj->getFileName() << ":\n"; 426 DumpSymbolNamesFromObject(Obj.get()); 427 } 428 } 429 } else if (magic.is_object()) { 430 OwningPtr<Binary> obj; 431 if (error(object::createBinary(Buffer.take(), obj), Filename)) 432 return; 433 if (object::ObjectFile *o = dyn_cast<ObjectFile>(obj.get())) 434 DumpSymbolNamesFromObject(o); 435 } else { 436 errs() << ToolName << ": " << Filename << ": " 437 << "unrecognizable file type\n"; 438 HadError = true; 439 return; 440 } 441 } 442 443 int main(int argc, char **argv) { 444 // Print a stack trace if we signal out. 445 sys::PrintStackTraceOnErrorSignal(); 446 PrettyStackTraceProgram X(argc, argv); 447 448 llvm_shutdown_obj Y; // Call llvm_shutdown() on exit. 449 cl::ParseCommandLineOptions(argc, argv, "llvm symbol table dumper\n"); 450 451 // llvm-nm only reads binary files. 452 if (error(sys::ChangeStdinToBinary())) 453 return 1; 454 455 ToolName = argv[0]; 456 if (BSDFormat) OutputFormat = bsd; 457 if (POSIXFormat) OutputFormat = posix; 458 459 // The relative order of these is important. If you pass --size-sort it should 460 // only print out the size. However, if you pass -S --size-sort, it should 461 // print out both the size and address. 462 if (SizeSort && !PrintSize) PrintAddress = false; 463 if (OutputFormat == sysv || SizeSort) PrintSize = true; 464 465 switch (InputFilenames.size()) { 466 case 0: InputFilenames.push_back("-"); 467 case 1: break; 468 default: MultipleFiles = true; 469 } 470 471 std::for_each(InputFilenames.begin(), InputFilenames.end(), 472 DumpSymbolNamesFromFile); 473 474 if (HadError) 475 return 1; 476 477 return 0; 478 } 479