[llvm-nm] - Fix a bug and unbreak ASan BB.
[llvm-complete.git] / tools / llvm-nm / llvm-nm.cpp
blobee55722dc139b04b9d33117ed0e560c14b348fdd
1 //===-- llvm-nm.cpp - Symbol table dumping utility for llvm ---------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This program is a utility that works like traditional Unix "nm", that is, it
10 // prints out the names of symbols in a bitcode or object file, along with some
11 // information about each symbol.
13 // This "nm" supports many of the features of GNU "nm", including its different
14 // output formats.
16 //===----------------------------------------------------------------------===//
18 #include "llvm/ADT/StringSwitch.h"
19 #include "llvm/BinaryFormat/COFF.h"
20 #include "llvm/Demangle/Demangle.h"
21 #include "llvm/IR/Function.h"
22 #include "llvm/IR/LLVMContext.h"
23 #include "llvm/Object/Archive.h"
24 #include "llvm/Object/COFF.h"
25 #include "llvm/Object/COFFImportFile.h"
26 #include "llvm/Object/ELFObjectFile.h"
27 #include "llvm/Object/IRObjectFile.h"
28 #include "llvm/Object/MachO.h"
29 #include "llvm/Object/MachOUniversal.h"
30 #include "llvm/Object/ObjectFile.h"
31 #include "llvm/Object/Wasm.h"
32 #include "llvm/Support/CommandLine.h"
33 #include "llvm/Support/FileSystem.h"
34 #include "llvm/Support/Format.h"
35 #include "llvm/Support/InitLLVM.h"
36 #include "llvm/Support/MemoryBuffer.h"
37 #include "llvm/Support/Program.h"
38 #include "llvm/Support/Signals.h"
39 #include "llvm/Support/TargetSelect.h"
40 #include "llvm/Support/WithColor.h"
41 #include "llvm/Support/raw_ostream.h"
42 #include <vector>
44 using namespace llvm;
45 using namespace object;
47 namespace {
48 enum OutputFormatTy { bsd, sysv, posix, darwin };
50 cl::OptionCategory NMCat("llvm-nm Options");
52 cl::opt<OutputFormatTy> OutputFormat(
53 "format", cl::desc("Specify output format"),
54 cl::values(clEnumVal(bsd, "BSD format"), clEnumVal(sysv, "System V format"),
55 clEnumVal(posix, "POSIX.2 format"),
56 clEnumVal(darwin, "Darwin -m format")),
57 cl::init(bsd), cl::cat(NMCat));
58 cl::alias OutputFormat2("f", cl::desc("Alias for --format"),
59 cl::aliasopt(OutputFormat));
61 cl::list<std::string> InputFilenames(cl::Positional, cl::desc("<input files>"),
62 cl::ZeroOrMore);
64 cl::opt<bool> UndefinedOnly("undefined-only",
65 cl::desc("Show only undefined symbols"),
66 cl::cat(NMCat));
67 cl::alias UndefinedOnly2("u", cl::desc("Alias for --undefined-only"),
68 cl::aliasopt(UndefinedOnly), cl::Grouping);
70 cl::opt<bool> DynamicSyms("dynamic",
71 cl::desc("Display the dynamic symbols instead "
72 "of normal symbols."),
73 cl::cat(NMCat));
74 cl::alias DynamicSyms2("D", cl::desc("Alias for --dynamic"),
75 cl::aliasopt(DynamicSyms), cl::Grouping);
77 cl::opt<bool> DefinedOnly("defined-only", cl::desc("Show only defined symbols"),
78 cl::cat(NMCat));
79 cl::alias DefinedOnly2("U", cl::desc("Alias for --defined-only"),
80 cl::aliasopt(DefinedOnly), cl::Grouping);
82 cl::opt<bool> ExternalOnly("extern-only",
83 cl::desc("Show only external symbols"),
84 cl::ZeroOrMore, cl::cat(NMCat));
85 cl::alias ExternalOnly2("g", cl::desc("Alias for --extern-only"),
86 cl::aliasopt(ExternalOnly), cl::Grouping,
87 cl::ZeroOrMore);
89 cl::opt<bool> NoWeakSymbols("no-weak", cl::desc("Show only non-weak symbols"),
90 cl::cat(NMCat));
91 cl::alias NoWeakSymbols2("W", cl::desc("Alias for --no-weak"),
92 cl::aliasopt(NoWeakSymbols), cl::Grouping);
94 cl::opt<bool> BSDFormat("B", cl::desc("Alias for --format=bsd"), cl::Grouping,
95 cl::cat(NMCat));
96 cl::opt<bool> POSIXFormat("P", cl::desc("Alias for --format=posix"),
97 cl::Grouping, cl::cat(NMCat));
98 cl::alias Portability("portability", cl::desc("Alias for --format=posix"),
99 cl::aliasopt(POSIXFormat), cl::NotHidden);
100 cl::opt<bool> DarwinFormat("m", cl::desc("Alias for --format=darwin"),
101 cl::Grouping, cl::cat(NMCat));
103 static cl::list<std::string>
104 ArchFlags("arch", cl::desc("architecture(s) from a Mach-O file to dump"),
105 cl::ZeroOrMore, cl::cat(NMCat));
106 bool ArchAll = false;
108 cl::opt<bool> PrintFileName(
109 "print-file-name",
110 cl::desc("Precede each symbol with the object file it came from"),
111 cl::cat(NMCat));
113 cl::alias PrintFileNameA("A", cl::desc("Alias for --print-file-name"),
114 cl::aliasopt(PrintFileName), cl::Grouping);
115 cl::alias PrintFileNameo("o", cl::desc("Alias for --print-file-name"),
116 cl::aliasopt(PrintFileName), cl::Grouping);
118 cl::opt<bool> DebugSyms("debug-syms",
119 cl::desc("Show all symbols, even debugger only"),
120 cl::cat(NMCat));
121 cl::alias DebugSymsa("a", cl::desc("Alias for --debug-syms"),
122 cl::aliasopt(DebugSyms), cl::Grouping);
124 cl::opt<bool> NumericSort("numeric-sort", cl::desc("Sort symbols by address"),
125 cl::cat(NMCat));
126 cl::alias NumericSortn("n", cl::desc("Alias for --numeric-sort"),
127 cl::aliasopt(NumericSort), cl::Grouping);
128 cl::alias NumericSortv("v", cl::desc("Alias for --numeric-sort"),
129 cl::aliasopt(NumericSort), cl::Grouping);
131 cl::opt<bool> NoSort("no-sort", cl::desc("Show symbols in order encountered"),
132 cl::cat(NMCat));
133 cl::alias NoSortp("p", cl::desc("Alias for --no-sort"), cl::aliasopt(NoSort),
134 cl::Grouping);
136 cl::opt<bool> Demangle("demangle", cl::ZeroOrMore,
137 cl::desc("Demangle C++ symbol names"), cl::cat(NMCat));
138 cl::alias DemangleC("C", cl::desc("Alias for --demangle"),
139 cl::aliasopt(Demangle), cl::Grouping);
140 cl::opt<bool> NoDemangle("no-demangle", cl::init(false), cl::ZeroOrMore,
141 cl::desc("Don't demangle symbol names"),
142 cl::cat(NMCat));
144 cl::opt<bool> ReverseSort("reverse-sort", cl::desc("Sort in reverse order"),
145 cl::cat(NMCat));
146 cl::alias ReverseSortr("r", cl::desc("Alias for --reverse-sort"),
147 cl::aliasopt(ReverseSort), cl::Grouping);
149 cl::opt<bool> PrintSize("print-size",
150 cl::desc("Show symbol size as well as address"),
151 cl::cat(NMCat));
152 cl::alias PrintSizeS("S", cl::desc("Alias for --print-size"),
153 cl::aliasopt(PrintSize), cl::Grouping);
154 bool MachOPrintSizeWarning = false;
156 cl::opt<bool> SizeSort("size-sort", cl::desc("Sort symbols by size"),
157 cl::cat(NMCat));
159 cl::opt<bool> WithoutAliases("without-aliases", cl::Hidden,
160 cl::desc("Exclude aliases from output"),
161 cl::cat(NMCat));
163 cl::opt<bool> ArchiveMap("print-armap", cl::desc("Print the archive map"),
164 cl::cat(NMCat));
165 cl::alias ArchiveMaps("M", cl::desc("Alias for --print-armap"),
166 cl::aliasopt(ArchiveMap), cl::Grouping);
168 enum Radix { d, o, x };
169 cl::opt<Radix>
170 AddressRadix("radix", cl::desc("Radix (o/d/x) for printing symbol Values"),
171 cl::values(clEnumVal(d, "decimal"), clEnumVal(o, "octal"),
172 clEnumVal(x, "hexadecimal")),
173 cl::init(x), cl::cat(NMCat));
174 cl::alias RadixAlias("t", cl::desc("Alias for --radix"),
175 cl::aliasopt(AddressRadix));
177 cl::opt<bool> JustSymbolName("just-symbol-name",
178 cl::desc("Print just the symbol's name"),
179 cl::cat(NMCat));
180 cl::alias JustSymbolNames("j", cl::desc("Alias for --just-symbol-name"),
181 cl::aliasopt(JustSymbolName), cl::Grouping);
183 cl::opt<bool> SpecialSyms("special-syms",
184 cl::desc("No-op. Used for GNU compatibility only"));
186 cl::list<std::string> SegSect("s", cl::multi_val(2), cl::ZeroOrMore,
187 cl::value_desc("segment section"), cl::Hidden,
188 cl::desc("Dump only symbols from this segment "
189 "and section name, Mach-O only"),
190 cl::cat(NMCat));
192 cl::opt<bool> FormatMachOasHex("x",
193 cl::desc("Print symbol entry in hex, "
194 "Mach-O only"),
195 cl::Grouping, cl::cat(NMCat));
196 cl::opt<bool> AddDyldInfo("add-dyldinfo",
197 cl::desc("Add symbols from the dyldinfo not already "
198 "in the symbol table, Mach-O only"),
199 cl::cat(NMCat));
200 cl::opt<bool> NoDyldInfo("no-dyldinfo",
201 cl::desc("Don't add any symbols from the dyldinfo, "
202 "Mach-O only"),
203 cl::cat(NMCat));
204 cl::opt<bool> DyldInfoOnly("dyldinfo-only",
205 cl::desc("Show only symbols from the dyldinfo, "
206 "Mach-O only"),
207 cl::cat(NMCat));
209 cl::opt<bool> NoLLVMBitcode("no-llvm-bc",
210 cl::desc("Disable LLVM bitcode reader"),
211 cl::cat(NMCat));
213 cl::extrahelp HelpResponse("\nPass @FILE as argument to read options from FILE.\n");
215 bool PrintAddress = true;
217 bool MultipleFiles = false;
219 bool HadError = false;
221 std::string ToolName;
222 } // anonymous namespace
224 static void error(Twine Message, Twine Path = Twine()) {
225 HadError = true;
226 WithColor::error(errs(), ToolName) << Path << ": " << Message << ".\n";
229 static bool error(std::error_code EC, Twine Path = Twine()) {
230 if (EC) {
231 error(EC.message(), Path);
232 return true;
234 return false;
237 // This version of error() prints the archive name and member name, for example:
238 // "libx.a(foo.o)" after the ToolName before the error message. It sets
239 // HadError but returns allowing the code to move on to other archive members.
240 static void error(llvm::Error E, StringRef FileName, const Archive::Child &C,
241 StringRef ArchitectureName = StringRef()) {
242 HadError = true;
243 WithColor::error(errs(), ToolName) << FileName;
245 Expected<StringRef> NameOrErr = C.getName();
246 // TODO: if we have a error getting the name then it would be nice to print
247 // the index of which archive member this is and or its offset in the
248 // archive instead of "???" as the name.
249 if (!NameOrErr) {
250 consumeError(NameOrErr.takeError());
251 errs() << "(" << "???" << ")";
252 } else
253 errs() << "(" << NameOrErr.get() << ")";
255 if (!ArchitectureName.empty())
256 errs() << " (for architecture " << ArchitectureName << ") ";
258 std::string Buf;
259 raw_string_ostream OS(Buf);
260 logAllUnhandledErrors(std::move(E), OS);
261 OS.flush();
262 errs() << " " << Buf << "\n";
265 // This version of error() prints the file name and which architecture slice it
266 // is from, for example: "foo.o (for architecture i386)" after the ToolName
267 // before the error message. It sets HadError but returns allowing the code to
268 // move on to other architecture slices.
269 static void error(llvm::Error E, StringRef FileName,
270 StringRef ArchitectureName = StringRef()) {
271 HadError = true;
272 WithColor::error(errs(), ToolName) << FileName;
274 if (!ArchitectureName.empty())
275 errs() << " (for architecture " << ArchitectureName << ") ";
277 std::string Buf;
278 raw_string_ostream OS(Buf);
279 logAllUnhandledErrors(std::move(E), OS);
280 OS.flush();
281 errs() << " " << Buf << "\n";
284 namespace {
285 struct NMSymbol {
286 uint64_t Address;
287 uint64_t Size;
288 char TypeChar;
289 StringRef Name;
290 StringRef SectionName;
291 StringRef TypeName;
292 BasicSymbolRef Sym;
293 // The Sym field above points to the native symbol in the object file,
294 // for Mach-O when we are creating symbols from the dyld info the above
295 // pointer is null as there is no native symbol. In these cases the fields
296 // below are filled in to represent what would have been a Mach-O nlist
297 // native symbol.
298 uint32_t SymFlags;
299 SectionRef Section;
300 uint8_t NType;
301 uint8_t NSect;
302 uint16_t NDesc;
303 StringRef IndirectName;
305 } // anonymous namespace
307 static bool compareSymbolAddress(const NMSymbol &A, const NMSymbol &B) {
308 bool ADefined;
309 if (A.Sym.getRawDataRefImpl().p)
310 ADefined = !(A.Sym.getFlags() & SymbolRef::SF_Undefined);
311 else
312 ADefined = A.TypeChar != 'U';
313 bool BDefined;
314 if (B.Sym.getRawDataRefImpl().p)
315 BDefined = !(B.Sym.getFlags() & SymbolRef::SF_Undefined);
316 else
317 BDefined = B.TypeChar != 'U';
318 return std::make_tuple(ADefined, A.Address, A.Name, A.Size) <
319 std::make_tuple(BDefined, B.Address, B.Name, B.Size);
322 static bool compareSymbolSize(const NMSymbol &A, const NMSymbol &B) {
323 return std::make_tuple(A.Size, A.Name, A.Address) <
324 std::make_tuple(B.Size, B.Name, B.Address);
327 static bool compareSymbolName(const NMSymbol &A, const NMSymbol &B) {
328 return std::make_tuple(A.Name, A.Size, A.Address) <
329 std::make_tuple(B.Name, B.Size, B.Address);
332 static char isSymbolList64Bit(SymbolicFile &Obj) {
333 if (auto *IRObj = dyn_cast<IRObjectFile>(&Obj))
334 return Triple(IRObj->getTargetTriple()).isArch64Bit();
335 if (isa<COFFObjectFile>(Obj) || isa<COFFImportFile>(Obj))
336 return false;
337 if (isa<WasmObjectFile>(Obj))
338 return false;
339 if (MachOObjectFile *MachO = dyn_cast<MachOObjectFile>(&Obj))
340 return MachO->is64Bit();
341 return cast<ELFObjectFileBase>(Obj).getBytesInAddress() == 8;
344 static StringRef CurrentFilename;
345 static std::vector<NMSymbol> SymbolList;
347 static char getSymbolNMTypeChar(IRObjectFile &Obj, basic_symbol_iterator I);
349 // darwinPrintSymbol() is used to print a symbol from a Mach-O file when the
350 // the OutputFormat is darwin or we are printing Mach-O symbols in hex. For
351 // the darwin format it produces the same output as darwin's nm(1) -m output
352 // and when printing Mach-O symbols in hex it produces the same output as
353 // darwin's nm(1) -x format.
354 static void darwinPrintSymbol(SymbolicFile &Obj, const NMSymbol &S,
355 char *SymbolAddrStr, const char *printBlanks,
356 const char *printDashes,
357 const char *printFormat) {
358 MachO::mach_header H;
359 MachO::mach_header_64 H_64;
360 uint32_t Filetype = MachO::MH_OBJECT;
361 uint32_t Flags = 0;
362 uint8_t NType = 0;
363 uint8_t NSect = 0;
364 uint16_t NDesc = 0;
365 uint32_t NStrx = 0;
366 uint64_t NValue = 0;
367 MachOObjectFile *MachO = dyn_cast<MachOObjectFile>(&Obj);
368 if (Obj.isIR()) {
369 uint32_t SymFlags = S.Sym.getFlags();
370 if (SymFlags & SymbolRef::SF_Global)
371 NType |= MachO::N_EXT;
372 if (SymFlags & SymbolRef::SF_Hidden)
373 NType |= MachO::N_PEXT;
374 if (SymFlags & SymbolRef::SF_Undefined)
375 NType |= MachO::N_EXT | MachO::N_UNDF;
376 else {
377 // Here we have a symbol definition. So to fake out a section name we
378 // use 1, 2 and 3 for section numbers. See below where they are used to
379 // print out fake section names.
380 NType |= MachO::N_SECT;
381 if (SymFlags & SymbolRef::SF_Const)
382 NSect = 3;
383 else if (SymFlags & SymbolRef::SF_Executable)
384 NSect = 1;
385 else
386 NSect = 2;
388 if (SymFlags & SymbolRef::SF_Weak)
389 NDesc |= MachO::N_WEAK_DEF;
390 } else {
391 DataRefImpl SymDRI = S.Sym.getRawDataRefImpl();
392 if (MachO->is64Bit()) {
393 H_64 = MachO->MachOObjectFile::getHeader64();
394 Filetype = H_64.filetype;
395 Flags = H_64.flags;
396 if (SymDRI.p){
397 MachO::nlist_64 STE_64 = MachO->getSymbol64TableEntry(SymDRI);
398 NType = STE_64.n_type;
399 NSect = STE_64.n_sect;
400 NDesc = STE_64.n_desc;
401 NStrx = STE_64.n_strx;
402 NValue = STE_64.n_value;
403 } else {
404 NType = S.NType;
405 NSect = S.NSect;
406 NDesc = S.NDesc;
407 NStrx = 0;
408 NValue = S.Address;
410 } else {
411 H = MachO->MachOObjectFile::getHeader();
412 Filetype = H.filetype;
413 Flags = H.flags;
414 if (SymDRI.p){
415 MachO::nlist STE = MachO->getSymbolTableEntry(SymDRI);
416 NType = STE.n_type;
417 NSect = STE.n_sect;
418 NDesc = STE.n_desc;
419 NStrx = STE.n_strx;
420 NValue = STE.n_value;
421 } else {
422 NType = S.NType;
423 NSect = S.NSect;
424 NDesc = S.NDesc;
425 NStrx = 0;
426 NValue = S.Address;
431 // If we are printing Mach-O symbols in hex do that and return.
432 if (FormatMachOasHex) {
433 outs() << format(printFormat, NValue) << ' '
434 << format("%02x %02x %04x %08x", NType, NSect, NDesc, NStrx) << ' '
435 << S.Name;
436 if ((NType & MachO::N_TYPE) == MachO::N_INDR) {
437 outs() << " (indirect for ";
438 outs() << format(printFormat, NValue) << ' ';
439 StringRef IndirectName;
440 if (S.Sym.getRawDataRefImpl().p) {
441 if (MachO->getIndirectName(S.Sym.getRawDataRefImpl(), IndirectName))
442 outs() << "?)";
443 else
444 outs() << IndirectName << ")";
445 } else
446 outs() << S.IndirectName << ")";
448 outs() << "\n";
449 return;
452 if (PrintAddress) {
453 if ((NType & MachO::N_TYPE) == MachO::N_INDR)
454 strcpy(SymbolAddrStr, printBlanks);
455 if (Obj.isIR() && (NType & MachO::N_TYPE) == MachO::N_TYPE)
456 strcpy(SymbolAddrStr, printDashes);
457 outs() << SymbolAddrStr << ' ';
460 switch (NType & MachO::N_TYPE) {
461 case MachO::N_UNDF:
462 if (NValue != 0) {
463 outs() << "(common) ";
464 if (MachO::GET_COMM_ALIGN(NDesc) != 0)
465 outs() << "(alignment 2^" << (int)MachO::GET_COMM_ALIGN(NDesc) << ") ";
466 } else {
467 if ((NType & MachO::N_TYPE) == MachO::N_PBUD)
468 outs() << "(prebound ";
469 else
470 outs() << "(";
471 if ((NDesc & MachO::REFERENCE_TYPE) ==
472 MachO::REFERENCE_FLAG_UNDEFINED_LAZY)
473 outs() << "undefined [lazy bound]) ";
474 else if ((NDesc & MachO::REFERENCE_TYPE) ==
475 MachO::REFERENCE_FLAG_PRIVATE_UNDEFINED_LAZY)
476 outs() << "undefined [private lazy bound]) ";
477 else if ((NDesc & MachO::REFERENCE_TYPE) ==
478 MachO::REFERENCE_FLAG_PRIVATE_UNDEFINED_NON_LAZY)
479 outs() << "undefined [private]) ";
480 else
481 outs() << "undefined) ";
483 break;
484 case MachO::N_ABS:
485 outs() << "(absolute) ";
486 break;
487 case MachO::N_INDR:
488 outs() << "(indirect) ";
489 break;
490 case MachO::N_SECT: {
491 if (Obj.isIR()) {
492 // For llvm bitcode files print out a fake section name using the values
493 // use 1, 2 and 3 for section numbers as set above.
494 if (NSect == 1)
495 outs() << "(LTO,CODE) ";
496 else if (NSect == 2)
497 outs() << "(LTO,DATA) ";
498 else if (NSect == 3)
499 outs() << "(LTO,RODATA) ";
500 else
501 outs() << "(?,?) ";
502 break;
504 section_iterator Sec = SectionRef();
505 if (S.Sym.getRawDataRefImpl().p) {
506 Expected<section_iterator> SecOrErr =
507 MachO->getSymbolSection(S.Sym.getRawDataRefImpl());
508 if (!SecOrErr) {
509 consumeError(SecOrErr.takeError());
510 outs() << "(?,?) ";
511 break;
513 Sec = *SecOrErr;
514 if (Sec == MachO->section_end()) {
515 outs() << "(?,?) ";
516 break;
518 } else {
519 Sec = S.Section;
521 DataRefImpl Ref = Sec->getRawDataRefImpl();
522 StringRef SectionName;
523 if (Expected<StringRef> NameOrErr = MachO->getSectionName(Ref))
524 SectionName = *NameOrErr;
525 StringRef SegmentName = MachO->getSectionFinalSegmentName(Ref);
526 outs() << "(" << SegmentName << "," << SectionName << ") ";
527 break;
529 default:
530 outs() << "(?) ";
531 break;
534 if (NType & MachO::N_EXT) {
535 if (NDesc & MachO::REFERENCED_DYNAMICALLY)
536 outs() << "[referenced dynamically] ";
537 if (NType & MachO::N_PEXT) {
538 if ((NDesc & MachO::N_WEAK_DEF) == MachO::N_WEAK_DEF)
539 outs() << "weak private external ";
540 else
541 outs() << "private external ";
542 } else {
543 if ((NDesc & MachO::N_WEAK_REF) == MachO::N_WEAK_REF ||
544 (NDesc & MachO::N_WEAK_DEF) == MachO::N_WEAK_DEF) {
545 if ((NDesc & (MachO::N_WEAK_REF | MachO::N_WEAK_DEF)) ==
546 (MachO::N_WEAK_REF | MachO::N_WEAK_DEF))
547 outs() << "weak external automatically hidden ";
548 else
549 outs() << "weak external ";
550 } else
551 outs() << "external ";
553 } else {
554 if (NType & MachO::N_PEXT)
555 outs() << "non-external (was a private external) ";
556 else
557 outs() << "non-external ";
560 if (Filetype == MachO::MH_OBJECT) {
561 if (NDesc & MachO::N_NO_DEAD_STRIP)
562 outs() << "[no dead strip] ";
563 if ((NType & MachO::N_TYPE) != MachO::N_UNDF &&
564 NDesc & MachO::N_SYMBOL_RESOLVER)
565 outs() << "[symbol resolver] ";
566 if ((NType & MachO::N_TYPE) != MachO::N_UNDF && NDesc & MachO::N_ALT_ENTRY)
567 outs() << "[alt entry] ";
568 if ((NType & MachO::N_TYPE) != MachO::N_UNDF && NDesc & MachO::N_COLD_FUNC)
569 outs() << "[cold func] ";
572 if ((NDesc & MachO::N_ARM_THUMB_DEF) == MachO::N_ARM_THUMB_DEF)
573 outs() << "[Thumb] ";
575 if ((NType & MachO::N_TYPE) == MachO::N_INDR) {
576 outs() << S.Name << " (for ";
577 StringRef IndirectName;
578 if (MachO) {
579 if (S.Sym.getRawDataRefImpl().p) {
580 if (MachO->getIndirectName(S.Sym.getRawDataRefImpl(), IndirectName))
581 outs() << "?)";
582 else
583 outs() << IndirectName << ")";
584 } else
585 outs() << S.IndirectName << ")";
586 } else
587 outs() << "?)";
588 } else
589 outs() << S.Name;
591 if ((Flags & MachO::MH_TWOLEVEL) == MachO::MH_TWOLEVEL &&
592 (((NType & MachO::N_TYPE) == MachO::N_UNDF && NValue == 0) ||
593 (NType & MachO::N_TYPE) == MachO::N_PBUD)) {
594 uint32_t LibraryOrdinal = MachO::GET_LIBRARY_ORDINAL(NDesc);
595 if (LibraryOrdinal != 0) {
596 if (LibraryOrdinal == MachO::EXECUTABLE_ORDINAL)
597 outs() << " (from executable)";
598 else if (LibraryOrdinal == MachO::DYNAMIC_LOOKUP_ORDINAL)
599 outs() << " (dynamically looked up)";
600 else {
601 StringRef LibraryName;
602 if (!MachO ||
603 MachO->getLibraryShortNameByIndex(LibraryOrdinal - 1, LibraryName))
604 outs() << " (from bad library ordinal " << LibraryOrdinal << ")";
605 else
606 outs() << " (from " << LibraryName << ")";
611 outs() << "\n";
614 // Table that maps Darwin's Mach-O stab constants to strings to allow printing.
615 struct DarwinStabName {
616 uint8_t NType;
617 const char *Name;
619 static const struct DarwinStabName DarwinStabNames[] = {
620 {MachO::N_GSYM, "GSYM"},
621 {MachO::N_FNAME, "FNAME"},
622 {MachO::N_FUN, "FUN"},
623 {MachO::N_STSYM, "STSYM"},
624 {MachO::N_LCSYM, "LCSYM"},
625 {MachO::N_BNSYM, "BNSYM"},
626 {MachO::N_PC, "PC"},
627 {MachO::N_AST, "AST"},
628 {MachO::N_OPT, "OPT"},
629 {MachO::N_RSYM, "RSYM"},
630 {MachO::N_SLINE, "SLINE"},
631 {MachO::N_ENSYM, "ENSYM"},
632 {MachO::N_SSYM, "SSYM"},
633 {MachO::N_SO, "SO"},
634 {MachO::N_OSO, "OSO"},
635 {MachO::N_LSYM, "LSYM"},
636 {MachO::N_BINCL, "BINCL"},
637 {MachO::N_SOL, "SOL"},
638 {MachO::N_PARAMS, "PARAM"},
639 {MachO::N_VERSION, "VERS"},
640 {MachO::N_OLEVEL, "OLEV"},
641 {MachO::N_PSYM, "PSYM"},
642 {MachO::N_EINCL, "EINCL"},
643 {MachO::N_ENTRY, "ENTRY"},
644 {MachO::N_LBRAC, "LBRAC"},
645 {MachO::N_EXCL, "EXCL"},
646 {MachO::N_RBRAC, "RBRAC"},
647 {MachO::N_BCOMM, "BCOMM"},
648 {MachO::N_ECOMM, "ECOMM"},
649 {MachO::N_ECOML, "ECOML"},
650 {MachO::N_LENG, "LENG"},
653 static const char *getDarwinStabString(uint8_t NType) {
654 for (auto I : makeArrayRef(DarwinStabNames))
655 if (I.NType == NType)
656 return I.Name;
657 return nullptr;
660 // darwinPrintStab() prints the n_sect, n_desc along with a symbolic name of
661 // a stab n_type value in a Mach-O file.
662 static void darwinPrintStab(MachOObjectFile *MachO, const NMSymbol &S) {
663 MachO::nlist_64 STE_64;
664 MachO::nlist STE;
665 uint8_t NType;
666 uint8_t NSect;
667 uint16_t NDesc;
668 DataRefImpl SymDRI = S.Sym.getRawDataRefImpl();
669 if (MachO->is64Bit()) {
670 STE_64 = MachO->getSymbol64TableEntry(SymDRI);
671 NType = STE_64.n_type;
672 NSect = STE_64.n_sect;
673 NDesc = STE_64.n_desc;
674 } else {
675 STE = MachO->getSymbolTableEntry(SymDRI);
676 NType = STE.n_type;
677 NSect = STE.n_sect;
678 NDesc = STE.n_desc;
681 outs() << format(" %02x %04x ", NSect, NDesc);
682 if (const char *stabString = getDarwinStabString(NType))
683 outs() << format("%5.5s", stabString);
684 else
685 outs() << format(" %02x", NType);
688 static Optional<std::string> demangle(StringRef Name, bool StripUnderscore) {
689 if (StripUnderscore && !Name.empty() && Name[0] == '_')
690 Name = Name.substr(1);
692 if (!Name.startswith("_Z"))
693 return None;
695 int Status;
696 char *Undecorated =
697 itaniumDemangle(Name.str().c_str(), nullptr, nullptr, &Status);
698 if (Status != 0)
699 return None;
701 std::string S(Undecorated);
702 free(Undecorated);
703 return S;
706 static bool symbolIsDefined(const NMSymbol &Sym) {
707 return Sym.TypeChar != 'U' && Sym.TypeChar != 'w' && Sym.TypeChar != 'v';
710 static void sortAndPrintSymbolList(SymbolicFile &Obj, bool printName,
711 const std::string &ArchiveName,
712 const std::string &ArchitectureName) {
713 if (!NoSort) {
714 using Comparator = bool (*)(const NMSymbol &, const NMSymbol &);
715 Comparator Cmp;
716 if (NumericSort)
717 Cmp = &compareSymbolAddress;
718 else if (SizeSort)
719 Cmp = &compareSymbolSize;
720 else
721 Cmp = &compareSymbolName;
723 if (ReverseSort)
724 llvm::sort(SymbolList, [=](const NMSymbol &A, const NMSymbol &B) -> bool {
725 return Cmp(B, A);
727 else
728 llvm::sort(SymbolList, Cmp);
731 if (!PrintFileName) {
732 if (OutputFormat == posix && MultipleFiles && printName) {
733 outs() << '\n' << CurrentFilename << ":\n";
734 } else if (OutputFormat == bsd && MultipleFiles && printName) {
735 outs() << "\n" << CurrentFilename << ":\n";
736 } else if (OutputFormat == sysv) {
737 outs() << "\n\nSymbols from " << CurrentFilename << ":\n\n";
738 if (isSymbolList64Bit(Obj))
739 outs() << "Name Value Class Type"
740 << " Size Line Section\n";
741 else
742 outs() << "Name Value Class Type"
743 << " Size Line Section\n";
747 const char *printBlanks, *printDashes, *printFormat;
748 if (isSymbolList64Bit(Obj)) {
749 printBlanks = " ";
750 printDashes = "----------------";
751 switch (AddressRadix) {
752 case Radix::o:
753 printFormat = OutputFormat == posix ? "%" PRIo64 : "%016" PRIo64;
754 break;
755 case Radix::x:
756 printFormat = OutputFormat == posix ? "%" PRIx64 : "%016" PRIx64;
757 break;
758 default:
759 printFormat = OutputFormat == posix ? "%" PRId64 : "%016" PRId64;
761 } else {
762 printBlanks = " ";
763 printDashes = "--------";
764 switch (AddressRadix) {
765 case Radix::o:
766 printFormat = OutputFormat == posix ? "%" PRIo64 : "%08" PRIo64;
767 break;
768 case Radix::x:
769 printFormat = OutputFormat == posix ? "%" PRIx64 : "%08" PRIx64;
770 break;
771 default:
772 printFormat = OutputFormat == posix ? "%" PRId64 : "%08" PRId64;
776 auto writeFileName = [&](raw_ostream &S) {
777 if (!ArchitectureName.empty())
778 S << "(for architecture " << ArchitectureName << "):";
779 if (OutputFormat == posix && !ArchiveName.empty())
780 S << ArchiveName << "[" << CurrentFilename << "]: ";
781 else {
782 if (!ArchiveName.empty())
783 S << ArchiveName << ":";
784 S << CurrentFilename << ": ";
788 if (SymbolList.empty()) {
789 if (PrintFileName)
790 writeFileName(errs());
791 errs() << "no symbols\n";
794 for (const NMSymbol &S : SymbolList) {
795 uint32_t SymFlags;
796 std::string Name = S.Name.str();
797 MachOObjectFile *MachO = dyn_cast<MachOObjectFile>(&Obj);
798 if (Demangle) {
799 if (Optional<std::string> Opt = demangle(S.Name, MachO))
800 Name = *Opt;
802 if (S.Sym.getRawDataRefImpl().p)
803 SymFlags = S.Sym.getFlags();
804 else
805 SymFlags = S.SymFlags;
807 bool Undefined = SymFlags & SymbolRef::SF_Undefined;
808 bool Global = SymFlags & SymbolRef::SF_Global;
809 bool Weak = SymFlags & SymbolRef::SF_Weak;
810 if ((!Undefined && UndefinedOnly) || (Undefined && DefinedOnly) ||
811 (!Global && ExternalOnly) || (Weak && NoWeakSymbols))
812 continue;
813 if (PrintFileName)
814 writeFileName(outs());
815 if ((JustSymbolName ||
816 (UndefinedOnly && MachO && OutputFormat != darwin)) &&
817 OutputFormat != posix) {
818 outs() << Name << "\n";
819 continue;
822 char SymbolAddrStr[23], SymbolSizeStr[23];
824 // If the format is SysV or the symbol isn't defined, then print spaces.
825 if (OutputFormat == sysv || !symbolIsDefined(S)) {
826 if (OutputFormat == posix) {
827 format(printFormat, S.Address)
828 .print(SymbolAddrStr, sizeof(SymbolAddrStr));
829 format(printFormat, S.Size).print(SymbolSizeStr, sizeof(SymbolSizeStr));
830 } else {
831 strcpy(SymbolAddrStr, printBlanks);
832 strcpy(SymbolSizeStr, printBlanks);
836 if (symbolIsDefined(S)) {
837 // Otherwise, print the symbol address and size.
838 if (Obj.isIR())
839 strcpy(SymbolAddrStr, printDashes);
840 else if (MachO && S.TypeChar == 'I')
841 strcpy(SymbolAddrStr, printBlanks);
842 else
843 format(printFormat, S.Address)
844 .print(SymbolAddrStr, sizeof(SymbolAddrStr));
845 format(printFormat, S.Size).print(SymbolSizeStr, sizeof(SymbolSizeStr));
848 // If OutputFormat is darwin or we are printing Mach-O symbols in hex and
849 // we have a MachOObjectFile, call darwinPrintSymbol to print as darwin's
850 // nm(1) -m output or hex, else if OutputFormat is darwin or we are
851 // printing Mach-O symbols in hex and not a Mach-O object fall back to
852 // OutputFormat bsd (see below).
853 if ((OutputFormat == darwin || FormatMachOasHex) && (MachO || Obj.isIR())) {
854 darwinPrintSymbol(Obj, S, SymbolAddrStr, printBlanks, printDashes,
855 printFormat);
856 } else if (OutputFormat == posix) {
857 outs() << Name << " " << S.TypeChar << " " << SymbolAddrStr << " "
858 << (MachO ? "0" : SymbolSizeStr) << "\n";
859 } else if (OutputFormat == bsd || (OutputFormat == darwin && !MachO)) {
860 if (PrintAddress)
861 outs() << SymbolAddrStr << ' ';
862 if (PrintSize)
863 outs() << SymbolSizeStr << ' ';
864 outs() << S.TypeChar;
865 if (S.TypeChar == '-' && MachO)
866 darwinPrintStab(MachO, S);
867 outs() << " " << Name;
868 if (S.TypeChar == 'I' && MachO) {
869 outs() << " (indirect for ";
870 if (S.Sym.getRawDataRefImpl().p) {
871 StringRef IndirectName;
872 if (MachO->getIndirectName(S.Sym.getRawDataRefImpl(), IndirectName))
873 outs() << "?)";
874 else
875 outs() << IndirectName << ")";
876 } else
877 outs() << S.IndirectName << ")";
879 outs() << "\n";
880 } else if (OutputFormat == sysv) {
881 outs() << left_justify(Name, 20) << "|" << SymbolAddrStr << "| "
882 << S.TypeChar << " |" << right_justify(S.TypeName, 18) << "|"
883 << SymbolSizeStr << "| |" << S.SectionName << "\n";
887 SymbolList.clear();
890 static char getSymbolNMTypeChar(ELFObjectFileBase &Obj,
891 basic_symbol_iterator I) {
892 // OK, this is ELF
893 elf_symbol_iterator SymI(I);
895 Expected<elf_section_iterator> SecIOrErr = SymI->getSection();
896 if (!SecIOrErr) {
897 consumeError(SecIOrErr.takeError());
898 return '?';
901 uint8_t Binding = SymI->getBinding();
902 if (Binding == ELF::STB_GNU_UNIQUE)
903 return 'u';
905 assert(Binding != ELF::STB_WEAK && "STB_WEAK not tested in calling function");
906 if (Binding != ELF::STB_GLOBAL && Binding != ELF::STB_LOCAL)
907 return '?';
909 elf_section_iterator SecI = *SecIOrErr;
910 if (SecI != Obj.section_end()) {
911 uint32_t Type = SecI->getType();
912 uint64_t Flags = SecI->getFlags();
913 if (Flags & ELF::SHF_EXECINSTR)
914 return 't';
915 if (Type == ELF::SHT_NOBITS)
916 return 'b';
917 if (Flags & ELF::SHF_ALLOC)
918 return Flags & ELF::SHF_WRITE ? 'd' : 'r';
920 auto NameOrErr = SecI->getName();
921 if (!NameOrErr) {
922 consumeError(NameOrErr.takeError());
923 return '?';
925 if ((*NameOrErr).startswith(".debug"))
926 return 'N';
927 if (!(Flags & ELF::SHF_WRITE))
928 return 'n';
931 return '?';
934 static char getSymbolNMTypeChar(COFFObjectFile &Obj, symbol_iterator I) {
935 COFFSymbolRef Symb = Obj.getCOFFSymbol(*I);
936 // OK, this is COFF.
937 symbol_iterator SymI(I);
939 Expected<StringRef> Name = SymI->getName();
940 if (!Name) {
941 consumeError(Name.takeError());
942 return '?';
945 char Ret = StringSwitch<char>(*Name)
946 .StartsWith(".debug", 'N')
947 .StartsWith(".sxdata", 'N')
948 .Default('?');
950 if (Ret != '?')
951 return Ret;
953 uint32_t Characteristics = 0;
954 if (!COFF::isReservedSectionNumber(Symb.getSectionNumber())) {
955 Expected<section_iterator> SecIOrErr = SymI->getSection();
956 if (!SecIOrErr) {
957 consumeError(SecIOrErr.takeError());
958 return '?';
960 section_iterator SecI = *SecIOrErr;
961 const coff_section *Section = Obj.getCOFFSection(*SecI);
962 Characteristics = Section->Characteristics;
963 if (Expected<StringRef> NameOrErr = Obj.getSectionName(Section))
964 if (NameOrErr->startswith(".idata"))
965 return 'i';
968 switch (Symb.getSectionNumber()) {
969 case COFF::IMAGE_SYM_DEBUG:
970 return 'n';
971 default:
972 // Check section type.
973 if (Characteristics & COFF::IMAGE_SCN_CNT_CODE)
974 return 't';
975 if (Characteristics & COFF::IMAGE_SCN_CNT_INITIALIZED_DATA)
976 return Characteristics & COFF::IMAGE_SCN_MEM_WRITE ? 'd' : 'r';
977 if (Characteristics & COFF::IMAGE_SCN_CNT_UNINITIALIZED_DATA)
978 return 'b';
979 if (Characteristics & COFF::IMAGE_SCN_LNK_INFO)
980 return 'i';
981 // Check for section symbol.
982 if (Symb.isSectionDefinition())
983 return 's';
986 return '?';
989 static char getSymbolNMTypeChar(COFFImportFile &Obj) {
990 switch (Obj.getCOFFImportHeader()->getType()) {
991 case COFF::IMPORT_CODE:
992 return 't';
993 case COFF::IMPORT_DATA:
994 return 'd';
995 case COFF::IMPORT_CONST:
996 return 'r';
998 return '?';
1001 static char getSymbolNMTypeChar(MachOObjectFile &Obj, basic_symbol_iterator I) {
1002 DataRefImpl Symb = I->getRawDataRefImpl();
1003 uint8_t NType = Obj.is64Bit() ? Obj.getSymbol64TableEntry(Symb).n_type
1004 : Obj.getSymbolTableEntry(Symb).n_type;
1006 if (NType & MachO::N_STAB)
1007 return '-';
1009 switch (NType & MachO::N_TYPE) {
1010 case MachO::N_ABS:
1011 return 's';
1012 case MachO::N_INDR:
1013 return 'i';
1014 case MachO::N_SECT: {
1015 Expected<section_iterator> SecOrErr = Obj.getSymbolSection(Symb);
1016 if (!SecOrErr) {
1017 consumeError(SecOrErr.takeError());
1018 return 's';
1020 section_iterator Sec = *SecOrErr;
1021 if (Sec == Obj.section_end())
1022 return 's';
1023 DataRefImpl Ref = Sec->getRawDataRefImpl();
1024 StringRef SectionName;
1025 if (Expected<StringRef> NameOrErr = Obj.getSectionName(Ref))
1026 SectionName = *NameOrErr;
1027 StringRef SegmentName = Obj.getSectionFinalSegmentName(Ref);
1028 if (Obj.is64Bit() && Obj.getHeader64().filetype == MachO::MH_KEXT_BUNDLE &&
1029 SegmentName == "__TEXT_EXEC" && SectionName == "__text")
1030 return 't';
1031 if (SegmentName == "__TEXT" && SectionName == "__text")
1032 return 't';
1033 if (SegmentName == "__DATA" && SectionName == "__data")
1034 return 'd';
1035 if (SegmentName == "__DATA" && SectionName == "__bss")
1036 return 'b';
1037 return 's';
1041 return '?';
1044 static char getSymbolNMTypeChar(WasmObjectFile &Obj, basic_symbol_iterator I) {
1045 uint32_t Flags = I->getFlags();
1046 if (Flags & SymbolRef::SF_Executable)
1047 return 't';
1048 return 'd';
1051 static char getSymbolNMTypeChar(IRObjectFile &Obj, basic_symbol_iterator I) {
1052 uint32_t Flags = I->getFlags();
1053 // FIXME: should we print 'b'? At the IR level we cannot be sure if this
1054 // will be in bss or not, but we could approximate.
1055 if (Flags & SymbolRef::SF_Executable)
1056 return 't';
1057 else if (Triple(Obj.getTargetTriple()).isOSDarwin() &&
1058 (Flags & SymbolRef::SF_Const))
1059 return 's';
1060 else
1061 return 'd';
1064 static bool isObject(SymbolicFile &Obj, basic_symbol_iterator I) {
1065 return !dyn_cast<ELFObjectFileBase>(&Obj)
1066 ? false
1067 : elf_symbol_iterator(I)->getELFType() == ELF::STT_OBJECT;
1070 // For ELF object files, Set TypeName to the symbol typename, to be printed
1071 // in the 'Type' column of the SYSV format output.
1072 static StringRef getNMTypeName(SymbolicFile &Obj, basic_symbol_iterator I) {
1073 if (isa<ELFObjectFileBase>(&Obj)) {
1074 elf_symbol_iterator SymI(I);
1075 return SymI->getELFTypeName();
1077 return "";
1080 // Return Posix nm class type tag (single letter), but also set SecName and
1081 // section and name, to be used in format=sysv output.
1082 static char getNMSectionTagAndName(SymbolicFile &Obj, basic_symbol_iterator I,
1083 StringRef &SecName) {
1084 uint32_t Symflags = I->getFlags();
1085 if (ELFObjectFileBase *ELFObj = dyn_cast<ELFObjectFileBase>(&Obj)) {
1086 if (Symflags & object::SymbolRef::SF_Absolute)
1087 SecName = "*ABS*";
1088 else if (Symflags & object::SymbolRef::SF_Common)
1089 SecName = "*COM*";
1090 else if (Symflags & object::SymbolRef::SF_Undefined)
1091 SecName = "*UND*";
1092 else {
1093 elf_symbol_iterator SymI(I);
1094 Expected<elf_section_iterator> SecIOrErr = SymI->getSection();
1095 if (!SecIOrErr) {
1096 consumeError(SecIOrErr.takeError());
1097 return '?';
1100 if (*SecIOrErr == ELFObj->section_end())
1101 return '?';
1103 Expected<StringRef> NameOrErr = (*SecIOrErr)->getName();
1104 if (!NameOrErr) {
1105 consumeError(NameOrErr.takeError());
1106 return '?';
1108 SecName = *NameOrErr;
1112 if ((Symflags & object::SymbolRef::SF_Weak) && !isa<MachOObjectFile>(Obj)) {
1113 char Ret = isObject(Obj, I) ? 'v' : 'w';
1114 return (!(Symflags & object::SymbolRef::SF_Undefined)) ? toupper(Ret) : Ret;
1117 if (Symflags & object::SymbolRef::SF_Undefined)
1118 return 'U';
1120 if (Symflags & object::SymbolRef::SF_Common)
1121 return 'C';
1123 char Ret = '?';
1124 if (Symflags & object::SymbolRef::SF_Absolute)
1125 Ret = 'a';
1126 else if (IRObjectFile *IR = dyn_cast<IRObjectFile>(&Obj))
1127 Ret = getSymbolNMTypeChar(*IR, I);
1128 else if (COFFObjectFile *COFF = dyn_cast<COFFObjectFile>(&Obj))
1129 Ret = getSymbolNMTypeChar(*COFF, I);
1130 else if (COFFImportFile *COFFImport = dyn_cast<COFFImportFile>(&Obj))
1131 Ret = getSymbolNMTypeChar(*COFFImport);
1132 else if (MachOObjectFile *MachO = dyn_cast<MachOObjectFile>(&Obj))
1133 Ret = getSymbolNMTypeChar(*MachO, I);
1134 else if (WasmObjectFile *Wasm = dyn_cast<WasmObjectFile>(&Obj))
1135 Ret = getSymbolNMTypeChar(*Wasm, I);
1136 else
1137 Ret = getSymbolNMTypeChar(cast<ELFObjectFileBase>(Obj), I);
1139 if (!(Symflags & object::SymbolRef::SF_Global))
1140 return Ret;
1142 if (Obj.isELF() && ELFSymbolRef(*I).getBinding() == ELF::STB_GNU_UNIQUE)
1143 return Ret;
1145 return toupper(Ret);
1148 // getNsectForSegSect() is used to implement the Mach-O "-s segname sectname"
1149 // option to dump only those symbols from that section in a Mach-O file.
1150 // It is called once for each Mach-O file from dumpSymbolNamesFromObject()
1151 // to get the section number for that named section from the command line
1152 // arguments. It returns the section number for that section in the Mach-O
1153 // file or zero it is not present.
1154 static unsigned getNsectForSegSect(MachOObjectFile *Obj) {
1155 unsigned Nsect = 1;
1156 for (auto &S : Obj->sections()) {
1157 DataRefImpl Ref = S.getRawDataRefImpl();
1158 StringRef SectionName;
1159 if (Expected<StringRef> NameOrErr = Obj->getSectionName(Ref))
1160 SectionName = *NameOrErr;
1161 StringRef SegmentName = Obj->getSectionFinalSegmentName(Ref);
1162 if (SegmentName == SegSect[0] && SectionName == SegSect[1])
1163 return Nsect;
1164 Nsect++;
1166 return 0;
1169 // getNsectInMachO() is used to implement the Mach-O "-s segname sectname"
1170 // option to dump only those symbols from that section in a Mach-O file.
1171 // It is called once for each symbol in a Mach-O file from
1172 // dumpSymbolNamesFromObject() and returns the section number for that symbol
1173 // if it is in a section, else it returns 0.
1174 static unsigned getNsectInMachO(MachOObjectFile &Obj, BasicSymbolRef Sym) {
1175 DataRefImpl Symb = Sym.getRawDataRefImpl();
1176 if (Obj.is64Bit()) {
1177 MachO::nlist_64 STE = Obj.getSymbol64TableEntry(Symb);
1178 return (STE.n_type & MachO::N_TYPE) == MachO::N_SECT ? STE.n_sect : 0;
1180 MachO::nlist STE = Obj.getSymbolTableEntry(Symb);
1181 return (STE.n_type & MachO::N_TYPE) == MachO::N_SECT ? STE.n_sect : 0;
1184 static void
1185 dumpSymbolNamesFromObject(SymbolicFile &Obj, bool printName,
1186 const std::string &ArchiveName = std::string(),
1187 const std::string &ArchitectureName = std::string()) {
1188 auto Symbols = Obj.symbols();
1189 if (DynamicSyms) {
1190 const auto *E = dyn_cast<ELFObjectFileBase>(&Obj);
1191 if (!E) {
1192 error("File format has no dynamic symbol table", Obj.getFileName());
1193 return;
1195 Symbols = E->getDynamicSymbolIterators();
1197 std::string NameBuffer;
1198 raw_string_ostream OS(NameBuffer);
1199 // If a "-s segname sectname" option was specified and this is a Mach-O
1200 // file get the section number for that section in this object file.
1201 unsigned int Nsect = 0;
1202 MachOObjectFile *MachO = dyn_cast<MachOObjectFile>(&Obj);
1203 if (!SegSect.empty() && MachO) {
1204 Nsect = getNsectForSegSect(MachO);
1205 // If this section is not in the object file no symbols are printed.
1206 if (Nsect == 0)
1207 return;
1209 if (!MachO || !DyldInfoOnly) {
1210 for (BasicSymbolRef Sym : Symbols) {
1211 uint32_t SymFlags = Sym.getFlags();
1212 if (!DebugSyms && (SymFlags & SymbolRef::SF_FormatSpecific))
1213 continue;
1214 if (WithoutAliases && (SymFlags & SymbolRef::SF_Indirect))
1215 continue;
1216 // If a "-s segname sectname" option was specified and this is a Mach-O
1217 // file and this section appears in this file, Nsect will be non-zero then
1218 // see if this symbol is a symbol from that section and if not skip it.
1219 if (Nsect && Nsect != getNsectInMachO(*MachO, Sym))
1220 continue;
1221 NMSymbol S = {};
1222 S.Size = 0;
1223 S.Address = 0;
1224 if (isa<ELFObjectFileBase>(&Obj))
1225 S.Size = ELFSymbolRef(Sym).getSize();
1226 if (PrintAddress && isa<ObjectFile>(Obj)) {
1227 SymbolRef SymRef(Sym);
1228 Expected<uint64_t> AddressOrErr = SymRef.getAddress();
1229 if (!AddressOrErr) {
1230 consumeError(AddressOrErr.takeError());
1231 break;
1233 S.Address = *AddressOrErr;
1235 S.TypeName = getNMTypeName(Obj, Sym);
1236 S.TypeChar = getNMSectionTagAndName(Obj, Sym, S.SectionName);
1237 if (Error E = Sym.printName(OS)) {
1238 if (MachO) {
1239 OS << "bad string index";
1240 consumeError(std::move(E));
1241 } else
1242 error(std::move(E), Obj.getFileName());
1244 OS << '\0';
1245 S.Sym = Sym;
1246 SymbolList.push_back(S);
1250 OS.flush();
1251 const char *P = NameBuffer.c_str();
1252 unsigned I;
1253 for (I = 0; I < SymbolList.size(); ++I) {
1254 SymbolList[I].Name = P;
1255 P += strlen(P) + 1;
1258 // If this is a Mach-O file where the nlist symbol table is out of sync
1259 // with the dyld export trie then look through exports and fake up symbols
1260 // for the ones that are missing (also done with the -add-dyldinfo flag).
1261 // This is needed if strip(1) -T is run on a binary containing swift
1262 // language symbols for example. The option -only-dyldinfo will fake up
1263 // all symbols from the dyld export trie as well as the bind info.
1264 std::string ExportsNameBuffer;
1265 raw_string_ostream EOS(ExportsNameBuffer);
1266 std::string BindsNameBuffer;
1267 raw_string_ostream BOS(BindsNameBuffer);
1268 std::string LazysNameBuffer;
1269 raw_string_ostream LOS(LazysNameBuffer);
1270 std::string WeaksNameBuffer;
1271 raw_string_ostream WOS(WeaksNameBuffer);
1272 std::string FunctionStartsNameBuffer;
1273 raw_string_ostream FOS(FunctionStartsNameBuffer);
1274 if (MachO && !NoDyldInfo) {
1275 MachO::mach_header H;
1276 MachO::mach_header_64 H_64;
1277 uint32_t HFlags = 0;
1278 if (MachO->is64Bit()) {
1279 H_64 = MachO->MachOObjectFile::getHeader64();
1280 HFlags = H_64.flags;
1281 } else {
1282 H = MachO->MachOObjectFile::getHeader();
1283 HFlags = H.flags;
1285 uint64_t BaseSegmentAddress = 0;
1286 for (const auto &Command : MachO->load_commands()) {
1287 if (Command.C.cmd == MachO::LC_SEGMENT) {
1288 MachO::segment_command Seg = MachO->getSegmentLoadCommand(Command);
1289 if (Seg.fileoff == 0 && Seg.filesize != 0) {
1290 BaseSegmentAddress = Seg.vmaddr;
1291 break;
1293 } else if (Command.C.cmd == MachO::LC_SEGMENT_64) {
1294 MachO::segment_command_64 Seg = MachO->getSegment64LoadCommand(Command);
1295 if (Seg.fileoff == 0 && Seg.filesize != 0) {
1296 BaseSegmentAddress = Seg.vmaddr;
1297 break;
1301 if (DyldInfoOnly || AddDyldInfo ||
1302 HFlags & MachO::MH_NLIST_OUTOFSYNC_WITH_DYLDINFO) {
1303 unsigned ExportsAdded = 0;
1304 Error Err = Error::success();
1305 for (const llvm::object::ExportEntry &Entry : MachO->exports(Err)) {
1306 bool found = false;
1307 bool ReExport = false;
1308 if (!DyldInfoOnly) {
1309 for (const NMSymbol &S : SymbolList)
1310 if (S.Address == Entry.address() + BaseSegmentAddress &&
1311 S.Name == Entry.name()) {
1312 found = true;
1313 break;
1316 if (!found) {
1317 NMSymbol S = {};
1318 S.Address = Entry.address() + BaseSegmentAddress;
1319 S.Size = 0;
1320 S.TypeChar = '\0';
1321 S.Name = Entry.name();
1322 // There is no symbol in the nlist symbol table for this so we set
1323 // Sym effectivly to null and the rest of code in here must test for
1324 // it and not do things like Sym.getFlags() for it.
1325 S.Sym = BasicSymbolRef();
1326 S.SymFlags = SymbolRef::SF_Global;
1327 S.Section = SectionRef();
1328 S.NType = 0;
1329 S.NSect = 0;
1330 S.NDesc = 0;
1331 S.IndirectName = StringRef();
1333 uint64_t EFlags = Entry.flags();
1334 bool Abs = ((EFlags & MachO::EXPORT_SYMBOL_FLAGS_KIND_MASK) ==
1335 MachO::EXPORT_SYMBOL_FLAGS_KIND_ABSOLUTE);
1336 bool Resolver = (EFlags &
1337 MachO::EXPORT_SYMBOL_FLAGS_STUB_AND_RESOLVER);
1338 ReExport = (EFlags & MachO::EXPORT_SYMBOL_FLAGS_REEXPORT);
1339 bool WeakDef = (EFlags & MachO::EXPORT_SYMBOL_FLAGS_WEAK_DEFINITION);
1340 if (WeakDef)
1341 S.NDesc |= MachO::N_WEAK_DEF;
1342 if (Abs) {
1343 S.NType = MachO::N_EXT | MachO::N_ABS;
1344 S.TypeChar = 'A';
1345 } else if (ReExport) {
1346 S.NType = MachO::N_EXT | MachO::N_INDR;
1347 S.TypeChar = 'I';
1348 } else {
1349 S.NType = MachO::N_EXT | MachO::N_SECT;
1350 if (Resolver) {
1351 S.Address = Entry.other() + BaseSegmentAddress;
1352 if ((S.Address & 1) != 0 &&
1353 !MachO->is64Bit() && H.cputype == MachO::CPU_TYPE_ARM){
1354 S.Address &= ~1LL;
1355 S.NDesc |= MachO::N_ARM_THUMB_DEF;
1357 } else {
1358 S.Address = Entry.address() + BaseSegmentAddress;
1360 StringRef SegmentName = StringRef();
1361 StringRef SectionName = StringRef();
1362 for (const SectionRef &Section : MachO->sections()) {
1363 S.NSect++;
1365 if (Expected<StringRef> NameOrErr = Section.getName())
1366 SectionName = *NameOrErr;
1367 else
1368 consumeError(NameOrErr.takeError());
1370 SegmentName = MachO->getSectionFinalSegmentName(
1371 Section.getRawDataRefImpl());
1372 if (S.Address >= Section.getAddress() &&
1373 S.Address < Section.getAddress() + Section.getSize()) {
1374 S.Section = Section;
1375 break;
1376 } else if (Entry.name() == "__mh_execute_header" &&
1377 SegmentName == "__TEXT" && SectionName == "__text") {
1378 S.Section = Section;
1379 S.NDesc |= MachO::REFERENCED_DYNAMICALLY;
1380 break;
1383 if (SegmentName == "__TEXT" && SectionName == "__text")
1384 S.TypeChar = 'T';
1385 else if (SegmentName == "__DATA" && SectionName == "__data")
1386 S.TypeChar = 'D';
1387 else if (SegmentName == "__DATA" && SectionName == "__bss")
1388 S.TypeChar = 'B';
1389 else
1390 S.TypeChar = 'S';
1392 SymbolList.push_back(S);
1394 EOS << Entry.name();
1395 EOS << '\0';
1396 ExportsAdded++;
1398 // For ReExports there are a two more things to do, first add the
1399 // indirect name and second create the undefined symbol using the
1400 // referened dynamic library.
1401 if (ReExport) {
1403 // Add the indirect name.
1404 if (Entry.otherName().empty())
1405 EOS << Entry.name();
1406 else
1407 EOS << Entry.otherName();
1408 EOS << '\0';
1410 // Now create the undefined symbol using the referened dynamic
1411 // library.
1412 NMSymbol U = {};
1413 U.Address = 0;
1414 U.Size = 0;
1415 U.TypeChar = 'U';
1416 if (Entry.otherName().empty())
1417 U.Name = Entry.name();
1418 else
1419 U.Name = Entry.otherName();
1420 // Again there is no symbol in the nlist symbol table for this so
1421 // we set Sym effectivly to null and the rest of code in here must
1422 // test for it and not do things like Sym.getFlags() for it.
1423 U.Sym = BasicSymbolRef();
1424 U.SymFlags = SymbolRef::SF_Global | SymbolRef::SF_Undefined;
1425 U.Section = SectionRef();
1426 U.NType = MachO::N_EXT | MachO::N_UNDF;
1427 U.NSect = 0;
1428 U.NDesc = 0;
1429 // The library ordinal for this undefined symbol is in the export
1430 // trie Entry.other().
1431 MachO::SET_LIBRARY_ORDINAL(U.NDesc, Entry.other());
1432 U.IndirectName = StringRef();
1433 SymbolList.push_back(U);
1435 // Finally add the undefined symbol's name.
1436 if (Entry.otherName().empty())
1437 EOS << Entry.name();
1438 else
1439 EOS << Entry.otherName();
1440 EOS << '\0';
1441 ExportsAdded++;
1445 if (Err)
1446 error(std::move(Err), MachO->getFileName());
1447 // Set the symbol names and indirect names for the added symbols.
1448 if (ExportsAdded) {
1449 EOS.flush();
1450 const char *Q = ExportsNameBuffer.c_str();
1451 for (unsigned K = 0; K < ExportsAdded; K++) {
1452 SymbolList[I].Name = Q;
1453 Q += strlen(Q) + 1;
1454 if (SymbolList[I].TypeChar == 'I') {
1455 SymbolList[I].IndirectName = Q;
1456 Q += strlen(Q) + 1;
1458 I++;
1462 // Add the undefined symbols from the bind entries.
1463 unsigned BindsAdded = 0;
1464 Error BErr = Error::success();
1465 StringRef LastSymbolName = StringRef();
1466 for (const llvm::object::MachOBindEntry &Entry : MachO->bindTable(BErr)) {
1467 bool found = false;
1468 if (LastSymbolName == Entry.symbolName())
1469 found = true;
1470 else if(!DyldInfoOnly) {
1471 for (unsigned J = 0; J < SymbolList.size() && !found; ++J) {
1472 if (SymbolList[J].Name == Entry.symbolName())
1473 found = true;
1476 if (!found) {
1477 LastSymbolName = Entry.symbolName();
1478 NMSymbol B = {};
1479 B.Address = 0;
1480 B.Size = 0;
1481 B.TypeChar = 'U';
1482 // There is no symbol in the nlist symbol table for this so we set
1483 // Sym effectivly to null and the rest of code in here must test for
1484 // it and not do things like Sym.getFlags() for it.
1485 B.Sym = BasicSymbolRef();
1486 B.SymFlags = SymbolRef::SF_Global | SymbolRef::SF_Undefined;
1487 B.NType = MachO::N_EXT | MachO::N_UNDF;
1488 B.NSect = 0;
1489 B.NDesc = 0;
1490 MachO::SET_LIBRARY_ORDINAL(B.NDesc, Entry.ordinal());
1491 B.IndirectName = StringRef();
1492 B.Name = Entry.symbolName();
1493 SymbolList.push_back(B);
1494 BOS << Entry.symbolName();
1495 BOS << '\0';
1496 BindsAdded++;
1499 if (BErr)
1500 error(std::move(BErr), MachO->getFileName());
1501 // Set the symbol names and indirect names for the added symbols.
1502 if (BindsAdded) {
1503 BOS.flush();
1504 const char *Q = BindsNameBuffer.c_str();
1505 for (unsigned K = 0; K < BindsAdded; K++) {
1506 SymbolList[I].Name = Q;
1507 Q += strlen(Q) + 1;
1508 if (SymbolList[I].TypeChar == 'I') {
1509 SymbolList[I].IndirectName = Q;
1510 Q += strlen(Q) + 1;
1512 I++;
1516 // Add the undefined symbols from the lazy bind entries.
1517 unsigned LazysAdded = 0;
1518 Error LErr = Error::success();
1519 LastSymbolName = StringRef();
1520 for (const llvm::object::MachOBindEntry &Entry :
1521 MachO->lazyBindTable(LErr)) {
1522 bool found = false;
1523 if (LastSymbolName == Entry.symbolName())
1524 found = true;
1525 else {
1526 // Here we must check to see it this symbol is already in the
1527 // SymbolList as it might have already have been added above via a
1528 // non-lazy (bind) entry.
1529 for (unsigned J = 0; J < SymbolList.size() && !found; ++J) {
1530 if (SymbolList[J].Name == Entry.symbolName())
1531 found = true;
1534 if (!found) {
1535 LastSymbolName = Entry.symbolName();
1536 NMSymbol L = {};
1537 L.Name = Entry.symbolName();
1538 L.Address = 0;
1539 L.Size = 0;
1540 L.TypeChar = 'U';
1541 // There is no symbol in the nlist symbol table for this so we set
1542 // Sym effectivly to null and the rest of code in here must test for
1543 // it and not do things like Sym.getFlags() for it.
1544 L.Sym = BasicSymbolRef();
1545 L.SymFlags = SymbolRef::SF_Global | SymbolRef::SF_Undefined;
1546 L.NType = MachO::N_EXT | MachO::N_UNDF;
1547 L.NSect = 0;
1548 // The REFERENCE_FLAG_UNDEFINED_LAZY is no longer used but here it
1549 // makes sence since we are creating this from a lazy bind entry.
1550 L.NDesc = MachO::REFERENCE_FLAG_UNDEFINED_LAZY;
1551 MachO::SET_LIBRARY_ORDINAL(L.NDesc, Entry.ordinal());
1552 L.IndirectName = StringRef();
1553 SymbolList.push_back(L);
1554 LOS << Entry.symbolName();
1555 LOS << '\0';
1556 LazysAdded++;
1559 if (LErr)
1560 error(std::move(LErr), MachO->getFileName());
1561 // Set the symbol names and indirect names for the added symbols.
1562 if (LazysAdded) {
1563 LOS.flush();
1564 const char *Q = LazysNameBuffer.c_str();
1565 for (unsigned K = 0; K < LazysAdded; K++) {
1566 SymbolList[I].Name = Q;
1567 Q += strlen(Q) + 1;
1568 if (SymbolList[I].TypeChar == 'I') {
1569 SymbolList[I].IndirectName = Q;
1570 Q += strlen(Q) + 1;
1572 I++;
1576 // Add the undefineds symbol from the weak bind entries which are not
1577 // strong symbols.
1578 unsigned WeaksAdded = 0;
1579 Error WErr = Error::success();
1580 LastSymbolName = StringRef();
1581 for (const llvm::object::MachOBindEntry &Entry :
1582 MachO->weakBindTable(WErr)) {
1583 bool found = false;
1584 unsigned J = 0;
1585 if (LastSymbolName == Entry.symbolName() ||
1586 Entry.flags() & MachO::BIND_SYMBOL_FLAGS_NON_WEAK_DEFINITION) {
1587 found = true;
1588 } else {
1589 for (J = 0; J < SymbolList.size() && !found; ++J) {
1590 if (SymbolList[J].Name == Entry.symbolName()) {
1591 found = true;
1592 break;
1596 if (!found) {
1597 LastSymbolName = Entry.symbolName();
1598 NMSymbol W;
1599 memset(&W, '\0', sizeof(NMSymbol));
1600 W.Name = Entry.symbolName();
1601 W.Address = 0;
1602 W.Size = 0;
1603 W.TypeChar = 'U';
1604 // There is no symbol in the nlist symbol table for this so we set
1605 // Sym effectivly to null and the rest of code in here must test for
1606 // it and not do things like Sym.getFlags() for it.
1607 W.Sym = BasicSymbolRef();
1608 W.SymFlags = SymbolRef::SF_Global | SymbolRef::SF_Undefined;
1609 W.NType = MachO::N_EXT | MachO::N_UNDF;
1610 W.NSect = 0;
1611 // Odd that we are using N_WEAK_DEF on an undefined symbol but that is
1612 // what is created in this case by the linker when there are real
1613 // symbols in the nlist structs.
1614 W.NDesc = MachO::N_WEAK_DEF;
1615 W.IndirectName = StringRef();
1616 SymbolList.push_back(W);
1617 WOS << Entry.symbolName();
1618 WOS << '\0';
1619 WeaksAdded++;
1620 } else {
1621 // This is the case the symbol was previously been found and it could
1622 // have been added from a bind or lazy bind symbol. If so and not
1623 // a definition also mark it as weak.
1624 if (SymbolList[J].TypeChar == 'U')
1625 // See comment above about N_WEAK_DEF.
1626 SymbolList[J].NDesc |= MachO::N_WEAK_DEF;
1629 if (WErr)
1630 error(std::move(WErr), MachO->getFileName());
1631 // Set the symbol names and indirect names for the added symbols.
1632 if (WeaksAdded) {
1633 WOS.flush();
1634 const char *Q = WeaksNameBuffer.c_str();
1635 for (unsigned K = 0; K < WeaksAdded; K++) {
1636 SymbolList[I].Name = Q;
1637 Q += strlen(Q) + 1;
1638 if (SymbolList[I].TypeChar == 'I') {
1639 SymbolList[I].IndirectName = Q;
1640 Q += strlen(Q) + 1;
1642 I++;
1646 // Trying adding symbol from the function starts table and LC_MAIN entry
1647 // point.
1648 SmallVector<uint64_t, 8> FoundFns;
1649 uint64_t lc_main_offset = UINT64_MAX;
1650 for (const auto &Command : MachO->load_commands()) {
1651 if (Command.C.cmd == MachO::LC_FUNCTION_STARTS) {
1652 // We found a function starts segment, parse the addresses for
1653 // consumption.
1654 MachO::linkedit_data_command LLC =
1655 MachO->getLinkeditDataLoadCommand(Command);
1657 MachO->ReadULEB128s(LLC.dataoff, FoundFns);
1658 } else if (Command.C.cmd == MachO::LC_MAIN) {
1659 MachO::entry_point_command LCmain =
1660 MachO->getEntryPointCommand(Command);
1661 lc_main_offset = LCmain.entryoff;
1664 // See if these addresses are already in the symbol table.
1665 unsigned FunctionStartsAdded = 0;
1666 for (uint64_t f = 0; f < FoundFns.size(); f++) {
1667 bool found = false;
1668 for (unsigned J = 0; J < SymbolList.size() && !found; ++J) {
1669 if (SymbolList[J].Address == FoundFns[f] + BaseSegmentAddress)
1670 found = true;
1672 // See this address is not already in the symbol table fake up an
1673 // nlist for it.
1674 if (!found) {
1675 NMSymbol F = {};
1676 F.Name = "<redacted function X>";
1677 F.Address = FoundFns[f] + BaseSegmentAddress;
1678 F.Size = 0;
1679 // There is no symbol in the nlist symbol table for this so we set
1680 // Sym effectivly to null and the rest of code in here must test for
1681 // it and not do things like Sym.getFlags() for it.
1682 F.Sym = BasicSymbolRef();
1683 F.SymFlags = 0;
1684 F.NType = MachO::N_SECT;
1685 F.NSect = 0;
1686 StringRef SegmentName = StringRef();
1687 StringRef SectionName = StringRef();
1688 for (const SectionRef &Section : MachO->sections()) {
1689 if (Expected<StringRef> NameOrErr = Section.getName())
1690 SectionName = *NameOrErr;
1691 else
1692 consumeError(NameOrErr.takeError());
1694 SegmentName = MachO->getSectionFinalSegmentName(
1695 Section.getRawDataRefImpl());
1696 F.NSect++;
1697 if (F.Address >= Section.getAddress() &&
1698 F.Address < Section.getAddress() + Section.getSize()) {
1699 F.Section = Section;
1700 break;
1703 if (SegmentName == "__TEXT" && SectionName == "__text")
1704 F.TypeChar = 't';
1705 else if (SegmentName == "__DATA" && SectionName == "__data")
1706 F.TypeChar = 'd';
1707 else if (SegmentName == "__DATA" && SectionName == "__bss")
1708 F.TypeChar = 'b';
1709 else
1710 F.TypeChar = 's';
1711 F.NDesc = 0;
1712 F.IndirectName = StringRef();
1713 SymbolList.push_back(F);
1714 if (FoundFns[f] == lc_main_offset)
1715 FOS << "<redacted LC_MAIN>";
1716 else
1717 FOS << "<redacted function " << f << ">";
1718 FOS << '\0';
1719 FunctionStartsAdded++;
1722 if (FunctionStartsAdded) {
1723 FOS.flush();
1724 const char *Q = FunctionStartsNameBuffer.c_str();
1725 for (unsigned K = 0; K < FunctionStartsAdded; K++) {
1726 SymbolList[I].Name = Q;
1727 Q += strlen(Q) + 1;
1728 if (SymbolList[I].TypeChar == 'I') {
1729 SymbolList[I].IndirectName = Q;
1730 Q += strlen(Q) + 1;
1732 I++;
1738 CurrentFilename = Obj.getFileName();
1739 sortAndPrintSymbolList(Obj, printName, ArchiveName, ArchitectureName);
1742 // checkMachOAndArchFlags() checks to see if the SymbolicFile is a Mach-O file
1743 // and if it is and there is a list of architecture flags is specified then
1744 // check to make sure this Mach-O file is one of those architectures or all
1745 // architectures was specificed. If not then an error is generated and this
1746 // routine returns false. Else it returns true.
1747 static bool checkMachOAndArchFlags(SymbolicFile *O, std::string &Filename) {
1748 auto *MachO = dyn_cast<MachOObjectFile>(O);
1750 if (!MachO || ArchAll || ArchFlags.empty())
1751 return true;
1753 MachO::mach_header H;
1754 MachO::mach_header_64 H_64;
1755 Triple T;
1756 const char *McpuDefault, *ArchFlag;
1757 if (MachO->is64Bit()) {
1758 H_64 = MachO->MachOObjectFile::getHeader64();
1759 T = MachOObjectFile::getArchTriple(H_64.cputype, H_64.cpusubtype,
1760 &McpuDefault, &ArchFlag);
1761 } else {
1762 H = MachO->MachOObjectFile::getHeader();
1763 T = MachOObjectFile::getArchTriple(H.cputype, H.cpusubtype,
1764 &McpuDefault, &ArchFlag);
1766 const std::string ArchFlagName(ArchFlag);
1767 if (none_of(ArchFlags, [&](const std::string &Name) {
1768 return Name == ArchFlagName;
1769 })) {
1770 error("No architecture specified", Filename);
1771 return false;
1773 return true;
1776 static void dumpSymbolNamesFromFile(std::string &Filename) {
1777 ErrorOr<std::unique_ptr<MemoryBuffer>> BufferOrErr =
1778 MemoryBuffer::getFileOrSTDIN(Filename);
1779 if (error(BufferOrErr.getError(), Filename))
1780 return;
1782 LLVMContext Context;
1783 LLVMContext *ContextPtr = NoLLVMBitcode ? nullptr : &Context;
1784 Expected<std::unique_ptr<Binary>> BinaryOrErr =
1785 createBinary(BufferOrErr.get()->getMemBufferRef(), ContextPtr);
1786 if (!BinaryOrErr) {
1787 error(BinaryOrErr.takeError(), Filename);
1788 return;
1790 Binary &Bin = *BinaryOrErr.get();
1792 if (Archive *A = dyn_cast<Archive>(&Bin)) {
1793 if (ArchiveMap) {
1794 Archive::symbol_iterator I = A->symbol_begin();
1795 Archive::symbol_iterator E = A->symbol_end();
1796 if (I != E) {
1797 outs() << "Archive map\n";
1798 for (; I != E; ++I) {
1799 Expected<Archive::Child> C = I->getMember();
1800 if (!C) {
1801 error(C.takeError(), Filename);
1802 break;
1804 Expected<StringRef> FileNameOrErr = C->getName();
1805 if (!FileNameOrErr) {
1806 error(FileNameOrErr.takeError(), Filename);
1807 break;
1809 StringRef SymName = I->getName();
1810 outs() << SymName << " in " << FileNameOrErr.get() << "\n";
1812 outs() << "\n";
1817 Error Err = Error::success();
1818 for (auto &C : A->children(Err)) {
1819 Expected<std::unique_ptr<Binary>> ChildOrErr =
1820 C.getAsBinary(ContextPtr);
1821 if (!ChildOrErr) {
1822 if (auto E = isNotObjectErrorInvalidFileType(ChildOrErr.takeError()))
1823 error(std::move(E), Filename, C);
1824 continue;
1826 if (SymbolicFile *O = dyn_cast<SymbolicFile>(&*ChildOrErr.get())) {
1827 if (!MachOPrintSizeWarning && PrintSize && isa<MachOObjectFile>(O)) {
1828 WithColor::warning(errs(), ToolName)
1829 << "sizes with -print-size for Mach-O files are always zero.\n";
1830 MachOPrintSizeWarning = true;
1832 if (!checkMachOAndArchFlags(O, Filename))
1833 return;
1834 if (!PrintFileName) {
1835 outs() << "\n";
1836 if (isa<MachOObjectFile>(O)) {
1837 outs() << Filename << "(" << O->getFileName() << ")";
1838 } else
1839 outs() << O->getFileName();
1840 outs() << ":\n";
1842 dumpSymbolNamesFromObject(*O, false, Filename);
1845 if (Err)
1846 error(std::move(Err), A->getFileName());
1848 return;
1850 if (MachOUniversalBinary *UB = dyn_cast<MachOUniversalBinary>(&Bin)) {
1851 // If we have a list of architecture flags specified dump only those.
1852 if (!ArchAll && !ArchFlags.empty()) {
1853 // Look for a slice in the universal binary that matches each ArchFlag.
1854 bool ArchFound;
1855 for (unsigned i = 0; i < ArchFlags.size(); ++i) {
1856 ArchFound = false;
1857 for (MachOUniversalBinary::object_iterator I = UB->begin_objects(),
1858 E = UB->end_objects();
1859 I != E; ++I) {
1860 if (ArchFlags[i] == I->getArchFlagName()) {
1861 ArchFound = true;
1862 Expected<std::unique_ptr<ObjectFile>> ObjOrErr =
1863 I->getAsObjectFile();
1864 std::string ArchiveName;
1865 std::string ArchitectureName;
1866 ArchiveName.clear();
1867 ArchitectureName.clear();
1868 if (ObjOrErr) {
1869 ObjectFile &Obj = *ObjOrErr.get();
1870 if (ArchFlags.size() > 1) {
1871 if (PrintFileName)
1872 ArchitectureName = I->getArchFlagName();
1873 else
1874 outs() << "\n" << Obj.getFileName() << " (for architecture "
1875 << I->getArchFlagName() << ")"
1876 << ":\n";
1878 dumpSymbolNamesFromObject(Obj, false, ArchiveName,
1879 ArchitectureName);
1880 } else if (auto E = isNotObjectErrorInvalidFileType(
1881 ObjOrErr.takeError())) {
1882 error(std::move(E), Filename, ArchFlags.size() > 1 ?
1883 StringRef(I->getArchFlagName()) : StringRef());
1884 continue;
1885 } else if (Expected<std::unique_ptr<Archive>> AOrErr =
1886 I->getAsArchive()) {
1887 std::unique_ptr<Archive> &A = *AOrErr;
1888 Error Err = Error::success();
1889 for (auto &C : A->children(Err)) {
1890 Expected<std::unique_ptr<Binary>> ChildOrErr =
1891 C.getAsBinary(ContextPtr);
1892 if (!ChildOrErr) {
1893 if (auto E = isNotObjectErrorInvalidFileType(
1894 ChildOrErr.takeError())) {
1895 error(std::move(E), Filename, C, ArchFlags.size() > 1 ?
1896 StringRef(I->getArchFlagName()) : StringRef());
1898 continue;
1900 if (SymbolicFile *O =
1901 dyn_cast<SymbolicFile>(&*ChildOrErr.get())) {
1902 if (PrintFileName) {
1903 ArchiveName = A->getFileName();
1904 if (ArchFlags.size() > 1)
1905 ArchitectureName = I->getArchFlagName();
1906 } else {
1907 outs() << "\n" << A->getFileName();
1908 outs() << "(" << O->getFileName() << ")";
1909 if (ArchFlags.size() > 1) {
1910 outs() << " (for architecture " << I->getArchFlagName()
1911 << ")";
1913 outs() << ":\n";
1915 dumpSymbolNamesFromObject(*O, false, ArchiveName,
1916 ArchitectureName);
1919 if (Err)
1920 error(std::move(Err), A->getFileName());
1921 } else {
1922 consumeError(AOrErr.takeError());
1923 error(Filename + " for architecture " +
1924 StringRef(I->getArchFlagName()) +
1925 " is not a Mach-O file or an archive file",
1926 "Mach-O universal file");
1930 if (!ArchFound) {
1931 error(ArchFlags[i],
1932 "file: " + Filename + " does not contain architecture");
1933 return;
1936 return;
1938 // No architecture flags were specified so if this contains a slice that
1939 // matches the host architecture dump only that.
1940 if (!ArchAll) {
1941 Triple HostTriple = MachOObjectFile::getHostArch();
1942 StringRef HostArchName = HostTriple.getArchName();
1943 for (MachOUniversalBinary::object_iterator I = UB->begin_objects(),
1944 E = UB->end_objects();
1945 I != E; ++I) {
1946 if (HostArchName == I->getArchFlagName()) {
1947 Expected<std::unique_ptr<ObjectFile>> ObjOrErr = I->getAsObjectFile();
1948 std::string ArchiveName;
1949 if (ObjOrErr) {
1950 ObjectFile &Obj = *ObjOrErr.get();
1951 dumpSymbolNamesFromObject(Obj, false);
1952 } else if (auto E = isNotObjectErrorInvalidFileType(
1953 ObjOrErr.takeError())) {
1954 error(std::move(E), Filename);
1955 return;
1956 } else if (Expected<std::unique_ptr<Archive>> AOrErr =
1957 I->getAsArchive()) {
1958 std::unique_ptr<Archive> &A = *AOrErr;
1959 Error Err = Error::success();
1960 for (auto &C : A->children(Err)) {
1961 Expected<std::unique_ptr<Binary>> ChildOrErr =
1962 C.getAsBinary(ContextPtr);
1963 if (!ChildOrErr) {
1964 if (auto E = isNotObjectErrorInvalidFileType(
1965 ChildOrErr.takeError()))
1966 error(std::move(E), Filename, C);
1967 continue;
1969 if (SymbolicFile *O =
1970 dyn_cast<SymbolicFile>(&*ChildOrErr.get())) {
1971 if (PrintFileName)
1972 ArchiveName = A->getFileName();
1973 else
1974 outs() << "\n" << A->getFileName() << "(" << O->getFileName()
1975 << ")"
1976 << ":\n";
1977 dumpSymbolNamesFromObject(*O, false, ArchiveName);
1980 if (Err)
1981 error(std::move(Err), A->getFileName());
1982 } else {
1983 consumeError(AOrErr.takeError());
1984 error(Filename + " for architecture " +
1985 StringRef(I->getArchFlagName()) +
1986 " is not a Mach-O file or an archive file",
1987 "Mach-O universal file");
1989 return;
1993 // Either all architectures have been specified or none have been specified
1994 // and this does not contain the host architecture so dump all the slices.
1995 bool moreThanOneArch = UB->getNumberOfObjects() > 1;
1996 for (const MachOUniversalBinary::ObjectForArch &O : UB->objects()) {
1997 Expected<std::unique_ptr<ObjectFile>> ObjOrErr = O.getAsObjectFile();
1998 std::string ArchiveName;
1999 std::string ArchitectureName;
2000 ArchiveName.clear();
2001 ArchitectureName.clear();
2002 if (ObjOrErr) {
2003 ObjectFile &Obj = *ObjOrErr.get();
2004 if (PrintFileName) {
2005 if (isa<MachOObjectFile>(Obj) && moreThanOneArch)
2006 ArchitectureName = O.getArchFlagName();
2007 } else {
2008 if (moreThanOneArch)
2009 outs() << "\n";
2010 outs() << Obj.getFileName();
2011 if (isa<MachOObjectFile>(Obj) && moreThanOneArch)
2012 outs() << " (for architecture " << O.getArchFlagName() << ")";
2013 outs() << ":\n";
2015 dumpSymbolNamesFromObject(Obj, false, ArchiveName, ArchitectureName);
2016 } else if (auto E = isNotObjectErrorInvalidFileType(
2017 ObjOrErr.takeError())) {
2018 error(std::move(E), Filename, moreThanOneArch ?
2019 StringRef(O.getArchFlagName()) : StringRef());
2020 continue;
2021 } else if (Expected<std::unique_ptr<Archive>> AOrErr =
2022 O.getAsArchive()) {
2023 std::unique_ptr<Archive> &A = *AOrErr;
2024 Error Err = Error::success();
2025 for (auto &C : A->children(Err)) {
2026 Expected<std::unique_ptr<Binary>> ChildOrErr =
2027 C.getAsBinary(ContextPtr);
2028 if (!ChildOrErr) {
2029 if (auto E = isNotObjectErrorInvalidFileType(
2030 ChildOrErr.takeError()))
2031 error(std::move(E), Filename, C, moreThanOneArch ?
2032 StringRef(ArchitectureName) : StringRef());
2033 continue;
2035 if (SymbolicFile *F = dyn_cast<SymbolicFile>(&*ChildOrErr.get())) {
2036 if (PrintFileName) {
2037 ArchiveName = A->getFileName();
2038 if (isa<MachOObjectFile>(F) && moreThanOneArch)
2039 ArchitectureName = O.getArchFlagName();
2040 } else {
2041 outs() << "\n" << A->getFileName();
2042 if (isa<MachOObjectFile>(F)) {
2043 outs() << "(" << F->getFileName() << ")";
2044 if (moreThanOneArch)
2045 outs() << " (for architecture " << O.getArchFlagName()
2046 << ")";
2047 } else
2048 outs() << ":" << F->getFileName();
2049 outs() << ":\n";
2051 dumpSymbolNamesFromObject(*F, false, ArchiveName, ArchitectureName);
2054 if (Err)
2055 error(std::move(Err), A->getFileName());
2056 } else {
2057 consumeError(AOrErr.takeError());
2058 error(Filename + " for architecture " +
2059 StringRef(O.getArchFlagName()) +
2060 " is not a Mach-O file or an archive file",
2061 "Mach-O universal file");
2064 return;
2066 if (SymbolicFile *O = dyn_cast<SymbolicFile>(&Bin)) {
2067 if (!MachOPrintSizeWarning && PrintSize && isa<MachOObjectFile>(O)) {
2068 WithColor::warning(errs(), ToolName)
2069 << "sizes with --print-size for Mach-O files are always zero.\n";
2070 MachOPrintSizeWarning = true;
2072 if (!checkMachOAndArchFlags(O, Filename))
2073 return;
2074 dumpSymbolNamesFromObject(*O, true);
2078 int main(int argc, char **argv) {
2079 InitLLVM X(argc, argv);
2080 cl::HideUnrelatedOptions(NMCat);
2081 cl::ParseCommandLineOptions(argc, argv, "llvm symbol table dumper\n");
2083 // llvm-nm only reads binary files.
2084 if (error(sys::ChangeStdinToBinary()))
2085 return 1;
2087 // These calls are needed so that we can read bitcode correctly.
2088 llvm::InitializeAllTargetInfos();
2089 llvm::InitializeAllTargetMCs();
2090 llvm::InitializeAllAsmParsers();
2092 ToolName = argv[0];
2093 if (BSDFormat)
2094 OutputFormat = bsd;
2095 if (POSIXFormat)
2096 OutputFormat = posix;
2097 if (DarwinFormat)
2098 OutputFormat = darwin;
2100 // The relative order of these is important. If you pass --size-sort it should
2101 // only print out the size. However, if you pass -S --size-sort, it should
2102 // print out both the size and address.
2103 if (SizeSort && !PrintSize)
2104 PrintAddress = false;
2105 if (OutputFormat == sysv || SizeSort)
2106 PrintSize = true;
2107 if (InputFilenames.empty())
2108 InputFilenames.push_back("a.out");
2109 if (InputFilenames.size() > 1)
2110 MultipleFiles = true;
2112 // If both --demangle and --no-demangle are specified then pick the last one.
2113 if (NoDemangle.getPosition() > Demangle.getPosition())
2114 Demangle = !NoDemangle;
2116 for (unsigned i = 0; i < ArchFlags.size(); ++i) {
2117 if (ArchFlags[i] == "all") {
2118 ArchAll = true;
2119 } else {
2120 if (!MachOObjectFile::isValidArch(ArchFlags[i]))
2121 error("Unknown architecture named '" + ArchFlags[i] + "'",
2122 "for the --arch option");
2126 if (!SegSect.empty() && SegSect.size() != 2)
2127 error("bad number of arguments (must be two arguments)",
2128 "for the -s option");
2130 if (NoDyldInfo && (AddDyldInfo || DyldInfoOnly))
2131 error("--no-dyldinfo can't be used with --add-dyldinfo or --dyldinfo-only");
2133 llvm::for_each(InputFilenames, dumpSymbolNamesFromFile);
2135 if (HadError)
2136 return 1;