forked from OSchip/llvm-project
2092 lines
74 KiB
C++
2092 lines
74 KiB
C++
//===-- llvm-nm.cpp - Symbol table dumping utility for llvm ---------------===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This program is a utility that works like traditional Unix "nm", that is, it
|
|
// prints out the names of symbols in a bitcode or object file, along with some
|
|
// information about each symbol.
|
|
//
|
|
// This "nm" supports many of the features of GNU "nm", including its different
|
|
// output formats.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "llvm/ADT/StringSwitch.h"
|
|
#include "llvm/BinaryFormat/COFF.h"
|
|
#include "llvm/Demangle/Demangle.h"
|
|
#include "llvm/IR/Function.h"
|
|
#include "llvm/IR/LLVMContext.h"
|
|
#include "llvm/Object/Archive.h"
|
|
#include "llvm/Object/COFF.h"
|
|
#include "llvm/Object/COFFImportFile.h"
|
|
#include "llvm/Object/ELFObjectFile.h"
|
|
#include "llvm/Object/IRObjectFile.h"
|
|
#include "llvm/Object/MachO.h"
|
|
#include "llvm/Object/MachOUniversal.h"
|
|
#include "llvm/Object/ObjectFile.h"
|
|
#include "llvm/Object/Wasm.h"
|
|
#include "llvm/Support/CommandLine.h"
|
|
#include "llvm/Support/FileSystem.h"
|
|
#include "llvm/Support/Format.h"
|
|
#include "llvm/Support/InitLLVM.h"
|
|
#include "llvm/Support/MemoryBuffer.h"
|
|
#include "llvm/Support/Program.h"
|
|
#include "llvm/Support/Signals.h"
|
|
#include "llvm/Support/TargetSelect.h"
|
|
#include "llvm/Support/WithColor.h"
|
|
#include "llvm/Support/raw_ostream.h"
|
|
#include <vector>
|
|
|
|
using namespace llvm;
|
|
using namespace object;
|
|
|
|
namespace {
|
|
enum OutputFormatTy { bsd, sysv, posix, darwin };
|
|
cl::opt<OutputFormatTy> OutputFormat(
|
|
"format", cl::desc("Specify output format"),
|
|
cl::values(clEnumVal(bsd, "BSD format"), clEnumVal(sysv, "System V format"),
|
|
clEnumVal(posix, "POSIX.2 format"),
|
|
clEnumVal(darwin, "Darwin -m format")),
|
|
cl::init(bsd));
|
|
cl::alias OutputFormat2("f", cl::desc("Alias for --format"),
|
|
cl::aliasopt(OutputFormat));
|
|
|
|
cl::list<std::string> InputFilenames(cl::Positional, cl::desc("<input files>"),
|
|
cl::ZeroOrMore);
|
|
|
|
cl::opt<bool> UndefinedOnly("undefined-only",
|
|
cl::desc("Show only undefined symbols"));
|
|
cl::alias UndefinedOnly2("u", cl::desc("Alias for --undefined-only"),
|
|
cl::aliasopt(UndefinedOnly), cl::Grouping);
|
|
|
|
cl::opt<bool> DynamicSyms("dynamic",
|
|
cl::desc("Display the dynamic symbols instead "
|
|
"of normal symbols."));
|
|
cl::alias DynamicSyms2("D", cl::desc("Alias for --dynamic"),
|
|
cl::aliasopt(DynamicSyms), cl::Grouping);
|
|
|
|
cl::opt<bool> DefinedOnly("defined-only",
|
|
cl::desc("Show only defined symbols"));
|
|
cl::alias DefinedOnly2("U", cl::desc("Alias for --defined-only"),
|
|
cl::aliasopt(DefinedOnly), cl::Grouping);
|
|
|
|
cl::opt<bool> ExternalOnly("extern-only",
|
|
cl::desc("Show only external symbols"),
|
|
cl::ZeroOrMore);
|
|
cl::alias ExternalOnly2("g", cl::desc("Alias for --extern-only"),
|
|
cl::aliasopt(ExternalOnly), cl::Grouping,
|
|
cl::ZeroOrMore);
|
|
|
|
cl::opt<bool> NoWeakSymbols("no-weak",
|
|
cl::desc("Show only non-weak symbols"));
|
|
cl::alias NoWeakSymbols2("W", cl::desc("Alias for --no-weak"),
|
|
cl::aliasopt(NoWeakSymbols), cl::Grouping);
|
|
|
|
cl::opt<bool> BSDFormat("B", cl::desc("Alias for --format=bsd"),
|
|
cl::Grouping);
|
|
cl::opt<bool> POSIXFormat("P", cl::desc("Alias for --format=posix"),
|
|
cl::Grouping);
|
|
cl::alias Portability("portability", cl::desc("Alias for --format=posix"),
|
|
cl::aliasopt(POSIXFormat), cl::NotHidden);
|
|
cl::opt<bool> DarwinFormat("m", cl::desc("Alias for --format=darwin"),
|
|
cl::Grouping);
|
|
|
|
static cl::list<std::string>
|
|
ArchFlags("arch", cl::desc("architecture(s) from a Mach-O file to dump"),
|
|
cl::ZeroOrMore);
|
|
bool ArchAll = false;
|
|
|
|
cl::opt<bool> PrintFileName(
|
|
"print-file-name",
|
|
cl::desc("Precede each symbol with the object file it came from"));
|
|
|
|
cl::alias PrintFileNameA("A", cl::desc("Alias for --print-file-name"),
|
|
cl::aliasopt(PrintFileName), cl::Grouping);
|
|
cl::alias PrintFileNameo("o", cl::desc("Alias for --print-file-name"),
|
|
cl::aliasopt(PrintFileName), cl::Grouping);
|
|
|
|
cl::opt<bool> DebugSyms("debug-syms",
|
|
cl::desc("Show all symbols, even debugger only"));
|
|
cl::alias DebugSymsa("a", cl::desc("Alias for --debug-syms"),
|
|
cl::aliasopt(DebugSyms), cl::Grouping);
|
|
|
|
cl::opt<bool> NumericSort("numeric-sort", cl::desc("Sort symbols by address"));
|
|
cl::alias NumericSortn("n", cl::desc("Alias for --numeric-sort"),
|
|
cl::aliasopt(NumericSort), cl::Grouping);
|
|
cl::alias NumericSortv("v", cl::desc("Alias for --numeric-sort"),
|
|
cl::aliasopt(NumericSort), cl::Grouping);
|
|
|
|
cl::opt<bool> NoSort("no-sort", cl::desc("Show symbols in order encountered"));
|
|
cl::alias NoSortp("p", cl::desc("Alias for --no-sort"), cl::aliasopt(NoSort),
|
|
cl::Grouping);
|
|
|
|
cl::opt<bool> Demangle("demangle", cl::desc("Demangle C++ symbol names"));
|
|
cl::alias DemangleC("C", cl::desc("Alias for --demangle"), cl::aliasopt(Demangle),
|
|
cl::Grouping);
|
|
|
|
cl::opt<bool> ReverseSort("reverse-sort", cl::desc("Sort in reverse order"));
|
|
cl::alias ReverseSortr("r", cl::desc("Alias for --reverse-sort"),
|
|
cl::aliasopt(ReverseSort), cl::Grouping);
|
|
|
|
cl::opt<bool> PrintSize("print-size",
|
|
cl::desc("Show symbol size instead of address"));
|
|
cl::alias PrintSizeS("S", cl::desc("Alias for --print-size"),
|
|
cl::aliasopt(PrintSize), cl::Grouping);
|
|
bool MachOPrintSizeWarning = false;
|
|
|
|
cl::opt<bool> SizeSort("size-sort", cl::desc("Sort symbols by size"));
|
|
|
|
cl::opt<bool> WithoutAliases("without-aliases", cl::Hidden,
|
|
cl::desc("Exclude aliases from output"));
|
|
|
|
cl::opt<bool> ArchiveMap("print-armap", cl::desc("Print the archive map"));
|
|
cl::alias ArchiveMaps("M", cl::desc("Alias for --print-armap"),
|
|
cl::aliasopt(ArchiveMap), cl::Grouping);
|
|
|
|
enum Radix { d, o, x };
|
|
cl::opt<Radix>
|
|
AddressRadix("radix", cl::desc("Radix (o/d/x) for printing symbol Values"),
|
|
cl::values(clEnumVal(d, "decimal"), clEnumVal(o, "octal"),
|
|
clEnumVal(x, "hexadecimal")),
|
|
cl::init(x));
|
|
cl::alias RadixAlias("t", cl::desc("Alias for --radix"),
|
|
cl::aliasopt(AddressRadix));
|
|
|
|
cl::opt<bool> JustSymbolName("just-symbol-name",
|
|
cl::desc("Print just the symbol's name"));
|
|
cl::alias JustSymbolNames("j", cl::desc("Alias for --just-symbol-name"),
|
|
cl::aliasopt(JustSymbolName), cl::Grouping);
|
|
|
|
// FIXME: This option takes exactly two strings and should be allowed anywhere
|
|
// on the command line. Such that "llvm-nm -s __TEXT __text foo.o" would work.
|
|
// But that does not as the CommandLine Library does not have a way to make
|
|
// this work. For now the "-s __TEXT __text" has to be last on the command
|
|
// line.
|
|
cl::list<std::string> SegSect("s", cl::Positional, cl::ZeroOrMore,
|
|
cl::desc("Dump only symbols from this segment "
|
|
"and section name, Mach-O only"));
|
|
|
|
cl::opt<bool> FormatMachOasHex("x", cl::desc("Print symbol entry in hex, "
|
|
"Mach-O only"), cl::Grouping);
|
|
cl::opt<bool> AddDyldInfo("add-dyldinfo",
|
|
cl::desc("Add symbols from the dyldinfo not already "
|
|
"in the symbol table, Mach-O only"));
|
|
cl::opt<bool> NoDyldInfo("no-dyldinfo",
|
|
cl::desc("Don't add any symbols from the dyldinfo, "
|
|
"Mach-O only"));
|
|
cl::opt<bool> DyldInfoOnly("dyldinfo-only",
|
|
cl::desc("Show only symbols from the dyldinfo, "
|
|
"Mach-O only"));
|
|
|
|
cl::opt<bool> NoLLVMBitcode("no-llvm-bc",
|
|
cl::desc("Disable LLVM bitcode reader"));
|
|
|
|
cl::extrahelp HelpResponse("\nPass @FILE as argument to read options from FILE.\n");
|
|
|
|
bool PrintAddress = true;
|
|
|
|
bool MultipleFiles = false;
|
|
|
|
bool HadError = false;
|
|
|
|
std::string ToolName;
|
|
} // anonymous namespace
|
|
|
|
static void error(Twine Message, Twine Path = Twine()) {
|
|
HadError = true;
|
|
WithColor::error(errs(), ToolName) << Path << ": " << Message << ".\n";
|
|
}
|
|
|
|
static bool error(std::error_code EC, Twine Path = Twine()) {
|
|
if (EC) {
|
|
error(EC.message(), Path);
|
|
return true;
|
|
}
|
|
return false;
|
|
}
|
|
|
|
// This version of error() prints the archive name and member name, for example:
|
|
// "libx.a(foo.o)" after the ToolName before the error message. It sets
|
|
// HadError but returns allowing the code to move on to other archive members.
|
|
static void error(llvm::Error E, StringRef FileName, const Archive::Child &C,
|
|
StringRef ArchitectureName = StringRef()) {
|
|
HadError = true;
|
|
WithColor::error(errs(), ToolName) << FileName;
|
|
|
|
Expected<StringRef> NameOrErr = C.getName();
|
|
// TODO: if we have a error getting the name then it would be nice to print
|
|
// the index of which archive member this is and or its offset in the
|
|
// archive instead of "???" as the name.
|
|
if (!NameOrErr) {
|
|
consumeError(NameOrErr.takeError());
|
|
errs() << "(" << "???" << ")";
|
|
} else
|
|
errs() << "(" << NameOrErr.get() << ")";
|
|
|
|
if (!ArchitectureName.empty())
|
|
errs() << " (for architecture " << ArchitectureName << ") ";
|
|
|
|
std::string Buf;
|
|
raw_string_ostream OS(Buf);
|
|
logAllUnhandledErrors(std::move(E), OS);
|
|
OS.flush();
|
|
errs() << " " << Buf << "\n";
|
|
}
|
|
|
|
// This version of error() prints the file name and which architecture slice it
|
|
// is from, for example: "foo.o (for architecture i386)" after the ToolName
|
|
// before the error message. It sets HadError but returns allowing the code to
|
|
// move on to other architecture slices.
|
|
static void error(llvm::Error E, StringRef FileName,
|
|
StringRef ArchitectureName = StringRef()) {
|
|
HadError = true;
|
|
WithColor::error(errs(), ToolName) << FileName;
|
|
|
|
if (!ArchitectureName.empty())
|
|
errs() << " (for architecture " << ArchitectureName << ") ";
|
|
|
|
std::string Buf;
|
|
raw_string_ostream OS(Buf);
|
|
logAllUnhandledErrors(std::move(E), OS);
|
|
OS.flush();
|
|
errs() << " " << Buf << "\n";
|
|
}
|
|
|
|
namespace {
|
|
struct NMSymbol {
|
|
uint64_t Address;
|
|
uint64_t Size;
|
|
char TypeChar;
|
|
StringRef Name;
|
|
BasicSymbolRef Sym;
|
|
// The Sym field above points to the native symbol in the object file,
|
|
// for Mach-O when we are creating symbols from the dyld info the above
|
|
// pointer is null as there is no native symbol. In these cases the fields
|
|
// below are filled in to represent what would have been a Mach-O nlist
|
|
// native symbol.
|
|
uint32_t SymFlags;
|
|
SectionRef Section;
|
|
uint8_t NType;
|
|
uint8_t NSect;
|
|
uint16_t NDesc;
|
|
StringRef IndirectName;
|
|
};
|
|
} // anonymous namespace
|
|
|
|
static bool compareSymbolAddress(const NMSymbol &A, const NMSymbol &B) {
|
|
bool ADefined;
|
|
if (A.Sym.getRawDataRefImpl().p)
|
|
ADefined = !(A.Sym.getFlags() & SymbolRef::SF_Undefined);
|
|
else
|
|
ADefined = A.TypeChar != 'U';
|
|
bool BDefined;
|
|
if (B.Sym.getRawDataRefImpl().p)
|
|
BDefined = !(B.Sym.getFlags() & SymbolRef::SF_Undefined);
|
|
else
|
|
BDefined = B.TypeChar != 'U';
|
|
return std::make_tuple(ADefined, A.Address, A.Name, A.Size) <
|
|
std::make_tuple(BDefined, B.Address, B.Name, B.Size);
|
|
}
|
|
|
|
static bool compareSymbolSize(const NMSymbol &A, const NMSymbol &B) {
|
|
return std::make_tuple(A.Size, A.Name, A.Address) <
|
|
std::make_tuple(B.Size, B.Name, B.Address);
|
|
}
|
|
|
|
static bool compareSymbolName(const NMSymbol &A, const NMSymbol &B) {
|
|
return std::make_tuple(A.Name, A.Size, A.Address) <
|
|
std::make_tuple(B.Name, B.Size, B.Address);
|
|
}
|
|
|
|
static char isSymbolList64Bit(SymbolicFile &Obj) {
|
|
if (auto *IRObj = dyn_cast<IRObjectFile>(&Obj))
|
|
return Triple(IRObj->getTargetTriple()).isArch64Bit();
|
|
if (isa<COFFObjectFile>(Obj) || isa<COFFImportFile>(Obj))
|
|
return false;
|
|
if (isa<WasmObjectFile>(Obj))
|
|
return false;
|
|
if (MachOObjectFile *MachO = dyn_cast<MachOObjectFile>(&Obj))
|
|
return MachO->is64Bit();
|
|
return cast<ELFObjectFileBase>(Obj).getBytesInAddress() == 8;
|
|
}
|
|
|
|
static StringRef CurrentFilename;
|
|
typedef std::vector<NMSymbol> SymbolListT;
|
|
static SymbolListT SymbolList;
|
|
|
|
static char getSymbolNMTypeChar(IRObjectFile &Obj, basic_symbol_iterator I);
|
|
|
|
// darwinPrintSymbol() is used to print a symbol from a Mach-O file when the
|
|
// the OutputFormat is darwin or we are printing Mach-O symbols in hex. For
|
|
// the darwin format it produces the same output as darwin's nm(1) -m output
|
|
// and when printing Mach-O symbols in hex it produces the same output as
|
|
// darwin's nm(1) -x format.
|
|
static void darwinPrintSymbol(SymbolicFile &Obj, SymbolListT::iterator I,
|
|
char *SymbolAddrStr, const char *printBlanks,
|
|
const char *printDashes, const char *printFormat) {
|
|
MachO::mach_header H;
|
|
MachO::mach_header_64 H_64;
|
|
uint32_t Filetype = MachO::MH_OBJECT;
|
|
uint32_t Flags = 0;
|
|
uint8_t NType = 0;
|
|
uint8_t NSect = 0;
|
|
uint16_t NDesc = 0;
|
|
uint32_t NStrx = 0;
|
|
uint64_t NValue = 0;
|
|
MachOObjectFile *MachO = dyn_cast<MachOObjectFile>(&Obj);
|
|
if (Obj.isIR()) {
|
|
uint32_t SymFlags = I->Sym.getFlags();
|
|
if (SymFlags & SymbolRef::SF_Global)
|
|
NType |= MachO::N_EXT;
|
|
if (SymFlags & SymbolRef::SF_Hidden)
|
|
NType |= MachO::N_PEXT;
|
|
if (SymFlags & SymbolRef::SF_Undefined)
|
|
NType |= MachO::N_EXT | MachO::N_UNDF;
|
|
else {
|
|
// Here we have a symbol definition. So to fake out a section name we
|
|
// use 1, 2 and 3 for section numbers. See below where they are used to
|
|
// print out fake section names.
|
|
NType |= MachO::N_SECT;
|
|
if (SymFlags & SymbolRef::SF_Const)
|
|
NSect = 3;
|
|
else if (SymFlags & SymbolRef::SF_Executable)
|
|
NSect = 1;
|
|
else
|
|
NSect = 2;
|
|
}
|
|
if (SymFlags & SymbolRef::SF_Weak)
|
|
NDesc |= MachO::N_WEAK_DEF;
|
|
} else {
|
|
DataRefImpl SymDRI = I->Sym.getRawDataRefImpl();
|
|
if (MachO->is64Bit()) {
|
|
H_64 = MachO->MachOObjectFile::getHeader64();
|
|
Filetype = H_64.filetype;
|
|
Flags = H_64.flags;
|
|
if (SymDRI.p){
|
|
MachO::nlist_64 STE_64 = MachO->getSymbol64TableEntry(SymDRI);
|
|
NType = STE_64.n_type;
|
|
NSect = STE_64.n_sect;
|
|
NDesc = STE_64.n_desc;
|
|
NStrx = STE_64.n_strx;
|
|
NValue = STE_64.n_value;
|
|
} else {
|
|
NType = I->NType;
|
|
NSect = I->NSect;
|
|
NDesc = I->NDesc;
|
|
NStrx = 0;
|
|
NValue = I->Address;
|
|
}
|
|
} else {
|
|
H = MachO->MachOObjectFile::getHeader();
|
|
Filetype = H.filetype;
|
|
Flags = H.flags;
|
|
if (SymDRI.p){
|
|
MachO::nlist STE = MachO->getSymbolTableEntry(SymDRI);
|
|
NType = STE.n_type;
|
|
NSect = STE.n_sect;
|
|
NDesc = STE.n_desc;
|
|
NStrx = STE.n_strx;
|
|
NValue = STE.n_value;
|
|
} else {
|
|
NType = I->NType;
|
|
NSect = I->NSect;
|
|
NDesc = I->NDesc;
|
|
NStrx = 0;
|
|
NValue = I->Address;
|
|
}
|
|
}
|
|
}
|
|
|
|
// If we are printing Mach-O symbols in hex do that and return.
|
|
if (FormatMachOasHex) {
|
|
char Str[18] = "";
|
|
format(printFormat, NValue).print(Str, sizeof(Str));
|
|
outs() << Str << ' ';
|
|
format("%02x", NType).print(Str, sizeof(Str));
|
|
outs() << Str << ' ';
|
|
format("%02x", NSect).print(Str, sizeof(Str));
|
|
outs() << Str << ' ';
|
|
format("%04x", NDesc).print(Str, sizeof(Str));
|
|
outs() << Str << ' ';
|
|
format("%08x", NStrx).print(Str, sizeof(Str));
|
|
outs() << Str << ' ';
|
|
outs() << I->Name;
|
|
if ((NType & MachO::N_TYPE) == MachO::N_INDR) {
|
|
outs() << " (indirect for ";
|
|
format(printFormat, NValue).print(Str, sizeof(Str));
|
|
outs() << Str << ' ';
|
|
StringRef IndirectName;
|
|
if (I->Sym.getRawDataRefImpl().p) {
|
|
if (MachO->getIndirectName(I->Sym.getRawDataRefImpl(), IndirectName))
|
|
outs() << "?)";
|
|
else
|
|
outs() << IndirectName << ")";
|
|
}
|
|
else
|
|
outs() << I->IndirectName << ")";
|
|
}
|
|
outs() << "\n";
|
|
return;
|
|
}
|
|
|
|
if (PrintAddress) {
|
|
if ((NType & MachO::N_TYPE) == MachO::N_INDR)
|
|
strcpy(SymbolAddrStr, printBlanks);
|
|
if (Obj.isIR() && (NType & MachO::N_TYPE) == MachO::N_TYPE)
|
|
strcpy(SymbolAddrStr, printDashes);
|
|
outs() << SymbolAddrStr << ' ';
|
|
}
|
|
|
|
switch (NType & MachO::N_TYPE) {
|
|
case MachO::N_UNDF:
|
|
if (NValue != 0) {
|
|
outs() << "(common) ";
|
|
if (MachO::GET_COMM_ALIGN(NDesc) != 0)
|
|
outs() << "(alignment 2^" << (int)MachO::GET_COMM_ALIGN(NDesc) << ") ";
|
|
} else {
|
|
if ((NType & MachO::N_TYPE) == MachO::N_PBUD)
|
|
outs() << "(prebound ";
|
|
else
|
|
outs() << "(";
|
|
if ((NDesc & MachO::REFERENCE_TYPE) ==
|
|
MachO::REFERENCE_FLAG_UNDEFINED_LAZY)
|
|
outs() << "undefined [lazy bound]) ";
|
|
else if ((NDesc & MachO::REFERENCE_TYPE) ==
|
|
MachO::REFERENCE_FLAG_PRIVATE_UNDEFINED_LAZY)
|
|
outs() << "undefined [private lazy bound]) ";
|
|
else if ((NDesc & MachO::REFERENCE_TYPE) ==
|
|
MachO::REFERENCE_FLAG_PRIVATE_UNDEFINED_NON_LAZY)
|
|
outs() << "undefined [private]) ";
|
|
else
|
|
outs() << "undefined) ";
|
|
}
|
|
break;
|
|
case MachO::N_ABS:
|
|
outs() << "(absolute) ";
|
|
break;
|
|
case MachO::N_INDR:
|
|
outs() << "(indirect) ";
|
|
break;
|
|
case MachO::N_SECT: {
|
|
if (Obj.isIR()) {
|
|
// For llvm bitcode files print out a fake section name using the values
|
|
// use 1, 2 and 3 for section numbers as set above.
|
|
if (NSect == 1)
|
|
outs() << "(LTO,CODE) ";
|
|
else if (NSect == 2)
|
|
outs() << "(LTO,DATA) ";
|
|
else if (NSect == 3)
|
|
outs() << "(LTO,RODATA) ";
|
|
else
|
|
outs() << "(?,?) ";
|
|
break;
|
|
}
|
|
section_iterator Sec = SectionRef();
|
|
if (I->Sym.getRawDataRefImpl().p) {
|
|
Expected<section_iterator> SecOrErr =
|
|
MachO->getSymbolSection(I->Sym.getRawDataRefImpl());
|
|
if (!SecOrErr) {
|
|
consumeError(SecOrErr.takeError());
|
|
outs() << "(?,?) ";
|
|
break;
|
|
}
|
|
Sec = *SecOrErr;
|
|
if (Sec == MachO->section_end()) {
|
|
outs() << "(?,?) ";
|
|
break;
|
|
}
|
|
} else {
|
|
Sec = I->Section;
|
|
}
|
|
DataRefImpl Ref = Sec->getRawDataRefImpl();
|
|
StringRef SectionName;
|
|
MachO->getSectionName(Ref, SectionName);
|
|
StringRef SegmentName = MachO->getSectionFinalSegmentName(Ref);
|
|
outs() << "(" << SegmentName << "," << SectionName << ") ";
|
|
break;
|
|
}
|
|
default:
|
|
outs() << "(?) ";
|
|
break;
|
|
}
|
|
|
|
if (NType & MachO::N_EXT) {
|
|
if (NDesc & MachO::REFERENCED_DYNAMICALLY)
|
|
outs() << "[referenced dynamically] ";
|
|
if (NType & MachO::N_PEXT) {
|
|
if ((NDesc & MachO::N_WEAK_DEF) == MachO::N_WEAK_DEF)
|
|
outs() << "weak private external ";
|
|
else
|
|
outs() << "private external ";
|
|
} else {
|
|
if ((NDesc & MachO::N_WEAK_REF) == MachO::N_WEAK_REF ||
|
|
(NDesc & MachO::N_WEAK_DEF) == MachO::N_WEAK_DEF) {
|
|
if ((NDesc & (MachO::N_WEAK_REF | MachO::N_WEAK_DEF)) ==
|
|
(MachO::N_WEAK_REF | MachO::N_WEAK_DEF))
|
|
outs() << "weak external automatically hidden ";
|
|
else
|
|
outs() << "weak external ";
|
|
} else
|
|
outs() << "external ";
|
|
}
|
|
} else {
|
|
if (NType & MachO::N_PEXT)
|
|
outs() << "non-external (was a private external) ";
|
|
else
|
|
outs() << "non-external ";
|
|
}
|
|
|
|
if (Filetype == MachO::MH_OBJECT &&
|
|
(NDesc & MachO::N_NO_DEAD_STRIP) == MachO::N_NO_DEAD_STRIP)
|
|
outs() << "[no dead strip] ";
|
|
|
|
if (Filetype == MachO::MH_OBJECT &&
|
|
((NType & MachO::N_TYPE) != MachO::N_UNDF) &&
|
|
(NDesc & MachO::N_SYMBOL_RESOLVER) == MachO::N_SYMBOL_RESOLVER)
|
|
outs() << "[symbol resolver] ";
|
|
|
|
if (Filetype == MachO::MH_OBJECT &&
|
|
((NType & MachO::N_TYPE) != MachO::N_UNDF) &&
|
|
(NDesc & MachO::N_ALT_ENTRY) == MachO::N_ALT_ENTRY)
|
|
outs() << "[alt entry] ";
|
|
|
|
if (Filetype == MachO::MH_OBJECT &&
|
|
((NType & MachO::N_TYPE) != MachO::N_UNDF) &&
|
|
(NDesc & MachO::N_COLD_FUNC) == MachO::N_COLD_FUNC)
|
|
outs() << "[cold func] ";
|
|
|
|
if ((NDesc & MachO::N_ARM_THUMB_DEF) == MachO::N_ARM_THUMB_DEF)
|
|
outs() << "[Thumb] ";
|
|
|
|
if ((NType & MachO::N_TYPE) == MachO::N_INDR) {
|
|
outs() << I->Name << " (for ";
|
|
StringRef IndirectName;
|
|
if (MachO) {
|
|
if (I->Sym.getRawDataRefImpl().p) {
|
|
if (MachO->getIndirectName(I->Sym.getRawDataRefImpl(), IndirectName))
|
|
outs() << "?)";
|
|
else
|
|
outs() << IndirectName << ")";
|
|
}
|
|
else
|
|
outs() << I->IndirectName << ")";
|
|
} else
|
|
outs() << "?)";
|
|
} else
|
|
outs() << I->Name;
|
|
|
|
if ((Flags & MachO::MH_TWOLEVEL) == MachO::MH_TWOLEVEL &&
|
|
(((NType & MachO::N_TYPE) == MachO::N_UNDF && NValue == 0) ||
|
|
(NType & MachO::N_TYPE) == MachO::N_PBUD)) {
|
|
uint32_t LibraryOrdinal = MachO::GET_LIBRARY_ORDINAL(NDesc);
|
|
if (LibraryOrdinal != 0) {
|
|
if (LibraryOrdinal == MachO::EXECUTABLE_ORDINAL)
|
|
outs() << " (from executable)";
|
|
else if (LibraryOrdinal == MachO::DYNAMIC_LOOKUP_ORDINAL)
|
|
outs() << " (dynamically looked up)";
|
|
else {
|
|
StringRef LibraryName;
|
|
if (!MachO ||
|
|
MachO->getLibraryShortNameByIndex(LibraryOrdinal - 1, LibraryName))
|
|
outs() << " (from bad library ordinal " << LibraryOrdinal << ")";
|
|
else
|
|
outs() << " (from " << LibraryName << ")";
|
|
}
|
|
}
|
|
}
|
|
|
|
outs() << "\n";
|
|
}
|
|
|
|
// Table that maps Darwin's Mach-O stab constants to strings to allow printing.
|
|
struct DarwinStabName {
|
|
uint8_t NType;
|
|
const char *Name;
|
|
};
|
|
static const struct DarwinStabName DarwinStabNames[] = {
|
|
{MachO::N_GSYM, "GSYM"},
|
|
{MachO::N_FNAME, "FNAME"},
|
|
{MachO::N_FUN, "FUN"},
|
|
{MachO::N_STSYM, "STSYM"},
|
|
{MachO::N_LCSYM, "LCSYM"},
|
|
{MachO::N_BNSYM, "BNSYM"},
|
|
{MachO::N_PC, "PC"},
|
|
{MachO::N_AST, "AST"},
|
|
{MachO::N_OPT, "OPT"},
|
|
{MachO::N_RSYM, "RSYM"},
|
|
{MachO::N_SLINE, "SLINE"},
|
|
{MachO::N_ENSYM, "ENSYM"},
|
|
{MachO::N_SSYM, "SSYM"},
|
|
{MachO::N_SO, "SO"},
|
|
{MachO::N_OSO, "OSO"},
|
|
{MachO::N_LSYM, "LSYM"},
|
|
{MachO::N_BINCL, "BINCL"},
|
|
{MachO::N_SOL, "SOL"},
|
|
{MachO::N_PARAMS, "PARAM"},
|
|
{MachO::N_VERSION, "VERS"},
|
|
{MachO::N_OLEVEL, "OLEV"},
|
|
{MachO::N_PSYM, "PSYM"},
|
|
{MachO::N_EINCL, "EINCL"},
|
|
{MachO::N_ENTRY, "ENTRY"},
|
|
{MachO::N_LBRAC, "LBRAC"},
|
|
{MachO::N_EXCL, "EXCL"},
|
|
{MachO::N_RBRAC, "RBRAC"},
|
|
{MachO::N_BCOMM, "BCOMM"},
|
|
{MachO::N_ECOMM, "ECOMM"},
|
|
{MachO::N_ECOML, "ECOML"},
|
|
{MachO::N_LENG, "LENG"},
|
|
{0, nullptr}};
|
|
|
|
static const char *getDarwinStabString(uint8_t NType) {
|
|
for (unsigned i = 0; DarwinStabNames[i].Name; i++) {
|
|
if (DarwinStabNames[i].NType == NType)
|
|
return DarwinStabNames[i].Name;
|
|
}
|
|
return nullptr;
|
|
}
|
|
|
|
// darwinPrintStab() prints the n_sect, n_desc along with a symbolic name of
|
|
// a stab n_type value in a Mach-O file.
|
|
static void darwinPrintStab(MachOObjectFile *MachO, SymbolListT::iterator I) {
|
|
MachO::nlist_64 STE_64;
|
|
MachO::nlist STE;
|
|
uint8_t NType;
|
|
uint8_t NSect;
|
|
uint16_t NDesc;
|
|
DataRefImpl SymDRI = I->Sym.getRawDataRefImpl();
|
|
if (MachO->is64Bit()) {
|
|
STE_64 = MachO->getSymbol64TableEntry(SymDRI);
|
|
NType = STE_64.n_type;
|
|
NSect = STE_64.n_sect;
|
|
NDesc = STE_64.n_desc;
|
|
} else {
|
|
STE = MachO->getSymbolTableEntry(SymDRI);
|
|
NType = STE.n_type;
|
|
NSect = STE.n_sect;
|
|
NDesc = STE.n_desc;
|
|
}
|
|
|
|
char Str[18] = "";
|
|
format("%02x", NSect).print(Str, sizeof(Str));
|
|
outs() << ' ' << Str << ' ';
|
|
format("%04x", NDesc).print(Str, sizeof(Str));
|
|
outs() << Str << ' ';
|
|
if (const char *stabString = getDarwinStabString(NType))
|
|
format("%5.5s", stabString).print(Str, sizeof(Str));
|
|
else
|
|
format(" %02x", NType).print(Str, sizeof(Str));
|
|
outs() << Str;
|
|
}
|
|
|
|
static Optional<std::string> demangle(StringRef Name, bool StripUnderscore) {
|
|
if (StripUnderscore && !Name.empty() && Name[0] == '_')
|
|
Name = Name.substr(1);
|
|
|
|
if (!Name.startswith("_Z"))
|
|
return None;
|
|
|
|
int Status;
|
|
char *Undecorated =
|
|
itaniumDemangle(Name.str().c_str(), nullptr, nullptr, &Status);
|
|
if (Status != 0)
|
|
return None;
|
|
|
|
std::string S(Undecorated);
|
|
free(Undecorated);
|
|
return S;
|
|
}
|
|
|
|
static bool symbolIsDefined(const NMSymbol &Sym) {
|
|
return Sym.TypeChar != 'U' && Sym.TypeChar != 'w' && Sym.TypeChar != 'v';
|
|
}
|
|
|
|
static void sortAndPrintSymbolList(SymbolicFile &Obj, bool printName,
|
|
const std::string &ArchiveName,
|
|
const std::string &ArchitectureName) {
|
|
if (!NoSort) {
|
|
std::function<bool(const NMSymbol &, const NMSymbol &)> Cmp;
|
|
if (NumericSort)
|
|
Cmp = compareSymbolAddress;
|
|
else if (SizeSort)
|
|
Cmp = compareSymbolSize;
|
|
else
|
|
Cmp = compareSymbolName;
|
|
|
|
if (ReverseSort)
|
|
Cmp = [=](const NMSymbol &A, const NMSymbol &B) { return Cmp(B, A); };
|
|
llvm::sort(SymbolList, Cmp);
|
|
}
|
|
|
|
if (!PrintFileName) {
|
|
if (OutputFormat == posix && MultipleFiles && printName) {
|
|
outs() << '\n' << CurrentFilename << ":\n";
|
|
} else if (OutputFormat == bsd && MultipleFiles && printName) {
|
|
outs() << "\n" << CurrentFilename << ":\n";
|
|
} else if (OutputFormat == sysv) {
|
|
outs() << "\n\nSymbols from " << CurrentFilename << ":\n\n";
|
|
if (isSymbolList64Bit(Obj))
|
|
outs() << "Name Value Class Type"
|
|
<< " Size Line Section\n";
|
|
else
|
|
outs() << "Name Value Class Type"
|
|
<< " Size Line Section\n";
|
|
}
|
|
}
|
|
|
|
const char *printBlanks, *printDashes, *printFormat;
|
|
if (isSymbolList64Bit(Obj)) {
|
|
printBlanks = " ";
|
|
printDashes = "----------------";
|
|
switch (AddressRadix) {
|
|
case Radix::o:
|
|
printFormat = OutputFormat == posix ? "%" PRIo64 : "%016" PRIo64;
|
|
break;
|
|
case Radix::x:
|
|
printFormat = OutputFormat == posix ? "%" PRIx64 : "%016" PRIx64;
|
|
break;
|
|
default:
|
|
printFormat = OutputFormat == posix ? "%" PRId64 : "%016" PRId64;
|
|
}
|
|
} else {
|
|
printBlanks = " ";
|
|
printDashes = "--------";
|
|
switch (AddressRadix) {
|
|
case Radix::o:
|
|
printFormat = OutputFormat == posix ? "%" PRIo64 : "%08" PRIo64;
|
|
break;
|
|
case Radix::x:
|
|
printFormat = OutputFormat == posix ? "%" PRIx64 : "%08" PRIx64;
|
|
break;
|
|
default:
|
|
printFormat = OutputFormat == posix ? "%" PRId64 : "%08" PRId64;
|
|
}
|
|
}
|
|
|
|
auto writeFileName = [&](raw_ostream &S) {
|
|
if (!ArchitectureName.empty())
|
|
S << "(for architecture " << ArchitectureName << "):";
|
|
if (OutputFormat == posix && !ArchiveName.empty())
|
|
S << ArchiveName << "[" << CurrentFilename << "]: ";
|
|
else {
|
|
if (!ArchiveName.empty())
|
|
S << ArchiveName << ":";
|
|
S << CurrentFilename << ": ";
|
|
}
|
|
};
|
|
|
|
if (SymbolList.empty()) {
|
|
if (PrintFileName)
|
|
writeFileName(errs());
|
|
errs() << "no symbols\n";
|
|
}
|
|
|
|
for (SymbolListT::iterator I = SymbolList.begin(), E = SymbolList.end();
|
|
I != E; ++I) {
|
|
uint32_t SymFlags;
|
|
std::string Name = I->Name.str();
|
|
MachOObjectFile *MachO = dyn_cast<MachOObjectFile>(&Obj);
|
|
if (Demangle) {
|
|
if (Optional<std::string> Opt = demangle(I->Name, MachO))
|
|
Name = *Opt;
|
|
}
|
|
if (I->Sym.getRawDataRefImpl().p)
|
|
SymFlags = I->Sym.getFlags();
|
|
else
|
|
SymFlags = I->SymFlags;
|
|
|
|
bool Undefined = SymFlags & SymbolRef::SF_Undefined;
|
|
bool Global = SymFlags & SymbolRef::SF_Global;
|
|
bool Weak = SymFlags & SymbolRef::SF_Weak;
|
|
if ((!Undefined && UndefinedOnly) || (Undefined && DefinedOnly) ||
|
|
(!Global && ExternalOnly) || (Weak && NoWeakSymbols))
|
|
continue;
|
|
if (PrintFileName)
|
|
writeFileName(outs());
|
|
if ((JustSymbolName ||
|
|
(UndefinedOnly && MachO && OutputFormat != darwin)) &&
|
|
OutputFormat != posix) {
|
|
outs() << Name << "\n";
|
|
continue;
|
|
}
|
|
|
|
char SymbolAddrStr[18] = "";
|
|
char SymbolSizeStr[18] = "";
|
|
|
|
// If the format is SysV or the symbol isn't defined, then print spaces.
|
|
if (OutputFormat == sysv || !symbolIsDefined(*I)) {
|
|
if (OutputFormat == posix) {
|
|
format(printFormat, I->Address)
|
|
.print(SymbolAddrStr, sizeof(SymbolAddrStr));
|
|
format(printFormat, I->Size)
|
|
.print(SymbolSizeStr, sizeof(SymbolSizeStr));
|
|
} else {
|
|
strcpy(SymbolAddrStr, printBlanks);
|
|
strcpy(SymbolSizeStr, printBlanks);
|
|
}
|
|
}
|
|
|
|
// Otherwise, print the symbol address and size.
|
|
if (symbolIsDefined(*I)) {
|
|
if (Obj.isIR())
|
|
strcpy(SymbolAddrStr, printDashes);
|
|
else if(MachO && I->TypeChar == 'I')
|
|
strcpy(SymbolAddrStr, printBlanks);
|
|
else
|
|
format(printFormat, I->Address)
|
|
.print(SymbolAddrStr, sizeof(SymbolAddrStr));
|
|
format(printFormat, I->Size).print(SymbolSizeStr, sizeof(SymbolSizeStr));
|
|
}
|
|
|
|
// If OutputFormat is darwin or we are printing Mach-O symbols in hex and
|
|
// we have a MachOObjectFile, call darwinPrintSymbol to print as darwin's
|
|
// nm(1) -m output or hex, else if OutputFormat is darwin or we are
|
|
// printing Mach-O symbols in hex and not a Mach-O object fall back to
|
|
// OutputFormat bsd (see below).
|
|
if ((OutputFormat == darwin || FormatMachOasHex) && (MachO || Obj.isIR())) {
|
|
darwinPrintSymbol(Obj, I, SymbolAddrStr, printBlanks, printDashes,
|
|
printFormat);
|
|
} else if (OutputFormat == posix) {
|
|
outs() << Name << " " << I->TypeChar << " ";
|
|
if (MachO)
|
|
outs() << SymbolAddrStr << " " << "0" /* SymbolSizeStr */ << "\n";
|
|
else
|
|
outs() << SymbolAddrStr << " " << SymbolSizeStr << "\n";
|
|
} else if (OutputFormat == bsd || (OutputFormat == darwin && !MachO)) {
|
|
if (PrintAddress)
|
|
outs() << SymbolAddrStr << ' ';
|
|
if (PrintSize) {
|
|
outs() << SymbolSizeStr;
|
|
outs() << ' ';
|
|
}
|
|
outs() << I->TypeChar;
|
|
if (I->TypeChar == '-' && MachO)
|
|
darwinPrintStab(MachO, I);
|
|
outs() << " " << Name;
|
|
if (I->TypeChar == 'I' && MachO) {
|
|
outs() << " (indirect for ";
|
|
if (I->Sym.getRawDataRefImpl().p) {
|
|
StringRef IndirectName;
|
|
if (MachO->getIndirectName(I->Sym.getRawDataRefImpl(), IndirectName))
|
|
outs() << "?)";
|
|
else
|
|
outs() << IndirectName << ")";
|
|
} else
|
|
outs() << I->IndirectName << ")";
|
|
}
|
|
outs() << "\n";
|
|
} else if (OutputFormat == sysv) {
|
|
std::string PaddedName(Name);
|
|
while (PaddedName.length() < 20)
|
|
PaddedName += " ";
|
|
outs() << PaddedName << "|" << SymbolAddrStr << "| " << I->TypeChar
|
|
<< " | |" << SymbolSizeStr << "| |\n";
|
|
}
|
|
}
|
|
|
|
SymbolList.clear();
|
|
}
|
|
|
|
static char getSymbolNMTypeChar(ELFObjectFileBase &Obj,
|
|
basic_symbol_iterator I) {
|
|
// OK, this is ELF
|
|
elf_symbol_iterator SymI(I);
|
|
|
|
Expected<elf_section_iterator> SecIOrErr = SymI->getSection();
|
|
if (!SecIOrErr) {
|
|
consumeError(SecIOrErr.takeError());
|
|
return '?';
|
|
}
|
|
|
|
elf_section_iterator SecI = *SecIOrErr;
|
|
if (SecI != Obj.section_end()) {
|
|
switch (SecI->getType()) {
|
|
case ELF::SHT_PROGBITS:
|
|
case ELF::SHT_DYNAMIC:
|
|
switch (SecI->getFlags()) {
|
|
case (ELF::SHF_ALLOC | ELF::SHF_EXECINSTR):
|
|
return 't';
|
|
case (ELF::SHF_TLS | ELF::SHF_ALLOC | ELF::SHF_WRITE):
|
|
case (ELF::SHF_ALLOC | ELF::SHF_WRITE):
|
|
return 'd';
|
|
case ELF::SHF_ALLOC:
|
|
case (ELF::SHF_ALLOC | ELF::SHF_MERGE):
|
|
case (ELF::SHF_ALLOC | ELF::SHF_MERGE | ELF::SHF_STRINGS):
|
|
return 'r';
|
|
}
|
|
break;
|
|
case ELF::SHT_NOBITS:
|
|
return 'b';
|
|
case ELF::SHT_INIT_ARRAY:
|
|
case ELF::SHT_FINI_ARRAY:
|
|
return 't';
|
|
}
|
|
}
|
|
|
|
if (SymI->getELFType() == ELF::STT_SECTION) {
|
|
Expected<StringRef> Name = SymI->getName();
|
|
if (!Name) {
|
|
consumeError(Name.takeError());
|
|
return '?';
|
|
}
|
|
return StringSwitch<char>(*Name)
|
|
.StartsWith(".debug", 'N')
|
|
.StartsWith(".note", 'n')
|
|
.StartsWith(".comment", 'n')
|
|
.Default('?');
|
|
}
|
|
|
|
return 'n';
|
|
}
|
|
|
|
static char getSymbolNMTypeChar(COFFObjectFile &Obj, symbol_iterator I) {
|
|
COFFSymbolRef Symb = Obj.getCOFFSymbol(*I);
|
|
// OK, this is COFF.
|
|
symbol_iterator SymI(I);
|
|
|
|
Expected<StringRef> Name = SymI->getName();
|
|
if (!Name) {
|
|
consumeError(Name.takeError());
|
|
return '?';
|
|
}
|
|
|
|
char Ret = StringSwitch<char>(*Name)
|
|
.StartsWith(".debug", 'N')
|
|
.StartsWith(".sxdata", 'N')
|
|
.Default('?');
|
|
|
|
if (Ret != '?')
|
|
return Ret;
|
|
|
|
uint32_t Characteristics = 0;
|
|
if (!COFF::isReservedSectionNumber(Symb.getSectionNumber())) {
|
|
Expected<section_iterator> SecIOrErr = SymI->getSection();
|
|
if (!SecIOrErr) {
|
|
consumeError(SecIOrErr.takeError());
|
|
return '?';
|
|
}
|
|
section_iterator SecI = *SecIOrErr;
|
|
const coff_section *Section = Obj.getCOFFSection(*SecI);
|
|
Characteristics = Section->Characteristics;
|
|
StringRef SectionName;
|
|
Obj.getSectionName(Section, SectionName);
|
|
if (SectionName.startswith(".idata"))
|
|
return 'i';
|
|
}
|
|
|
|
switch (Symb.getSectionNumber()) {
|
|
case COFF::IMAGE_SYM_DEBUG:
|
|
return 'n';
|
|
default:
|
|
// Check section type.
|
|
if (Characteristics & COFF::IMAGE_SCN_CNT_CODE)
|
|
return 't';
|
|
if (Characteristics & COFF::IMAGE_SCN_CNT_INITIALIZED_DATA)
|
|
return Characteristics & COFF::IMAGE_SCN_MEM_WRITE ? 'd' : 'r';
|
|
if (Characteristics & COFF::IMAGE_SCN_CNT_UNINITIALIZED_DATA)
|
|
return 'b';
|
|
if (Characteristics & COFF::IMAGE_SCN_LNK_INFO)
|
|
return 'i';
|
|
// Check for section symbol.
|
|
if (Symb.isSectionDefinition())
|
|
return 's';
|
|
}
|
|
|
|
return '?';
|
|
}
|
|
|
|
static char getSymbolNMTypeChar(COFFImportFile &Obj) {
|
|
switch (Obj.getCOFFImportHeader()->getType()) {
|
|
case COFF::IMPORT_CODE:
|
|
return 't';
|
|
case COFF::IMPORT_DATA:
|
|
return 'd';
|
|
case COFF::IMPORT_CONST:
|
|
return 'r';
|
|
}
|
|
return '?';
|
|
}
|
|
|
|
static char getSymbolNMTypeChar(MachOObjectFile &Obj, basic_symbol_iterator I) {
|
|
DataRefImpl Symb = I->getRawDataRefImpl();
|
|
uint8_t NType = Obj.is64Bit() ? Obj.getSymbol64TableEntry(Symb).n_type
|
|
: Obj.getSymbolTableEntry(Symb).n_type;
|
|
|
|
if (NType & MachO::N_STAB)
|
|
return '-';
|
|
|
|
switch (NType & MachO::N_TYPE) {
|
|
case MachO::N_ABS:
|
|
return 's';
|
|
case MachO::N_INDR:
|
|
return 'i';
|
|
case MachO::N_SECT: {
|
|
Expected<section_iterator> SecOrErr = Obj.getSymbolSection(Symb);
|
|
if (!SecOrErr) {
|
|
consumeError(SecOrErr.takeError());
|
|
return 's';
|
|
}
|
|
section_iterator Sec = *SecOrErr;
|
|
if (Sec == Obj.section_end())
|
|
return 's';
|
|
DataRefImpl Ref = Sec->getRawDataRefImpl();
|
|
StringRef SectionName;
|
|
Obj.getSectionName(Ref, SectionName);
|
|
StringRef SegmentName = Obj.getSectionFinalSegmentName(Ref);
|
|
if (Obj.is64Bit() && Obj.getHeader64().filetype == MachO::MH_KEXT_BUNDLE &&
|
|
SegmentName == "__TEXT_EXEC" && SectionName == "__text")
|
|
return 't';
|
|
if (SegmentName == "__TEXT" && SectionName == "__text")
|
|
return 't';
|
|
if (SegmentName == "__DATA" && SectionName == "__data")
|
|
return 'd';
|
|
if (SegmentName == "__DATA" && SectionName == "__bss")
|
|
return 'b';
|
|
return 's';
|
|
}
|
|
}
|
|
|
|
return '?';
|
|
}
|
|
|
|
static char getSymbolNMTypeChar(WasmObjectFile &Obj, basic_symbol_iterator I) {
|
|
uint32_t Flags = I->getFlags();
|
|
if (Flags & SymbolRef::SF_Executable)
|
|
return 't';
|
|
return 'd';
|
|
}
|
|
|
|
static char getSymbolNMTypeChar(IRObjectFile &Obj, basic_symbol_iterator I) {
|
|
uint32_t Flags = I->getFlags();
|
|
// FIXME: should we print 'b'? At the IR level we cannot be sure if this
|
|
// will be in bss or not, but we could approximate.
|
|
if (Flags & SymbolRef::SF_Executable)
|
|
return 't';
|
|
else if (Triple(Obj.getTargetTriple()).isOSDarwin() &&
|
|
(Flags & SymbolRef::SF_Const))
|
|
return 's';
|
|
else
|
|
return 'd';
|
|
}
|
|
|
|
static bool isObject(SymbolicFile &Obj, basic_symbol_iterator I) {
|
|
return !dyn_cast<ELFObjectFileBase>(&Obj)
|
|
? false
|
|
: elf_symbol_iterator(I)->getELFType() == ELF::STT_OBJECT;
|
|
}
|
|
|
|
static char getNMTypeChar(SymbolicFile &Obj, basic_symbol_iterator I) {
|
|
uint32_t Symflags = I->getFlags();
|
|
if ((Symflags & object::SymbolRef::SF_Weak) && !isa<MachOObjectFile>(Obj)) {
|
|
char Ret = isObject(Obj, I) ? 'v' : 'w';
|
|
return (!(Symflags & object::SymbolRef::SF_Undefined)) ? toupper(Ret) : Ret;
|
|
}
|
|
|
|
if (Symflags & object::SymbolRef::SF_Undefined)
|
|
return 'U';
|
|
|
|
if (Symflags & object::SymbolRef::SF_Common)
|
|
return 'C';
|
|
|
|
char Ret = '?';
|
|
if (Symflags & object::SymbolRef::SF_Absolute)
|
|
Ret = 'a';
|
|
else if (IRObjectFile *IR = dyn_cast<IRObjectFile>(&Obj))
|
|
Ret = getSymbolNMTypeChar(*IR, I);
|
|
else if (COFFObjectFile *COFF = dyn_cast<COFFObjectFile>(&Obj))
|
|
Ret = getSymbolNMTypeChar(*COFF, I);
|
|
else if (COFFImportFile *COFFImport = dyn_cast<COFFImportFile>(&Obj))
|
|
Ret = getSymbolNMTypeChar(*COFFImport);
|
|
else if (MachOObjectFile *MachO = dyn_cast<MachOObjectFile>(&Obj))
|
|
Ret = getSymbolNMTypeChar(*MachO, I);
|
|
else if (WasmObjectFile *Wasm = dyn_cast<WasmObjectFile>(&Obj))
|
|
Ret = getSymbolNMTypeChar(*Wasm, I);
|
|
else
|
|
Ret = getSymbolNMTypeChar(cast<ELFObjectFileBase>(Obj), I);
|
|
|
|
if (Symflags & object::SymbolRef::SF_Global)
|
|
Ret = toupper(Ret);
|
|
|
|
return Ret;
|
|
}
|
|
|
|
// getNsectForSegSect() is used to implement the Mach-O "-s segname sectname"
|
|
// option to dump only those symbols from that section in a Mach-O file.
|
|
// It is called once for each Mach-O file from dumpSymbolNamesFromObject()
|
|
// to get the section number for that named section from the command line
|
|
// arguments. It returns the section number for that section in the Mach-O
|
|
// file or zero it is not present.
|
|
static unsigned getNsectForSegSect(MachOObjectFile *Obj) {
|
|
unsigned Nsect = 1;
|
|
for (auto &S : Obj->sections()) {
|
|
DataRefImpl Ref = S.getRawDataRefImpl();
|
|
StringRef SectionName;
|
|
Obj->getSectionName(Ref, SectionName);
|
|
StringRef SegmentName = Obj->getSectionFinalSegmentName(Ref);
|
|
if (SegmentName == SegSect[0] && SectionName == SegSect[1])
|
|
return Nsect;
|
|
Nsect++;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
// getNsectInMachO() is used to implement the Mach-O "-s segname sectname"
|
|
// option to dump only those symbols from that section in a Mach-O file.
|
|
// It is called once for each symbol in a Mach-O file from
|
|
// dumpSymbolNamesFromObject() and returns the section number for that symbol
|
|
// if it is in a section, else it returns 0.
|
|
static unsigned getNsectInMachO(MachOObjectFile &Obj, BasicSymbolRef Sym) {
|
|
DataRefImpl Symb = Sym.getRawDataRefImpl();
|
|
if (Obj.is64Bit()) {
|
|
MachO::nlist_64 STE = Obj.getSymbol64TableEntry(Symb);
|
|
return (STE.n_type & MachO::N_TYPE) == MachO::N_SECT ? STE.n_sect : 0;
|
|
}
|
|
MachO::nlist STE = Obj.getSymbolTableEntry(Symb);
|
|
return (STE.n_type & MachO::N_TYPE) == MachO::N_SECT ? STE.n_sect : 0;
|
|
}
|
|
|
|
static void
|
|
dumpSymbolNamesFromObject(SymbolicFile &Obj, bool printName,
|
|
const std::string &ArchiveName = std::string(),
|
|
const std::string &ArchitectureName = std::string()) {
|
|
auto Symbols = Obj.symbols();
|
|
if (DynamicSyms) {
|
|
const auto *E = dyn_cast<ELFObjectFileBase>(&Obj);
|
|
if (!E) {
|
|
error("File format has no dynamic symbol table", Obj.getFileName());
|
|
return;
|
|
}
|
|
auto DynSymbols = E->getDynamicSymbolIterators();
|
|
Symbols =
|
|
make_range<basic_symbol_iterator>(DynSymbols.begin(), DynSymbols.end());
|
|
}
|
|
std::string NameBuffer;
|
|
raw_string_ostream OS(NameBuffer);
|
|
// If a "-s segname sectname" option was specified and this is a Mach-O
|
|
// file get the section number for that section in this object file.
|
|
unsigned int Nsect = 0;
|
|
MachOObjectFile *MachO = dyn_cast<MachOObjectFile>(&Obj);
|
|
if (!SegSect.empty() && MachO) {
|
|
Nsect = getNsectForSegSect(MachO);
|
|
// If this section is not in the object file no symbols are printed.
|
|
if (Nsect == 0)
|
|
return;
|
|
}
|
|
if (!MachO || !DyldInfoOnly) {
|
|
for (BasicSymbolRef Sym : Symbols) {
|
|
uint32_t SymFlags = Sym.getFlags();
|
|
if (!DebugSyms && (SymFlags & SymbolRef::SF_FormatSpecific))
|
|
continue;
|
|
if (WithoutAliases && (SymFlags & SymbolRef::SF_Indirect))
|
|
continue;
|
|
// If a "-s segname sectname" option was specified and this is a Mach-O
|
|
// file and this section appears in this file, Nsect will be non-zero then
|
|
// see if this symbol is a symbol from that section and if not skip it.
|
|
if (Nsect && Nsect != getNsectInMachO(*MachO, Sym))
|
|
continue;
|
|
NMSymbol S = {};
|
|
S.Size = 0;
|
|
S.Address = 0;
|
|
if (isa<ELFObjectFileBase>(&Obj))
|
|
S.Size = ELFSymbolRef(Sym).getSize();
|
|
if (PrintAddress && isa<ObjectFile>(Obj)) {
|
|
SymbolRef SymRef(Sym);
|
|
Expected<uint64_t> AddressOrErr = SymRef.getAddress();
|
|
if (!AddressOrErr) {
|
|
consumeError(AddressOrErr.takeError());
|
|
break;
|
|
}
|
|
S.Address = *AddressOrErr;
|
|
}
|
|
S.TypeChar = getNMTypeChar(Obj, Sym);
|
|
std::error_code EC = Sym.printName(OS);
|
|
if (EC && MachO)
|
|
OS << "bad string index";
|
|
else
|
|
error(EC);
|
|
OS << '\0';
|
|
S.Sym = Sym;
|
|
SymbolList.push_back(S);
|
|
}
|
|
}
|
|
|
|
OS.flush();
|
|
const char *P = NameBuffer.c_str();
|
|
unsigned I;
|
|
for (I = 0; I < SymbolList.size(); ++I) {
|
|
SymbolList[I].Name = P;
|
|
P += strlen(P) + 1;
|
|
}
|
|
|
|
// If this is a Mach-O file where the nlist symbol table is out of sync
|
|
// with the dyld export trie then look through exports and fake up symbols
|
|
// for the ones that are missing (also done with the -add-dyldinfo flag).
|
|
// This is needed if strip(1) -T is run on a binary containing swift
|
|
// language symbols for example. The option -only-dyldinfo will fake up
|
|
// all symbols from the dyld export trie as well as the bind info.
|
|
std::string ExportsNameBuffer;
|
|
raw_string_ostream EOS(ExportsNameBuffer);
|
|
std::string BindsNameBuffer;
|
|
raw_string_ostream BOS(BindsNameBuffer);
|
|
std::string LazysNameBuffer;
|
|
raw_string_ostream LOS(LazysNameBuffer);
|
|
std::string WeaksNameBuffer;
|
|
raw_string_ostream WOS(WeaksNameBuffer);
|
|
std::string FunctionStartsNameBuffer;
|
|
raw_string_ostream FOS(FunctionStartsNameBuffer);
|
|
if (MachO && !NoDyldInfo) {
|
|
MachO::mach_header H;
|
|
MachO::mach_header_64 H_64;
|
|
uint32_t HFlags = 0;
|
|
if (MachO->is64Bit()) {
|
|
H_64 = MachO->MachOObjectFile::getHeader64();
|
|
HFlags = H_64.flags;
|
|
} else {
|
|
H = MachO->MachOObjectFile::getHeader();
|
|
HFlags = H.flags;
|
|
}
|
|
uint64_t BaseSegmentAddress = 0;
|
|
for (const auto &Command : MachO->load_commands()) {
|
|
if (Command.C.cmd == MachO::LC_SEGMENT) {
|
|
MachO::segment_command Seg = MachO->getSegmentLoadCommand(Command);
|
|
if (Seg.fileoff == 0 && Seg.filesize != 0) {
|
|
BaseSegmentAddress = Seg.vmaddr;
|
|
break;
|
|
}
|
|
} else if (Command.C.cmd == MachO::LC_SEGMENT_64) {
|
|
MachO::segment_command_64 Seg = MachO->getSegment64LoadCommand(Command);
|
|
if (Seg.fileoff == 0 && Seg.filesize != 0) {
|
|
BaseSegmentAddress = Seg.vmaddr;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
if (DyldInfoOnly || AddDyldInfo ||
|
|
HFlags & MachO::MH_NLIST_OUTOFSYNC_WITH_DYLDINFO) {
|
|
unsigned ExportsAdded = 0;
|
|
Error Err = Error::success();
|
|
for (const llvm::object::ExportEntry &Entry : MachO->exports(Err)) {
|
|
bool found = false;
|
|
bool ReExport = false;
|
|
if (!DyldInfoOnly) {
|
|
for (unsigned J = 0; J < SymbolList.size() && !found; ++J) {
|
|
if (SymbolList[J].Address == Entry.address() + BaseSegmentAddress &&
|
|
SymbolList[J].Name == Entry.name())
|
|
found = true;
|
|
}
|
|
}
|
|
if (!found) {
|
|
NMSymbol S = {};
|
|
S.Address = Entry.address() + BaseSegmentAddress;
|
|
S.Size = 0;
|
|
S.TypeChar = '\0';
|
|
S.Name = Entry.name();
|
|
// There is no symbol in the nlist symbol table for this so we set
|
|
// Sym effectivly to null and the rest of code in here must test for
|
|
// it and not do things like Sym.getFlags() for it.
|
|
S.Sym = BasicSymbolRef();
|
|
S.SymFlags = SymbolRef::SF_Global;
|
|
S.Section = SectionRef();
|
|
S.NType = 0;
|
|
S.NSect = 0;
|
|
S.NDesc = 0;
|
|
S.IndirectName = StringRef();
|
|
|
|
uint64_t EFlags = Entry.flags();
|
|
bool Abs = ((EFlags & MachO::EXPORT_SYMBOL_FLAGS_KIND_MASK) ==
|
|
MachO::EXPORT_SYMBOL_FLAGS_KIND_ABSOLUTE);
|
|
bool Resolver = (EFlags &
|
|
MachO::EXPORT_SYMBOL_FLAGS_STUB_AND_RESOLVER);
|
|
ReExport = (EFlags & MachO::EXPORT_SYMBOL_FLAGS_REEXPORT);
|
|
bool WeakDef = (EFlags & MachO::EXPORT_SYMBOL_FLAGS_WEAK_DEFINITION);
|
|
if (WeakDef)
|
|
S.NDesc |= MachO::N_WEAK_DEF;
|
|
if (Abs) {
|
|
S.NType = MachO::N_EXT | MachO::N_ABS;
|
|
S.TypeChar = 'A';
|
|
} else if (ReExport) {
|
|
S.NType = MachO::N_EXT | MachO::N_INDR;
|
|
S.TypeChar = 'I';
|
|
} else {
|
|
S.NType = MachO::N_EXT | MachO::N_SECT;
|
|
if (Resolver) {
|
|
S.Address = Entry.other() + BaseSegmentAddress;
|
|
if ((S.Address & 1) != 0 &&
|
|
!MachO->is64Bit() && H.cputype == MachO::CPU_TYPE_ARM){
|
|
S.Address &= ~1LL;
|
|
S.NDesc |= MachO::N_ARM_THUMB_DEF;
|
|
}
|
|
} else {
|
|
S.Address = Entry.address() + BaseSegmentAddress;
|
|
}
|
|
StringRef SegmentName = StringRef();
|
|
StringRef SectionName = StringRef();
|
|
for (const SectionRef &Section : MachO->sections()) {
|
|
S.NSect++;
|
|
Section.getName(SectionName);
|
|
SegmentName = MachO->getSectionFinalSegmentName(
|
|
Section.getRawDataRefImpl());
|
|
if (S.Address >= Section.getAddress() &&
|
|
S.Address < Section.getAddress() + Section.getSize()) {
|
|
S.Section = Section;
|
|
break;
|
|
} else if (Entry.name() == "__mh_execute_header" &&
|
|
SegmentName == "__TEXT" && SectionName == "__text") {
|
|
S.Section = Section;
|
|
S.NDesc |= MachO::REFERENCED_DYNAMICALLY;
|
|
break;
|
|
}
|
|
}
|
|
if (SegmentName == "__TEXT" && SectionName == "__text")
|
|
S.TypeChar = 'T';
|
|
else if (SegmentName == "__DATA" && SectionName == "__data")
|
|
S.TypeChar = 'D';
|
|
else if (SegmentName == "__DATA" && SectionName == "__bss")
|
|
S.TypeChar = 'B';
|
|
else
|
|
S.TypeChar = 'S';
|
|
}
|
|
SymbolList.push_back(S);
|
|
|
|
EOS << Entry.name();
|
|
EOS << '\0';
|
|
ExportsAdded++;
|
|
|
|
// For ReExports there are a two more things to do, first add the
|
|
// indirect name and second create the undefined symbol using the
|
|
// referened dynamic library.
|
|
if (ReExport) {
|
|
|
|
// Add the indirect name.
|
|
if (Entry.otherName().empty())
|
|
EOS << Entry.name();
|
|
else
|
|
EOS << Entry.otherName();
|
|
EOS << '\0';
|
|
|
|
// Now create the undefined symbol using the referened dynamic
|
|
// library.
|
|
NMSymbol U = {};
|
|
U.Address = 0;
|
|
U.Size = 0;
|
|
U.TypeChar = 'U';
|
|
if (Entry.otherName().empty())
|
|
U.Name = Entry.name();
|
|
else
|
|
U.Name = Entry.otherName();
|
|
// Again there is no symbol in the nlist symbol table for this so
|
|
// we set Sym effectivly to null and the rest of code in here must
|
|
// test for it and not do things like Sym.getFlags() for it.
|
|
U.Sym = BasicSymbolRef();
|
|
U.SymFlags = SymbolRef::SF_Global | SymbolRef::SF_Undefined;
|
|
U.Section = SectionRef();
|
|
U.NType = MachO::N_EXT | MachO::N_UNDF;
|
|
U.NSect = 0;
|
|
U.NDesc = 0;
|
|
// The library ordinal for this undefined symbol is in the export
|
|
// trie Entry.other().
|
|
MachO::SET_LIBRARY_ORDINAL(U.NDesc, Entry.other());
|
|
U.IndirectName = StringRef();
|
|
SymbolList.push_back(U);
|
|
|
|
// Finally add the undefined symbol's name.
|
|
if (Entry.otherName().empty())
|
|
EOS << Entry.name();
|
|
else
|
|
EOS << Entry.otherName();
|
|
EOS << '\0';
|
|
ExportsAdded++;
|
|
}
|
|
}
|
|
}
|
|
if (Err)
|
|
error(std::move(Err), MachO->getFileName());
|
|
// Set the symbol names and indirect names for the added symbols.
|
|
if (ExportsAdded) {
|
|
EOS.flush();
|
|
const char *Q = ExportsNameBuffer.c_str();
|
|
for (unsigned K = 0; K < ExportsAdded; K++) {
|
|
SymbolList[I].Name = Q;
|
|
Q += strlen(Q) + 1;
|
|
if (SymbolList[I].TypeChar == 'I') {
|
|
SymbolList[I].IndirectName = Q;
|
|
Q += strlen(Q) + 1;
|
|
}
|
|
I++;
|
|
}
|
|
}
|
|
|
|
// Add the undefined symbols from the bind entries.
|
|
unsigned BindsAdded = 0;
|
|
Error BErr = Error::success();
|
|
StringRef LastSymbolName = StringRef();
|
|
for (const llvm::object::MachOBindEntry &Entry : MachO->bindTable(BErr)) {
|
|
bool found = false;
|
|
if (LastSymbolName == Entry.symbolName())
|
|
found = true;
|
|
else if(!DyldInfoOnly) {
|
|
for (unsigned J = 0; J < SymbolList.size() && !found; ++J) {
|
|
if (SymbolList[J].Name == Entry.symbolName())
|
|
found = true;
|
|
}
|
|
}
|
|
if (!found) {
|
|
LastSymbolName = Entry.symbolName();
|
|
NMSymbol B = {};
|
|
B.Address = 0;
|
|
B.Size = 0;
|
|
B.TypeChar = 'U';
|
|
// There is no symbol in the nlist symbol table for this so we set
|
|
// Sym effectivly to null and the rest of code in here must test for
|
|
// it and not do things like Sym.getFlags() for it.
|
|
B.Sym = BasicSymbolRef();
|
|
B.SymFlags = SymbolRef::SF_Global | SymbolRef::SF_Undefined;
|
|
B.NType = MachO::N_EXT | MachO::N_UNDF;
|
|
B.NSect = 0;
|
|
B.NDesc = 0;
|
|
B.NDesc = 0;
|
|
MachO::SET_LIBRARY_ORDINAL(B.NDesc, Entry.ordinal());
|
|
B.IndirectName = StringRef();
|
|
B.Name = Entry.symbolName();
|
|
SymbolList.push_back(B);
|
|
BOS << Entry.symbolName();
|
|
BOS << '\0';
|
|
BindsAdded++;
|
|
}
|
|
}
|
|
if (BErr)
|
|
error(std::move(BErr), MachO->getFileName());
|
|
// Set the symbol names and indirect names for the added symbols.
|
|
if (BindsAdded) {
|
|
BOS.flush();
|
|
const char *Q = BindsNameBuffer.c_str();
|
|
for (unsigned K = 0; K < BindsAdded; K++) {
|
|
SymbolList[I].Name = Q;
|
|
Q += strlen(Q) + 1;
|
|
if (SymbolList[I].TypeChar == 'I') {
|
|
SymbolList[I].IndirectName = Q;
|
|
Q += strlen(Q) + 1;
|
|
}
|
|
I++;
|
|
}
|
|
}
|
|
|
|
// Add the undefined symbols from the lazy bind entries.
|
|
unsigned LazysAdded = 0;
|
|
Error LErr = Error::success();
|
|
LastSymbolName = StringRef();
|
|
for (const llvm::object::MachOBindEntry &Entry :
|
|
MachO->lazyBindTable(LErr)) {
|
|
bool found = false;
|
|
if (LastSymbolName == Entry.symbolName())
|
|
found = true;
|
|
else {
|
|
// Here we must check to see it this symbol is already in the
|
|
// SymbolList as it might have already have been added above via a
|
|
// non-lazy (bind) entry.
|
|
for (unsigned J = 0; J < SymbolList.size() && !found; ++J) {
|
|
if (SymbolList[J].Name == Entry.symbolName())
|
|
found = true;
|
|
}
|
|
}
|
|
if (!found) {
|
|
LastSymbolName = Entry.symbolName();
|
|
NMSymbol L = {};
|
|
L.Name = Entry.symbolName();
|
|
L.Address = 0;
|
|
L.Size = 0;
|
|
L.TypeChar = 'U';
|
|
// There is no symbol in the nlist symbol table for this so we set
|
|
// Sym effectivly to null and the rest of code in here must test for
|
|
// it and not do things like Sym.getFlags() for it.
|
|
L.Sym = BasicSymbolRef();
|
|
L.SymFlags = SymbolRef::SF_Global | SymbolRef::SF_Undefined;
|
|
L.NType = MachO::N_EXT | MachO::N_UNDF;
|
|
L.NSect = 0;
|
|
// The REFERENCE_FLAG_UNDEFINED_LAZY is no longer used but here it
|
|
// makes sence since we are creating this from a lazy bind entry.
|
|
L.NDesc = MachO::REFERENCE_FLAG_UNDEFINED_LAZY;
|
|
MachO::SET_LIBRARY_ORDINAL(L.NDesc, Entry.ordinal());
|
|
L.IndirectName = StringRef();
|
|
SymbolList.push_back(L);
|
|
LOS << Entry.symbolName();
|
|
LOS << '\0';
|
|
LazysAdded++;
|
|
}
|
|
}
|
|
if (LErr)
|
|
error(std::move(LErr), MachO->getFileName());
|
|
// Set the symbol names and indirect names for the added symbols.
|
|
if (LazysAdded) {
|
|
LOS.flush();
|
|
const char *Q = LazysNameBuffer.c_str();
|
|
for (unsigned K = 0; K < LazysAdded; K++) {
|
|
SymbolList[I].Name = Q;
|
|
Q += strlen(Q) + 1;
|
|
if (SymbolList[I].TypeChar == 'I') {
|
|
SymbolList[I].IndirectName = Q;
|
|
Q += strlen(Q) + 1;
|
|
}
|
|
I++;
|
|
}
|
|
}
|
|
|
|
// Add the undefineds symbol from the weak bind entries which are not
|
|
// strong symbols.
|
|
unsigned WeaksAdded = 0;
|
|
Error WErr = Error::success();
|
|
LastSymbolName = StringRef();
|
|
for (const llvm::object::MachOBindEntry &Entry :
|
|
MachO->weakBindTable(WErr)) {
|
|
bool found = false;
|
|
unsigned J = 0;
|
|
if (LastSymbolName == Entry.symbolName() ||
|
|
Entry.flags() & MachO::BIND_SYMBOL_FLAGS_NON_WEAK_DEFINITION) {
|
|
found = true;
|
|
} else {
|
|
for (J = 0; J < SymbolList.size() && !found; ++J) {
|
|
if (SymbolList[J].Name == Entry.symbolName()) {
|
|
found = true;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
if (!found) {
|
|
LastSymbolName = Entry.symbolName();
|
|
NMSymbol W;
|
|
memset(&W, '\0', sizeof(NMSymbol));
|
|
W.Name = Entry.symbolName();
|
|
W.Address = 0;
|
|
W.Size = 0;
|
|
W.TypeChar = 'U';
|
|
// There is no symbol in the nlist symbol table for this so we set
|
|
// Sym effectivly to null and the rest of code in here must test for
|
|
// it and not do things like Sym.getFlags() for it.
|
|
W.Sym = BasicSymbolRef();
|
|
W.SymFlags = SymbolRef::SF_Global | SymbolRef::SF_Undefined;
|
|
W.NType = MachO::N_EXT | MachO::N_UNDF;
|
|
W.NSect = 0;
|
|
// Odd that we are using N_WEAK_DEF on an undefined symbol but that is
|
|
// what is created in this case by the linker when there are real
|
|
// symbols in the nlist structs.
|
|
W.NDesc = MachO::N_WEAK_DEF;
|
|
W.IndirectName = StringRef();
|
|
SymbolList.push_back(W);
|
|
WOS << Entry.symbolName();
|
|
WOS << '\0';
|
|
WeaksAdded++;
|
|
} else {
|
|
// This is the case the symbol was previously been found and it could
|
|
// have been added from a bind or lazy bind symbol. If so and not
|
|
// a definition also mark it as weak.
|
|
if (SymbolList[J].TypeChar == 'U')
|
|
// See comment above about N_WEAK_DEF.
|
|
SymbolList[J].NDesc |= MachO::N_WEAK_DEF;
|
|
}
|
|
}
|
|
if (WErr)
|
|
error(std::move(WErr), MachO->getFileName());
|
|
// Set the symbol names and indirect names for the added symbols.
|
|
if (WeaksAdded) {
|
|
WOS.flush();
|
|
const char *Q = WeaksNameBuffer.c_str();
|
|
for (unsigned K = 0; K < WeaksAdded; K++) {
|
|
SymbolList[I].Name = Q;
|
|
Q += strlen(Q) + 1;
|
|
if (SymbolList[I].TypeChar == 'I') {
|
|
SymbolList[I].IndirectName = Q;
|
|
Q += strlen(Q) + 1;
|
|
}
|
|
I++;
|
|
}
|
|
}
|
|
|
|
// Trying adding symbol from the function starts table and LC_MAIN entry
|
|
// point.
|
|
SmallVector<uint64_t, 8> FoundFns;
|
|
uint64_t lc_main_offset = UINT64_MAX;
|
|
for (const auto &Command : MachO->load_commands()) {
|
|
if (Command.C.cmd == MachO::LC_FUNCTION_STARTS) {
|
|
// We found a function starts segment, parse the addresses for
|
|
// consumption.
|
|
MachO::linkedit_data_command LLC =
|
|
MachO->getLinkeditDataLoadCommand(Command);
|
|
|
|
MachO->ReadULEB128s(LLC.dataoff, FoundFns);
|
|
} else if (Command.C.cmd == MachO::LC_MAIN) {
|
|
MachO::entry_point_command LCmain =
|
|
MachO->getEntryPointCommand(Command);
|
|
lc_main_offset = LCmain.entryoff;
|
|
}
|
|
}
|
|
// See if these addresses are already in the symbol table.
|
|
unsigned FunctionStartsAdded = 0;
|
|
for (uint64_t f = 0; f < FoundFns.size(); f++) {
|
|
bool found = false;
|
|
for (unsigned J = 0; J < SymbolList.size() && !found; ++J) {
|
|
if (SymbolList[J].Address == FoundFns[f] + BaseSegmentAddress)
|
|
found = true;
|
|
}
|
|
// See this address is not already in the symbol table fake up an
|
|
// nlist for it.
|
|
if (!found) {
|
|
NMSymbol F = {};
|
|
F.Name = "<redacted function X>";
|
|
F.Address = FoundFns[f] + BaseSegmentAddress;
|
|
F.Size = 0;
|
|
// There is no symbol in the nlist symbol table for this so we set
|
|
// Sym effectivly to null and the rest of code in here must test for
|
|
// it and not do things like Sym.getFlags() for it.
|
|
F.Sym = BasicSymbolRef();
|
|
F.SymFlags = 0;
|
|
F.NType = MachO::N_SECT;
|
|
F.NSect = 0;
|
|
StringRef SegmentName = StringRef();
|
|
StringRef SectionName = StringRef();
|
|
for (const SectionRef &Section : MachO->sections()) {
|
|
Section.getName(SectionName);
|
|
SegmentName = MachO->getSectionFinalSegmentName(
|
|
Section.getRawDataRefImpl());
|
|
F.NSect++;
|
|
if (F.Address >= Section.getAddress() &&
|
|
F.Address < Section.getAddress() + Section.getSize()) {
|
|
F.Section = Section;
|
|
break;
|
|
}
|
|
}
|
|
if (SegmentName == "__TEXT" && SectionName == "__text")
|
|
F.TypeChar = 't';
|
|
else if (SegmentName == "__DATA" && SectionName == "__data")
|
|
F.TypeChar = 'd';
|
|
else if (SegmentName == "__DATA" && SectionName == "__bss")
|
|
F.TypeChar = 'b';
|
|
else
|
|
F.TypeChar = 's';
|
|
F.NDesc = 0;
|
|
F.IndirectName = StringRef();
|
|
SymbolList.push_back(F);
|
|
if (FoundFns[f] == lc_main_offset)
|
|
FOS << "<redacted LC_MAIN>";
|
|
else
|
|
FOS << "<redacted function " << f << ">";
|
|
FOS << '\0';
|
|
FunctionStartsAdded++;
|
|
}
|
|
}
|
|
if (FunctionStartsAdded) {
|
|
FOS.flush();
|
|
const char *Q = FunctionStartsNameBuffer.c_str();
|
|
for (unsigned K = 0; K < FunctionStartsAdded; K++) {
|
|
SymbolList[I].Name = Q;
|
|
Q += strlen(Q) + 1;
|
|
if (SymbolList[I].TypeChar == 'I') {
|
|
SymbolList[I].IndirectName = Q;
|
|
Q += strlen(Q) + 1;
|
|
}
|
|
I++;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
CurrentFilename = Obj.getFileName();
|
|
sortAndPrintSymbolList(Obj, printName, ArchiveName, ArchitectureName);
|
|
}
|
|
|
|
// checkMachOAndArchFlags() checks to see if the SymbolicFile is a Mach-O file
|
|
// and if it is and there is a list of architecture flags is specified then
|
|
// check to make sure this Mach-O file is one of those architectures or all
|
|
// architectures was specificed. If not then an error is generated and this
|
|
// routine returns false. Else it returns true.
|
|
static bool checkMachOAndArchFlags(SymbolicFile *O, std::string &Filename) {
|
|
auto *MachO = dyn_cast<MachOObjectFile>(O);
|
|
|
|
if (!MachO || ArchAll || ArchFlags.empty())
|
|
return true;
|
|
|
|
MachO::mach_header H;
|
|
MachO::mach_header_64 H_64;
|
|
Triple T;
|
|
const char *McpuDefault, *ArchFlag;
|
|
if (MachO->is64Bit()) {
|
|
H_64 = MachO->MachOObjectFile::getHeader64();
|
|
T = MachOObjectFile::getArchTriple(H_64.cputype, H_64.cpusubtype,
|
|
&McpuDefault, &ArchFlag);
|
|
} else {
|
|
H = MachO->MachOObjectFile::getHeader();
|
|
T = MachOObjectFile::getArchTriple(H.cputype, H.cpusubtype,
|
|
&McpuDefault, &ArchFlag);
|
|
}
|
|
const std::string ArchFlagName(ArchFlag);
|
|
if (none_of(ArchFlags, [&](const std::string &Name) {
|
|
return Name == ArchFlagName;
|
|
})) {
|
|
error("No architecture specified", Filename);
|
|
return false;
|
|
}
|
|
return true;
|
|
}
|
|
|
|
static void dumpSymbolNamesFromFile(std::string &Filename) {
|
|
ErrorOr<std::unique_ptr<MemoryBuffer>> BufferOrErr =
|
|
MemoryBuffer::getFileOrSTDIN(Filename);
|
|
if (error(BufferOrErr.getError(), Filename))
|
|
return;
|
|
|
|
LLVMContext Context;
|
|
LLVMContext *ContextPtr = NoLLVMBitcode ? nullptr : &Context;
|
|
Expected<std::unique_ptr<Binary>> BinaryOrErr =
|
|
createBinary(BufferOrErr.get()->getMemBufferRef(), ContextPtr);
|
|
if (!BinaryOrErr) {
|
|
error(BinaryOrErr.takeError(), Filename);
|
|
return;
|
|
}
|
|
Binary &Bin = *BinaryOrErr.get();
|
|
|
|
if (Archive *A = dyn_cast<Archive>(&Bin)) {
|
|
if (ArchiveMap) {
|
|
Archive::symbol_iterator I = A->symbol_begin();
|
|
Archive::symbol_iterator E = A->symbol_end();
|
|
if (I != E) {
|
|
outs() << "Archive map\n";
|
|
for (; I != E; ++I) {
|
|
Expected<Archive::Child> C = I->getMember();
|
|
if (!C) {
|
|
error(C.takeError(), Filename);
|
|
break;
|
|
}
|
|
Expected<StringRef> FileNameOrErr = C->getName();
|
|
if (!FileNameOrErr) {
|
|
error(FileNameOrErr.takeError(), Filename);
|
|
break;
|
|
}
|
|
StringRef SymName = I->getName();
|
|
outs() << SymName << " in " << FileNameOrErr.get() << "\n";
|
|
}
|
|
outs() << "\n";
|
|
}
|
|
}
|
|
|
|
{
|
|
Error Err = Error::success();
|
|
for (auto &C : A->children(Err)) {
|
|
Expected<std::unique_ptr<Binary>> ChildOrErr =
|
|
C.getAsBinary(ContextPtr);
|
|
if (!ChildOrErr) {
|
|
if (auto E = isNotObjectErrorInvalidFileType(ChildOrErr.takeError()))
|
|
error(std::move(E), Filename, C);
|
|
continue;
|
|
}
|
|
if (SymbolicFile *O = dyn_cast<SymbolicFile>(&*ChildOrErr.get())) {
|
|
if (!MachOPrintSizeWarning && PrintSize && isa<MachOObjectFile>(O)) {
|
|
WithColor::warning(errs(), ToolName)
|
|
<< "sizes with -print-size for Mach-O files are always zero.\n";
|
|
MachOPrintSizeWarning = true;
|
|
}
|
|
if (!checkMachOAndArchFlags(O, Filename))
|
|
return;
|
|
if (!PrintFileName) {
|
|
outs() << "\n";
|
|
if (isa<MachOObjectFile>(O)) {
|
|
outs() << Filename << "(" << O->getFileName() << ")";
|
|
} else
|
|
outs() << O->getFileName();
|
|
outs() << ":\n";
|
|
}
|
|
dumpSymbolNamesFromObject(*O, false, Filename);
|
|
}
|
|
}
|
|
if (Err)
|
|
error(std::move(Err), A->getFileName());
|
|
}
|
|
return;
|
|
}
|
|
if (MachOUniversalBinary *UB = dyn_cast<MachOUniversalBinary>(&Bin)) {
|
|
// If we have a list of architecture flags specified dump only those.
|
|
if (!ArchAll && !ArchFlags.empty()) {
|
|
// Look for a slice in the universal binary that matches each ArchFlag.
|
|
bool ArchFound;
|
|
for (unsigned i = 0; i < ArchFlags.size(); ++i) {
|
|
ArchFound = false;
|
|
for (MachOUniversalBinary::object_iterator I = UB->begin_objects(),
|
|
E = UB->end_objects();
|
|
I != E; ++I) {
|
|
if (ArchFlags[i] == I->getArchFlagName()) {
|
|
ArchFound = true;
|
|
Expected<std::unique_ptr<ObjectFile>> ObjOrErr =
|
|
I->getAsObjectFile();
|
|
std::string ArchiveName;
|
|
std::string ArchitectureName;
|
|
ArchiveName.clear();
|
|
ArchitectureName.clear();
|
|
if (ObjOrErr) {
|
|
ObjectFile &Obj = *ObjOrErr.get();
|
|
if (ArchFlags.size() > 1) {
|
|
if (PrintFileName)
|
|
ArchitectureName = I->getArchFlagName();
|
|
else
|
|
outs() << "\n" << Obj.getFileName() << " (for architecture "
|
|
<< I->getArchFlagName() << ")"
|
|
<< ":\n";
|
|
}
|
|
dumpSymbolNamesFromObject(Obj, false, ArchiveName,
|
|
ArchitectureName);
|
|
} else if (auto E = isNotObjectErrorInvalidFileType(
|
|
ObjOrErr.takeError())) {
|
|
error(std::move(E), Filename, ArchFlags.size() > 1 ?
|
|
StringRef(I->getArchFlagName()) : StringRef());
|
|
continue;
|
|
} else if (Expected<std::unique_ptr<Archive>> AOrErr =
|
|
I->getAsArchive()) {
|
|
std::unique_ptr<Archive> &A = *AOrErr;
|
|
Error Err = Error::success();
|
|
for (auto &C : A->children(Err)) {
|
|
Expected<std::unique_ptr<Binary>> ChildOrErr =
|
|
C.getAsBinary(ContextPtr);
|
|
if (!ChildOrErr) {
|
|
if (auto E = isNotObjectErrorInvalidFileType(
|
|
ChildOrErr.takeError())) {
|
|
error(std::move(E), Filename, C, ArchFlags.size() > 1 ?
|
|
StringRef(I->getArchFlagName()) : StringRef());
|
|
}
|
|
continue;
|
|
}
|
|
if (SymbolicFile *O =
|
|
dyn_cast<SymbolicFile>(&*ChildOrErr.get())) {
|
|
if (PrintFileName) {
|
|
ArchiveName = A->getFileName();
|
|
if (ArchFlags.size() > 1)
|
|
ArchitectureName = I->getArchFlagName();
|
|
} else {
|
|
outs() << "\n" << A->getFileName();
|
|
outs() << "(" << O->getFileName() << ")";
|
|
if (ArchFlags.size() > 1) {
|
|
outs() << " (for architecture " << I->getArchFlagName()
|
|
<< ")";
|
|
}
|
|
outs() << ":\n";
|
|
}
|
|
dumpSymbolNamesFromObject(*O, false, ArchiveName,
|
|
ArchitectureName);
|
|
}
|
|
}
|
|
if (Err)
|
|
error(std::move(Err), A->getFileName());
|
|
} else {
|
|
consumeError(AOrErr.takeError());
|
|
error(Filename + " for architecture " +
|
|
StringRef(I->getArchFlagName()) +
|
|
" is not a Mach-O file or an archive file",
|
|
"Mach-O universal file");
|
|
}
|
|
}
|
|
}
|
|
if (!ArchFound) {
|
|
error(ArchFlags[i],
|
|
"file: " + Filename + " does not contain architecture");
|
|
return;
|
|
}
|
|
}
|
|
return;
|
|
}
|
|
// No architecture flags were specified so if this contains a slice that
|
|
// matches the host architecture dump only that.
|
|
if (!ArchAll) {
|
|
Triple HostTriple = MachOObjectFile::getHostArch();
|
|
StringRef HostArchName = HostTriple.getArchName();
|
|
for (MachOUniversalBinary::object_iterator I = UB->begin_objects(),
|
|
E = UB->end_objects();
|
|
I != E; ++I) {
|
|
if (HostArchName == I->getArchFlagName()) {
|
|
Expected<std::unique_ptr<ObjectFile>> ObjOrErr = I->getAsObjectFile();
|
|
std::string ArchiveName;
|
|
if (ObjOrErr) {
|
|
ObjectFile &Obj = *ObjOrErr.get();
|
|
dumpSymbolNamesFromObject(Obj, false);
|
|
} else if (auto E = isNotObjectErrorInvalidFileType(
|
|
ObjOrErr.takeError())) {
|
|
error(std::move(E), Filename);
|
|
return;
|
|
} else if (Expected<std::unique_ptr<Archive>> AOrErr =
|
|
I->getAsArchive()) {
|
|
std::unique_ptr<Archive> &A = *AOrErr;
|
|
Error Err = Error::success();
|
|
for (auto &C : A->children(Err)) {
|
|
Expected<std::unique_ptr<Binary>> ChildOrErr =
|
|
C.getAsBinary(ContextPtr);
|
|
if (!ChildOrErr) {
|
|
if (auto E = isNotObjectErrorInvalidFileType(
|
|
ChildOrErr.takeError()))
|
|
error(std::move(E), Filename, C);
|
|
continue;
|
|
}
|
|
if (SymbolicFile *O =
|
|
dyn_cast<SymbolicFile>(&*ChildOrErr.get())) {
|
|
if (PrintFileName)
|
|
ArchiveName = A->getFileName();
|
|
else
|
|
outs() << "\n" << A->getFileName() << "(" << O->getFileName()
|
|
<< ")"
|
|
<< ":\n";
|
|
dumpSymbolNamesFromObject(*O, false, ArchiveName);
|
|
}
|
|
}
|
|
if (Err)
|
|
error(std::move(Err), A->getFileName());
|
|
} else {
|
|
consumeError(AOrErr.takeError());
|
|
error(Filename + " for architecture " +
|
|
StringRef(I->getArchFlagName()) +
|
|
" is not a Mach-O file or an archive file",
|
|
"Mach-O universal file");
|
|
}
|
|
return;
|
|
}
|
|
}
|
|
}
|
|
// Either all architectures have been specified or none have been specified
|
|
// and this does not contain the host architecture so dump all the slices.
|
|
bool moreThanOneArch = UB->getNumberOfObjects() > 1;
|
|
for (MachOUniversalBinary::object_iterator I = UB->begin_objects(),
|
|
E = UB->end_objects();
|
|
I != E; ++I) {
|
|
Expected<std::unique_ptr<ObjectFile>> ObjOrErr = I->getAsObjectFile();
|
|
std::string ArchiveName;
|
|
std::string ArchitectureName;
|
|
ArchiveName.clear();
|
|
ArchitectureName.clear();
|
|
if (ObjOrErr) {
|
|
ObjectFile &Obj = *ObjOrErr.get();
|
|
if (PrintFileName) {
|
|
if (isa<MachOObjectFile>(Obj) && moreThanOneArch)
|
|
ArchitectureName = I->getArchFlagName();
|
|
} else {
|
|
if (moreThanOneArch)
|
|
outs() << "\n";
|
|
outs() << Obj.getFileName();
|
|
if (isa<MachOObjectFile>(Obj) && moreThanOneArch)
|
|
outs() << " (for architecture " << I->getArchFlagName() << ")";
|
|
outs() << ":\n";
|
|
}
|
|
dumpSymbolNamesFromObject(Obj, false, ArchiveName, ArchitectureName);
|
|
} else if (auto E = isNotObjectErrorInvalidFileType(
|
|
ObjOrErr.takeError())) {
|
|
error(std::move(E), Filename, moreThanOneArch ?
|
|
StringRef(I->getArchFlagName()) : StringRef());
|
|
continue;
|
|
} else if (Expected<std::unique_ptr<Archive>> AOrErr =
|
|
I->getAsArchive()) {
|
|
std::unique_ptr<Archive> &A = *AOrErr;
|
|
Error Err = Error::success();
|
|
for (auto &C : A->children(Err)) {
|
|
Expected<std::unique_ptr<Binary>> ChildOrErr =
|
|
C.getAsBinary(ContextPtr);
|
|
if (!ChildOrErr) {
|
|
if (auto E = isNotObjectErrorInvalidFileType(
|
|
ChildOrErr.takeError()))
|
|
error(std::move(E), Filename, C, moreThanOneArch ?
|
|
StringRef(ArchitectureName) : StringRef());
|
|
continue;
|
|
}
|
|
if (SymbolicFile *O = dyn_cast<SymbolicFile>(&*ChildOrErr.get())) {
|
|
if (PrintFileName) {
|
|
ArchiveName = A->getFileName();
|
|
if (isa<MachOObjectFile>(O) && moreThanOneArch)
|
|
ArchitectureName = I->getArchFlagName();
|
|
} else {
|
|
outs() << "\n" << A->getFileName();
|
|
if (isa<MachOObjectFile>(O)) {
|
|
outs() << "(" << O->getFileName() << ")";
|
|
if (moreThanOneArch)
|
|
outs() << " (for architecture " << I->getArchFlagName()
|
|
<< ")";
|
|
} else
|
|
outs() << ":" << O->getFileName();
|
|
outs() << ":\n";
|
|
}
|
|
dumpSymbolNamesFromObject(*O, false, ArchiveName, ArchitectureName);
|
|
}
|
|
}
|
|
if (Err)
|
|
error(std::move(Err), A->getFileName());
|
|
} else {
|
|
consumeError(AOrErr.takeError());
|
|
error(Filename + " for architecture " +
|
|
StringRef(I->getArchFlagName()) +
|
|
" is not a Mach-O file or an archive file",
|
|
"Mach-O universal file");
|
|
}
|
|
}
|
|
return;
|
|
}
|
|
if (SymbolicFile *O = dyn_cast<SymbolicFile>(&Bin)) {
|
|
if (!MachOPrintSizeWarning && PrintSize && isa<MachOObjectFile>(O)) {
|
|
WithColor::warning(errs(), ToolName)
|
|
<< "sizes with -print-size for Mach-O files are always zero.\n";
|
|
MachOPrintSizeWarning = true;
|
|
}
|
|
if (!checkMachOAndArchFlags(O, Filename))
|
|
return;
|
|
dumpSymbolNamesFromObject(*O, true);
|
|
}
|
|
}
|
|
|
|
int main(int argc, char **argv) {
|
|
InitLLVM X(argc, argv);
|
|
cl::ParseCommandLineOptions(argc, argv, "llvm symbol table dumper\n");
|
|
|
|
// llvm-nm only reads binary files.
|
|
if (error(sys::ChangeStdinToBinary()))
|
|
return 1;
|
|
|
|
// These calls are needed so that we can read bitcode correctly.
|
|
llvm::InitializeAllTargetInfos();
|
|
llvm::InitializeAllTargetMCs();
|
|
llvm::InitializeAllAsmParsers();
|
|
|
|
ToolName = argv[0];
|
|
if (BSDFormat)
|
|
OutputFormat = bsd;
|
|
if (POSIXFormat)
|
|
OutputFormat = posix;
|
|
if (DarwinFormat)
|
|
OutputFormat = darwin;
|
|
|
|
// The relative order of these is important. If you pass --size-sort it should
|
|
// only print out the size. However, if you pass -S --size-sort, it should
|
|
// print out both the size and address.
|
|
if (SizeSort && !PrintSize)
|
|
PrintAddress = false;
|
|
if (OutputFormat == sysv || SizeSort)
|
|
PrintSize = true;
|
|
if (InputFilenames.empty())
|
|
InputFilenames.push_back("a.out");
|
|
if (InputFilenames.size() > 1)
|
|
MultipleFiles = true;
|
|
|
|
for (unsigned i = 0; i < ArchFlags.size(); ++i) {
|
|
if (ArchFlags[i] == "all") {
|
|
ArchAll = true;
|
|
} else {
|
|
if (!MachOObjectFile::isValidArch(ArchFlags[i]))
|
|
error("Unknown architecture named '" + ArchFlags[i] + "'",
|
|
"for the -arch option");
|
|
}
|
|
}
|
|
|
|
if (!SegSect.empty() && SegSect.size() != 2)
|
|
error("bad number of arguments (must be two arguments)",
|
|
"for the -s option");
|
|
|
|
if (NoDyldInfo && (AddDyldInfo || DyldInfoOnly))
|
|
error("-no-dyldinfo can't be used with -add-dyldinfo or -dyldinfo-only");
|
|
|
|
llvm::for_each(InputFilenames, dumpSymbolNamesFromFile);
|
|
|
|
if (HadError)
|
|
return 1;
|
|
}
|