forked from OSchip/llvm-project
[llvm-objdump] Use the COFF export table for additional symbols
Most linked executables do not have a symbol table in COFF. However, it is pretty typical to have some export entries. Use those entries to inform the disassembler about potential function definitions and call targets. llvm-svn: 253429
This commit is contained in:
parent
67361cc2e1
commit
fbb1c3a70b
|
@ -15,8 +15,8 @@ define hidden i32 @bah(i8* %start) #0 align 2 {
|
||||||
; ARM: $t
|
; ARM: $t
|
||||||
; ARM-NEXT: 48 1c
|
; ARM-NEXT: 48 1c
|
||||||
|
|
||||||
; THUMB: $a
|
; THUMB: $a{{.*}}:
|
||||||
; THUMB-NEXT: 04 70
|
; THUMB-NEXT: 04 70
|
||||||
; THUMB-NEXT: 2d e5
|
; THUMB-NEXT: 2d e5
|
||||||
; THUMB: $t
|
; THUMB: $t{{.*}}:
|
||||||
; THUMB-NEXT: 48 1c adds r0, r1, #1
|
; THUMB-NEXT: 48 1c adds r0, r1, #1
|
||||||
|
|
Binary file not shown.
|
@ -0,0 +1,8 @@
|
||||||
|
// RUN: llvm-objdump -d %p/Inputs/disassemble.dll.coff-i386 | \
|
||||||
|
// RUN: FileCheck %s
|
||||||
|
|
||||||
|
// CHECK-LABEL: g:
|
||||||
|
// CHECK: calll 8 <f>
|
||||||
|
|
||||||
|
// CHECK-LABEL: f:
|
||||||
|
// CHECK: calll -24 <g>
|
|
@ -886,27 +886,66 @@ static void DisassembleObject(const ObjectFile *Obj, bool InlineRelocs) {
|
||||||
}
|
}
|
||||||
|
|
||||||
// Create a mapping from virtual address to symbol name. This is used to
|
// Create a mapping from virtual address to symbol name. This is used to
|
||||||
// pretty print the target of a call.
|
// pretty print the symbols while disassembling.
|
||||||
std::vector<std::pair<uint64_t, StringRef>> AllSymbols;
|
typedef std::vector<std::pair<uint64_t, StringRef>> SectionSymbolsTy;
|
||||||
if (MIA) {
|
std::map<SectionRef, SectionSymbolsTy> AllSymbols;
|
||||||
for (const SymbolRef &Symbol : Obj->symbols()) {
|
for (const SymbolRef &Symbol : Obj->symbols()) {
|
||||||
if (Symbol.getType() != SymbolRef::ST_Function)
|
ErrorOr<uint64_t> AddressOrErr = Symbol.getAddress();
|
||||||
continue;
|
error(AddressOrErr.getError());
|
||||||
|
uint64_t Address = *AddressOrErr;
|
||||||
|
|
||||||
ErrorOr<uint64_t> AddressOrErr = Symbol.getAddress();
|
ErrorOr<StringRef> Name = Symbol.getName();
|
||||||
error(AddressOrErr.getError());
|
error(Name.getError());
|
||||||
uint64_t Address = *AddressOrErr;
|
if (Name->empty())
|
||||||
|
continue;
|
||||||
|
|
||||||
ErrorOr<StringRef> Name = Symbol.getName();
|
ErrorOr<section_iterator> SectionOrErr = Symbol.getSection();
|
||||||
error(Name.getError());
|
error(SectionOrErr.getError());
|
||||||
if (Name->empty())
|
section_iterator SecI = *SectionOrErr;
|
||||||
continue;
|
if (SecI == Obj->section_end())
|
||||||
AllSymbols.push_back(std::make_pair(Address, *Name));
|
continue;
|
||||||
}
|
|
||||||
|
|
||||||
array_pod_sort(AllSymbols.begin(), AllSymbols.end());
|
AllSymbols[*SecI].emplace_back(Address, *Name);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// Create a mapping from virtual address to section.
|
||||||
|
std::vector<std::pair<uint64_t, SectionRef>> SectionAddresses;
|
||||||
|
for (SectionRef Sec : Obj->sections())
|
||||||
|
SectionAddresses.emplace_back(Sec.getAddress(), Sec);
|
||||||
|
array_pod_sort(SectionAddresses.begin(), SectionAddresses.end());
|
||||||
|
|
||||||
|
// Linked executables (.exe and .dll files) typically don't include a real
|
||||||
|
// symbol table but they might contain an export table.
|
||||||
|
if (const auto *COFFObj = dyn_cast<COFFObjectFile>(Obj)) {
|
||||||
|
for (const auto &ExportEntry : COFFObj->export_directories()) {
|
||||||
|
StringRef Name;
|
||||||
|
error(ExportEntry.getSymbolName(Name));
|
||||||
|
if (Name.empty())
|
||||||
|
continue;
|
||||||
|
uint32_t RVA;
|
||||||
|
error(ExportEntry.getExportRVA(RVA));
|
||||||
|
|
||||||
|
uint64_t VA = COFFObj->getImageBase() + RVA;
|
||||||
|
auto Sec = std::upper_bound(
|
||||||
|
SectionAddresses.begin(), SectionAddresses.end(), VA,
|
||||||
|
[](uint64_t LHS, const std::pair<uint64_t, SectionRef> &RHS) {
|
||||||
|
return LHS < RHS.first;
|
||||||
|
});
|
||||||
|
if (Sec != SectionAddresses.begin())
|
||||||
|
--Sec;
|
||||||
|
else
|
||||||
|
Sec = SectionAddresses.end();
|
||||||
|
|
||||||
|
if (Sec != SectionAddresses.end())
|
||||||
|
AllSymbols[Sec->second].emplace_back(VA, Name);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
// Sort all the symbols, this allows us to use a simple binary search to find
|
||||||
|
// a symbol near an address.
|
||||||
|
for (std::pair<const SectionRef, SectionSymbolsTy> &SecSyms : AllSymbols)
|
||||||
|
array_pod_sort(SecSyms.second.begin(), SecSyms.second.end());
|
||||||
|
|
||||||
for (const SectionRef &Section : ToolSectionFilter(*Obj)) {
|
for (const SectionRef &Section : ToolSectionFilter(*Obj)) {
|
||||||
if (!DisassembleAll && (!Section.isText() || Section.isVirtual()))
|
if (!DisassembleAll && (!Section.isText() || Section.isVirtual()))
|
||||||
continue;
|
continue;
|
||||||
|
@ -916,33 +955,21 @@ static void DisassembleObject(const ObjectFile *Obj, bool InlineRelocs) {
|
||||||
if (!SectSize)
|
if (!SectSize)
|
||||||
continue;
|
continue;
|
||||||
|
|
||||||
// Make a list of all the symbols in this section.
|
// Get the list of all the symbols in this section.
|
||||||
std::vector<std::pair<uint64_t, StringRef>> Symbols;
|
SectionSymbolsTy &Symbols = AllSymbols[Section];
|
||||||
std::vector<uint64_t> DataMappingSymsAddr;
|
std::vector<uint64_t> DataMappingSymsAddr;
|
||||||
std::vector<uint64_t> TextMappingSymsAddr;
|
std::vector<uint64_t> TextMappingSymsAddr;
|
||||||
for (const SymbolRef &Symbol : Obj->symbols()) {
|
if (Obj->isELF() && Obj->getArch() == Triple::aarch64) {
|
||||||
if (Section.containsSymbol(Symbol)) {
|
for (const auto &Symb : Symbols) {
|
||||||
ErrorOr<uint64_t> AddressOrErr = Symbol.getAddress();
|
uint64_t Address = Symb.first;
|
||||||
error(AddressOrErr.getError());
|
StringRef Name = Symb.second;
|
||||||
uint64_t Address = *AddressOrErr;
|
if (Name.startswith("$d"))
|
||||||
Address -= SectionAddr;
|
DataMappingSymsAddr.push_back(Address);
|
||||||
if (Address >= SectSize)
|
if (Name.startswith("$x"))
|
||||||
continue;
|
TextMappingSymsAddr.push_back(Address);
|
||||||
|
|
||||||
ErrorOr<StringRef> Name = Symbol.getName();
|
|
||||||
error(Name.getError());
|
|
||||||
Symbols.push_back(std::make_pair(Address, *Name));
|
|
||||||
if (Obj->isELF() && Obj->getArch() == Triple::aarch64) {
|
|
||||||
if (Name->startswith("$d"))
|
|
||||||
DataMappingSymsAddr.push_back(Address);
|
|
||||||
if (Name->startswith("$x"))
|
|
||||||
TextMappingSymsAddr.push_back(Address);
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
// Sort the symbols by address, just in case they didn't come in that way.
|
|
||||||
array_pod_sort(Symbols.begin(), Symbols.end());
|
|
||||||
std::sort(DataMappingSymsAddr.begin(), DataMappingSymsAddr.end());
|
std::sort(DataMappingSymsAddr.begin(), DataMappingSymsAddr.end());
|
||||||
std::sort(TextMappingSymsAddr.begin(), TextMappingSymsAddr.end());
|
std::sort(TextMappingSymsAddr.begin(), TextMappingSymsAddr.end());
|
||||||
|
|
||||||
|
@ -991,11 +1018,16 @@ static void DisassembleObject(const ObjectFile *Obj, bool InlineRelocs) {
|
||||||
// Disassemble symbol by symbol.
|
// Disassemble symbol by symbol.
|
||||||
for (unsigned si = 0, se = Symbols.size(); si != se; ++si) {
|
for (unsigned si = 0, se = Symbols.size(); si != se; ++si) {
|
||||||
|
|
||||||
uint64_t Start = Symbols[si].first;
|
uint64_t Start = Symbols[si].first - SectionAddr;
|
||||||
// The end is either the section end or the beginning of the next symbol.
|
// The end is either the section end or the beginning of the next
|
||||||
uint64_t End = (si == se - 1) ? SectSize : Symbols[si + 1].first;
|
// symbol.
|
||||||
|
uint64_t End =
|
||||||
|
(si == se - 1) ? SectSize : Symbols[si + 1].first - SectionAddr;
|
||||||
|
// Don't try to disassemble beyond the end of section contents.
|
||||||
|
if (End > SectSize)
|
||||||
|
End = SectSize;
|
||||||
// If this symbol has the same address as the next symbol, then skip it.
|
// If this symbol has the same address as the next symbol, then skip it.
|
||||||
if (Start == End)
|
if (Start >= End)
|
||||||
continue;
|
continue;
|
||||||
|
|
||||||
outs() << '\n' << Symbols[si].second << ":\n";
|
outs() << '\n' << Symbols[si].second << ":\n";
|
||||||
|
@ -1056,26 +1088,55 @@ static void DisassembleObject(const ObjectFile *Obj, bool InlineRelocs) {
|
||||||
SectionAddr + Index, outs(), "", *STI);
|
SectionAddr + Index, outs(), "", *STI);
|
||||||
outs() << CommentStream.str();
|
outs() << CommentStream.str();
|
||||||
Comments.clear();
|
Comments.clear();
|
||||||
|
|
||||||
|
// Try to resolve the target of a call, tail call, etc. to a specific
|
||||||
|
// symbol.
|
||||||
if (MIA && (MIA->isCall(Inst) || MIA->isUnconditionalBranch(Inst) ||
|
if (MIA && (MIA->isCall(Inst) || MIA->isUnconditionalBranch(Inst) ||
|
||||||
MIA->isConditionalBranch(Inst))) {
|
MIA->isConditionalBranch(Inst))) {
|
||||||
uint64_t Target;
|
uint64_t Target;
|
||||||
if (MIA->evaluateBranch(Inst, SectionAddr + Index, Size, Target)) {
|
if (MIA->evaluateBranch(Inst, SectionAddr + Index, Size, Target)) {
|
||||||
auto TargetSym = std::upper_bound(
|
// In a relocatable object, the target's section must reside in
|
||||||
AllSymbols.begin(), AllSymbols.end(), Target,
|
// the same section as the call instruction or it is accessed
|
||||||
[](uint64_t LHS, const std::pair<uint64_t, StringRef> &RHS) {
|
// through a relocation.
|
||||||
return LHS < RHS.first;
|
//
|
||||||
});
|
// In a non-relocatable object, the target may be in any section.
|
||||||
if (TargetSym != AllSymbols.begin())
|
//
|
||||||
--TargetSym;
|
// N.B. We don't walk the relocations in the relocatable case yet.
|
||||||
else
|
auto *TargetSectionSymbols = &Symbols;
|
||||||
TargetSym = AllSymbols.end();
|
if (!Obj->isRelocatableObject()) {
|
||||||
|
auto SectionAddress = std::upper_bound(
|
||||||
|
SectionAddresses.begin(), SectionAddresses.end(), Target,
|
||||||
|
[](uint64_t LHS,
|
||||||
|
const std::pair<uint64_t, SectionRef> &RHS) {
|
||||||
|
return LHS < RHS.first;
|
||||||
|
});
|
||||||
|
if (SectionAddress != SectionAddresses.begin()) {
|
||||||
|
--SectionAddress;
|
||||||
|
TargetSectionSymbols = &AllSymbols[SectionAddress->second];
|
||||||
|
} else {
|
||||||
|
TargetSectionSymbols = nullptr;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
if (TargetSym != AllSymbols.end()) {
|
// Find the first symbol in the section whose offset is less than
|
||||||
outs() << " <" << TargetSym->second;
|
// or equal to the target.
|
||||||
uint64_t Disp = Target - TargetSym->first;
|
if (TargetSectionSymbols) {
|
||||||
if (Disp)
|
auto TargetSym = std::upper_bound(
|
||||||
outs() << '+' << utohexstr(Disp);
|
TargetSectionSymbols->begin(), TargetSectionSymbols->end(),
|
||||||
outs() << '>';
|
Target, [](uint64_t LHS,
|
||||||
|
const std::pair<uint64_t, StringRef> &RHS) {
|
||||||
|
return LHS < RHS.first;
|
||||||
|
});
|
||||||
|
if (TargetSym != Symbols.begin()) {
|
||||||
|
--TargetSym;
|
||||||
|
uint64_t TargetAddress = std::get<0>(*TargetSym);
|
||||||
|
StringRef TargetName = std::get<1>(*TargetSym);
|
||||||
|
outs() << " <" << TargetName;
|
||||||
|
uint64_t Disp = Target - TargetAddress;
|
||||||
|
if (Disp)
|
||||||
|
outs() << '+' << utohexstr(Disp);
|
||||||
|
outs() << '>';
|
||||||
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in New Issue