forked from OSchip/llvm-project
Properly size the string table, and emit symbol table and string table
entries in the correct order, fixing several fixmes. llvm-svn: 29902
This commit is contained in:
parent
34b70eea5c
commit
7851db75d9
|
@ -204,8 +204,6 @@ namespace llvm {
|
||||||
/// the file, and then emit during finalization.
|
/// the file, and then emit during finalization.
|
||||||
MachOHeader Header;
|
MachOHeader Header;
|
||||||
|
|
||||||
private:
|
|
||||||
|
|
||||||
/// MachOSegment - This struct contains the necessary information to
|
/// MachOSegment - This struct contains the necessary information to
|
||||||
/// emit the load commands for each section in the file.
|
/// emit the load commands for each section in the file.
|
||||||
struct MachOSegment {
|
struct MachOSegment {
|
||||||
|
@ -353,6 +351,8 @@ namespace llvm {
|
||||||
reserved3(0) { }
|
reserved3(0) { }
|
||||||
};
|
};
|
||||||
|
|
||||||
|
private:
|
||||||
|
|
||||||
/// SectionList - This is the list of sections that we have emitted to the
|
/// SectionList - This is the list of sections that we have emitted to the
|
||||||
/// file. Once the file has been completely built, the segment load command
|
/// file. Once the file has been completely built, the segment load command
|
||||||
/// SectionCommands are constructed from this info.
|
/// SectionCommands are constructed from this info.
|
||||||
|
@ -472,6 +472,7 @@ namespace llvm {
|
||||||
/// turned into a real symbol table in the file.
|
/// turned into a real symbol table in the file.
|
||||||
struct MachOSym {
|
struct MachOSym {
|
||||||
const GlobalValue *GV; // The global value this corresponds to.
|
const GlobalValue *GV; // The global value this corresponds to.
|
||||||
|
std::string GVName; // The mangled name of the global value.
|
||||||
uint32_t n_strx; // index into the string table
|
uint32_t n_strx; // index into the string table
|
||||||
uint8_t n_type; // type flag
|
uint8_t n_type; // type flag
|
||||||
uint8_t n_sect; // section number or NO_SECT
|
uint8_t n_sect; // section number or NO_SECT
|
||||||
|
@ -510,20 +511,40 @@ namespace llvm {
|
||||||
N_WEAK_DEF = 0x0080 // coalesced symbol is a weak definition
|
N_WEAK_DEF = 0x0080 // coalesced symbol is a weak definition
|
||||||
};
|
};
|
||||||
|
|
||||||
/// entrySize - This routine returns the size of a symbol table entry as
|
MachOSym(const GlobalValue *gv, std::string name, uint8_t sect) : GV(gv),
|
||||||
/// written to disk.
|
GVName(name), n_strx(0), n_type(sect == NO_SECT ? N_UNDF : N_SECT),
|
||||||
static unsigned entrySize() { return 12; }
|
n_sect(sect), n_desc(0), n_value(0) {
|
||||||
|
// FIXME: names aren't getting the proper global/local prefix
|
||||||
MachOSym(const GlobalValue *gv, uint8_t sect) : GV(gv), n_strx(0),
|
}
|
||||||
n_type(sect == NO_SECT ? N_UNDF : N_SECT), n_sect(sect), n_desc(0),
|
|
||||||
n_value(0) {}
|
|
||||||
};
|
};
|
||||||
|
|
||||||
|
struct MachOSymCmp {
|
||||||
|
bool operator()(const MachOSym &LHS, const MachOSym &RHS) {
|
||||||
|
return LHS.GVName < RHS.GVName;
|
||||||
|
}
|
||||||
|
};
|
||||||
|
|
||||||
|
/// PartitionByLocal - Simple boolean predicate that returns true if Sym is
|
||||||
|
/// a local symbol rather than an external symbol.
|
||||||
|
static bool PartitionByLocal(const MachOSym &Sym);
|
||||||
|
|
||||||
|
/// PartitionByDefined - Simple boolean predicate that returns true if Sym
|
||||||
|
/// is defined in this module.
|
||||||
|
static bool PartitionByDefined(const MachOWriter::MachOSym &Sym);
|
||||||
|
|
||||||
/// SymbolTable - This is the list of symbols we have emitted to the file.
|
/// SymbolTable - This is the list of symbols we have emitted to the file.
|
||||||
/// This actually gets rearranged before emission to the file (to put the
|
/// This actually gets rearranged before emission to the file (to put the
|
||||||
/// local symbols first in the list).
|
/// local symbols first in the list).
|
||||||
std::vector<MachOSym> SymbolTable;
|
std::vector<MachOSym> SymbolTable;
|
||||||
|
|
||||||
|
/// SymT - A buffer to hold the symbol table before we write it out at the
|
||||||
|
/// appropriate location in the file.
|
||||||
|
DataBuffer SymT;
|
||||||
|
|
||||||
|
/// StrT - A buffer to hold the string table before we write it out at the
|
||||||
|
/// appropriate location in the file.
|
||||||
|
DataBuffer StrT;
|
||||||
|
|
||||||
/// PendingSyms - This is a list of externally defined symbols that we have
|
/// PendingSyms - This is a list of externally defined symbols that we have
|
||||||
/// been asked to emit, but have not seen a reference to. When a reference
|
/// been asked to emit, but have not seen a reference to. When a reference
|
||||||
/// is seen, the symbol will move from this list to the SymbolTable.
|
/// is seen, the symbol will move from this list to the SymbolTable.
|
||||||
|
@ -533,9 +554,6 @@ namespace llvm {
|
||||||
/// SymbolTable to aid in emitting the DYSYMTAB load command.
|
/// SymbolTable to aid in emitting the DYSYMTAB load command.
|
||||||
std::vector<unsigned> DynamicSymbolTable;
|
std::vector<unsigned> DynamicSymbolTable;
|
||||||
|
|
||||||
/// StringTable - The table of strings referenced by SymbolTable entries
|
|
||||||
std::vector<std::string> StringTable;
|
|
||||||
|
|
||||||
// align - Emit padding into the file until the current output position is
|
// align - Emit padding into the file until the current output position is
|
||||||
// aligned to the specified power of two boundary.
|
// aligned to the specified power of two boundary.
|
||||||
static void align(DataBuffer &Output, unsigned Boundary) {
|
static void align(DataBuffer &Output, unsigned Boundary) {
|
||||||
|
@ -624,8 +642,7 @@ namespace llvm {
|
||||||
void EmitHeaderAndLoadCommands();
|
void EmitHeaderAndLoadCommands();
|
||||||
void EmitSections();
|
void EmitSections();
|
||||||
void EmitRelocations();
|
void EmitRelocations();
|
||||||
void EmitSymbolTable();
|
void BufferSymbolAndStringTable();
|
||||||
void EmitStringTable();
|
|
||||||
};
|
};
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -30,6 +30,7 @@
|
||||||
#include "llvm/Target/TargetJITInfo.h"
|
#include "llvm/Target/TargetJITInfo.h"
|
||||||
#include "llvm/Support/Mangler.h"
|
#include "llvm/Support/Mangler.h"
|
||||||
#include "llvm/Support/MathExtras.h"
|
#include "llvm/Support/MathExtras.h"
|
||||||
|
#include <algorithm>
|
||||||
#include <iostream>
|
#include <iostream>
|
||||||
using namespace llvm;
|
using namespace llvm;
|
||||||
|
|
||||||
|
@ -128,10 +129,11 @@ bool MachOCodeEmitter::finishFunction(MachineFunction &F) {
|
||||||
MOS->size += CurBufferPtr - BufferBegin;
|
MOS->size += CurBufferPtr - BufferBegin;
|
||||||
|
|
||||||
// Get a symbol for the function to add to the symbol table
|
// Get a symbol for the function to add to the symbol table
|
||||||
MachOWriter::MachOSym FnSym(F.getFunction(), MOS->Index);
|
const GlobalValue *FuncV = F.getFunction();
|
||||||
|
MachOWriter::MachOSym FnSym(FuncV, MOW.Mang->getValueName(FuncV), MOS->Index);
|
||||||
|
|
||||||
// Figure out the binding (linkage) of the symbol.
|
// Figure out the binding (linkage) of the symbol.
|
||||||
switch (F.getFunction()->getLinkage()) {
|
switch (FuncV->getLinkage()) {
|
||||||
default:
|
default:
|
||||||
// appending linkage is illegal for functions.
|
// appending linkage is illegal for functions.
|
||||||
assert(0 && "Unknown linkage type!");
|
assert(0 && "Unknown linkage type!");
|
||||||
|
@ -159,7 +161,6 @@ bool MachOCodeEmitter::finishFunction(MachineFunction &F) {
|
||||||
// until the sections are all layed out, but we still need to
|
// until the sections are all layed out, but we still need to
|
||||||
// record them. Maybe emit TargetRelocations and then resolve
|
// record them. Maybe emit TargetRelocations and then resolve
|
||||||
// those at file writing time?
|
// those at file writing time?
|
||||||
std::cerr << "whee!\n";
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
Relocations.clear();
|
Relocations.clear();
|
||||||
|
@ -191,7 +192,7 @@ void MachOWriter::AddSymbolToSection(MachOSection &Sec, GlobalVariable *GV) {
|
||||||
unsigned Size = TM.getTargetData()->getTypeSize(Ty);
|
unsigned Size = TM.getTargetData()->getTypeSize(Ty);
|
||||||
unsigned Align = Log2_32(TM.getTargetData()->getTypeAlignment(Ty));
|
unsigned Align = Log2_32(TM.getTargetData()->getTypeAlignment(Ty));
|
||||||
|
|
||||||
MachOSym Sym(GV, Sec.Index);
|
MachOSym Sym(GV, Mang->getValueName(GV), Sec.Index);
|
||||||
// Reserve space in the .bss section for this symbol while maintaining the
|
// Reserve space in the .bss section for this symbol while maintaining the
|
||||||
// desired section alignment, which must be at least as much as required by
|
// desired section alignment, which must be at least as much as required by
|
||||||
// this symbol.
|
// this symbol.
|
||||||
|
@ -227,7 +228,8 @@ void MachOWriter::EmitGlobal(GlobalVariable *GV) {
|
||||||
// part of the common block if they are zero initialized and allowed to be
|
// part of the common block if they are zero initialized and allowed to be
|
||||||
// merged with other symbols.
|
// merged with other symbols.
|
||||||
if (NoInit || GV->hasLinkOnceLinkage() || GV->hasWeakLinkage()) {
|
if (NoInit || GV->hasLinkOnceLinkage() || GV->hasWeakLinkage()) {
|
||||||
MachOWriter::MachOSym ExtOrCommonSym(GV, MachOSym::NO_SECT);
|
MachOWriter::MachOSym ExtOrCommonSym(GV, Mang->getValueName(GV),
|
||||||
|
MachOSym::NO_SECT);
|
||||||
ExtOrCommonSym.n_type |= MachOSym::N_EXT;
|
ExtOrCommonSym.n_type |= MachOSym::N_EXT;
|
||||||
// For undefined (N_UNDF) external (N_EXT) types, n_value is the size in
|
// For undefined (N_UNDF) external (N_EXT) types, n_value is the size in
|
||||||
// bytes of the symbol.
|
// bytes of the symbol.
|
||||||
|
@ -279,12 +281,18 @@ bool MachOWriter::doInitialization(Module &M) {
|
||||||
/// doFinalization - Now that the module has been completely processed, emit
|
/// doFinalization - Now that the module has been completely processed, emit
|
||||||
/// the Mach-O file to 'O'.
|
/// the Mach-O file to 'O'.
|
||||||
bool MachOWriter::doFinalization(Module &M) {
|
bool MachOWriter::doFinalization(Module &M) {
|
||||||
|
// FIXME: we don't handle debug info yet, we should probably do that.
|
||||||
|
|
||||||
// Okay, the.text section has been completed, build the .data, .bss, and
|
// Okay, the.text section has been completed, build the .data, .bss, and
|
||||||
// "common" sections next.
|
// "common" sections next.
|
||||||
for (Module::global_iterator I = M.global_begin(), E = M.global_end();
|
for (Module::global_iterator I = M.global_begin(), E = M.global_end();
|
||||||
I != E; ++I)
|
I != E; ++I)
|
||||||
EmitGlobal(I);
|
EmitGlobal(I);
|
||||||
|
|
||||||
|
// Emit the symbol table to temporary buffers, so that we know the size of
|
||||||
|
// the string table when we write the load commands in the next phase.
|
||||||
|
BufferSymbolAndStringTable();
|
||||||
|
|
||||||
// Emit the header and load commands.
|
// Emit the header and load commands.
|
||||||
EmitHeaderAndLoadCommands();
|
EmitHeaderAndLoadCommands();
|
||||||
|
|
||||||
|
@ -296,12 +304,9 @@ bool MachOWriter::doFinalization(Module &M) {
|
||||||
// have different relocation types.
|
// have different relocation types.
|
||||||
EmitRelocations();
|
EmitRelocations();
|
||||||
|
|
||||||
// Emit the symbol table.
|
// Write the symbol table and the string table to the end of the file.
|
||||||
// FIXME: we don't handle debug info yet, we should probably do that.
|
O.write((char*)&SymT[0], SymT.size());
|
||||||
EmitSymbolTable();
|
O.write((char*)&StrT[0], StrT.size());
|
||||||
|
|
||||||
// Emit the string table for the sections we have.
|
|
||||||
EmitStringTable();
|
|
||||||
|
|
||||||
// We are done with the abstract symbols.
|
// We are done with the abstract symbols.
|
||||||
SectionList.clear();
|
SectionList.clear();
|
||||||
|
@ -383,16 +388,11 @@ void MachOWriter::EmitHeaderAndLoadCommands() {
|
||||||
}
|
}
|
||||||
|
|
||||||
// Step #6: Emit LC_SYMTAB/LC_DYSYMTAB load commands
|
// Step #6: Emit LC_SYMTAB/LC_DYSYMTAB load commands
|
||||||
// FIXME: We'll need to scan over the symbol table and possibly do the sort
|
|
||||||
// here so that we can set the proper indices in the dysymtab load command for
|
|
||||||
// the index and number of external symbols defined in this module.
|
|
||||||
// FIXME: We'll also need to scan over all the symbols so that we can
|
|
||||||
// calculate the size of the string table.
|
|
||||||
// FIXME: add size of relocs
|
// FIXME: add size of relocs
|
||||||
SymTab.symoff = SEG.fileoff + SEG.filesize;
|
SymTab.symoff = SEG.fileoff + SEG.filesize;
|
||||||
SymTab.nsyms = SymbolTable.size();
|
SymTab.nsyms = SymbolTable.size();
|
||||||
SymTab.stroff = SymTab.symoff + SymTab.nsyms * MachOSym::entrySize();
|
SymTab.stroff = SymTab.symoff + SymT.size();
|
||||||
SymTab.strsize = 10;
|
SymTab.strsize = StrT.size();
|
||||||
outword(FH, SymTab.cmd);
|
outword(FH, SymTab.cmd);
|
||||||
outword(FH, SymTab.cmdsize);
|
outword(FH, SymTab.cmdsize);
|
||||||
outword(FH, SymTab.symoff);
|
outword(FH, SymTab.symoff);
|
||||||
|
@ -401,6 +401,8 @@ void MachOWriter::EmitHeaderAndLoadCommands() {
|
||||||
outword(FH, SymTab.strsize);
|
outword(FH, SymTab.strsize);
|
||||||
|
|
||||||
// FIXME: set DySymTab fields appropriately
|
// FIXME: set DySymTab fields appropriately
|
||||||
|
// We should probably just update these in BufferSymbolAndStringTable since
|
||||||
|
// thats where we're partitioning up the different kinds of symbols.
|
||||||
outword(FH, DySymTab.cmd);
|
outword(FH, DySymTab.cmd);
|
||||||
outword(FH, DySymTab.cmdsize);
|
outword(FH, DySymTab.cmdsize);
|
||||||
outword(FH, DySymTab.ilocalsym);
|
outword(FH, DySymTab.ilocalsym);
|
||||||
|
@ -440,54 +442,74 @@ void MachOWriter::EmitRelocations() {
|
||||||
// specific.
|
// specific.
|
||||||
}
|
}
|
||||||
|
|
||||||
/// EmitSymbolTable - Sort the symbols we encountered and assign them each a
|
/// PartitionByLocal - Simple boolean predicate that returns true if Sym is
|
||||||
/// string table index so that they appear in the correct order in the output
|
/// a local symbol rather than an external symbol.
|
||||||
/// file.
|
bool MachOWriter::PartitionByLocal(const MachOSym &Sym) {
|
||||||
void MachOWriter::EmitSymbolTable() {
|
// FIXME: Not totally sure if private extern counts as external
|
||||||
// The order of the symbol table is:
|
return (Sym.n_type & (MachOSym::N_EXT | MachOSym::N_PEXT)) == 0;
|
||||||
// local symbols
|
}
|
||||||
// defined external symbols (sorted by name)
|
|
||||||
// undefined external symbols (sorted by name)
|
|
||||||
DataBuffer ST;
|
|
||||||
|
|
||||||
// FIXME: enforce the above ordering, presumably by sorting by name,
|
/// PartitionByDefined - Simple boolean predicate that returns true if Sym is
|
||||||
// then partitioning twice.
|
/// defined in this module.
|
||||||
unsigned stringIndex;
|
bool MachOWriter::PartitionByDefined(const MachOSym &Sym) {
|
||||||
|
// FIXME: Do N_ABS or N_INDR count as defined?
|
||||||
|
return (Sym.n_type & MachOSym::N_SECT) == MachOSym::N_SECT;
|
||||||
|
}
|
||||||
|
|
||||||
|
/// BufferSymbolAndStringTable - Sort the symbols we encountered and assign them
|
||||||
|
/// each a string table index so that they appear in the correct order in the
|
||||||
|
/// output file.
|
||||||
|
void MachOWriter::BufferSymbolAndStringTable() {
|
||||||
|
// The order of the symbol table is:
|
||||||
|
// 1. local symbols
|
||||||
|
// 2. defined external symbols (sorted by name)
|
||||||
|
// 3. undefined external symbols (sorted by name)
|
||||||
|
|
||||||
|
// Sort the symbols by name, so that when we partition the symbols by scope
|
||||||
|
// of definition, we won't have to sort by name within each partition.
|
||||||
|
std::sort(SymbolTable.begin(), SymbolTable.end(), MachOSymCmp());
|
||||||
|
|
||||||
|
// Parition the symbol table entries so that all local symbols come before
|
||||||
|
// all symbols with external linkage. { 1 | 2 3 }
|
||||||
|
std::partition(SymbolTable.begin(), SymbolTable.end(), PartitionByLocal);
|
||||||
|
|
||||||
|
// Advance iterator to beginning of external symbols and partition so that
|
||||||
|
// all external symbols defined in this module come before all external
|
||||||
|
// symbols defined elsewhere. { 1 | 2 | 3 }
|
||||||
for (std::vector<MachOSym>::iterator I = SymbolTable.begin(),
|
for (std::vector<MachOSym>::iterator I = SymbolTable.begin(),
|
||||||
E = SymbolTable.end(); I != E; ++I) {
|
E = SymbolTable.end(); I != E; ++I) {
|
||||||
// FIXME: remove when we actually calculate these correctly
|
if (!PartitionByLocal(*I)) {
|
||||||
I->n_strx = 1;
|
std::partition(I, E, PartitionByDefined);
|
||||||
StringTable.push_back(Mang->getValueName(I->GV));
|
break;
|
||||||
// Emit nlist to buffer
|
|
||||||
outword(ST, I->n_strx);
|
|
||||||
outbyte(ST, I->n_type);
|
|
||||||
outbyte(ST, I->n_sect);
|
|
||||||
outhalf(ST, I->n_desc);
|
|
||||||
outaddr(ST, I->n_value);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
O.write((char*)&ST[0], ST.size());
|
|
||||||
}
|
}
|
||||||
|
|
||||||
/// EmitStringTable - This method adds and emits a section for the Mach-O
|
|
||||||
/// string table.
|
|
||||||
void MachOWriter::EmitStringTable() {
|
|
||||||
// The order of the string table is:
|
|
||||||
// strings for external symbols
|
|
||||||
// strings for local symbols
|
|
||||||
// This is the symbol table, but backwards. This allows us to avoid a sorting
|
|
||||||
// the symbol table again; all we have to do is use a reverse iterator.
|
|
||||||
DataBuffer ST;
|
|
||||||
|
|
||||||
// Write out a leading zero byte when emitting string table, for n_strx == 0
|
// Write out a leading zero byte when emitting string table, for n_strx == 0
|
||||||
// which means an empty string.
|
// which means an empty string.
|
||||||
outbyte(ST, 0);
|
outbyte(StrT, 0);
|
||||||
|
|
||||||
for (std::vector<std::string>::iterator I = StringTable.begin(),
|
// The order of the string table is:
|
||||||
E = StringTable.end(); I != E; ++I) {
|
// 1. strings for external symbols
|
||||||
// FIXME: do not arbitrarily cap symbols to 16 characters
|
// 2. strings for local symbols
|
||||||
// FIXME: do something more efficient than outstring
|
// Since this is the opposite order from the symbol table, which we have just
|
||||||
outstring(ST, *I, 16);
|
// sorted, we can walk the symbol table backwards to output the string table.
|
||||||
|
for (std::vector<MachOSym>::reverse_iterator I = SymbolTable.rbegin(),
|
||||||
|
E = SymbolTable.rend(); I != E; ++I) {
|
||||||
|
if (I->GVName == "") {
|
||||||
|
I->n_strx = 0;
|
||||||
|
} else {
|
||||||
|
I->n_strx = StrT.size();
|
||||||
|
outstring(StrT, I->GVName, I->GVName.length()+1);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
for (std::vector<MachOSym>::iterator I = SymbolTable.begin(),
|
||||||
|
E = SymbolTable.end(); I != E; ++I) {
|
||||||
|
// Emit nlist to buffer
|
||||||
|
outword(SymT, I->n_strx);
|
||||||
|
outbyte(SymT, I->n_type);
|
||||||
|
outbyte(SymT, I->n_sect);
|
||||||
|
outhalf(SymT, I->n_desc);
|
||||||
|
outaddr(SymT, I->n_value);
|
||||||
}
|
}
|
||||||
O.write((char*)&ST[0], ST.size());
|
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in New Issue