2020-04-03 02:54:05 +08:00
|
|
|
//===- Writer.cpp ---------------------------------------------------------===//
|
|
|
|
//
|
|
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
#include "Writer.h"
|
|
|
|
#include "Config.h"
|
|
|
|
#include "InputFiles.h"
|
|
|
|
#include "InputSection.h"
|
|
|
|
#include "OutputSegment.h"
|
|
|
|
#include "SymbolTable.h"
|
|
|
|
#include "Symbols.h"
|
2020-04-22 04:37:57 +08:00
|
|
|
#include "SyntheticSections.h"
|
2020-04-03 02:54:05 +08:00
|
|
|
#include "Target.h"
|
|
|
|
|
|
|
|
#include "lld/Common/ErrorHandler.h"
|
|
|
|
#include "lld/Common/Memory.h"
|
|
|
|
#include "llvm/BinaryFormat/MachO.h"
|
2020-04-22 04:37:57 +08:00
|
|
|
#include "llvm/Support/EndianStream.h"
|
2020-04-03 02:54:05 +08:00
|
|
|
#include "llvm/Support/LEB128.h"
|
|
|
|
#include "llvm/Support/MathExtras.h"
|
|
|
|
|
|
|
|
using namespace llvm;
|
|
|
|
using namespace llvm::MachO;
|
|
|
|
using namespace llvm::support;
|
|
|
|
using namespace lld;
|
|
|
|
using namespace lld::macho;
|
|
|
|
|
|
|
|
namespace {
|
|
|
|
class LCLinkEdit;
|
|
|
|
class LCDyldInfo;
|
|
|
|
class LCSymtab;
|
|
|
|
|
|
|
|
class LoadCommand {
|
|
|
|
public:
|
|
|
|
virtual ~LoadCommand() = default;
|
|
|
|
virtual uint32_t getSize() const = 0;
|
|
|
|
virtual void writeTo(uint8_t *buf) const = 0;
|
|
|
|
};
|
|
|
|
|
|
|
|
class Writer {
|
|
|
|
public:
|
|
|
|
Writer() : buffer(errorHandler().outputBuffer) {}
|
|
|
|
|
|
|
|
void createLoadCommands();
|
2020-04-22 04:37:57 +08:00
|
|
|
void scanRelocations();
|
2020-04-03 02:54:05 +08:00
|
|
|
void assignAddresses();
|
|
|
|
|
2020-04-22 04:37:57 +08:00
|
|
|
void createDyldInfoContents();
|
|
|
|
|
2020-04-03 02:54:05 +08:00
|
|
|
void openFile();
|
|
|
|
void writeHeader();
|
|
|
|
void writeSections();
|
|
|
|
|
|
|
|
void run();
|
|
|
|
|
|
|
|
std::vector<LoadCommand *> loadCommands;
|
|
|
|
std::unique_ptr<FileOutputBuffer> &buffer;
|
|
|
|
uint64_t fileSize = 0;
|
|
|
|
uint64_t sizeofCmds = 0;
|
|
|
|
LCLinkEdit *linkEditSeg = nullptr;
|
|
|
|
LCDyldInfo *dyldInfoSeg = nullptr;
|
|
|
|
LCSymtab *symtabSeg = nullptr;
|
|
|
|
};
|
|
|
|
|
|
|
|
class LCPagezero : public LoadCommand {
|
|
|
|
public:
|
|
|
|
uint32_t getSize() const override { return sizeof(segment_command_64); }
|
|
|
|
|
|
|
|
void writeTo(uint8_t *buf) const override {
|
|
|
|
auto *c = reinterpret_cast<segment_command_64 *>(buf);
|
|
|
|
c->cmd = LC_SEGMENT_64;
|
|
|
|
c->cmdsize = getSize();
|
|
|
|
strcpy(c->segname, "__PAGEZERO");
|
|
|
|
c->vmsize = PageSize;
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
class LCLinkEdit : public LoadCommand {
|
|
|
|
public:
|
|
|
|
uint32_t getSize() const override { return sizeof(segment_command_64); }
|
|
|
|
|
|
|
|
void writeTo(uint8_t *buf) const override {
|
|
|
|
auto *c = reinterpret_cast<segment_command_64 *>(buf);
|
|
|
|
c->cmd = LC_SEGMENT_64;
|
|
|
|
c->cmdsize = getSize();
|
|
|
|
strcpy(c->segname, "__LINKEDIT");
|
2020-04-22 04:37:57 +08:00
|
|
|
c->vmaddr = addr;
|
2020-04-03 02:54:05 +08:00
|
|
|
c->fileoff = fileOff;
|
2020-04-22 04:37:57 +08:00
|
|
|
c->filesize = c->vmsize = contents.size();
|
2020-04-03 02:54:05 +08:00
|
|
|
c->maxprot = VM_PROT_READ | VM_PROT_WRITE;
|
|
|
|
c->initprot = VM_PROT_READ;
|
|
|
|
}
|
|
|
|
|
|
|
|
uint64_t getOffset() const { return fileOff + contents.size(); }
|
|
|
|
|
|
|
|
uint64_t fileOff = 0;
|
2020-04-22 04:37:57 +08:00
|
|
|
uint64_t addr = 0;
|
2020-04-03 02:54:05 +08:00
|
|
|
SmallVector<char, 128> contents;
|
|
|
|
};
|
|
|
|
|
|
|
|
class LCDyldInfo : public LoadCommand {
|
|
|
|
public:
|
|
|
|
uint32_t getSize() const override { return sizeof(dyld_info_command); }
|
|
|
|
|
|
|
|
void writeTo(uint8_t *buf) const override {
|
|
|
|
auto *c = reinterpret_cast<dyld_info_command *>(buf);
|
|
|
|
c->cmd = LC_DYLD_INFO_ONLY;
|
|
|
|
c->cmdsize = getSize();
|
2020-04-22 04:37:57 +08:00
|
|
|
c->bind_off = bindOff;
|
|
|
|
c->bind_size = bindSize;
|
2020-04-03 02:54:05 +08:00
|
|
|
c->export_off = exportOff;
|
|
|
|
c->export_size = exportSize;
|
|
|
|
}
|
|
|
|
|
2020-04-22 04:37:57 +08:00
|
|
|
uint64_t bindOff = 0;
|
|
|
|
uint64_t bindSize = 0;
|
2020-04-03 02:54:05 +08:00
|
|
|
uint64_t exportOff = 0;
|
|
|
|
uint64_t exportSize = 0;
|
|
|
|
};
|
|
|
|
|
|
|
|
class LCDysymtab : public LoadCommand {
|
|
|
|
public:
|
|
|
|
uint32_t getSize() const override { return sizeof(dysymtab_command); }
|
|
|
|
|
|
|
|
void writeTo(uint8_t *buf) const override {
|
|
|
|
auto *c = reinterpret_cast<dysymtab_command *>(buf);
|
|
|
|
c->cmd = LC_DYSYMTAB;
|
|
|
|
c->cmdsize = getSize();
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
class LCSegment : public LoadCommand {
|
|
|
|
public:
|
|
|
|
LCSegment(StringRef name, OutputSegment *seg) : name(name), seg(seg) {}
|
|
|
|
|
|
|
|
uint32_t getSize() const override {
|
|
|
|
return sizeof(segment_command_64) +
|
|
|
|
seg->sections.size() * sizeof(section_64);
|
|
|
|
}
|
|
|
|
|
|
|
|
void writeTo(uint8_t *buf) const override {
|
|
|
|
auto *c = reinterpret_cast<segment_command_64 *>(buf);
|
|
|
|
buf += sizeof(segment_command_64);
|
|
|
|
|
|
|
|
c->cmd = LC_SEGMENT_64;
|
|
|
|
c->cmdsize = getSize();
|
|
|
|
memcpy(c->segname, name.data(), name.size());
|
|
|
|
|
|
|
|
// dyld3's MachOLoaded::getSlide() assumes that the __TEXT segment starts
|
|
|
|
// from the beginning of the file (i.e. the header).
|
|
|
|
// TODO: replace this logic by creating a synthetic __TEXT,__mach_header
|
|
|
|
// section instead.
|
2020-04-22 04:37:57 +08:00
|
|
|
c->fileoff = name == "__TEXT" ? 0 : seg->firstSection()->addr - ImageBase;
|
2020-04-03 02:54:05 +08:00
|
|
|
c->vmaddr = c->fileoff + ImageBase;
|
2020-04-22 04:37:57 +08:00
|
|
|
c->vmsize = c->filesize =
|
|
|
|
seg->lastSection()->addr + seg->lastSection()->getSize() - c->vmaddr;
|
2020-04-03 02:54:05 +08:00
|
|
|
c->maxprot = VM_PROT_READ | VM_PROT_WRITE | VM_PROT_EXECUTE;
|
|
|
|
c->initprot = seg->perms;
|
|
|
|
c->nsects = seg->sections.size();
|
|
|
|
|
|
|
|
for (auto &p : seg->sections) {
|
|
|
|
StringRef s = p.first;
|
|
|
|
std::vector<InputSection *> §ions = p.second;
|
|
|
|
|
|
|
|
auto *sectHdr = reinterpret_cast<section_64 *>(buf);
|
|
|
|
buf += sizeof(section_64);
|
|
|
|
|
|
|
|
memcpy(sectHdr->sectname, s.data(), s.size());
|
|
|
|
memcpy(sectHdr->segname, name.data(), name.size());
|
|
|
|
|
|
|
|
sectHdr->addr = sections[0]->addr;
|
|
|
|
sectHdr->offset = sections[0]->addr - ImageBase;
|
|
|
|
sectHdr->align = sections[0]->align;
|
|
|
|
uint32_t maxAlign = 0;
|
|
|
|
for (const InputSection *section : sections)
|
|
|
|
maxAlign = std::max(maxAlign, section->align);
|
|
|
|
sectHdr->align = Log2_32(maxAlign);
|
|
|
|
sectHdr->flags = sections[0]->flags;
|
2020-04-22 04:37:57 +08:00
|
|
|
sectHdr->size = sections.back()->addr + sections.back()->getSize() -
|
2020-04-03 02:54:05 +08:00
|
|
|
sections[0]->addr;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
private:
|
|
|
|
StringRef name;
|
|
|
|
OutputSegment *seg;
|
|
|
|
};
|
|
|
|
|
|
|
|
class LCMain : public LoadCommand {
|
|
|
|
uint32_t getSize() const override { return sizeof(entry_point_command); }
|
|
|
|
|
|
|
|
void writeTo(uint8_t *buf) const override {
|
|
|
|
auto *c = reinterpret_cast<entry_point_command *>(buf);
|
|
|
|
c->cmd = LC_MAIN;
|
|
|
|
c->cmdsize = getSize();
|
|
|
|
c->entryoff = config->entry->getVA();
|
|
|
|
c->stacksize = 0;
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
class LCSymtab : public LoadCommand {
|
|
|
|
public:
|
|
|
|
uint32_t getSize() const override { return sizeof(symtab_command); }
|
|
|
|
|
|
|
|
void writeTo(uint8_t *buf) const override {
|
|
|
|
auto *c = reinterpret_cast<symtab_command *>(buf);
|
|
|
|
c->cmd = LC_SYMTAB;
|
|
|
|
c->cmdsize = getSize();
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
class LCLoadDylib : public LoadCommand {
|
|
|
|
public:
|
|
|
|
LCLoadDylib(StringRef path) : path(path) {}
|
|
|
|
|
|
|
|
uint32_t getSize() const override {
|
|
|
|
return alignTo(sizeof(dylib_command) + path.size() + 1, 8);
|
|
|
|
}
|
|
|
|
|
|
|
|
void writeTo(uint8_t *buf) const override {
|
|
|
|
auto *c = reinterpret_cast<dylib_command *>(buf);
|
|
|
|
buf += sizeof(dylib_command);
|
|
|
|
|
|
|
|
c->cmd = LC_LOAD_DYLIB;
|
|
|
|
c->cmdsize = getSize();
|
|
|
|
c->dylib.name = sizeof(dylib_command);
|
|
|
|
|
|
|
|
memcpy(buf, path.data(), path.size());
|
|
|
|
buf[path.size()] = '\0';
|
|
|
|
}
|
|
|
|
|
|
|
|
private:
|
|
|
|
StringRef path;
|
|
|
|
};
|
|
|
|
|
|
|
|
class LCLoadDylinker : public LoadCommand {
|
|
|
|
public:
|
|
|
|
uint32_t getSize() const override {
|
|
|
|
return alignTo(sizeof(dylinker_command) + path.size() + 1, 8);
|
|
|
|
}
|
|
|
|
|
|
|
|
void writeTo(uint8_t *buf) const override {
|
|
|
|
auto *c = reinterpret_cast<dylinker_command *>(buf);
|
|
|
|
buf += sizeof(dylinker_command);
|
|
|
|
|
|
|
|
c->cmd = LC_LOAD_DYLINKER;
|
|
|
|
c->cmdsize = getSize();
|
|
|
|
c->name = sizeof(dylinker_command);
|
|
|
|
|
|
|
|
memcpy(buf, path.data(), path.size());
|
|
|
|
buf[path.size()] = '\0';
|
|
|
|
}
|
|
|
|
|
|
|
|
private:
|
|
|
|
// Recent versions of Darwin won't run any binary that has dyld at a
|
|
|
|
// different location.
|
|
|
|
const StringRef path = "/usr/lib/dyld";
|
|
|
|
};
|
|
|
|
} // namespace
|
|
|
|
|
|
|
|
void Writer::createLoadCommands() {
|
|
|
|
linkEditSeg = make<LCLinkEdit>();
|
|
|
|
dyldInfoSeg = make<LCDyldInfo>();
|
|
|
|
symtabSeg = make<LCSymtab>();
|
|
|
|
|
|
|
|
loadCommands.push_back(linkEditSeg);
|
|
|
|
loadCommands.push_back(dyldInfoSeg);
|
|
|
|
loadCommands.push_back(symtabSeg);
|
|
|
|
loadCommands.push_back(make<LCPagezero>());
|
|
|
|
loadCommands.push_back(make<LCLoadDylinker>());
|
|
|
|
loadCommands.push_back(make<LCDysymtab>());
|
|
|
|
loadCommands.push_back(make<LCMain>());
|
2020-04-22 04:37:57 +08:00
|
|
|
|
|
|
|
uint8_t segIndex = 1; // LCPagezero is a segment load command
|
|
|
|
for (OutputSegment *seg : outputSegments) {
|
|
|
|
if (!seg->sections.empty()) {
|
|
|
|
loadCommands.push_back(make<LCSegment>(seg->name, seg));
|
|
|
|
seg->index = segIndex++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
uint64_t dylibOrdinal = 1;
|
|
|
|
for (InputFile *file : inputFiles) {
|
|
|
|
if (auto *dylibFile = dyn_cast<DylibFile>(file)) {
|
|
|
|
loadCommands.push_back(make<LCLoadDylib>(dylibFile->dylibName));
|
|
|
|
dylibFile->ordinal = dylibOrdinal++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-04-03 02:54:05 +08:00
|
|
|
// TODO: dyld requires libSystem to be loaded. libSystem is a universal
|
|
|
|
// binary and we don't have support for that yet, so mock it out here.
|
|
|
|
loadCommands.push_back(make<LCLoadDylib>("/usr/lib/libSystem.B.dylib"));
|
2020-04-22 04:37:57 +08:00
|
|
|
}
|
2020-04-03 02:54:05 +08:00
|
|
|
|
2020-04-22 04:37:57 +08:00
|
|
|
void Writer::scanRelocations() {
|
|
|
|
for (InputSection *sect : inputSections)
|
|
|
|
for (Reloc &r : sect->relocs)
|
|
|
|
if (auto *s = r.target.dyn_cast<Symbol *>())
|
|
|
|
if (auto *dylibSymbol = dyn_cast<DylibSymbol>(s))
|
|
|
|
in.got->addEntry(*dylibSymbol);
|
2020-04-03 02:54:05 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
void Writer::assignAddresses() {
|
|
|
|
uint64_t addr = ImageBase + sizeof(mach_header_64);
|
|
|
|
|
|
|
|
uint64_t size = 0;
|
|
|
|
for (LoadCommand *lc : loadCommands)
|
|
|
|
size += lc->getSize();
|
|
|
|
sizeofCmds = size;
|
|
|
|
addr += size;
|
|
|
|
|
|
|
|
for (OutputSegment *seg : outputSegments) {
|
|
|
|
addr = alignTo(addr, PageSize);
|
|
|
|
|
|
|
|
for (auto &p : seg->sections) {
|
|
|
|
ArrayRef<InputSection *> sections = p.second;
|
|
|
|
for (InputSection *isec : sections) {
|
|
|
|
addr = alignTo(addr, isec->align);
|
|
|
|
isec->addr = addr;
|
2020-04-22 04:37:57 +08:00
|
|
|
addr += isec->getSize();
|
2020-04-03 02:54:05 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-04-22 04:37:57 +08:00
|
|
|
addr = alignTo(addr, PageSize);
|
|
|
|
linkEditSeg->addr = addr;
|
2020-04-03 02:54:05 +08:00
|
|
|
linkEditSeg->fileOff = addr - ImageBase;
|
|
|
|
}
|
|
|
|
|
2020-04-22 04:37:57 +08:00
|
|
|
// LC_DYLD_INFO_ONLY contains symbol import/export information. Imported
|
|
|
|
// symbols are described by a sequence of bind opcodes, which allow for a
|
|
|
|
// compact encoding. Exported symbols are described using a trie.
|
|
|
|
void Writer::createDyldInfoContents() {
|
|
|
|
uint64_t sectionStart = linkEditSeg->getOffset();
|
|
|
|
raw_svector_ostream os{linkEditSeg->contents};
|
|
|
|
|
|
|
|
if (in.got->getSize() != 0) {
|
|
|
|
// Emit bind opcodes, which tell dyld which dylib symbols to load.
|
|
|
|
|
|
|
|
// Tell dyld to write to the section containing the GOT.
|
|
|
|
os << static_cast<uint8_t>(BIND_OPCODE_SET_SEGMENT_AND_OFFSET_ULEB |
|
|
|
|
in.got->parent->index);
|
|
|
|
encodeULEB128(in.got->addr - in.got->parent->firstSection()->addr, os);
|
|
|
|
for (const DylibSymbol *sym : in.got->getEntries()) {
|
|
|
|
// TODO: Implement compact encoding -- we only need to encode the
|
|
|
|
// differences between consecutive symbol entries.
|
|
|
|
if (sym->file->ordinal <= BIND_IMMEDIATE_MASK) {
|
|
|
|
os << static_cast<uint8_t>(BIND_OPCODE_SET_DYLIB_ORDINAL_IMM |
|
|
|
|
sym->file->ordinal);
|
|
|
|
} else {
|
|
|
|
error("TODO: Support larger dylib symbol ordinals");
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
os << static_cast<uint8_t>(BIND_OPCODE_SET_SYMBOL_TRAILING_FLAGS_IMM)
|
|
|
|
<< sym->getName() << '\0'
|
|
|
|
<< static_cast<uint8_t>(BIND_OPCODE_SET_TYPE_IMM | BIND_TYPE_POINTER)
|
|
|
|
<< static_cast<uint8_t>(BIND_OPCODE_DO_BIND);
|
|
|
|
}
|
|
|
|
|
|
|
|
os << static_cast<uint8_t>(BIND_OPCODE_DONE);
|
|
|
|
|
|
|
|
dyldInfoSeg->bindOff = sectionStart;
|
|
|
|
dyldInfoSeg->bindSize = linkEditSeg->getOffset() - sectionStart;
|
|
|
|
}
|
|
|
|
|
|
|
|
// TODO: emit bind opcodes for lazy symbols.
|
|
|
|
// TODO: Implement symbol export trie.
|
|
|
|
}
|
|
|
|
|
2020-04-03 02:54:05 +08:00
|
|
|
void Writer::openFile() {
|
|
|
|
Expected<std::unique_ptr<FileOutputBuffer>> bufferOrErr =
|
|
|
|
FileOutputBuffer::create(config->outputFile, fileSize,
|
|
|
|
FileOutputBuffer::F_executable);
|
|
|
|
|
|
|
|
if (!bufferOrErr)
|
|
|
|
error("failed to open " + config->outputFile + ": " +
|
|
|
|
llvm::toString(bufferOrErr.takeError()));
|
|
|
|
else
|
|
|
|
buffer = std::move(*bufferOrErr);
|
|
|
|
}
|
|
|
|
|
|
|
|
void Writer::writeHeader() {
|
|
|
|
auto *hdr = reinterpret_cast<mach_header_64 *>(buffer->getBufferStart());
|
|
|
|
hdr->magic = MH_MAGIC_64;
|
|
|
|
hdr->cputype = CPU_TYPE_X86_64;
|
|
|
|
hdr->cpusubtype = CPU_SUBTYPE_X86_64_ALL | CPU_SUBTYPE_LIB64;
|
|
|
|
hdr->filetype = MH_EXECUTE;
|
|
|
|
hdr->ncmds = loadCommands.size();
|
|
|
|
hdr->sizeofcmds = sizeofCmds;
|
|
|
|
hdr->flags = MH_NOUNDEFS | MH_DYLDLINK | MH_TWOLEVEL;
|
|
|
|
|
|
|
|
uint8_t *p = reinterpret_cast<uint8_t *>(hdr + 1);
|
|
|
|
for (LoadCommand *lc : loadCommands) {
|
|
|
|
lc->writeTo(p);
|
|
|
|
p += lc->getSize();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void Writer::writeSections() {
|
|
|
|
uint8_t *buf = buffer->getBufferStart();
|
|
|
|
|
|
|
|
for (OutputSegment *seg : outputSegments)
|
|
|
|
for (auto § : seg->sections)
|
|
|
|
for (InputSection *isec : sect.second)
|
|
|
|
isec->writeTo(buf + isec->addr - ImageBase);
|
|
|
|
|
|
|
|
memcpy(buf + linkEditSeg->fileOff, linkEditSeg->contents.data(),
|
|
|
|
linkEditSeg->contents.size());
|
|
|
|
}
|
|
|
|
|
|
|
|
void Writer::run() {
|
|
|
|
createLoadCommands();
|
2020-04-22 04:37:57 +08:00
|
|
|
scanRelocations();
|
2020-04-03 02:54:05 +08:00
|
|
|
assignAddresses();
|
2020-04-22 04:37:57 +08:00
|
|
|
|
|
|
|
// Fill __LINKEDIT contents
|
|
|
|
createDyldInfoContents();
|
2020-04-03 02:54:05 +08:00
|
|
|
fileSize = linkEditSeg->fileOff + linkEditSeg->contents.size();
|
|
|
|
|
|
|
|
openFile();
|
|
|
|
if (errorCount())
|
|
|
|
return;
|
|
|
|
|
|
|
|
writeHeader();
|
|
|
|
writeSections();
|
|
|
|
|
|
|
|
if (auto e = buffer->commit())
|
|
|
|
error("failed to write to the output file: " + toString(std::move(e)));
|
|
|
|
}
|
|
|
|
|
|
|
|
void macho::writeResult() { Writer().run(); }
|
2020-04-22 04:37:57 +08:00
|
|
|
|
|
|
|
void macho::createSyntheticSections() {
|
|
|
|
in.got = make<GotSection>();
|
|
|
|
inputSections.push_back(in.got);
|
|
|
|
}
|