2020-04-03 02:54:05 +08:00
|
|
|
//===- InputFiles.h ---------------------------------------------*- C++ -*-===//
|
|
|
|
//
|
|
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
#ifndef LLD_MACHO_INPUT_FILES_H
|
|
|
|
#define LLD_MACHO_INPUT_FILES_H
|
|
|
|
|
2020-05-22 06:26:35 +08:00
|
|
|
#include "MachOStructs.h"
|
|
|
|
|
2020-04-03 02:54:05 +08:00
|
|
|
#include "lld/Common/LLVM.h"
|
2020-08-19 06:46:21 +08:00
|
|
|
#include "lld/Common/Memory.h"
|
2020-04-03 02:54:05 +08:00
|
|
|
#include "llvm/ADT/DenseSet.h"
|
|
|
|
#include "llvm/BinaryFormat/MachO.h"
|
|
|
|
#include "llvm/Object/Archive.h"
|
|
|
|
#include "llvm/Support/MemoryBuffer.h"
|
2020-06-06 02:18:33 +08:00
|
|
|
#include "llvm/TextAPI/MachO/InterfaceFile.h"
|
|
|
|
#include "llvm/TextAPI/MachO/TextAPIReader.h"
|
[lld-macho][re-land] Support .subsections_via_symbols
Summary:
This diff restores and builds upon @pcc and @ruiu's initial work on
subsections.
The .subsections_via_symbols directive indicates we can split each
section along symbol boundaries, unless those symbols have been marked
with `.alt_entry`.
We exercise this functionality in our tests by using order files that
rearrange those symbols.
Depends on D79668.
Reviewers: ruiu, pcc, MaskRay, smeenai, alexshap, gkm, Ktwu, christylee
Reviewed By: smeenai
Subscribers: thakis, llvm-commits, pcc, ruiu
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D79926
2020-05-19 23:46:07 +08:00
|
|
|
|
|
|
|
#include <map>
|
2020-04-03 02:54:05 +08:00
|
|
|
#include <vector>
|
|
|
|
|
|
|
|
namespace lld {
|
|
|
|
namespace macho {
|
|
|
|
|
|
|
|
class InputSection;
|
|
|
|
class Symbol;
|
|
|
|
struct Reloc;
|
|
|
|
|
[lld-macho][re-land] Support .subsections_via_symbols
Summary:
This diff restores and builds upon @pcc and @ruiu's initial work on
subsections.
The .subsections_via_symbols directive indicates we can split each
section along symbol boundaries, unless those symbols have been marked
with `.alt_entry`.
We exercise this functionality in our tests by using order files that
rearrange those symbols.
Depends on D79668.
Reviewers: ruiu, pcc, MaskRay, smeenai, alexshap, gkm, Ktwu, christylee
Reviewed By: smeenai
Subscribers: thakis, llvm-commits, pcc, ruiu
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D79926
2020-05-19 23:46:07 +08:00
|
|
|
// If .subsections_via_symbols is set, each InputSection will be split along
|
|
|
|
// symbol boundaries. The keys of a SubsectionMap represent the offsets of
|
|
|
|
// each subsection from the start of the original pre-split InputSection.
|
|
|
|
using SubsectionMap = std::map<uint32_t, InputSection *>;
|
|
|
|
|
2020-04-03 02:54:05 +08:00
|
|
|
class InputFile {
|
|
|
|
public:
|
|
|
|
enum Kind {
|
|
|
|
ObjKind,
|
2020-04-22 04:37:57 +08:00
|
|
|
DylibKind,
|
2020-05-15 03:43:51 +08:00
|
|
|
ArchiveKind,
|
2020-08-11 09:47:13 +08:00
|
|
|
OpaqueKind,
|
2020-04-03 02:54:05 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
virtual ~InputFile() = default;
|
|
|
|
Kind kind() const { return fileKind; }
|
2020-08-19 06:46:21 +08:00
|
|
|
StringRef getName() const { return name; }
|
2020-04-03 02:54:05 +08:00
|
|
|
|
|
|
|
MemoryBufferRef mb;
|
|
|
|
std::vector<Symbol *> symbols;
|
[lld-macho][re-land] Support .subsections_via_symbols
Summary:
This diff restores and builds upon @pcc and @ruiu's initial work on
subsections.
The .subsections_via_symbols directive indicates we can split each
section along symbol boundaries, unless those symbols have been marked
with `.alt_entry`.
We exercise this functionality in our tests by using order files that
rearrange those symbols.
Depends on D79668.
Reviewers: ruiu, pcc, MaskRay, smeenai, alexshap, gkm, Ktwu, christylee
Reviewed By: smeenai
Subscribers: thakis, llvm-commits, pcc, ruiu
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D79926
2020-05-19 23:46:07 +08:00
|
|
|
ArrayRef<llvm::MachO::section_64> sectionHeaders;
|
|
|
|
std::vector<SubsectionMap> subsections;
|
2020-04-03 02:54:05 +08:00
|
|
|
|
|
|
|
protected:
|
2020-08-19 06:46:21 +08:00
|
|
|
InputFile(Kind kind, MemoryBufferRef mb)
|
|
|
|
: mb(mb), fileKind(kind), name(mb.getBufferIdentifier()) {}
|
|
|
|
|
|
|
|
InputFile(Kind kind, const llvm::MachO::InterfaceFile &interface)
|
|
|
|
: fileKind(kind), name(saver.save(interface.getPath())) {}
|
2020-04-03 02:54:05 +08:00
|
|
|
|
[lld-macho][re-land] Support .subsections_via_symbols
Summary:
This diff restores and builds upon @pcc and @ruiu's initial work on
subsections.
The .subsections_via_symbols directive indicates we can split each
section along symbol boundaries, unless those symbols have been marked
with `.alt_entry`.
We exercise this functionality in our tests by using order files that
rearrange those symbols.
Depends on D79668.
Reviewers: ruiu, pcc, MaskRay, smeenai, alexshap, gkm, Ktwu, christylee
Reviewed By: smeenai
Subscribers: thakis, llvm-commits, pcc, ruiu
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D79926
2020-05-19 23:46:07 +08:00
|
|
|
void parseSections(ArrayRef<llvm::MachO::section_64>);
|
|
|
|
|
2020-05-22 06:26:35 +08:00
|
|
|
void parseSymbols(ArrayRef<lld::structs::nlist_64> nList, const char *strtab,
|
[lld-macho][re-land] Support .subsections_via_symbols
Summary:
This diff restores and builds upon @pcc and @ruiu's initial work on
subsections.
The .subsections_via_symbols directive indicates we can split each
section along symbol boundaries, unless those symbols have been marked
with `.alt_entry`.
We exercise this functionality in our tests by using order files that
rearrange those symbols.
Depends on D79668.
Reviewers: ruiu, pcc, MaskRay, smeenai, alexshap, gkm, Ktwu, christylee
Reviewed By: smeenai
Subscribers: thakis, llvm-commits, pcc, ruiu
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D79926
2020-05-19 23:46:07 +08:00
|
|
|
bool subsectionsViaSymbols);
|
2020-04-03 02:54:05 +08:00
|
|
|
|
[lld-macho][re-land] Support .subsections_via_symbols
Summary:
This diff restores and builds upon @pcc and @ruiu's initial work on
subsections.
The .subsections_via_symbols directive indicates we can split each
section along symbol boundaries, unless those symbols have been marked
with `.alt_entry`.
We exercise this functionality in our tests by using order files that
rearrange those symbols.
Depends on D79668.
Reviewers: ruiu, pcc, MaskRay, smeenai, alexshap, gkm, Ktwu, christylee
Reviewed By: smeenai
Subscribers: thakis, llvm-commits, pcc, ruiu
Tags: #llvm
Differential Revision: https://reviews.llvm.org/D79926
2020-05-19 23:46:07 +08:00
|
|
|
void parseRelocations(const llvm::MachO::section_64 &, SubsectionMap &);
|
2020-04-03 02:54:05 +08:00
|
|
|
|
|
|
|
private:
|
|
|
|
const Kind fileKind;
|
2020-08-19 06:46:21 +08:00
|
|
|
const StringRef name;
|
2020-04-03 02:54:05 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
// .o file
|
|
|
|
class ObjFile : public InputFile {
|
|
|
|
public:
|
|
|
|
explicit ObjFile(MemoryBufferRef mb);
|
|
|
|
static bool classof(const InputFile *f) { return f->kind() == ObjKind; }
|
|
|
|
};
|
|
|
|
|
2020-08-11 09:47:13 +08:00
|
|
|
// command-line -sectcreate file
|
|
|
|
class OpaqueFile : public InputFile {
|
|
|
|
public:
|
|
|
|
explicit OpaqueFile(MemoryBufferRef mb, StringRef segName,
|
|
|
|
StringRef sectName);
|
|
|
|
static bool classof(const InputFile *f) { return f->kind() == OpaqueKind; }
|
|
|
|
};
|
|
|
|
|
2020-04-22 04:37:57 +08:00
|
|
|
// .dylib file
|
|
|
|
class DylibFile : public InputFile {
|
|
|
|
public:
|
2020-04-24 11:16:49 +08:00
|
|
|
// Mach-O dylibs can re-export other dylibs as sub-libraries, meaning that the
|
|
|
|
// symbols in those sub-libraries will be available under the umbrella
|
|
|
|
// library's namespace. Those sub-libraries can also have their own
|
|
|
|
// re-exports. When loading a re-exported dylib, `umbrella` should be set to
|
|
|
|
// the root dylib to ensure symbols in the child library are correctly bound
|
|
|
|
// to the root. On the other hand, if a dylib is being directly loaded
|
|
|
|
// (through an -lfoo flag), then `umbrella` should be a nullptr.
|
|
|
|
explicit DylibFile(MemoryBufferRef mb, DylibFile *umbrella = nullptr);
|
2020-06-06 02:18:33 +08:00
|
|
|
|
2020-08-19 06:46:21 +08:00
|
|
|
explicit DylibFile(const llvm::MachO::InterfaceFile &interface,
|
|
|
|
DylibFile *umbrella = nullptr);
|
|
|
|
|
2020-04-22 04:37:57 +08:00
|
|
|
static bool classof(const InputFile *f) { return f->kind() == DylibKind; }
|
|
|
|
|
|
|
|
StringRef dylibName;
|
|
|
|
uint64_t ordinal = 0; // Ordinal numbering starts from 1, so 0 is a sentinel
|
2020-04-24 11:16:49 +08:00
|
|
|
bool reexport = false;
|
|
|
|
std::vector<DylibFile *> reexported;
|
2020-04-22 04:37:57 +08:00
|
|
|
};
|
|
|
|
|
2020-05-15 03:43:51 +08:00
|
|
|
// .a file
|
|
|
|
class ArchiveFile : public InputFile {
|
|
|
|
public:
|
|
|
|
explicit ArchiveFile(std::unique_ptr<llvm::object::Archive> &&file);
|
|
|
|
static bool classof(const InputFile *f) { return f->kind() == ArchiveKind; }
|
|
|
|
void fetch(const llvm::object::Archive::Symbol &sym);
|
|
|
|
|
|
|
|
private:
|
|
|
|
std::unique_ptr<llvm::object::Archive> file;
|
|
|
|
// Keep track of children fetched from the archive by tracking
|
|
|
|
// which address offsets have been fetched already.
|
|
|
|
llvm::DenseSet<uint64_t> seen;
|
|
|
|
};
|
|
|
|
|
2020-04-03 02:54:05 +08:00
|
|
|
extern std::vector<InputFile *> inputFiles;
|
|
|
|
|
|
|
|
llvm::Optional<MemoryBufferRef> readFile(StringRef path);
|
|
|
|
|
2020-08-19 05:37:04 +08:00
|
|
|
const llvm::MachO::load_command *
|
|
|
|
findCommand(const llvm::MachO::mach_header_64 *, uint32_t type);
|
|
|
|
|
2020-04-03 02:54:05 +08:00
|
|
|
} // namespace macho
|
|
|
|
|
|
|
|
std::string toString(const macho::InputFile *file);
|
|
|
|
} // namespace lld
|
|
|
|
|
|
|
|
#endif
|