2015-10-01 01:23:26 +08:00
|
|
|
//===- LinkerScript.cpp ---------------------------------------------------===//
|
|
|
|
//
|
|
|
|
// The LLVM Linker
|
|
|
|
//
|
|
|
|
// This file is distributed under the University of Illinois Open Source
|
|
|
|
// License. See LICENSE.TXT for details.
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
//
|
|
|
|
// This file contains the parser/evaluator of the linker script.
|
2016-07-22 03:45:22 +08:00
|
|
|
// It parses a linker script and write the result to Config or ScriptConfig
|
|
|
|
// objects.
|
|
|
|
//
|
|
|
|
// If SECTIONS command is used, a ScriptConfig contains an AST
|
|
|
|
// of the command which will later be consumed by createSections() and
|
|
|
|
// assignAddresses().
|
2015-10-01 01:23:26 +08:00
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
2016-02-12 05:17:59 +08:00
|
|
|
#include "LinkerScript.h"
|
2015-10-01 01:23:26 +08:00
|
|
|
#include "Config.h"
|
|
|
|
#include "Driver.h"
|
2016-02-13 05:47:28 +08:00
|
|
|
#include "InputSection.h"
|
2016-04-16 18:10:32 +08:00
|
|
|
#include "OutputSections.h"
|
2016-04-07 04:59:11 +08:00
|
|
|
#include "ScriptParser.h"
|
2016-06-29 16:01:32 +08:00
|
|
|
#include "Strings.h"
|
2016-07-12 14:39:48 +08:00
|
|
|
#include "Symbols.h"
|
2015-10-01 01:23:26 +08:00
|
|
|
#include "SymbolTable.h"
|
2016-07-01 18:27:36 +08:00
|
|
|
#include "Target.h"
|
2016-07-19 17:25:43 +08:00
|
|
|
#include "Writer.h"
|
2016-04-20 02:58:11 +08:00
|
|
|
#include "llvm/ADT/StringSwitch.h"
|
2016-04-16 18:10:32 +08:00
|
|
|
#include "llvm/Support/ELF.h"
|
2015-10-01 01:23:26 +08:00
|
|
|
#include "llvm/Support/FileSystem.h"
|
|
|
|
#include "llvm/Support/MemoryBuffer.h"
|
2015-10-13 08:09:21 +08:00
|
|
|
#include "llvm/Support/Path.h"
|
2015-10-11 09:53:04 +08:00
|
|
|
#include "llvm/Support/StringSaver.h"
|
2015-10-01 01:23:26 +08:00
|
|
|
|
|
|
|
using namespace llvm;
|
2016-04-16 18:10:32 +08:00
|
|
|
using namespace llvm::ELF;
|
2016-02-13 05:47:28 +08:00
|
|
|
using namespace llvm::object;
|
2015-10-01 01:23:26 +08:00
|
|
|
using namespace lld;
|
2016-02-28 08:25:54 +08:00
|
|
|
using namespace lld::elf;
|
2015-10-01 01:23:26 +08:00
|
|
|
|
2016-09-08 16:19:13 +08:00
|
|
|
LinkerScriptBase *elf::ScriptBase;
|
2016-04-21 04:13:41 +08:00
|
|
|
ScriptConfiguration *elf::ScriptConfig;
|
2016-02-12 05:17:59 +08:00
|
|
|
|
2016-09-08 16:20:30 +08:00
|
|
|
template <class ELFT> static void addRegular(SymbolAssignment *Cmd) {
|
2016-08-12 07:22:52 +08:00
|
|
|
Symbol *Sym = Symtab<ELFT>::X->addRegular(Cmd->Name, STB_GLOBAL, STV_DEFAULT);
|
|
|
|
Sym->Visibility = Cmd->Hidden ? STV_HIDDEN : STV_DEFAULT;
|
|
|
|
Cmd->Sym = Sym->body();
|
2016-09-16 23:30:47 +08:00
|
|
|
|
|
|
|
// If we have no SECTIONS then we don't have '.' and don't call
|
|
|
|
// assignAddresses(). We calculate symbol value immediately in this case.
|
|
|
|
if (!ScriptConfig->HasSections)
|
|
|
|
cast<DefinedRegular<ELFT>>(Cmd->Sym)->Value = Cmd->Expression(0);
|
2016-08-11 15:56:43 +08:00
|
|
|
}
|
|
|
|
|
2016-08-12 11:31:09 +08:00
|
|
|
template <class ELFT> static void addSynthetic(SymbolAssignment *Cmd) {
|
2016-08-19 23:36:32 +08:00
|
|
|
Symbol *Sym = Symtab<ELFT>::X->addSynthetic(
|
|
|
|
Cmd->Name, nullptr, 0, Cmd->Hidden ? STV_HIDDEN : STV_DEFAULT);
|
2016-08-12 07:22:52 +08:00
|
|
|
Cmd->Sym = Sym->body();
|
2016-08-11 15:56:43 +08:00
|
|
|
}
|
|
|
|
|
2016-09-07 15:08:43 +08:00
|
|
|
template <class ELFT> static void addSymbol(SymbolAssignment *Cmd) {
|
|
|
|
if (Cmd->IsAbsolute)
|
|
|
|
addRegular<ELFT>(Cmd);
|
|
|
|
else
|
|
|
|
addSynthetic<ELFT>(Cmd);
|
|
|
|
}
|
2016-08-12 07:22:52 +08:00
|
|
|
// If a symbol was in PROVIDE(), we need to define it only when
|
|
|
|
// it is an undefined symbol.
|
|
|
|
template <class ELFT> static bool shouldDefine(SymbolAssignment *Cmd) {
|
|
|
|
if (Cmd->Name == ".")
|
2016-08-11 15:56:43 +08:00
|
|
|
return false;
|
2016-08-12 07:22:52 +08:00
|
|
|
if (!Cmd->Provide)
|
|
|
|
return true;
|
|
|
|
SymbolBody *B = Symtab<ELFT>::X->find(Cmd->Name);
|
|
|
|
return B && B->isUndefined();
|
2016-08-11 15:56:43 +08:00
|
|
|
}
|
|
|
|
|
2016-07-21 14:43:01 +08:00
|
|
|
bool SymbolAssignment::classof(const BaseCommand *C) {
|
|
|
|
return C->Kind == AssignmentKind;
|
|
|
|
}
|
|
|
|
|
|
|
|
bool OutputSectionCommand::classof(const BaseCommand *C) {
|
|
|
|
return C->Kind == OutputSectionKind;
|
|
|
|
}
|
|
|
|
|
2016-07-21 22:26:59 +08:00
|
|
|
bool InputSectionDescription::classof(const BaseCommand *C) {
|
|
|
|
return C->Kind == InputSectionKind;
|
|
|
|
}
|
|
|
|
|
2016-08-04 17:29:31 +08:00
|
|
|
bool AssertCommand::classof(const BaseCommand *C) {
|
|
|
|
return C->Kind == AssertKind;
|
|
|
|
}
|
|
|
|
|
2016-07-23 22:09:58 +08:00
|
|
|
template <class ELFT> static bool isDiscarded(InputSectionBase<ELFT> *S) {
|
2016-07-21 22:26:59 +08:00
|
|
|
return !S || !S->Live;
|
2016-02-12 05:17:59 +08:00
|
|
|
}
|
|
|
|
|
2016-08-12 09:24:53 +08:00
|
|
|
template <class ELFT> LinkerScript<ELFT>::LinkerScript() {}
|
|
|
|
template <class ELFT> LinkerScript<ELFT>::~LinkerScript() {}
|
|
|
|
|
2016-04-21 04:13:41 +08:00
|
|
|
template <class ELFT>
|
|
|
|
bool LinkerScript<ELFT>::shouldKeep(InputSectionBase<ELFT> *S) {
|
2016-09-03 05:17:20 +08:00
|
|
|
for (Regex *Re : Opt.KeptSections)
|
2016-09-08 22:06:08 +08:00
|
|
|
if (Re->match(S->Name))
|
2016-07-21 22:26:59 +08:00
|
|
|
return true;
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2016-09-17 10:10:15 +08:00
|
|
|
static bool fileMatches(const Regex &FileRe, const Regex &ExcludedFileRe,
|
|
|
|
StringRef Filename) {
|
2016-09-17 01:42:10 +08:00
|
|
|
return const_cast<Regex &>(FileRe).match(Filename) &&
|
|
|
|
!const_cast<Regex &>(ExcludedFileRe).match(Filename);
|
2016-07-29 05:51:30 +08:00
|
|
|
}
|
|
|
|
|
2016-09-16 03:15:12 +08:00
|
|
|
static bool comparePriority(InputSectionData *A, InputSectionData *B) {
|
|
|
|
return getPriority(A->Name) < getPriority(B->Name);
|
|
|
|
}
|
|
|
|
|
2016-09-09 04:47:52 +08:00
|
|
|
static bool compareName(InputSectionData *A, InputSectionData *B) {
|
2016-09-08 22:06:08 +08:00
|
|
|
return A->Name < B->Name;
|
2016-08-05 06:27:00 +08:00
|
|
|
}
|
|
|
|
|
2016-09-09 04:47:52 +08:00
|
|
|
static bool compareAlignment(InputSectionData *A, InputSectionData *B) {
|
2016-08-05 06:27:00 +08:00
|
|
|
// ">" is not a mistake. Larger alignments are placed before smaller
|
|
|
|
// alignments in order to reduce the amount of padding necessary.
|
|
|
|
// This is compatible with GNU.
|
|
|
|
return A->Alignment > B->Alignment;
|
|
|
|
}
|
|
|
|
|
2016-09-09 04:47:52 +08:00
|
|
|
static std::function<bool(InputSectionData *, InputSectionData *)>
|
2016-09-17 04:21:55 +08:00
|
|
|
getComparator(SortSectionPolicy K) {
|
|
|
|
switch (K) {
|
|
|
|
case SortSectionPolicy::Alignment:
|
|
|
|
return compareAlignment;
|
|
|
|
case SortSectionPolicy::Name:
|
2016-09-09 04:47:52 +08:00
|
|
|
return compareName;
|
2016-09-17 04:21:55 +08:00
|
|
|
case SortSectionPolicy::Priority:
|
|
|
|
return comparePriority;
|
|
|
|
default:
|
|
|
|
llvm_unreachable("unknown sort policy");
|
|
|
|
}
|
2016-08-05 06:27:00 +08:00
|
|
|
}
|
2016-07-29 23:32:46 +08:00
|
|
|
|
2016-08-13 04:38:20 +08:00
|
|
|
static bool checkConstraint(uint64_t Flags, ConstraintKind Kind) {
|
|
|
|
bool RO = (Kind == ConstraintKind::ReadOnly);
|
|
|
|
bool RW = (Kind == ConstraintKind::ReadWrite);
|
|
|
|
bool Writable = Flags & SHF_WRITE;
|
2016-09-07 06:50:48 +08:00
|
|
|
return !(RO && Writable) && !(RW && !Writable);
|
2016-08-13 04:38:20 +08:00
|
|
|
}
|
|
|
|
|
2016-08-12 17:07:57 +08:00
|
|
|
template <class ELFT>
|
2016-09-17 04:34:02 +08:00
|
|
|
static bool matchConstraints(ArrayRef<InputSectionBase<ELFT> *> Sections,
|
2016-08-12 17:07:57 +08:00
|
|
|
ConstraintKind Kind) {
|
2016-08-13 04:38:20 +08:00
|
|
|
if (Kind == ConstraintKind::NoConstraint)
|
|
|
|
return true;
|
2016-09-16 23:10:23 +08:00
|
|
|
return llvm::all_of(Sections, [=](InputSectionData *Sec2) {
|
|
|
|
auto *Sec = static_cast<InputSectionBase<ELFT> *>(Sec2);
|
2016-08-13 04:38:20 +08:00
|
|
|
return checkConstraint(Sec->getSectionHdr()->sh_flags, Kind);
|
2016-08-12 17:07:57 +08:00
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2016-09-16 23:10:23 +08:00
|
|
|
// Compute and remember which sections the InputSectionDescription matches.
|
2016-09-14 22:32:08 +08:00
|
|
|
template <class ELFT>
|
2016-09-17 04:34:02 +08:00
|
|
|
void LinkerScript<ELFT>::computeInputSections(InputSectionDescription *I) {
|
2016-09-17 10:10:15 +08:00
|
|
|
for (const std::pair<Regex, Regex> &V : I->SectionsVec) {
|
2016-09-17 01:42:10 +08:00
|
|
|
for (ObjectFile<ELFT> *F : Symtab<ELFT>::X->getObjectFiles()) {
|
|
|
|
if (fileMatches(I->FileRe, V.first, sys::path::filename(F->getName()))) {
|
|
|
|
Regex &Re = const_cast<Regex &>(V.second);
|
|
|
|
for (InputSectionBase<ELFT> *S : F->getSections())
|
|
|
|
if (!isDiscarded(S) && !S->OutSec && Re.match(S->Name))
|
|
|
|
I->Sections.push_back(S);
|
|
|
|
|
|
|
|
if (Re.match("COMMON"))
|
|
|
|
I->Sections.push_back(CommonInputSection<ELFT>::X);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2016-09-16 23:10:23 +08:00
|
|
|
|
2016-09-17 05:14:55 +08:00
|
|
|
if (I->SortInner != SortSectionPolicy::Default)
|
2016-09-16 23:10:23 +08:00
|
|
|
std::stable_sort(I->Sections.begin(), I->Sections.end(),
|
|
|
|
getComparator(I->SortInner));
|
2016-09-17 05:14:55 +08:00
|
|
|
if (I->SortOuter != SortSectionPolicy::Default)
|
2016-09-16 23:10:23 +08:00
|
|
|
std::stable_sort(I->Sections.begin(), I->Sections.end(),
|
|
|
|
getComparator(I->SortOuter));
|
|
|
|
|
|
|
|
// We do not add duplicate input sections, so mark them with a dummy output
|
|
|
|
// section for now.
|
|
|
|
for (InputSectionData *S : I->Sections) {
|
|
|
|
auto *S2 = static_cast<InputSectionBase<ELFT> *>(S);
|
|
|
|
S2->OutSec = (OutputSectionBase<ELFT> *)-1;
|
|
|
|
}
|
2016-09-14 22:32:08 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
template <class ELFT>
|
|
|
|
void LinkerScript<ELFT>::discard(ArrayRef<InputSectionBase<ELFT> *> V) {
|
|
|
|
for (InputSectionBase<ELFT> *S : V) {
|
|
|
|
S->Live = false;
|
|
|
|
reportDiscarded(S);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-08-12 08:27:23 +08:00
|
|
|
template <class ELFT>
|
2016-08-12 11:16:56 +08:00
|
|
|
std::vector<InputSectionBase<ELFT> *>
|
2016-08-12 17:07:57 +08:00
|
|
|
LinkerScript<ELFT>::createInputSectionList(OutputSectionCommand &OutCmd) {
|
2016-08-12 11:16:56 +08:00
|
|
|
std::vector<InputSectionBase<ELFT> *> Ret;
|
|
|
|
|
2016-08-12 17:07:57 +08:00
|
|
|
for (const std::unique_ptr<BaseCommand> &Base : OutCmd.Commands) {
|
2016-09-17 05:05:36 +08:00
|
|
|
auto *Cmd = dyn_cast<InputSectionDescription>(Base.get());
|
|
|
|
if (!Cmd)
|
2016-08-12 11:16:56 +08:00
|
|
|
continue;
|
2016-09-17 04:34:02 +08:00
|
|
|
computeInputSections(Cmd);
|
2016-09-16 23:10:23 +08:00
|
|
|
for (InputSectionData *S : Cmd->Sections)
|
|
|
|
Ret.push_back(static_cast<InputSectionBase<ELFT> *>(S));
|
2016-08-12 11:16:56 +08:00
|
|
|
}
|
2016-09-17 04:34:02 +08:00
|
|
|
|
2016-08-12 11:16:56 +08:00
|
|
|
return Ret;
|
|
|
|
}
|
2016-08-12 08:27:23 +08:00
|
|
|
|
2016-09-13 22:23:14 +08:00
|
|
|
template <class ELFT>
|
|
|
|
static SectionKey<ELFT::Is64Bits> createKey(InputSectionBase<ELFT> *C,
|
|
|
|
StringRef OutsecName) {
|
|
|
|
// When using linker script the merge rules are different.
|
|
|
|
// Unfortunately, linker scripts are name based. This means that expressions
|
|
|
|
// like *(.foo*) can refer to multiple input sections that would normally be
|
|
|
|
// placed in different output sections. We cannot put them in different
|
|
|
|
// output sections or we would produce wrong results for
|
|
|
|
// start = .; *(.foo.*) end = .; *(.bar)
|
|
|
|
// and a mapping of .foo1 and .bar1 to one section and .foo2 and .bar2 to
|
|
|
|
// another. The problem is that there is no way to layout those output
|
|
|
|
// sections such that the .foo sections are the only thing between the
|
|
|
|
// start and end symbols.
|
|
|
|
|
|
|
|
// An extra annoyance is that we cannot simply disable merging of the contents
|
|
|
|
// of SHF_MERGE sections, but our implementation requires one output section
|
|
|
|
// per "kind" (string or not, which size/aligment).
|
|
|
|
// Fortunately, creating symbols in the middle of a merge section is not
|
|
|
|
// supported by bfd or gold, so we can just create multiple section in that
|
|
|
|
// case.
|
|
|
|
const typename ELFT::Shdr *H = C->getSectionHdr();
|
|
|
|
typedef typename ELFT::uint uintX_t;
|
|
|
|
uintX_t Flags = H->sh_flags & (SHF_MERGE | SHF_STRINGS);
|
|
|
|
|
|
|
|
uintX_t Alignment = 0;
|
|
|
|
if (isa<MergeInputSection<ELFT>>(C))
|
|
|
|
Alignment = std::max(H->sh_addralign, H->sh_entsize);
|
|
|
|
|
|
|
|
return SectionKey<ELFT::Is64Bits>{OutsecName, /*Type*/ 0, Flags, Alignment};
|
|
|
|
}
|
|
|
|
|
2016-08-12 11:16:56 +08:00
|
|
|
template <class ELFT>
|
2016-09-16 23:30:47 +08:00
|
|
|
void LinkerScript<ELFT>::addSection(OutputSectionFactory<ELFT> &Factory,
|
|
|
|
InputSectionBase<ELFT> *Sec,
|
|
|
|
StringRef Name) {
|
|
|
|
OutputSectionBase<ELFT> *OutSec;
|
|
|
|
bool IsNew;
|
|
|
|
std::tie(OutSec, IsNew) = Factory.create(createKey(Sec, Name), Sec);
|
|
|
|
if (IsNew)
|
|
|
|
OutputSections->push_back(OutSec);
|
|
|
|
OutSec->addSection(Sec);
|
|
|
|
}
|
|
|
|
|
|
|
|
template <class ELFT>
|
|
|
|
void LinkerScript<ELFT>::processCommands(OutputSectionFactory<ELFT> &Factory) {
|
2016-09-13 21:00:06 +08:00
|
|
|
|
2016-09-17 05:05:36 +08:00
|
|
|
for (unsigned I = 0; I < Opt.Commands.size(); ++I) {
|
|
|
|
auto Iter = Opt.Commands.begin() + I;
|
|
|
|
const std::unique_ptr<BaseCommand> &Base1 = *Iter;
|
2016-08-12 11:33:04 +08:00
|
|
|
if (auto *Cmd = dyn_cast<SymbolAssignment>(Base1.get())) {
|
|
|
|
if (shouldDefine<ELFT>(Cmd))
|
|
|
|
addRegular<ELFT>(Cmd);
|
|
|
|
continue;
|
|
|
|
}
|
2016-09-16 23:30:47 +08:00
|
|
|
if (auto *Cmd = dyn_cast<AssertCommand>(Base1.get())) {
|
|
|
|
// If we don't have SECTIONS then output sections have already been
|
|
|
|
// created by Writer<EFLT>. The LinkerScript<ELFT>::assignAddresses
|
|
|
|
// will not be called, so ASSERT should be evaluated now.
|
|
|
|
if (!Opt.HasSections)
|
|
|
|
Cmd->Expression(0);
|
|
|
|
continue;
|
|
|
|
}
|
2016-08-12 11:33:04 +08:00
|
|
|
|
2016-08-11 15:56:43 +08:00
|
|
|
if (auto *Cmd = dyn_cast<OutputSectionCommand>(Base1.get())) {
|
2016-09-13 00:05:16 +08:00
|
|
|
std::vector<InputSectionBase<ELFT> *> V = createInputSectionList(*Cmd);
|
|
|
|
|
2016-08-12 08:27:23 +08:00
|
|
|
if (Cmd->Name == "/DISCARD/") {
|
2016-09-13 00:05:16 +08:00
|
|
|
discard(V);
|
2016-08-12 08:27:23 +08:00
|
|
|
continue;
|
|
|
|
}
|
2016-08-12 11:16:56 +08:00
|
|
|
|
2016-09-17 05:05:36 +08:00
|
|
|
if (!matchConstraints<ELFT>(V, Cmd->Constraint)) {
|
|
|
|
for (InputSectionBase<ELFT> *S : V)
|
|
|
|
S->OutSec = nullptr;
|
|
|
|
Opt.Commands.erase(Iter);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
for (const std::unique_ptr<BaseCommand> &Base : Cmd->Commands)
|
|
|
|
if (auto *OutCmd = dyn_cast<SymbolAssignment>(Base.get()))
|
|
|
|
if (shouldDefine<ELFT>(OutCmd))
|
|
|
|
addSymbol<ELFT>(OutCmd);
|
|
|
|
|
2016-09-01 17:55:57 +08:00
|
|
|
if (V.empty())
|
2016-08-12 11:16:56 +08:00
|
|
|
continue;
|
|
|
|
|
2016-08-19 23:18:23 +08:00
|
|
|
for (InputSectionBase<ELFT> *Sec : V) {
|
2016-09-16 23:30:47 +08:00
|
|
|
addSection(Factory, Sec, Cmd->Name);
|
|
|
|
if (uint32_t Subalign = Cmd->SubalignExpr ? Cmd->SubalignExpr(0) : 0)
|
2016-08-19 23:18:23 +08:00
|
|
|
Sec->Alignment = Subalign;
|
|
|
|
}
|
2016-08-11 15:56:43 +08:00
|
|
|
}
|
2016-08-12 08:27:23 +08:00
|
|
|
}
|
2016-09-16 23:30:47 +08:00
|
|
|
}
|
2016-07-20 22:43:20 +08:00
|
|
|
|
2016-09-16 23:30:47 +08:00
|
|
|
template <class ELFT>
|
|
|
|
void LinkerScript<ELFT>::createSections(OutputSectionFactory<ELFT> &Factory) {
|
|
|
|
processCommands(Factory);
|
2016-08-12 11:16:56 +08:00
|
|
|
// Add orphan sections.
|
2016-09-16 23:30:47 +08:00
|
|
|
for (ObjectFile<ELFT> *F : Symtab<ELFT>::X->getObjectFiles())
|
|
|
|
for (InputSectionBase<ELFT> *S : F->getSections())
|
|
|
|
if (!isDiscarded(S) && !S->OutSec)
|
|
|
|
addSection(Factory, S, getOutputSectionName(S));
|
2016-07-20 22:43:20 +08:00
|
|
|
}
|
|
|
|
|
2016-09-07 15:08:43 +08:00
|
|
|
// Sets value of a section-defined symbol. Two kinds of
|
|
|
|
// symbols are processed: synthetic symbols, whose value
|
|
|
|
// is an offset from beginning of section and regular
|
|
|
|
// symbols whose value is absolute.
|
|
|
|
template <class ELFT>
|
|
|
|
static void assignSectionSymbol(SymbolAssignment *Cmd,
|
|
|
|
OutputSectionBase<ELFT> *Sec,
|
|
|
|
typename ELFT::uint Off) {
|
|
|
|
if (!Cmd->Sym)
|
|
|
|
return;
|
|
|
|
|
|
|
|
if (auto *Body = dyn_cast<DefinedSynthetic<ELFT>>(Cmd->Sym)) {
|
|
|
|
Body->Section = Sec;
|
|
|
|
Body->Value = Cmd->Expression(Sec->getVA() + Off) - Sec->getVA();
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
auto *Body = cast<DefinedRegular<ELFT>>(Cmd->Sym);
|
|
|
|
Body->Value = Cmd->Expression(Sec->getVA() + Off);
|
|
|
|
}
|
|
|
|
|
2016-09-16 23:10:23 +08:00
|
|
|
template <class ELFT> void LinkerScript<ELFT>::output(InputSection<ELFT> *S) {
|
|
|
|
if (!AlreadyOutputIS.insert(S).second)
|
|
|
|
return;
|
|
|
|
bool IsTbss =
|
|
|
|
(CurOutSec->getFlags() & SHF_TLS) && CurOutSec->getType() == SHT_NOBITS;
|
|
|
|
|
|
|
|
uintX_t Pos = IsTbss ? Dot + ThreadBssOffset : Dot;
|
|
|
|
Pos = alignTo(Pos, S->Alignment);
|
|
|
|
S->OutSecOff = Pos - CurOutSec->getVA();
|
|
|
|
Pos += S->getSize();
|
|
|
|
|
|
|
|
// Update output section size after adding each section. This is so that
|
|
|
|
// SIZEOF works correctly in the case below:
|
|
|
|
// .foo { *(.aaa) a = SIZEOF(.foo); *(.bbb) }
|
|
|
|
CurOutSec->setSize(Pos - CurOutSec->getVA());
|
|
|
|
|
|
|
|
if (!IsTbss)
|
|
|
|
Dot = Pos;
|
|
|
|
}
|
|
|
|
|
|
|
|
template <class ELFT> void LinkerScript<ELFT>::flush() {
|
|
|
|
if (auto *OutSec = dyn_cast_or_null<OutputSection<ELFT>>(CurOutSec)) {
|
|
|
|
for (InputSection<ELFT> *I : OutSec->Sections)
|
|
|
|
output(I);
|
|
|
|
AlreadyOutputOS.insert(CurOutSec);
|
2016-08-31 16:13:33 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
template <class ELFT>
|
2016-09-16 23:10:23 +08:00
|
|
|
void LinkerScript<ELFT>::switchTo(OutputSectionBase<ELFT> *Sec) {
|
|
|
|
if (CurOutSec == Sec)
|
|
|
|
return;
|
|
|
|
if (AlreadyOutputOS.count(Sec))
|
2016-08-11 15:56:43 +08:00
|
|
|
return;
|
|
|
|
|
2016-09-16 23:10:23 +08:00
|
|
|
flush();
|
|
|
|
CurOutSec = Sec;
|
|
|
|
|
|
|
|
Dot = alignTo(Dot, CurOutSec->getAlignment());
|
|
|
|
CurOutSec->setVA(Dot);
|
|
|
|
}
|
2016-09-01 17:55:57 +08:00
|
|
|
|
2016-09-16 23:10:23 +08:00
|
|
|
template <class ELFT> void LinkerScript<ELFT>::process(BaseCommand &Base) {
|
|
|
|
if (auto *AssignCmd = dyn_cast<SymbolAssignment>(&Base)) {
|
|
|
|
if (AssignCmd->Name == ".") {
|
|
|
|
// Update to location counter means update to section size.
|
|
|
|
Dot = AssignCmd->Expression(Dot);
|
|
|
|
CurOutSec->setSize(Dot - CurOutSec->getVA());
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
assignSectionSymbol<ELFT>(AssignCmd, CurOutSec, Dot - CurOutSec->getVA());
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
auto &ICmd = cast<InputSectionDescription>(Base);
|
|
|
|
for (InputSectionData *ID : ICmd.Sections) {
|
|
|
|
auto *IB = static_cast<InputSectionBase<ELFT> *>(ID);
|
|
|
|
switchTo(IB->OutSec);
|
|
|
|
if (auto *I = dyn_cast<InputSection<ELFT>>(IB))
|
|
|
|
output(I);
|
|
|
|
else if (AlreadyOutputOS.insert(CurOutSec).second)
|
|
|
|
Dot += CurOutSec->getSize();
|
2016-08-11 15:56:43 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-08-13 04:38:20 +08:00
|
|
|
template <class ELFT>
|
2016-09-07 18:46:07 +08:00
|
|
|
static std::vector<OutputSectionBase<ELFT> *>
|
|
|
|
findSections(OutputSectionCommand &Cmd,
|
2016-09-16 23:10:23 +08:00
|
|
|
const std::vector<OutputSectionBase<ELFT> *> &Sections) {
|
2016-09-07 18:46:07 +08:00
|
|
|
std::vector<OutputSectionBase<ELFT> *> Ret;
|
|
|
|
for (OutputSectionBase<ELFT> *Sec : Sections)
|
2016-09-17 05:05:36 +08:00
|
|
|
if (Sec->getName() == Cmd.Name)
|
2016-09-07 18:46:07 +08:00
|
|
|
Ret.push_back(Sec);
|
|
|
|
return Ret;
|
2016-08-13 04:38:20 +08:00
|
|
|
}
|
|
|
|
|
2016-09-16 23:10:23 +08:00
|
|
|
template <class ELFT>
|
|
|
|
void LinkerScript<ELFT>::assignOffsets(OutputSectionCommand *Cmd) {
|
|
|
|
std::vector<OutputSectionBase<ELFT> *> Sections =
|
|
|
|
findSections(*Cmd, *OutputSections);
|
|
|
|
if (Sections.empty())
|
|
|
|
return;
|
|
|
|
switchTo(Sections[0]);
|
|
|
|
|
|
|
|
// Find the last section output location. We will output orphan sections
|
|
|
|
// there so that end symbols point to the correct location.
|
|
|
|
auto E = std::find_if(Cmd->Commands.rbegin(), Cmd->Commands.rend(),
|
|
|
|
[](const std::unique_ptr<BaseCommand> &Cmd) {
|
|
|
|
return !isa<SymbolAssignment>(*Cmd);
|
|
|
|
})
|
|
|
|
.base();
|
|
|
|
for (auto I = Cmd->Commands.begin(); I != E; ++I)
|
|
|
|
process(**I);
|
|
|
|
flush();
|
|
|
|
for (OutputSectionBase<ELFT> *Base : Sections) {
|
|
|
|
if (!AlreadyOutputOS.insert(Base).second)
|
|
|
|
continue;
|
|
|
|
switchTo(Base);
|
|
|
|
Dot += CurOutSec->getSize();
|
|
|
|
}
|
|
|
|
for (auto I = E, E = Cmd->Commands.end(); I != E; ++I)
|
|
|
|
process(**I);
|
|
|
|
}
|
|
|
|
|
2016-08-04 20:13:05 +08:00
|
|
|
template <class ELFT> void LinkerScript<ELFT>::assignAddresses() {
|
2016-04-16 18:10:32 +08:00
|
|
|
// Orphan sections are sections present in the input files which
|
2016-04-19 05:00:40 +08:00
|
|
|
// are not explicitly placed into the output file by the linker script.
|
|
|
|
// We place orphan sections at end of file.
|
|
|
|
// Other linkers places them using some heuristics as described in
|
2016-04-16 18:10:32 +08:00
|
|
|
// https://sourceware.org/binutils/docs/ld/Orphan-Sections.html#Orphan-Sections.
|
2016-09-17 05:29:07 +08:00
|
|
|
|
|
|
|
// The OutputSections are already in the correct order.
|
|
|
|
// This loops creates or moves commands as needed so that they are in the
|
|
|
|
// correct order.
|
|
|
|
int CmdIndex = 0;
|
2016-08-12 08:36:56 +08:00
|
|
|
for (OutputSectionBase<ELFT> *Sec : *OutputSections) {
|
2016-04-16 18:10:32 +08:00
|
|
|
StringRef Name = Sec->getName();
|
2016-09-17 05:29:07 +08:00
|
|
|
|
|
|
|
// Find the last spot where we can insert a command and still get the
|
|
|
|
// correct order.
|
|
|
|
auto CmdIter = Opt.Commands.begin() + CmdIndex;
|
|
|
|
auto E = Opt.Commands.end();
|
|
|
|
while (CmdIter != E && !isa<OutputSectionCommand>(**CmdIter)) {
|
|
|
|
++CmdIter;
|
|
|
|
++CmdIndex;
|
|
|
|
}
|
|
|
|
|
|
|
|
auto Pos =
|
|
|
|
std::find_if(CmdIter, E, [&](const std::unique_ptr<BaseCommand> &Base) {
|
|
|
|
auto *Cmd = dyn_cast<OutputSectionCommand>(Base.get());
|
|
|
|
return Cmd && Cmd->Name == Name;
|
|
|
|
});
|
|
|
|
if (Pos == E) {
|
|
|
|
Opt.Commands.insert(CmdIter,
|
|
|
|
llvm::make_unique<OutputSectionCommand>(Name));
|
|
|
|
} else {
|
|
|
|
// If linker script lists alloc/non-alloc sections is the wrong order,
|
|
|
|
// this does a right rotate to bring the desired command in place.
|
2016-09-17 06:47:34 +08:00
|
|
|
auto RPos = llvm::make_reverse_iterator(Pos + 1);
|
|
|
|
std::rotate(RPos, RPos + 1, llvm::make_reverse_iterator(CmdIter));
|
2016-09-17 05:29:07 +08:00
|
|
|
}
|
|
|
|
++CmdIndex;
|
2016-04-16 18:10:32 +08:00
|
|
|
}
|
|
|
|
|
2016-04-19 05:00:40 +08:00
|
|
|
// Assign addresses as instructed by linker script SECTIONS sub-commands.
|
2016-08-12 12:00:22 +08:00
|
|
|
Dot = getHeaderSize();
|
2016-04-16 18:10:32 +08:00
|
|
|
|
2016-07-21 14:43:01 +08:00
|
|
|
for (const std::unique_ptr<BaseCommand> &Base : Opt.Commands) {
|
|
|
|
if (auto *Cmd = dyn_cast<SymbolAssignment>(Base.get())) {
|
2016-07-29 13:48:39 +08:00
|
|
|
if (Cmd->Name == ".") {
|
|
|
|
Dot = Cmd->Expression(Dot);
|
|
|
|
} else if (Cmd->Sym) {
|
|
|
|
cast<DefinedRegular<ELFT>>(Cmd->Sym)->Value = Cmd->Expression(Dot);
|
|
|
|
}
|
2016-07-12 14:39:48 +08:00
|
|
|
continue;
|
|
|
|
}
|
2016-04-16 18:10:32 +08:00
|
|
|
|
2016-08-04 17:29:31 +08:00
|
|
|
if (auto *Cmd = dyn_cast<AssertCommand>(Base.get())) {
|
|
|
|
Cmd->Expression(Dot);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
2016-07-21 14:43:01 +08:00
|
|
|
auto *Cmd = cast<OutputSectionCommand>(Base.get());
|
2016-04-16 18:10:32 +08:00
|
|
|
|
2016-09-16 23:10:23 +08:00
|
|
|
if (Cmd->AddrExpr)
|
|
|
|
Dot = Cmd->AddrExpr(Dot);
|
2016-09-07 18:46:07 +08:00
|
|
|
|
2016-09-16 23:10:23 +08:00
|
|
|
assignOffsets(Cmd);
|
2016-04-16 18:10:32 +08:00
|
|
|
}
|
2016-07-01 18:42:25 +08:00
|
|
|
|
2016-09-17 05:29:07 +08:00
|
|
|
uintX_t MinVA = std::numeric_limits<uintX_t>::max();
|
|
|
|
for (OutputSectionBase<ELFT> *Sec : *OutputSections) {
|
|
|
|
if (Sec->getFlags() & SHF_ALLOC)
|
|
|
|
MinVA = std::min(MinVA, Sec->getVA());
|
|
|
|
else
|
2016-09-16 23:10:23 +08:00
|
|
|
Sec->setVA(0);
|
2016-09-17 05:29:07 +08:00
|
|
|
}
|
|
|
|
|
2016-09-16 05:22:11 +08:00
|
|
|
uintX_t HeaderSize =
|
|
|
|
Out<ELFT>::ElfHeader->getSize() + Out<ELFT>::ProgramHeaders->getSize();
|
|
|
|
if (HeaderSize > MinVA)
|
|
|
|
fatal("Not enough space for ELF and program headers");
|
|
|
|
|
2016-07-07 22:28:47 +08:00
|
|
|
// ELF and Program headers need to be right before the first section in
|
2016-07-19 15:42:07 +08:00
|
|
|
// memory. Set their addresses accordingly.
|
2016-09-16 05:22:11 +08:00
|
|
|
MinVA = alignDown(MinVA - HeaderSize, Target->PageSize);
|
2016-07-01 18:27:36 +08:00
|
|
|
Out<ELFT>::ElfHeader->setVA(MinVA);
|
|
|
|
Out<ELFT>::ProgramHeaders->setVA(Out<ELFT>::ElfHeader->getSize() + MinVA);
|
2016-04-16 18:10:32 +08:00
|
|
|
}
|
|
|
|
|
2016-08-22 12:55:20 +08:00
|
|
|
// Creates program headers as instructed by PHDRS linker script command.
|
2016-07-19 17:25:43 +08:00
|
|
|
template <class ELFT>
|
2016-08-04 20:13:05 +08:00
|
|
|
std::vector<PhdrEntry<ELFT>> LinkerScript<ELFT>::createPhdrs() {
|
2016-07-25 07:47:31 +08:00
|
|
|
std::vector<PhdrEntry<ELFT>> Ret;
|
2016-07-19 17:25:43 +08:00
|
|
|
|
2016-08-22 12:55:20 +08:00
|
|
|
// Process PHDRS and FILEHDR keywords because they are not
|
|
|
|
// real output sections and cannot be added in the following loop.
|
2016-07-19 17:25:43 +08:00
|
|
|
for (const PhdrsCommand &Cmd : Opt.PhdrsCommands) {
|
2016-07-25 07:47:31 +08:00
|
|
|
Ret.emplace_back(Cmd.Type, Cmd.Flags == UINT_MAX ? PF_R : Cmd.Flags);
|
|
|
|
PhdrEntry<ELFT> &Phdr = Ret.back();
|
2016-07-19 17:25:43 +08:00
|
|
|
|
|
|
|
if (Cmd.HasFilehdr)
|
2016-07-23 22:18:48 +08:00
|
|
|
Phdr.add(Out<ELFT>::ElfHeader);
|
2016-07-19 17:25:43 +08:00
|
|
|
if (Cmd.HasPhdrs)
|
2016-07-23 22:18:48 +08:00
|
|
|
Phdr.add(Out<ELFT>::ProgramHeaders);
|
2016-09-09 17:46:16 +08:00
|
|
|
|
|
|
|
if (Cmd.LMAExpr) {
|
|
|
|
Phdr.H.p_paddr = Cmd.LMAExpr(0);
|
|
|
|
Phdr.HasLMA = true;
|
|
|
|
}
|
2016-07-19 17:25:43 +08:00
|
|
|
}
|
|
|
|
|
2016-08-22 12:55:20 +08:00
|
|
|
// Add output sections to program headers.
|
2016-07-25 07:47:31 +08:00
|
|
|
PhdrEntry<ELFT> *Load = nullptr;
|
|
|
|
uintX_t Flags = PF_R;
|
2016-08-22 12:55:20 +08:00
|
|
|
for (OutputSectionBase<ELFT> *Sec : *OutputSections) {
|
2016-07-19 17:25:43 +08:00
|
|
|
if (!(Sec->getFlags() & SHF_ALLOC))
|
|
|
|
break;
|
|
|
|
|
2016-07-25 07:47:31 +08:00
|
|
|
std::vector<size_t> PhdrIds = getPhdrIndices(Sec->getName());
|
2016-07-19 17:25:43 +08:00
|
|
|
if (!PhdrIds.empty()) {
|
|
|
|
// Assign headers specified by linker script
|
|
|
|
for (size_t Id : PhdrIds) {
|
2016-07-25 07:47:31 +08:00
|
|
|
Ret[Id].add(Sec);
|
2016-07-21 18:43:25 +08:00
|
|
|
if (Opt.PhdrsCommands[Id].Flags == UINT_MAX)
|
2016-07-27 22:10:56 +08:00
|
|
|
Ret[Id].H.p_flags |= Sec->getPhdrFlags();
|
2016-07-19 17:25:43 +08:00
|
|
|
}
|
|
|
|
} else {
|
|
|
|
// If we have no load segment or flags've changed then we want new load
|
|
|
|
// segment.
|
2016-07-27 22:10:56 +08:00
|
|
|
uintX_t NewFlags = Sec->getPhdrFlags();
|
2016-07-19 17:25:43 +08:00
|
|
|
if (Load == nullptr || Flags != NewFlags) {
|
2016-07-25 07:47:31 +08:00
|
|
|
Load = &*Ret.emplace(Ret.end(), PT_LOAD, NewFlags);
|
2016-07-19 17:25:43 +08:00
|
|
|
Flags = NewFlags;
|
|
|
|
}
|
2016-07-21 03:36:41 +08:00
|
|
|
Load->add(Sec);
|
2016-07-19 17:25:43 +08:00
|
|
|
}
|
|
|
|
}
|
2016-07-25 07:47:31 +08:00
|
|
|
return Ret;
|
2016-07-19 17:25:43 +08:00
|
|
|
}
|
|
|
|
|
2016-08-16 14:40:58 +08:00
|
|
|
template <class ELFT> bool LinkerScript<ELFT>::ignoreInterpSection() {
|
|
|
|
// Ignore .interp section in case we have PHDRS specification
|
|
|
|
// and PT_INTERP isn't listed.
|
|
|
|
return !Opt.PhdrsCommands.empty() &&
|
|
|
|
llvm::find_if(Opt.PhdrsCommands, [](const PhdrsCommand &Cmd) {
|
|
|
|
return Cmd.Type == PT_INTERP;
|
|
|
|
}) == Opt.PhdrsCommands.end();
|
|
|
|
}
|
|
|
|
|
2016-04-21 04:13:41 +08:00
|
|
|
template <class ELFT>
|
|
|
|
ArrayRef<uint8_t> LinkerScript<ELFT>::getFiller(StringRef Name) {
|
2016-07-21 15:48:54 +08:00
|
|
|
for (const std::unique_ptr<BaseCommand> &Base : Opt.Commands)
|
|
|
|
if (auto *Cmd = dyn_cast<OutputSectionCommand>(Base.get()))
|
|
|
|
if (Cmd->Name == Name)
|
|
|
|
return Cmd->Filler;
|
|
|
|
return {};
|
2016-02-26 22:48:31 +08:00
|
|
|
}
|
|
|
|
|
2016-08-17 16:16:57 +08:00
|
|
|
template <class ELFT> Expr LinkerScript<ELFT>::getLma(StringRef Name) {
|
2016-08-17 15:44:19 +08:00
|
|
|
for (const std::unique_ptr<BaseCommand> &Base : Opt.Commands)
|
|
|
|
if (auto *Cmd = dyn_cast<OutputSectionCommand>(Base.get()))
|
|
|
|
if (Cmd->LmaExpr && Cmd->Name == Name)
|
|
|
|
return Cmd->LmaExpr;
|
|
|
|
return {};
|
|
|
|
}
|
|
|
|
|
2016-04-22 04:30:00 +08:00
|
|
|
// Returns the index of the given section name in linker script
|
|
|
|
// SECTIONS commands. Sections are laid out as the same order as they
|
|
|
|
// were in the script. If a given name did not appear in the script,
|
|
|
|
// it returns INT_MAX, so that it will be laid out at end of file.
|
2016-07-21 14:43:01 +08:00
|
|
|
template <class ELFT> int LinkerScript<ELFT>::getSectionIndex(StringRef Name) {
|
2016-07-26 08:21:15 +08:00
|
|
|
int I = 0;
|
|
|
|
for (std::unique_ptr<BaseCommand> &Base : Opt.Commands) {
|
|
|
|
if (auto *Cmd = dyn_cast<OutputSectionCommand>(Base.get()))
|
|
|
|
if (Cmd->Name == Name)
|
|
|
|
return I;
|
|
|
|
++I;
|
|
|
|
}
|
|
|
|
return INT_MAX;
|
2016-04-21 18:22:02 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
// A compartor to sort output sections. Returns -1 or 1 if
|
|
|
|
// A or B are mentioned in linker script. Otherwise, returns 0.
|
2016-04-21 04:13:41 +08:00
|
|
|
template <class ELFT>
|
|
|
|
int LinkerScript<ELFT>::compareSections(StringRef A, StringRef B) {
|
2016-04-22 04:30:00 +08:00
|
|
|
int I = getSectionIndex(A);
|
|
|
|
int J = getSectionIndex(B);
|
|
|
|
if (I == INT_MAX && J == INT_MAX)
|
2016-02-12 05:17:59 +08:00
|
|
|
return 0;
|
|
|
|
return I < J ? -1 : 1;
|
|
|
|
}
|
|
|
|
|
2016-07-19 17:25:43 +08:00
|
|
|
template <class ELFT> bool LinkerScript<ELFT>::hasPhdrsCommands() {
|
|
|
|
return !Opt.PhdrsCommands.empty();
|
|
|
|
}
|
|
|
|
|
2016-08-30 17:54:01 +08:00
|
|
|
template <class ELFT>
|
2016-09-08 16:19:13 +08:00
|
|
|
uint64_t LinkerScript<ELFT>::getOutputSectionAddress(StringRef Name) {
|
2016-08-30 17:54:01 +08:00
|
|
|
for (OutputSectionBase<ELFT> *Sec : *OutputSections)
|
|
|
|
if (Sec->getName() == Name)
|
|
|
|
return Sec->getVA();
|
|
|
|
error("undefined section " + Name);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2016-07-30 00:18:47 +08:00
|
|
|
template <class ELFT>
|
2016-09-08 16:19:13 +08:00
|
|
|
uint64_t LinkerScript<ELFT>::getOutputSectionSize(StringRef Name) {
|
2016-07-30 00:18:47 +08:00
|
|
|
for (OutputSectionBase<ELFT> *Sec : *OutputSections)
|
|
|
|
if (Sec->getName() == Name)
|
|
|
|
return Sec->getSize();
|
|
|
|
error("undefined section " + Name);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2016-09-08 17:08:30 +08:00
|
|
|
template <class ELFT>
|
|
|
|
uint64_t LinkerScript<ELFT>::getOutputSectionAlign(StringRef Name) {
|
|
|
|
for (OutputSectionBase<ELFT> *Sec : *OutputSections)
|
|
|
|
if (Sec->getName() == Name)
|
|
|
|
return Sec->getAlignment();
|
|
|
|
error("undefined section " + Name);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2016-09-08 16:19:13 +08:00
|
|
|
template <class ELFT> uint64_t LinkerScript<ELFT>::getHeaderSize() {
|
2016-08-10 15:59:34 +08:00
|
|
|
return Out<ELFT>::ElfHeader->getSize() + Out<ELFT>::ProgramHeaders->getSize();
|
|
|
|
}
|
|
|
|
|
2016-09-08 16:19:13 +08:00
|
|
|
template <class ELFT> uint64_t LinkerScript<ELFT>::getSymbolValue(StringRef S) {
|
|
|
|
if (SymbolBody *B = Symtab<ELFT>::X->find(S))
|
|
|
|
return B->getVA<ELFT>();
|
|
|
|
error("symbol not found: " + S);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2016-07-19 17:25:43 +08:00
|
|
|
// Returns indices of ELF headers containing specific section, identified
|
|
|
|
// by Name. Each index is a zero based number of ELF header listed within
|
|
|
|
// PHDRS {} script block.
|
|
|
|
template <class ELFT>
|
2016-07-25 07:47:31 +08:00
|
|
|
std::vector<size_t> LinkerScript<ELFT>::getPhdrIndices(StringRef SectionName) {
|
2016-07-21 14:43:01 +08:00
|
|
|
for (const std::unique_ptr<BaseCommand> &Base : Opt.Commands) {
|
|
|
|
auto *Cmd = dyn_cast<OutputSectionCommand>(Base.get());
|
2016-07-25 07:47:31 +08:00
|
|
|
if (!Cmd || Cmd->Name != SectionName)
|
2016-07-21 00:43:03 +08:00
|
|
|
continue;
|
|
|
|
|
2016-07-26 08:27:36 +08:00
|
|
|
std::vector<size_t> Ret;
|
|
|
|
for (StringRef PhdrName : Cmd->Phdrs)
|
|
|
|
Ret.push_back(getPhdrIndex(PhdrName));
|
|
|
|
return Ret;
|
2016-07-19 17:25:43 +08:00
|
|
|
}
|
2016-07-21 00:43:03 +08:00
|
|
|
return {};
|
2016-07-19 17:25:43 +08:00
|
|
|
}
|
|
|
|
|
2016-07-26 08:27:36 +08:00
|
|
|
template <class ELFT>
|
|
|
|
size_t LinkerScript<ELFT>::getPhdrIndex(StringRef PhdrName) {
|
|
|
|
size_t I = 0;
|
|
|
|
for (PhdrsCommand &Cmd : Opt.PhdrsCommands) {
|
|
|
|
if (Cmd.Name == PhdrName)
|
|
|
|
return I;
|
|
|
|
++I;
|
|
|
|
}
|
|
|
|
error("section header '" + PhdrName + "' is not listed in PHDRS");
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2016-04-21 04:13:41 +08:00
|
|
|
class elf::ScriptParser : public ScriptParserBase {
|
2016-02-24 17:21:47 +08:00
|
|
|
typedef void (ScriptParser::*Handler)();
|
|
|
|
|
2015-10-01 01:23:26 +08:00
|
|
|
public:
|
2016-04-21 04:13:41 +08:00
|
|
|
ScriptParser(StringRef S, bool B) : ScriptParserBase(S), IsUnderSysroot(B) {}
|
2016-02-19 18:45:45 +08:00
|
|
|
|
2016-08-31 17:08:26 +08:00
|
|
|
void readLinkerScript();
|
|
|
|
void readVersionScript();
|
2015-10-01 01:23:26 +08:00
|
|
|
|
|
|
|
private:
|
2015-10-11 11:28:42 +08:00
|
|
|
void addFile(StringRef Path);
|
|
|
|
|
2015-10-01 01:23:26 +08:00
|
|
|
void readAsNeeded();
|
2015-10-08 14:48:38 +08:00
|
|
|
void readEntry();
|
2015-10-20 01:35:12 +08:00
|
|
|
void readExtern();
|
2015-10-01 01:23:26 +08:00
|
|
|
void readGroup();
|
2015-10-11 09:31:55 +08:00
|
|
|
void readInclude();
|
2015-10-07 08:25:09 +08:00
|
|
|
void readOutput();
|
2015-10-13 05:50:08 +08:00
|
|
|
void readOutputArch();
|
2015-10-01 01:23:26 +08:00
|
|
|
void readOutputFormat();
|
2016-07-19 17:25:43 +08:00
|
|
|
void readPhdrs();
|
2015-10-09 01:51:41 +08:00
|
|
|
void readSearchDir();
|
2015-11-12 17:52:08 +08:00
|
|
|
void readSections();
|
2016-09-01 04:03:54 +08:00
|
|
|
void readVersion();
|
|
|
|
void readVersionScriptCommand();
|
2015-11-12 17:52:08 +08:00
|
|
|
|
2016-07-25 07:05:57 +08:00
|
|
|
SymbolAssignment *readAssignment(StringRef Name);
|
2016-09-06 21:51:57 +08:00
|
|
|
std::vector<uint8_t> readFill();
|
2016-08-04 10:03:27 +08:00
|
|
|
OutputSectionCommand *readOutputSectionDescription(StringRef OutSec);
|
2016-09-06 21:51:57 +08:00
|
|
|
std::vector<uint8_t> readOutputSectionFiller(StringRef Tok);
|
2016-07-19 17:25:43 +08:00
|
|
|
std::vector<StringRef> readOutputSectionPhdrs();
|
2016-08-30 17:46:59 +08:00
|
|
|
InputSectionDescription *readInputSectionDescription(StringRef Tok);
|
2016-09-03 05:17:20 +08:00
|
|
|
Regex readFilePatterns();
|
2016-09-17 01:42:10 +08:00
|
|
|
void readSectionExcludes(InputSectionDescription *Cmd);
|
2016-08-30 17:46:59 +08:00
|
|
|
InputSectionDescription *readInputSectionRules(StringRef FilePattern);
|
2016-07-19 17:25:43 +08:00
|
|
|
unsigned readPhdrType();
|
2016-09-17 04:21:55 +08:00
|
|
|
SortSectionPolicy readSortKind();
|
2016-08-16 09:11:16 +08:00
|
|
|
SymbolAssignment *readProvideHidden(bool Provide, bool Hidden);
|
2016-09-07 15:08:43 +08:00
|
|
|
SymbolAssignment *readProvideOrAssignment(StringRef Tok, bool MakeAbsolute);
|
2016-07-28 15:18:23 +08:00
|
|
|
void readSort();
|
2016-08-04 17:29:31 +08:00
|
|
|
Expr readAssert();
|
Make readExpr return an Expr object instead of a vector of tokens.
Previously, we handled an expression as a vector of tokens. In other
words, an expression was a vector of uncooked raw StringRefs.
When we need a value of an expression, we used ExprParser to run
the expression.
The separation was needed essentially because parse time is too
early to evaluate an expression. In order to evaluate an expression,
we need to finalize section sizes. Because linker script parsing
is done at very early stage of the linking process, we can't
evaluate expressions while parsing.
The above mechanism worked fairly well, but there were a few
drawbacks.
One thing is that we sometimes have to parse the same expression
more than once in order to find the end of the expression.
In some contexts, linker script expressions have no clear end marker.
So, we needed to recognize balanced expressions and ternary operators.
The other is poor error reporting. Since expressions are parsed
basically twice, and some information that is available at the first
stage is lost in the second stage, it was hard to print out
apprpriate error messages.
This patch fixes the issues with a new approach.
Now the expression parsing is integrated into ScriptParser.
ExprParser class is removed. Expressions are represented as lambdas
instead of vectors of tokens. Lambdas captures information they
need to run themselves when they are created.
In this way, ends of expressions are naturally detected, and
errors are handled in the usual way. This patch also reduces
the amount of code.
Differential Revision: https://reviews.llvm.org/D22728
llvm-svn: 276574
2016-07-25 02:19:40 +08:00
|
|
|
|
|
|
|
Expr readExpr();
|
|
|
|
Expr readExpr1(Expr Lhs, int MinPrec);
|
|
|
|
Expr readPrimary();
|
|
|
|
Expr readTernary(Expr Cond);
|
2016-08-18 02:59:16 +08:00
|
|
|
Expr readParenExpr();
|
2015-10-01 01:23:26 +08:00
|
|
|
|
2016-08-31 17:08:26 +08:00
|
|
|
// For parsing version script.
|
|
|
|
void readExtern(std::vector<SymbolVersion> *Globals);
|
2016-09-01 04:03:54 +08:00
|
|
|
void readVersionDeclaration(StringRef VerStr);
|
2016-08-31 17:08:26 +08:00
|
|
|
void readGlobal(StringRef VerStr);
|
|
|
|
void readLocal();
|
|
|
|
|
2016-04-21 04:13:41 +08:00
|
|
|
ScriptConfiguration &Opt = *ScriptConfig;
|
|
|
|
StringSaver Saver = {ScriptConfig->Alloc};
|
2015-11-26 13:53:00 +08:00
|
|
|
bool IsUnderSysroot;
|
2015-10-01 01:23:26 +08:00
|
|
|
};
|
|
|
|
|
2016-08-31 17:08:26 +08:00
|
|
|
void ScriptParser::readVersionScript() {
|
2016-09-01 04:03:54 +08:00
|
|
|
readVersionScriptCommand();
|
|
|
|
if (!atEOF())
|
|
|
|
setError("EOF expected, but got " + next());
|
|
|
|
}
|
|
|
|
|
|
|
|
void ScriptParser::readVersionScriptCommand() {
|
2016-08-31 17:08:26 +08:00
|
|
|
if (skip("{")) {
|
2016-09-01 04:03:54 +08:00
|
|
|
readVersionDeclaration("");
|
2016-08-31 17:08:26 +08:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2016-09-01 04:03:54 +08:00
|
|
|
while (!atEOF() && !Error && peek() != "}") {
|
2016-08-31 17:08:26 +08:00
|
|
|
StringRef VerStr = next();
|
|
|
|
if (VerStr == "{") {
|
2016-09-01 04:03:54 +08:00
|
|
|
setError("anonymous version definition is used in "
|
|
|
|
"combination with other version definitions");
|
2016-08-31 17:08:26 +08:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
expect("{");
|
2016-09-01 04:03:54 +08:00
|
|
|
readVersionDeclaration(VerStr);
|
2016-08-31 17:08:26 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-09-01 04:03:54 +08:00
|
|
|
void ScriptParser::readVersion() {
|
|
|
|
expect("{");
|
|
|
|
readVersionScriptCommand();
|
|
|
|
expect("}");
|
|
|
|
}
|
|
|
|
|
2016-08-31 17:08:26 +08:00
|
|
|
void ScriptParser::readLinkerScript() {
|
2015-10-01 01:23:26 +08:00
|
|
|
while (!atEOF()) {
|
|
|
|
StringRef Tok = next();
|
2016-09-03 02:52:41 +08:00
|
|
|
if (Tok == ";")
|
|
|
|
continue;
|
|
|
|
|
2016-09-16 23:30:47 +08:00
|
|
|
if (Tok == "ASSERT") {
|
|
|
|
Opt.Commands.emplace_back(new AssertCommand(readAssert()));
|
|
|
|
} else if (Tok == "ENTRY") {
|
2016-09-03 02:52:41 +08:00
|
|
|
readEntry();
|
|
|
|
} else if (Tok == "EXTERN") {
|
|
|
|
readExtern();
|
|
|
|
} else if (Tok == "GROUP" || Tok == "INPUT") {
|
|
|
|
readGroup();
|
|
|
|
} else if (Tok == "INCLUDE") {
|
|
|
|
readInclude();
|
|
|
|
} else if (Tok == "OUTPUT") {
|
|
|
|
readOutput();
|
|
|
|
} else if (Tok == "OUTPUT_ARCH") {
|
|
|
|
readOutputArch();
|
|
|
|
} else if (Tok == "OUTPUT_FORMAT") {
|
|
|
|
readOutputFormat();
|
|
|
|
} else if (Tok == "PHDRS") {
|
|
|
|
readPhdrs();
|
|
|
|
} else if (Tok == "SEARCH_DIR") {
|
|
|
|
readSearchDir();
|
|
|
|
} else if (Tok == "SECTIONS") {
|
|
|
|
readSections();
|
|
|
|
} else if (Tok == "VERSION") {
|
|
|
|
readVersion();
|
2016-09-07 15:08:43 +08:00
|
|
|
} else if (SymbolAssignment *Cmd = readProvideOrAssignment(Tok, true)) {
|
2016-09-16 23:30:47 +08:00
|
|
|
Opt.Commands.emplace_back(Cmd);
|
2016-08-31 23:31:17 +08:00
|
|
|
} else {
|
2016-03-11 22:43:02 +08:00
|
|
|
setError("unknown directive: " + Tok);
|
2016-08-31 23:31:17 +08:00
|
|
|
}
|
2015-10-01 01:23:26 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-02-12 05:17:59 +08:00
|
|
|
void ScriptParser::addFile(StringRef S) {
|
2015-11-26 13:53:00 +08:00
|
|
|
if (IsUnderSysroot && S.startswith("/")) {
|
|
|
|
SmallString<128> Path;
|
|
|
|
(Config->Sysroot + S).toStringRef(Path);
|
|
|
|
if (sys::fs::exists(Path)) {
|
|
|
|
Driver->addFile(Saver.save(Path.str()));
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-10-13 08:09:21 +08:00
|
|
|
if (sys::path::is_absolute(S)) {
|
2015-10-11 11:28:42 +08:00
|
|
|
Driver->addFile(S);
|
|
|
|
} else if (S.startswith("=")) {
|
|
|
|
if (Config->Sysroot.empty())
|
|
|
|
Driver->addFile(S.substr(1));
|
|
|
|
else
|
|
|
|
Driver->addFile(Saver.save(Config->Sysroot + "/" + S.substr(1)));
|
|
|
|
} else if (S.startswith("-l")) {
|
2016-02-03 05:13:09 +08:00
|
|
|
Driver->addLibrary(S.substr(2));
|
2015-11-27 04:23:46 +08:00
|
|
|
} else if (sys::fs::exists(S)) {
|
|
|
|
Driver->addFile(S);
|
2015-10-11 11:28:42 +08:00
|
|
|
} else {
|
|
|
|
std::string Path = findFromSearchPaths(S);
|
|
|
|
if (Path.empty())
|
2016-03-12 16:31:34 +08:00
|
|
|
setError("unable to find " + S);
|
2016-02-03 04:27:59 +08:00
|
|
|
else
|
|
|
|
Driver->addFile(Saver.save(Path));
|
2015-10-11 11:28:42 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-02-12 05:17:59 +08:00
|
|
|
void ScriptParser::readAsNeeded() {
|
2015-10-01 01:23:26 +08:00
|
|
|
expect("(");
|
2015-10-12 04:59:12 +08:00
|
|
|
bool Orig = Config->AsNeeded;
|
|
|
|
Config->AsNeeded = true;
|
2016-08-05 09:25:45 +08:00
|
|
|
while (!Error && !skip(")"))
|
2016-09-09 22:35:36 +08:00
|
|
|
addFile(unquote(next()));
|
2015-10-12 04:59:12 +08:00
|
|
|
Config->AsNeeded = Orig;
|
2015-10-01 01:23:26 +08:00
|
|
|
}
|
|
|
|
|
2016-02-12 05:17:59 +08:00
|
|
|
void ScriptParser::readEntry() {
|
2015-10-08 14:48:38 +08:00
|
|
|
// -e <symbol> takes predecence over ENTRY(<symbol>).
|
|
|
|
expect("(");
|
|
|
|
StringRef Tok = next();
|
|
|
|
if (Config->Entry.empty())
|
|
|
|
Config->Entry = Tok;
|
|
|
|
expect(")");
|
|
|
|
}
|
|
|
|
|
2016-02-12 05:17:59 +08:00
|
|
|
void ScriptParser::readExtern() {
|
2015-10-20 01:35:12 +08:00
|
|
|
expect("(");
|
2016-08-05 09:25:45 +08:00
|
|
|
while (!Error && !skip(")"))
|
|
|
|
Config->Undefined.push_back(next());
|
2015-10-20 01:35:12 +08:00
|
|
|
}
|
|
|
|
|
2016-02-12 05:17:59 +08:00
|
|
|
void ScriptParser::readGroup() {
|
2015-10-01 01:23:26 +08:00
|
|
|
expect("(");
|
2016-08-05 09:25:45 +08:00
|
|
|
while (!Error && !skip(")")) {
|
2015-10-01 01:23:26 +08:00
|
|
|
StringRef Tok = next();
|
2016-08-05 09:25:45 +08:00
|
|
|
if (Tok == "AS_NEEDED")
|
2015-10-01 01:23:26 +08:00
|
|
|
readAsNeeded();
|
2016-08-05 09:25:45 +08:00
|
|
|
else
|
2016-09-09 22:35:36 +08:00
|
|
|
addFile(unquote(Tok));
|
2015-10-01 01:23:26 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-02-12 05:17:59 +08:00
|
|
|
void ScriptParser::readInclude() {
|
2015-10-11 09:31:55 +08:00
|
|
|
StringRef Tok = next();
|
2016-09-09 22:35:36 +08:00
|
|
|
auto MBOrErr = MemoryBuffer::getFile(unquote(Tok));
|
2016-02-03 04:27:59 +08:00
|
|
|
if (!MBOrErr) {
|
2016-03-11 22:43:02 +08:00
|
|
|
setError("cannot open " + Tok);
|
2016-02-03 04:27:59 +08:00
|
|
|
return;
|
|
|
|
}
|
2015-10-11 09:31:55 +08:00
|
|
|
std::unique_ptr<MemoryBuffer> &MB = *MBOrErr;
|
2015-10-11 09:53:04 +08:00
|
|
|
StringRef S = Saver.save(MB->getMemBufferRef().getBuffer());
|
|
|
|
std::vector<StringRef> V = tokenize(S);
|
2015-10-11 09:31:55 +08:00
|
|
|
Tokens.insert(Tokens.begin() + Pos, V.begin(), V.end());
|
|
|
|
}
|
|
|
|
|
2016-02-12 05:17:59 +08:00
|
|
|
void ScriptParser::readOutput() {
|
2015-10-07 08:25:09 +08:00
|
|
|
// -o <file> takes predecence over OUTPUT(<file>).
|
|
|
|
expect("(");
|
|
|
|
StringRef Tok = next();
|
|
|
|
if (Config->OutputFile.empty())
|
2016-09-09 22:35:36 +08:00
|
|
|
Config->OutputFile = unquote(Tok);
|
2015-10-07 08:25:09 +08:00
|
|
|
expect(")");
|
|
|
|
}
|
|
|
|
|
2016-02-12 05:17:59 +08:00
|
|
|
void ScriptParser::readOutputArch() {
|
2015-10-13 05:50:08 +08:00
|
|
|
// Error checking only for now.
|
|
|
|
expect("(");
|
|
|
|
next();
|
|
|
|
expect(")");
|
|
|
|
}
|
|
|
|
|
2016-02-12 05:17:59 +08:00
|
|
|
void ScriptParser::readOutputFormat() {
|
2015-10-01 01:23:26 +08:00
|
|
|
// Error checking only for now.
|
|
|
|
expect("(");
|
|
|
|
next();
|
2015-10-13 05:08:41 +08:00
|
|
|
StringRef Tok = next();
|
|
|
|
if (Tok == ")")
|
2016-09-08 16:20:30 +08:00
|
|
|
return;
|
2016-02-03 04:27:59 +08:00
|
|
|
if (Tok != ",") {
|
2016-03-11 22:43:02 +08:00
|
|
|
setError("unexpected token: " + Tok);
|
2016-02-03 04:27:59 +08:00
|
|
|
return;
|
|
|
|
}
|
2015-10-13 05:08:41 +08:00
|
|
|
next();
|
|
|
|
expect(",");
|
|
|
|
next();
|
2015-10-01 01:23:26 +08:00
|
|
|
expect(")");
|
|
|
|
}
|
|
|
|
|
2016-07-19 17:25:43 +08:00
|
|
|
void ScriptParser::readPhdrs() {
|
|
|
|
expect("{");
|
|
|
|
while (!Error && !skip("}")) {
|
|
|
|
StringRef Tok = next();
|
2016-09-09 17:46:16 +08:00
|
|
|
Opt.PhdrsCommands.push_back(
|
|
|
|
{Tok, PT_NULL, false, false, UINT_MAX, nullptr});
|
2016-07-19 17:25:43 +08:00
|
|
|
PhdrsCommand &PhdrCmd = Opt.PhdrsCommands.back();
|
|
|
|
|
|
|
|
PhdrCmd.Type = readPhdrType();
|
|
|
|
do {
|
|
|
|
Tok = next();
|
|
|
|
if (Tok == ";")
|
|
|
|
break;
|
|
|
|
if (Tok == "FILEHDR")
|
|
|
|
PhdrCmd.HasFilehdr = true;
|
|
|
|
else if (Tok == "PHDRS")
|
|
|
|
PhdrCmd.HasPhdrs = true;
|
2016-09-09 17:46:16 +08:00
|
|
|
else if (Tok == "AT")
|
|
|
|
PhdrCmd.LMAExpr = readParenExpr();
|
2016-07-21 18:43:25 +08:00
|
|
|
else if (Tok == "FLAGS") {
|
|
|
|
expect("(");
|
2016-08-03 06:14:57 +08:00
|
|
|
// Passing 0 for the value of dot is a bit of a hack. It means that
|
|
|
|
// we accept expressions like ".|1".
|
|
|
|
PhdrCmd.Flags = readExpr()(0);
|
2016-07-21 18:43:25 +08:00
|
|
|
expect(")");
|
|
|
|
} else
|
2016-07-19 17:25:43 +08:00
|
|
|
setError("unexpected header attribute: " + Tok);
|
|
|
|
} while (!Error);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-02-12 05:17:59 +08:00
|
|
|
void ScriptParser::readSearchDir() {
|
2015-10-09 01:51:41 +08:00
|
|
|
expect("(");
|
2016-09-09 07:26:54 +08:00
|
|
|
StringRef Tok = next();
|
2016-09-03 03:20:33 +08:00
|
|
|
if (!Config->Nostdlib)
|
2016-09-09 22:35:36 +08:00
|
|
|
Config->SearchPaths.push_back(unquote(Tok));
|
2015-10-09 01:51:41 +08:00
|
|
|
expect(")");
|
|
|
|
}
|
|
|
|
|
2016-02-12 05:17:59 +08:00
|
|
|
void ScriptParser::readSections() {
|
2016-09-14 16:32:36 +08:00
|
|
|
Opt.HasSections = true;
|
2015-11-12 17:52:08 +08:00
|
|
|
expect("{");
|
2016-04-16 18:10:32 +08:00
|
|
|
while (!Error && !skip("}")) {
|
2016-07-25 07:05:57 +08:00
|
|
|
StringRef Tok = next();
|
2016-09-07 15:08:43 +08:00
|
|
|
BaseCommand *Cmd = readProvideOrAssignment(Tok, true);
|
2016-08-11 15:56:43 +08:00
|
|
|
if (!Cmd) {
|
|
|
|
if (Tok == "ASSERT")
|
|
|
|
Cmd = new AssertCommand(readAssert());
|
|
|
|
else
|
|
|
|
Cmd = readOutputSectionDescription(Tok);
|
Make readExpr return an Expr object instead of a vector of tokens.
Previously, we handled an expression as a vector of tokens. In other
words, an expression was a vector of uncooked raw StringRefs.
When we need a value of an expression, we used ExprParser to run
the expression.
The separation was needed essentially because parse time is too
early to evaluate an expression. In order to evaluate an expression,
we need to finalize section sizes. Because linker script parsing
is done at very early stage of the linking process, we can't
evaluate expressions while parsing.
The above mechanism worked fairly well, but there were a few
drawbacks.
One thing is that we sometimes have to parse the same expression
more than once in order to find the end of the expression.
In some contexts, linker script expressions have no clear end marker.
So, we needed to recognize balanced expressions and ternary operators.
The other is poor error reporting. Since expressions are parsed
basically twice, and some information that is available at the first
stage is lost in the second stage, it was hard to print out
apprpriate error messages.
This patch fixes the issues with a new approach.
Now the expression parsing is integrated into ScriptParser.
ExprParser class is removed. Expressions are represented as lambdas
instead of vectors of tokens. Lambdas captures information they
need to run themselves when they are created.
In this way, ends of expressions are naturally detected, and
errors are handled in the usual way. This patch also reduces
the amount of code.
Differential Revision: https://reviews.llvm.org/D22728
llvm-svn: 276574
2016-07-25 02:19:40 +08:00
|
|
|
}
|
2016-08-04 10:03:27 +08:00
|
|
|
Opt.Commands.emplace_back(Cmd);
|
2016-04-16 18:10:32 +08:00
|
|
|
}
|
2015-11-12 17:52:08 +08:00
|
|
|
}
|
|
|
|
|
Make readExpr return an Expr object instead of a vector of tokens.
Previously, we handled an expression as a vector of tokens. In other
words, an expression was a vector of uncooked raw StringRefs.
When we need a value of an expression, we used ExprParser to run
the expression.
The separation was needed essentially because parse time is too
early to evaluate an expression. In order to evaluate an expression,
we need to finalize section sizes. Because linker script parsing
is done at very early stage of the linking process, we can't
evaluate expressions while parsing.
The above mechanism worked fairly well, but there were a few
drawbacks.
One thing is that we sometimes have to parse the same expression
more than once in order to find the end of the expression.
In some contexts, linker script expressions have no clear end marker.
So, we needed to recognize balanced expressions and ternary operators.
The other is poor error reporting. Since expressions are parsed
basically twice, and some information that is available at the first
stage is lost in the second stage, it was hard to print out
apprpriate error messages.
This patch fixes the issues with a new approach.
Now the expression parsing is integrated into ScriptParser.
ExprParser class is removed. Expressions are represented as lambdas
instead of vectors of tokens. Lambdas captures information they
need to run themselves when they are created.
In this way, ends of expressions are naturally detected, and
errors are handled in the usual way. This patch also reduces
the amount of code.
Differential Revision: https://reviews.llvm.org/D22728
llvm-svn: 276574
2016-07-25 02:19:40 +08:00
|
|
|
static int precedence(StringRef Op) {
|
|
|
|
return StringSwitch<int>(Op)
|
|
|
|
.Case("*", 4)
|
|
|
|
.Case("/", 4)
|
|
|
|
.Case("+", 3)
|
|
|
|
.Case("-", 3)
|
|
|
|
.Case("<", 2)
|
|
|
|
.Case(">", 2)
|
|
|
|
.Case(">=", 2)
|
|
|
|
.Case("<=", 2)
|
|
|
|
.Case("==", 2)
|
|
|
|
.Case("!=", 2)
|
|
|
|
.Case("&", 1)
|
2016-08-23 05:33:35 +08:00
|
|
|
.Case("|", 1)
|
Make readExpr return an Expr object instead of a vector of tokens.
Previously, we handled an expression as a vector of tokens. In other
words, an expression was a vector of uncooked raw StringRefs.
When we need a value of an expression, we used ExprParser to run
the expression.
The separation was needed essentially because parse time is too
early to evaluate an expression. In order to evaluate an expression,
we need to finalize section sizes. Because linker script parsing
is done at very early stage of the linking process, we can't
evaluate expressions while parsing.
The above mechanism worked fairly well, but there were a few
drawbacks.
One thing is that we sometimes have to parse the same expression
more than once in order to find the end of the expression.
In some contexts, linker script expressions have no clear end marker.
So, we needed to recognize balanced expressions and ternary operators.
The other is poor error reporting. Since expressions are parsed
basically twice, and some information that is available at the first
stage is lost in the second stage, it was hard to print out
apprpriate error messages.
This patch fixes the issues with a new approach.
Now the expression parsing is integrated into ScriptParser.
ExprParser class is removed. Expressions are represented as lambdas
instead of vectors of tokens. Lambdas captures information they
need to run themselves when they are created.
In this way, ends of expressions are naturally detected, and
errors are handled in the usual way. This patch also reduces
the amount of code.
Differential Revision: https://reviews.llvm.org/D22728
llvm-svn: 276574
2016-07-25 02:19:40 +08:00
|
|
|
.Default(-1);
|
|
|
|
}
|
|
|
|
|
2016-09-03 05:17:20 +08:00
|
|
|
Regex ScriptParser::readFilePatterns() {
|
2016-08-04 10:03:27 +08:00
|
|
|
std::vector<StringRef> V;
|
|
|
|
while (!Error && !skip(")"))
|
|
|
|
V.push_back(next());
|
2016-09-03 05:17:20 +08:00
|
|
|
return compileGlobPatterns(V);
|
2016-07-29 23:32:46 +08:00
|
|
|
}
|
|
|
|
|
2016-09-17 04:21:55 +08:00
|
|
|
SortSectionPolicy ScriptParser::readSortKind() {
|
2016-08-05 06:27:00 +08:00
|
|
|
if (skip("SORT") || skip("SORT_BY_NAME"))
|
2016-09-17 04:21:55 +08:00
|
|
|
return SortSectionPolicy::Name;
|
2016-08-05 06:27:00 +08:00
|
|
|
if (skip("SORT_BY_ALIGNMENT"))
|
2016-09-17 04:21:55 +08:00
|
|
|
return SortSectionPolicy::Alignment;
|
2016-09-16 03:15:12 +08:00
|
|
|
if (skip("SORT_BY_INIT_PRIORITY"))
|
2016-09-17 04:21:55 +08:00
|
|
|
return SortSectionPolicy::Priority;
|
|
|
|
if (skip("SORT_NONE"))
|
2016-09-17 05:14:55 +08:00
|
|
|
return SortSectionPolicy::None;
|
|
|
|
return SortSectionPolicy::Default;
|
2016-09-17 04:21:55 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static void selectSortKind(InputSectionDescription *Cmd) {
|
2016-09-17 05:14:55 +08:00
|
|
|
if (Cmd->SortOuter == SortSectionPolicy::None) {
|
|
|
|
Cmd->SortOuter = SortSectionPolicy::Default;
|
2016-09-17 04:21:55 +08:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2016-09-17 05:14:55 +08:00
|
|
|
if (Cmd->SortOuter != SortSectionPolicy::Default) {
|
2016-09-17 04:21:55 +08:00
|
|
|
// If the section sorting command in linker script is nested, the command
|
|
|
|
// line option will be ignored.
|
2016-09-17 05:14:55 +08:00
|
|
|
if (Cmd->SortInner != SortSectionPolicy::Default)
|
2016-09-17 04:21:55 +08:00
|
|
|
return;
|
|
|
|
// If the section sorting command in linker script isn't nested, the
|
|
|
|
// command line option will make the section sorting command to be treated
|
|
|
|
// as nested sorting command.
|
|
|
|
Cmd->SortInner = Config->SortSection;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
// If sorting rule not specified, use command line option.
|
|
|
|
Cmd->SortOuter = Config->SortSection;
|
2016-08-05 06:27:00 +08:00
|
|
|
}
|
|
|
|
|
2016-09-17 01:42:10 +08:00
|
|
|
// Method reads a list of sequence of excluded files and section globs given in
|
|
|
|
// a following form: ((EXCLUDE_FILE(file_pattern+))? section_pattern+)+
|
|
|
|
// Example: *(.foo.1 EXCLUDE_FILE (*a.o) .foo.2 EXCLUDE_FILE (*b.o) .foo.3)
|
|
|
|
void ScriptParser::readSectionExcludes(InputSectionDescription *Cmd) {
|
2016-09-17 10:10:15 +08:00
|
|
|
Regex ExcludeFileRe;
|
2016-09-17 01:42:10 +08:00
|
|
|
std::vector<StringRef> V;
|
|
|
|
|
|
|
|
while (!Error) {
|
|
|
|
if (skip(")")) {
|
|
|
|
Cmd->SectionsVec.push_back(
|
|
|
|
{std::move(ExcludeFileRe), compileGlobPatterns(V)});
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (skip("EXCLUDE_FILE")) {
|
|
|
|
if (!V.empty()) {
|
|
|
|
Cmd->SectionsVec.push_back(
|
|
|
|
{std::move(ExcludeFileRe), compileGlobPatterns(V)});
|
|
|
|
V.clear();
|
|
|
|
}
|
|
|
|
|
|
|
|
expect("(");
|
|
|
|
ExcludeFileRe = readFilePatterns();
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
V.push_back(next());
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-08-30 17:46:59 +08:00
|
|
|
InputSectionDescription *
|
|
|
|
ScriptParser::readInputSectionRules(StringRef FilePattern) {
|
2016-09-03 05:17:20 +08:00
|
|
|
auto *Cmd = new InputSectionDescription(FilePattern);
|
2016-07-26 05:47:13 +08:00
|
|
|
expect("(");
|
2016-07-27 09:44:01 +08:00
|
|
|
|
2016-08-05 06:27:00 +08:00
|
|
|
// Read SORT().
|
2016-09-17 04:21:55 +08:00
|
|
|
SortSectionPolicy K1 = readSortKind();
|
2016-09-17 05:14:55 +08:00
|
|
|
if (K1 != SortSectionPolicy::Default) {
|
2016-08-05 06:27:00 +08:00
|
|
|
Cmd->SortOuter = K1;
|
2016-07-29 23:32:46 +08:00
|
|
|
expect("(");
|
2016-09-17 04:21:55 +08:00
|
|
|
SortSectionPolicy K2 = readSortKind();
|
2016-09-17 05:14:55 +08:00
|
|
|
if (K2 != SortSectionPolicy::Default) {
|
2016-08-05 06:27:00 +08:00
|
|
|
Cmd->SortInner = K2;
|
2016-08-03 16:35:59 +08:00
|
|
|
expect("(");
|
2016-09-17 10:10:15 +08:00
|
|
|
Cmd->SectionsVec.push_back({Regex(), readFilePatterns()});
|
2016-08-03 16:35:59 +08:00
|
|
|
expect(")");
|
|
|
|
} else {
|
2016-09-17 10:10:15 +08:00
|
|
|
Cmd->SectionsVec.push_back({Regex(), readFilePatterns()});
|
2016-08-03 16:35:59 +08:00
|
|
|
}
|
2016-07-29 23:32:46 +08:00
|
|
|
expect(")");
|
2016-09-17 04:21:55 +08:00
|
|
|
selectSortKind(Cmd);
|
2016-08-04 10:03:27 +08:00
|
|
|
return Cmd;
|
2016-07-29 05:51:30 +08:00
|
|
|
}
|
2016-07-29 23:32:46 +08:00
|
|
|
|
2016-09-17 04:21:55 +08:00
|
|
|
selectSortKind(Cmd);
|
2016-09-17 01:42:10 +08:00
|
|
|
readSectionExcludes(Cmd);
|
2016-08-04 10:03:27 +08:00
|
|
|
return Cmd;
|
2016-07-29 05:51:30 +08:00
|
|
|
}
|
|
|
|
|
2016-08-30 17:46:59 +08:00
|
|
|
InputSectionDescription *
|
|
|
|
ScriptParser::readInputSectionDescription(StringRef Tok) {
|
2016-07-29 05:51:30 +08:00
|
|
|
// Input section wildcard can be surrounded by KEEP.
|
|
|
|
// https://sourceware.org/binutils/docs/ld/Input-Section-Keep.html#Input-Section-Keep
|
2016-08-30 17:46:59 +08:00
|
|
|
if (Tok == "KEEP") {
|
2016-07-29 05:51:30 +08:00
|
|
|
expect("(");
|
2016-08-30 17:46:59 +08:00
|
|
|
StringRef FilePattern = next();
|
|
|
|
InputSectionDescription *Cmd = readInputSectionRules(FilePattern);
|
2016-07-27 09:44:01 +08:00
|
|
|
expect(")");
|
2016-09-17 10:10:15 +08:00
|
|
|
for (std::pair<Regex, Regex> &Regex : Cmd->SectionsVec)
|
2016-09-17 01:42:10 +08:00
|
|
|
Opt.KeptSections.push_back(&Regex.second);
|
2016-08-04 10:03:27 +08:00
|
|
|
return Cmd;
|
2016-07-26 05:47:13 +08:00
|
|
|
}
|
2016-08-30 17:46:59 +08:00
|
|
|
return readInputSectionRules(Tok);
|
2016-07-26 05:47:13 +08:00
|
|
|
}
|
|
|
|
|
2016-07-28 15:18:23 +08:00
|
|
|
void ScriptParser::readSort() {
|
|
|
|
expect("(");
|
|
|
|
expect("CONSTRUCTORS");
|
|
|
|
expect(")");
|
|
|
|
}
|
|
|
|
|
2016-08-04 17:29:31 +08:00
|
|
|
Expr ScriptParser::readAssert() {
|
|
|
|
expect("(");
|
|
|
|
Expr E = readExpr();
|
|
|
|
expect(",");
|
2016-09-09 22:35:36 +08:00
|
|
|
StringRef Msg = unquote(next());
|
2016-08-04 17:29:31 +08:00
|
|
|
expect(")");
|
|
|
|
return [=](uint64_t Dot) {
|
|
|
|
uint64_t V = E(Dot);
|
|
|
|
if (!V)
|
|
|
|
error(Msg);
|
|
|
|
return V;
|
|
|
|
};
|
|
|
|
}
|
|
|
|
|
2016-09-07 01:46:43 +08:00
|
|
|
// Reads a FILL(expr) command. We handle the FILL command as an
|
|
|
|
// alias for =fillexp section attribute, which is different from
|
|
|
|
// what GNU linkers do.
|
|
|
|
// https://sourceware.org/binutils/docs/ld/Output-Section-Data.html
|
2016-09-06 21:51:57 +08:00
|
|
|
std::vector<uint8_t> ScriptParser::readFill() {
|
|
|
|
expect("(");
|
|
|
|
std::vector<uint8_t> V = readOutputSectionFiller(next());
|
|
|
|
expect(")");
|
|
|
|
expect(";");
|
|
|
|
return V;
|
|
|
|
}
|
|
|
|
|
2016-08-04 10:03:27 +08:00
|
|
|
OutputSectionCommand *
|
|
|
|
ScriptParser::readOutputSectionDescription(StringRef OutSec) {
|
2016-07-21 14:43:01 +08:00
|
|
|
OutputSectionCommand *Cmd = new OutputSectionCommand(OutSec);
|
2016-07-25 16:29:46 +08:00
|
|
|
|
|
|
|
// Read an address expression.
|
|
|
|
// https://sourceware.org/binutils/docs/ld/Output-Section-Address.html#Output-Section-Address
|
|
|
|
if (peek() != ":")
|
|
|
|
Cmd->AddrExpr = readExpr();
|
|
|
|
|
2015-11-12 17:52:08 +08:00
|
|
|
expect(":");
|
2016-07-22 11:36:24 +08:00
|
|
|
|
2016-08-17 15:44:19 +08:00
|
|
|
if (skip("AT"))
|
2016-08-18 02:59:16 +08:00
|
|
|
Cmd->LmaExpr = readParenExpr();
|
2016-07-27 02:06:29 +08:00
|
|
|
if (skip("ALIGN"))
|
2016-08-18 02:59:16 +08:00
|
|
|
Cmd->AlignExpr = readParenExpr();
|
2016-08-19 23:18:23 +08:00
|
|
|
if (skip("SUBALIGN"))
|
|
|
|
Cmd->SubalignExpr = readParenExpr();
|
2016-07-27 02:06:29 +08:00
|
|
|
|
2016-07-22 11:36:24 +08:00
|
|
|
// Parse constraints.
|
|
|
|
if (skip("ONLY_IF_RO"))
|
2016-07-26 06:00:10 +08:00
|
|
|
Cmd->Constraint = ConstraintKind::ReadOnly;
|
2016-07-22 11:36:24 +08:00
|
|
|
if (skip("ONLY_IF_RW"))
|
2016-07-26 06:00:10 +08:00
|
|
|
Cmd->Constraint = ConstraintKind::ReadWrite;
|
2015-11-12 17:52:08 +08:00
|
|
|
expect("{");
|
2016-04-22 06:00:51 +08:00
|
|
|
|
2016-02-03 04:27:59 +08:00
|
|
|
while (!Error && !skip("}")) {
|
2016-08-11 15:56:43 +08:00
|
|
|
StringRef Tok = next();
|
2016-09-07 15:08:43 +08:00
|
|
|
if (SymbolAssignment *Assignment = readProvideOrAssignment(Tok, false))
|
2016-08-11 15:56:43 +08:00
|
|
|
Cmd->Commands.emplace_back(Assignment);
|
2016-09-06 21:51:57 +08:00
|
|
|
else if (Tok == "FILL")
|
|
|
|
Cmd->Filler = readFill();
|
2016-08-11 15:56:43 +08:00
|
|
|
else if (Tok == "SORT")
|
2016-07-28 15:18:23 +08:00
|
|
|
readSort();
|
2016-08-30 17:46:59 +08:00
|
|
|
else if (peek() == "(")
|
|
|
|
Cmd->Commands.emplace_back(readInputSectionDescription(Tok));
|
2016-08-11 15:56:43 +08:00
|
|
|
else
|
|
|
|
setError("unknown command " + Tok);
|
2015-11-12 17:52:08 +08:00
|
|
|
}
|
2016-07-21 14:43:01 +08:00
|
|
|
Cmd->Phdrs = readOutputSectionPhdrs();
|
2016-09-06 21:51:57 +08:00
|
|
|
if (peek().startswith("="))
|
|
|
|
Cmd->Filler = readOutputSectionFiller(next().drop_front());
|
2016-08-04 10:03:27 +08:00
|
|
|
return Cmd;
|
2016-07-29 14:14:07 +08:00
|
|
|
}
|
2016-04-22 06:00:51 +08:00
|
|
|
|
2016-08-30 06:01:21 +08:00
|
|
|
// Read "=<number>" where <number> is an octal/decimal/hexadecimal number.
|
|
|
|
// https://sourceware.org/binutils/docs/ld/Output-Section-Fill.html
|
|
|
|
//
|
|
|
|
// ld.gold is not fully compatible with ld.bfd. ld.bfd handles
|
|
|
|
// hexstrings as blobs of arbitrary sizes, while ld.gold handles them
|
|
|
|
// as 32-bit big-endian values. We will do the same as ld.gold does
|
|
|
|
// because it's simpler than what ld.bfd does.
|
2016-09-06 21:51:57 +08:00
|
|
|
std::vector<uint8_t> ScriptParser::readOutputSectionFiller(StringRef Tok) {
|
2016-08-04 07:25:15 +08:00
|
|
|
uint32_t V;
|
2016-09-06 21:51:57 +08:00
|
|
|
if (Tok.getAsInteger(0, V)) {
|
2016-08-04 07:25:15 +08:00
|
|
|
setError("invalid filler expression: " + Tok);
|
2016-07-29 14:14:07 +08:00
|
|
|
return {};
|
2016-02-26 22:48:31 +08:00
|
|
|
}
|
2016-08-30 06:01:21 +08:00
|
|
|
return {uint8_t(V >> 24), uint8_t(V >> 16), uint8_t(V >> 8), uint8_t(V)};
|
2015-11-12 17:52:08 +08:00
|
|
|
}
|
|
|
|
|
2016-08-16 09:11:16 +08:00
|
|
|
SymbolAssignment *ScriptParser::readProvideHidden(bool Provide, bool Hidden) {
|
2016-07-22 15:38:40 +08:00
|
|
|
expect("(");
|
2016-07-29 08:29:25 +08:00
|
|
|
SymbolAssignment *Cmd = readAssignment(next());
|
2016-08-16 09:11:16 +08:00
|
|
|
Cmd->Provide = Provide;
|
2016-07-29 08:29:25 +08:00
|
|
|
Cmd->Hidden = Hidden;
|
2016-07-22 15:38:40 +08:00
|
|
|
expect(")");
|
|
|
|
expect(";");
|
2016-08-04 10:03:27 +08:00
|
|
|
return Cmd;
|
2016-07-22 15:38:40 +08:00
|
|
|
}
|
|
|
|
|
2016-09-07 15:08:43 +08:00
|
|
|
SymbolAssignment *ScriptParser::readProvideOrAssignment(StringRef Tok,
|
|
|
|
bool MakeAbsolute) {
|
2016-08-11 15:56:43 +08:00
|
|
|
SymbolAssignment *Cmd = nullptr;
|
|
|
|
if (peek() == "=" || peek() == "+=") {
|
|
|
|
Cmd = readAssignment(Tok);
|
|
|
|
expect(";");
|
|
|
|
} else if (Tok == "PROVIDE") {
|
2016-08-16 09:11:16 +08:00
|
|
|
Cmd = readProvideHidden(true, false);
|
|
|
|
} else if (Tok == "HIDDEN") {
|
|
|
|
Cmd = readProvideHidden(false, true);
|
2016-08-11 15:56:43 +08:00
|
|
|
} else if (Tok == "PROVIDE_HIDDEN") {
|
2016-08-16 09:11:16 +08:00
|
|
|
Cmd = readProvideHidden(true, true);
|
2016-08-11 15:56:43 +08:00
|
|
|
}
|
2016-09-07 15:08:43 +08:00
|
|
|
if (Cmd && MakeAbsolute)
|
|
|
|
Cmd->IsAbsolute = true;
|
2016-08-11 15:56:43 +08:00
|
|
|
return Cmd;
|
|
|
|
}
|
|
|
|
|
2016-07-29 05:08:56 +08:00
|
|
|
static uint64_t getSymbolValue(StringRef S, uint64_t Dot) {
|
|
|
|
if (S == ".")
|
|
|
|
return Dot;
|
2016-09-08 16:19:13 +08:00
|
|
|
return ScriptBase->getSymbolValue(S);
|
2016-08-10 15:59:34 +08:00
|
|
|
}
|
|
|
|
|
2016-07-29 05:08:56 +08:00
|
|
|
SymbolAssignment *ScriptParser::readAssignment(StringRef Name) {
|
|
|
|
StringRef Op = next();
|
2016-09-07 15:08:43 +08:00
|
|
|
bool IsAbsolute = false;
|
|
|
|
Expr E;
|
2016-07-29 05:08:56 +08:00
|
|
|
assert(Op == "=" || Op == "+=");
|
2016-09-07 15:08:43 +08:00
|
|
|
if (skip("ABSOLUTE")) {
|
|
|
|
E = readParenExpr();
|
|
|
|
IsAbsolute = true;
|
|
|
|
} else {
|
|
|
|
E = readExpr();
|
|
|
|
}
|
2016-07-29 05:08:56 +08:00
|
|
|
if (Op == "+=")
|
|
|
|
E = [=](uint64_t Dot) { return getSymbolValue(Name, Dot) + E(Dot); };
|
2016-09-07 15:08:43 +08:00
|
|
|
return new SymbolAssignment(Name, E, IsAbsolute);
|
2016-07-29 05:08:56 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
// This is an operator-precedence parser to parse a linker
|
|
|
|
// script expression.
|
|
|
|
Expr ScriptParser::readExpr() { return readExpr1(readPrimary(), 0); }
|
|
|
|
|
2016-08-05 09:04:59 +08:00
|
|
|
static Expr combine(StringRef Op, Expr L, Expr R) {
|
|
|
|
if (Op == "*")
|
|
|
|
return [=](uint64_t Dot) { return L(Dot) * R(Dot); };
|
|
|
|
if (Op == "/") {
|
|
|
|
return [=](uint64_t Dot) -> uint64_t {
|
|
|
|
uint64_t RHS = R(Dot);
|
|
|
|
if (RHS == 0) {
|
|
|
|
error("division by zero");
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
return L(Dot) / RHS;
|
|
|
|
};
|
|
|
|
}
|
|
|
|
if (Op == "+")
|
|
|
|
return [=](uint64_t Dot) { return L(Dot) + R(Dot); };
|
|
|
|
if (Op == "-")
|
|
|
|
return [=](uint64_t Dot) { return L(Dot) - R(Dot); };
|
|
|
|
if (Op == "<")
|
|
|
|
return [=](uint64_t Dot) { return L(Dot) < R(Dot); };
|
|
|
|
if (Op == ">")
|
|
|
|
return [=](uint64_t Dot) { return L(Dot) > R(Dot); };
|
|
|
|
if (Op == ">=")
|
|
|
|
return [=](uint64_t Dot) { return L(Dot) >= R(Dot); };
|
|
|
|
if (Op == "<=")
|
|
|
|
return [=](uint64_t Dot) { return L(Dot) <= R(Dot); };
|
|
|
|
if (Op == "==")
|
|
|
|
return [=](uint64_t Dot) { return L(Dot) == R(Dot); };
|
|
|
|
if (Op == "!=")
|
|
|
|
return [=](uint64_t Dot) { return L(Dot) != R(Dot); };
|
|
|
|
if (Op == "&")
|
|
|
|
return [=](uint64_t Dot) { return L(Dot) & R(Dot); };
|
2016-08-23 05:33:35 +08:00
|
|
|
if (Op == "|")
|
|
|
|
return [=](uint64_t Dot) { return L(Dot) | R(Dot); };
|
2016-08-05 09:04:59 +08:00
|
|
|
llvm_unreachable("invalid operator");
|
|
|
|
}
|
|
|
|
|
Make readExpr return an Expr object instead of a vector of tokens.
Previously, we handled an expression as a vector of tokens. In other
words, an expression was a vector of uncooked raw StringRefs.
When we need a value of an expression, we used ExprParser to run
the expression.
The separation was needed essentially because parse time is too
early to evaluate an expression. In order to evaluate an expression,
we need to finalize section sizes. Because linker script parsing
is done at very early stage of the linking process, we can't
evaluate expressions while parsing.
The above mechanism worked fairly well, but there were a few
drawbacks.
One thing is that we sometimes have to parse the same expression
more than once in order to find the end of the expression.
In some contexts, linker script expressions have no clear end marker.
So, we needed to recognize balanced expressions and ternary operators.
The other is poor error reporting. Since expressions are parsed
basically twice, and some information that is available at the first
stage is lost in the second stage, it was hard to print out
apprpriate error messages.
This patch fixes the issues with a new approach.
Now the expression parsing is integrated into ScriptParser.
ExprParser class is removed. Expressions are represented as lambdas
instead of vectors of tokens. Lambdas captures information they
need to run themselves when they are created.
In this way, ends of expressions are naturally detected, and
errors are handled in the usual way. This patch also reduces
the amount of code.
Differential Revision: https://reviews.llvm.org/D22728
llvm-svn: 276574
2016-07-25 02:19:40 +08:00
|
|
|
// This is a part of the operator-precedence parser. This function
|
|
|
|
// assumes that the remaining token stream starts with an operator.
|
|
|
|
Expr ScriptParser::readExpr1(Expr Lhs, int MinPrec) {
|
|
|
|
while (!atEOF() && !Error) {
|
|
|
|
// Read an operator and an expression.
|
|
|
|
StringRef Op1 = peek();
|
|
|
|
if (Op1 == "?")
|
|
|
|
return readTernary(Lhs);
|
|
|
|
if (precedence(Op1) < MinPrec)
|
|
|
|
break;
|
|
|
|
next();
|
|
|
|
Expr Rhs = readPrimary();
|
|
|
|
|
|
|
|
// Evaluate the remaining part of the expression first if the
|
|
|
|
// next operator has greater precedence than the previous one.
|
|
|
|
// For example, if we have read "+" and "3", and if the next
|
|
|
|
// operator is "*", then we'll evaluate 3 * ... part first.
|
|
|
|
while (!atEOF()) {
|
|
|
|
StringRef Op2 = peek();
|
|
|
|
if (precedence(Op2) <= precedence(Op1))
|
2016-07-22 15:38:40 +08:00
|
|
|
break;
|
Make readExpr return an Expr object instead of a vector of tokens.
Previously, we handled an expression as a vector of tokens. In other
words, an expression was a vector of uncooked raw StringRefs.
When we need a value of an expression, we used ExprParser to run
the expression.
The separation was needed essentially because parse time is too
early to evaluate an expression. In order to evaluate an expression,
we need to finalize section sizes. Because linker script parsing
is done at very early stage of the linking process, we can't
evaluate expressions while parsing.
The above mechanism worked fairly well, but there were a few
drawbacks.
One thing is that we sometimes have to parse the same expression
more than once in order to find the end of the expression.
In some contexts, linker script expressions have no clear end marker.
So, we needed to recognize balanced expressions and ternary operators.
The other is poor error reporting. Since expressions are parsed
basically twice, and some information that is available at the first
stage is lost in the second stage, it was hard to print out
apprpriate error messages.
This patch fixes the issues with a new approach.
Now the expression parsing is integrated into ScriptParser.
ExprParser class is removed. Expressions are represented as lambdas
instead of vectors of tokens. Lambdas captures information they
need to run themselves when they are created.
In this way, ends of expressions are naturally detected, and
errors are handled in the usual way. This patch also reduces
the amount of code.
Differential Revision: https://reviews.llvm.org/D22728
llvm-svn: 276574
2016-07-25 02:19:40 +08:00
|
|
|
Rhs = readExpr1(Rhs, precedence(Op2));
|
|
|
|
}
|
2016-07-22 15:38:40 +08:00
|
|
|
|
Make readExpr return an Expr object instead of a vector of tokens.
Previously, we handled an expression as a vector of tokens. In other
words, an expression was a vector of uncooked raw StringRefs.
When we need a value of an expression, we used ExprParser to run
the expression.
The separation was needed essentially because parse time is too
early to evaluate an expression. In order to evaluate an expression,
we need to finalize section sizes. Because linker script parsing
is done at very early stage of the linking process, we can't
evaluate expressions while parsing.
The above mechanism worked fairly well, but there were a few
drawbacks.
One thing is that we sometimes have to parse the same expression
more than once in order to find the end of the expression.
In some contexts, linker script expressions have no clear end marker.
So, we needed to recognize balanced expressions and ternary operators.
The other is poor error reporting. Since expressions are parsed
basically twice, and some information that is available at the first
stage is lost in the second stage, it was hard to print out
apprpriate error messages.
This patch fixes the issues with a new approach.
Now the expression parsing is integrated into ScriptParser.
ExprParser class is removed. Expressions are represented as lambdas
instead of vectors of tokens. Lambdas captures information they
need to run themselves when they are created.
In this way, ends of expressions are naturally detected, and
errors are handled in the usual way. This patch also reduces
the amount of code.
Differential Revision: https://reviews.llvm.org/D22728
llvm-svn: 276574
2016-07-25 02:19:40 +08:00
|
|
|
Lhs = combine(Op1, Lhs, Rhs);
|
2016-07-12 14:39:48 +08:00
|
|
|
}
|
Make readExpr return an Expr object instead of a vector of tokens.
Previously, we handled an expression as a vector of tokens. In other
words, an expression was a vector of uncooked raw StringRefs.
When we need a value of an expression, we used ExprParser to run
the expression.
The separation was needed essentially because parse time is too
early to evaluate an expression. In order to evaluate an expression,
we need to finalize section sizes. Because linker script parsing
is done at very early stage of the linking process, we can't
evaluate expressions while parsing.
The above mechanism worked fairly well, but there were a few
drawbacks.
One thing is that we sometimes have to parse the same expression
more than once in order to find the end of the expression.
In some contexts, linker script expressions have no clear end marker.
So, we needed to recognize balanced expressions and ternary operators.
The other is poor error reporting. Since expressions are parsed
basically twice, and some information that is available at the first
stage is lost in the second stage, it was hard to print out
apprpriate error messages.
This patch fixes the issues with a new approach.
Now the expression parsing is integrated into ScriptParser.
ExprParser class is removed. Expressions are represented as lambdas
instead of vectors of tokens. Lambdas captures information they
need to run themselves when they are created.
In this way, ends of expressions are naturally detected, and
errors are handled in the usual way. This patch also reduces
the amount of code.
Differential Revision: https://reviews.llvm.org/D22728
llvm-svn: 276574
2016-07-25 02:19:40 +08:00
|
|
|
return Lhs;
|
|
|
|
}
|
|
|
|
|
|
|
|
uint64_t static getConstant(StringRef S) {
|
2016-08-17 10:10:51 +08:00
|
|
|
if (S == "COMMONPAGESIZE")
|
Make readExpr return an Expr object instead of a vector of tokens.
Previously, we handled an expression as a vector of tokens. In other
words, an expression was a vector of uncooked raw StringRefs.
When we need a value of an expression, we used ExprParser to run
the expression.
The separation was needed essentially because parse time is too
early to evaluate an expression. In order to evaluate an expression,
we need to finalize section sizes. Because linker script parsing
is done at very early stage of the linking process, we can't
evaluate expressions while parsing.
The above mechanism worked fairly well, but there were a few
drawbacks.
One thing is that we sometimes have to parse the same expression
more than once in order to find the end of the expression.
In some contexts, linker script expressions have no clear end marker.
So, we needed to recognize balanced expressions and ternary operators.
The other is poor error reporting. Since expressions are parsed
basically twice, and some information that is available at the first
stage is lost in the second stage, it was hard to print out
apprpriate error messages.
This patch fixes the issues with a new approach.
Now the expression parsing is integrated into ScriptParser.
ExprParser class is removed. Expressions are represented as lambdas
instead of vectors of tokens. Lambdas captures information they
need to run themselves when they are created.
In this way, ends of expressions are naturally detected, and
errors are handled in the usual way. This patch also reduces
the amount of code.
Differential Revision: https://reviews.llvm.org/D22728
llvm-svn: 276574
2016-07-25 02:19:40 +08:00
|
|
|
return Target->PageSize;
|
2016-08-17 10:10:51 +08:00
|
|
|
if (S == "MAXPAGESIZE")
|
|
|
|
return Target->MaxPageSize;
|
Make readExpr return an Expr object instead of a vector of tokens.
Previously, we handled an expression as a vector of tokens. In other
words, an expression was a vector of uncooked raw StringRefs.
When we need a value of an expression, we used ExprParser to run
the expression.
The separation was needed essentially because parse time is too
early to evaluate an expression. In order to evaluate an expression,
we need to finalize section sizes. Because linker script parsing
is done at very early stage of the linking process, we can't
evaluate expressions while parsing.
The above mechanism worked fairly well, but there were a few
drawbacks.
One thing is that we sometimes have to parse the same expression
more than once in order to find the end of the expression.
In some contexts, linker script expressions have no clear end marker.
So, we needed to recognize balanced expressions and ternary operators.
The other is poor error reporting. Since expressions are parsed
basically twice, and some information that is available at the first
stage is lost in the second stage, it was hard to print out
apprpriate error messages.
This patch fixes the issues with a new approach.
Now the expression parsing is integrated into ScriptParser.
ExprParser class is removed. Expressions are represented as lambdas
instead of vectors of tokens. Lambdas captures information they
need to run themselves when they are created.
In this way, ends of expressions are naturally detected, and
errors are handled in the usual way. This patch also reduces
the amount of code.
Differential Revision: https://reviews.llvm.org/D22728
llvm-svn: 276574
2016-07-25 02:19:40 +08:00
|
|
|
error("unknown constant: " + S);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2016-09-03 02:19:00 +08:00
|
|
|
// Parses Tok as an integer. Returns true if successful.
|
|
|
|
// It recognizes hexadecimal (prefixed with "0x" or suffixed with "H")
|
|
|
|
// and decimal numbers. Decimal numbers may have "K" (kilo) or
|
|
|
|
// "M" (mega) prefixes.
|
2016-09-03 00:01:42 +08:00
|
|
|
static bool readInteger(StringRef Tok, uint64_t &Result) {
|
2016-09-03 05:54:35 +08:00
|
|
|
if (Tok.startswith("-")) {
|
|
|
|
if (!readInteger(Tok.substr(1), Result))
|
|
|
|
return false;
|
|
|
|
Result = -Result;
|
|
|
|
return true;
|
|
|
|
}
|
2016-09-03 00:01:42 +08:00
|
|
|
if (Tok.startswith_lower("0x"))
|
|
|
|
return !Tok.substr(2).getAsInteger(16, Result);
|
|
|
|
if (Tok.endswith_lower("H"))
|
|
|
|
return !Tok.drop_back().getAsInteger(16, Result);
|
|
|
|
|
|
|
|
int Suffix = 1;
|
|
|
|
if (Tok.endswith_lower("K")) {
|
|
|
|
Suffix = 1024;
|
|
|
|
Tok = Tok.drop_back();
|
|
|
|
} else if (Tok.endswith_lower("M")) {
|
|
|
|
Suffix = 1024 * 1024;
|
|
|
|
Tok = Tok.drop_back();
|
|
|
|
}
|
|
|
|
if (Tok.getAsInteger(10, Result))
|
|
|
|
return false;
|
|
|
|
Result *= Suffix;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
Make readExpr return an Expr object instead of a vector of tokens.
Previously, we handled an expression as a vector of tokens. In other
words, an expression was a vector of uncooked raw StringRefs.
When we need a value of an expression, we used ExprParser to run
the expression.
The separation was needed essentially because parse time is too
early to evaluate an expression. In order to evaluate an expression,
we need to finalize section sizes. Because linker script parsing
is done at very early stage of the linking process, we can't
evaluate expressions while parsing.
The above mechanism worked fairly well, but there were a few
drawbacks.
One thing is that we sometimes have to parse the same expression
more than once in order to find the end of the expression.
In some contexts, linker script expressions have no clear end marker.
So, we needed to recognize balanced expressions and ternary operators.
The other is poor error reporting. Since expressions are parsed
basically twice, and some information that is available at the first
stage is lost in the second stage, it was hard to print out
apprpriate error messages.
This patch fixes the issues with a new approach.
Now the expression parsing is integrated into ScriptParser.
ExprParser class is removed. Expressions are represented as lambdas
instead of vectors of tokens. Lambdas captures information they
need to run themselves when they are created.
In this way, ends of expressions are naturally detected, and
errors are handled in the usual way. This patch also reduces
the amount of code.
Differential Revision: https://reviews.llvm.org/D22728
llvm-svn: 276574
2016-07-25 02:19:40 +08:00
|
|
|
Expr ScriptParser::readPrimary() {
|
2016-08-18 02:59:16 +08:00
|
|
|
if (peek() == "(")
|
|
|
|
return readParenExpr();
|
Make readExpr return an Expr object instead of a vector of tokens.
Previously, we handled an expression as a vector of tokens. In other
words, an expression was a vector of uncooked raw StringRefs.
When we need a value of an expression, we used ExprParser to run
the expression.
The separation was needed essentially because parse time is too
early to evaluate an expression. In order to evaluate an expression,
we need to finalize section sizes. Because linker script parsing
is done at very early stage of the linking process, we can't
evaluate expressions while parsing.
The above mechanism worked fairly well, but there were a few
drawbacks.
One thing is that we sometimes have to parse the same expression
more than once in order to find the end of the expression.
In some contexts, linker script expressions have no clear end marker.
So, we needed to recognize balanced expressions and ternary operators.
The other is poor error reporting. Since expressions are parsed
basically twice, and some information that is available at the first
stage is lost in the second stage, it was hard to print out
apprpriate error messages.
This patch fixes the issues with a new approach.
Now the expression parsing is integrated into ScriptParser.
ExprParser class is removed. Expressions are represented as lambdas
instead of vectors of tokens. Lambdas captures information they
need to run themselves when they are created.
In this way, ends of expressions are naturally detected, and
errors are handled in the usual way. This patch also reduces
the amount of code.
Differential Revision: https://reviews.llvm.org/D22728
llvm-svn: 276574
2016-07-25 02:19:40 +08:00
|
|
|
|
2016-08-18 02:59:16 +08:00
|
|
|
StringRef Tok = next();
|
Make readExpr return an Expr object instead of a vector of tokens.
Previously, we handled an expression as a vector of tokens. In other
words, an expression was a vector of uncooked raw StringRefs.
When we need a value of an expression, we used ExprParser to run
the expression.
The separation was needed essentially because parse time is too
early to evaluate an expression. In order to evaluate an expression,
we need to finalize section sizes. Because linker script parsing
is done at very early stage of the linking process, we can't
evaluate expressions while parsing.
The above mechanism worked fairly well, but there were a few
drawbacks.
One thing is that we sometimes have to parse the same expression
more than once in order to find the end of the expression.
In some contexts, linker script expressions have no clear end marker.
So, we needed to recognize balanced expressions and ternary operators.
The other is poor error reporting. Since expressions are parsed
basically twice, and some information that is available at the first
stage is lost in the second stage, it was hard to print out
apprpriate error messages.
This patch fixes the issues with a new approach.
Now the expression parsing is integrated into ScriptParser.
ExprParser class is removed. Expressions are represented as lambdas
instead of vectors of tokens. Lambdas captures information they
need to run themselves when they are created.
In this way, ends of expressions are naturally detected, and
errors are handled in the usual way. This patch also reduces
the amount of code.
Differential Revision: https://reviews.llvm.org/D22728
llvm-svn: 276574
2016-07-25 02:19:40 +08:00
|
|
|
|
2016-09-03 05:54:35 +08:00
|
|
|
if (Tok == "~") {
|
|
|
|
Expr E = readPrimary();
|
|
|
|
return [=](uint64_t Dot) { return ~E(Dot); };
|
|
|
|
}
|
|
|
|
if (Tok == "-") {
|
|
|
|
Expr E = readPrimary();
|
|
|
|
return [=](uint64_t Dot) { return -E(Dot); };
|
|
|
|
}
|
|
|
|
|
Make readExpr return an Expr object instead of a vector of tokens.
Previously, we handled an expression as a vector of tokens. In other
words, an expression was a vector of uncooked raw StringRefs.
When we need a value of an expression, we used ExprParser to run
the expression.
The separation was needed essentially because parse time is too
early to evaluate an expression. In order to evaluate an expression,
we need to finalize section sizes. Because linker script parsing
is done at very early stage of the linking process, we can't
evaluate expressions while parsing.
The above mechanism worked fairly well, but there were a few
drawbacks.
One thing is that we sometimes have to parse the same expression
more than once in order to find the end of the expression.
In some contexts, linker script expressions have no clear end marker.
So, we needed to recognize balanced expressions and ternary operators.
The other is poor error reporting. Since expressions are parsed
basically twice, and some information that is available at the first
stage is lost in the second stage, it was hard to print out
apprpriate error messages.
This patch fixes the issues with a new approach.
Now the expression parsing is integrated into ScriptParser.
ExprParser class is removed. Expressions are represented as lambdas
instead of vectors of tokens. Lambdas captures information they
need to run themselves when they are created.
In this way, ends of expressions are naturally detected, and
errors are handled in the usual way. This patch also reduces
the amount of code.
Differential Revision: https://reviews.llvm.org/D22728
llvm-svn: 276574
2016-07-25 02:19:40 +08:00
|
|
|
// Built-in functions are parsed here.
|
|
|
|
// https://sourceware.org/binutils/docs/ld/Builtin-Functions.html.
|
2016-08-30 17:54:01 +08:00
|
|
|
if (Tok == "ADDR") {
|
|
|
|
expect("(");
|
|
|
|
StringRef Name = next();
|
|
|
|
expect(")");
|
2016-09-08 16:19:13 +08:00
|
|
|
return
|
|
|
|
[=](uint64_t Dot) { return ScriptBase->getOutputSectionAddress(Name); };
|
2016-08-30 17:54:01 +08:00
|
|
|
}
|
2016-08-04 17:29:31 +08:00
|
|
|
if (Tok == "ASSERT")
|
|
|
|
return readAssert();
|
Make readExpr return an Expr object instead of a vector of tokens.
Previously, we handled an expression as a vector of tokens. In other
words, an expression was a vector of uncooked raw StringRefs.
When we need a value of an expression, we used ExprParser to run
the expression.
The separation was needed essentially because parse time is too
early to evaluate an expression. In order to evaluate an expression,
we need to finalize section sizes. Because linker script parsing
is done at very early stage of the linking process, we can't
evaluate expressions while parsing.
The above mechanism worked fairly well, but there were a few
drawbacks.
One thing is that we sometimes have to parse the same expression
more than once in order to find the end of the expression.
In some contexts, linker script expressions have no clear end marker.
So, we needed to recognize balanced expressions and ternary operators.
The other is poor error reporting. Since expressions are parsed
basically twice, and some information that is available at the first
stage is lost in the second stage, it was hard to print out
apprpriate error messages.
This patch fixes the issues with a new approach.
Now the expression parsing is integrated into ScriptParser.
ExprParser class is removed. Expressions are represented as lambdas
instead of vectors of tokens. Lambdas captures information they
need to run themselves when they are created.
In this way, ends of expressions are naturally detected, and
errors are handled in the usual way. This patch also reduces
the amount of code.
Differential Revision: https://reviews.llvm.org/D22728
llvm-svn: 276574
2016-07-25 02:19:40 +08:00
|
|
|
if (Tok == "ALIGN") {
|
2016-08-18 02:59:16 +08:00
|
|
|
Expr E = readParenExpr();
|
Make readExpr return an Expr object instead of a vector of tokens.
Previously, we handled an expression as a vector of tokens. In other
words, an expression was a vector of uncooked raw StringRefs.
When we need a value of an expression, we used ExprParser to run
the expression.
The separation was needed essentially because parse time is too
early to evaluate an expression. In order to evaluate an expression,
we need to finalize section sizes. Because linker script parsing
is done at very early stage of the linking process, we can't
evaluate expressions while parsing.
The above mechanism worked fairly well, but there were a few
drawbacks.
One thing is that we sometimes have to parse the same expression
more than once in order to find the end of the expression.
In some contexts, linker script expressions have no clear end marker.
So, we needed to recognize balanced expressions and ternary operators.
The other is poor error reporting. Since expressions are parsed
basically twice, and some information that is available at the first
stage is lost in the second stage, it was hard to print out
apprpriate error messages.
This patch fixes the issues with a new approach.
Now the expression parsing is integrated into ScriptParser.
ExprParser class is removed. Expressions are represented as lambdas
instead of vectors of tokens. Lambdas captures information they
need to run themselves when they are created.
In this way, ends of expressions are naturally detected, and
errors are handled in the usual way. This patch also reduces
the amount of code.
Differential Revision: https://reviews.llvm.org/D22728
llvm-svn: 276574
2016-07-25 02:19:40 +08:00
|
|
|
return [=](uint64_t Dot) { return alignTo(Dot, E(Dot)); };
|
|
|
|
}
|
|
|
|
if (Tok == "CONSTANT") {
|
|
|
|
expect("(");
|
|
|
|
StringRef Tok = next();
|
|
|
|
expect(")");
|
|
|
|
return [=](uint64_t Dot) { return getConstant(Tok); };
|
|
|
|
}
|
2016-07-29 02:16:24 +08:00
|
|
|
if (Tok == "SEGMENT_START") {
|
|
|
|
expect("(");
|
|
|
|
next();
|
|
|
|
expect(",");
|
|
|
|
uint64_t Val;
|
2016-09-15 21:36:44 +08:00
|
|
|
if (next().getAsInteger(0, Val))
|
|
|
|
setError("integer expected");
|
2016-07-29 02:16:24 +08:00
|
|
|
expect(")");
|
|
|
|
return [=](uint64_t Dot) { return Val; };
|
|
|
|
}
|
Make readExpr return an Expr object instead of a vector of tokens.
Previously, we handled an expression as a vector of tokens. In other
words, an expression was a vector of uncooked raw StringRefs.
When we need a value of an expression, we used ExprParser to run
the expression.
The separation was needed essentially because parse time is too
early to evaluate an expression. In order to evaluate an expression,
we need to finalize section sizes. Because linker script parsing
is done at very early stage of the linking process, we can't
evaluate expressions while parsing.
The above mechanism worked fairly well, but there were a few
drawbacks.
One thing is that we sometimes have to parse the same expression
more than once in order to find the end of the expression.
In some contexts, linker script expressions have no clear end marker.
So, we needed to recognize balanced expressions and ternary operators.
The other is poor error reporting. Since expressions are parsed
basically twice, and some information that is available at the first
stage is lost in the second stage, it was hard to print out
apprpriate error messages.
This patch fixes the issues with a new approach.
Now the expression parsing is integrated into ScriptParser.
ExprParser class is removed. Expressions are represented as lambdas
instead of vectors of tokens. Lambdas captures information they
need to run themselves when they are created.
In this way, ends of expressions are naturally detected, and
errors are handled in the usual way. This patch also reduces
the amount of code.
Differential Revision: https://reviews.llvm.org/D22728
llvm-svn: 276574
2016-07-25 02:19:40 +08:00
|
|
|
if (Tok == "DATA_SEGMENT_ALIGN") {
|
|
|
|
expect("(");
|
|
|
|
Expr E = readExpr();
|
|
|
|
expect(",");
|
|
|
|
readExpr();
|
|
|
|
expect(")");
|
2016-07-27 03:34:10 +08:00
|
|
|
return [=](uint64_t Dot) { return alignTo(Dot, E(Dot)); };
|
Make readExpr return an Expr object instead of a vector of tokens.
Previously, we handled an expression as a vector of tokens. In other
words, an expression was a vector of uncooked raw StringRefs.
When we need a value of an expression, we used ExprParser to run
the expression.
The separation was needed essentially because parse time is too
early to evaluate an expression. In order to evaluate an expression,
we need to finalize section sizes. Because linker script parsing
is done at very early stage of the linking process, we can't
evaluate expressions while parsing.
The above mechanism worked fairly well, but there were a few
drawbacks.
One thing is that we sometimes have to parse the same expression
more than once in order to find the end of the expression.
In some contexts, linker script expressions have no clear end marker.
So, we needed to recognize balanced expressions and ternary operators.
The other is poor error reporting. Since expressions are parsed
basically twice, and some information that is available at the first
stage is lost in the second stage, it was hard to print out
apprpriate error messages.
This patch fixes the issues with a new approach.
Now the expression parsing is integrated into ScriptParser.
ExprParser class is removed. Expressions are represented as lambdas
instead of vectors of tokens. Lambdas captures information they
need to run themselves when they are created.
In this way, ends of expressions are naturally detected, and
errors are handled in the usual way. This patch also reduces
the amount of code.
Differential Revision: https://reviews.llvm.org/D22728
llvm-svn: 276574
2016-07-25 02:19:40 +08:00
|
|
|
}
|
|
|
|
if (Tok == "DATA_SEGMENT_END") {
|
|
|
|
expect("(");
|
|
|
|
expect(".");
|
|
|
|
expect(")");
|
|
|
|
return [](uint64_t Dot) { return Dot; };
|
|
|
|
}
|
2016-07-27 01:58:44 +08:00
|
|
|
// GNU linkers implements more complicated logic to handle
|
|
|
|
// DATA_SEGMENT_RELRO_END. We instead ignore the arguments and just align to
|
|
|
|
// the next page boundary for simplicity.
|
|
|
|
if (Tok == "DATA_SEGMENT_RELRO_END") {
|
|
|
|
expect("(");
|
2016-09-15 03:14:01 +08:00
|
|
|
readExpr();
|
2016-07-27 01:58:44 +08:00
|
|
|
expect(",");
|
|
|
|
readExpr();
|
|
|
|
expect(")");
|
|
|
|
return [](uint64_t Dot) { return alignTo(Dot, Target->PageSize); };
|
|
|
|
}
|
2016-07-30 00:18:47 +08:00
|
|
|
if (Tok == "SIZEOF") {
|
|
|
|
expect("(");
|
|
|
|
StringRef Name = next();
|
|
|
|
expect(")");
|
2016-09-08 16:19:13 +08:00
|
|
|
return [=](uint64_t Dot) { return ScriptBase->getOutputSectionSize(Name); };
|
2016-07-30 00:18:47 +08:00
|
|
|
}
|
2016-09-08 17:08:30 +08:00
|
|
|
if (Tok == "ALIGNOF") {
|
|
|
|
expect("(");
|
|
|
|
StringRef Name = next();
|
|
|
|
expect(")");
|
|
|
|
return
|
|
|
|
[=](uint64_t Dot) { return ScriptBase->getOutputSectionAlign(Name); };
|
|
|
|
}
|
2016-08-10 15:59:34 +08:00
|
|
|
if (Tok == "SIZEOF_HEADERS")
|
2016-09-08 16:19:13 +08:00
|
|
|
return [=](uint64_t Dot) { return ScriptBase->getHeaderSize(); };
|
Make readExpr return an Expr object instead of a vector of tokens.
Previously, we handled an expression as a vector of tokens. In other
words, an expression was a vector of uncooked raw StringRefs.
When we need a value of an expression, we used ExprParser to run
the expression.
The separation was needed essentially because parse time is too
early to evaluate an expression. In order to evaluate an expression,
we need to finalize section sizes. Because linker script parsing
is done at very early stage of the linking process, we can't
evaluate expressions while parsing.
The above mechanism worked fairly well, but there were a few
drawbacks.
One thing is that we sometimes have to parse the same expression
more than once in order to find the end of the expression.
In some contexts, linker script expressions have no clear end marker.
So, we needed to recognize balanced expressions and ternary operators.
The other is poor error reporting. Since expressions are parsed
basically twice, and some information that is available at the first
stage is lost in the second stage, it was hard to print out
apprpriate error messages.
This patch fixes the issues with a new approach.
Now the expression parsing is integrated into ScriptParser.
ExprParser class is removed. Expressions are represented as lambdas
instead of vectors of tokens. Lambdas captures information they
need to run themselves when they are created.
In this way, ends of expressions are naturally detected, and
errors are handled in the usual way. This patch also reduces
the amount of code.
Differential Revision: https://reviews.llvm.org/D22728
llvm-svn: 276574
2016-07-25 02:19:40 +08:00
|
|
|
|
2016-09-03 00:01:42 +08:00
|
|
|
// Tok is a literal number.
|
|
|
|
uint64_t V;
|
|
|
|
if (readInteger(Tok, V))
|
|
|
|
return [=](uint64_t Dot) { return V; };
|
|
|
|
|
|
|
|
// Tok is a symbol name.
|
|
|
|
if (Tok != "." && !isValidCIdentifier(Tok))
|
|
|
|
setError("malformed number: " + Tok);
|
|
|
|
return [=](uint64_t Dot) { return getSymbolValue(Tok, Dot); };
|
Make readExpr return an Expr object instead of a vector of tokens.
Previously, we handled an expression as a vector of tokens. In other
words, an expression was a vector of uncooked raw StringRefs.
When we need a value of an expression, we used ExprParser to run
the expression.
The separation was needed essentially because parse time is too
early to evaluate an expression. In order to evaluate an expression,
we need to finalize section sizes. Because linker script parsing
is done at very early stage of the linking process, we can't
evaluate expressions while parsing.
The above mechanism worked fairly well, but there were a few
drawbacks.
One thing is that we sometimes have to parse the same expression
more than once in order to find the end of the expression.
In some contexts, linker script expressions have no clear end marker.
So, we needed to recognize balanced expressions and ternary operators.
The other is poor error reporting. Since expressions are parsed
basically twice, and some information that is available at the first
stage is lost in the second stage, it was hard to print out
apprpriate error messages.
This patch fixes the issues with a new approach.
Now the expression parsing is integrated into ScriptParser.
ExprParser class is removed. Expressions are represented as lambdas
instead of vectors of tokens. Lambdas captures information they
need to run themselves when they are created.
In this way, ends of expressions are naturally detected, and
errors are handled in the usual way. This patch also reduces
the amount of code.
Differential Revision: https://reviews.llvm.org/D22728
llvm-svn: 276574
2016-07-25 02:19:40 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
Expr ScriptParser::readTernary(Expr Cond) {
|
|
|
|
next();
|
|
|
|
Expr L = readExpr();
|
|
|
|
expect(":");
|
|
|
|
Expr R = readExpr();
|
|
|
|
return [=](uint64_t Dot) { return Cond(Dot) ? L(Dot) : R(Dot); };
|
|
|
|
}
|
|
|
|
|
2016-08-18 02:59:16 +08:00
|
|
|
Expr ScriptParser::readParenExpr() {
|
|
|
|
expect("(");
|
|
|
|
Expr E = readExpr();
|
|
|
|
expect(")");
|
|
|
|
return E;
|
|
|
|
}
|
|
|
|
|
2016-07-19 17:25:43 +08:00
|
|
|
std::vector<StringRef> ScriptParser::readOutputSectionPhdrs() {
|
|
|
|
std::vector<StringRef> Phdrs;
|
|
|
|
while (!Error && peek().startswith(":")) {
|
|
|
|
StringRef Tok = next();
|
|
|
|
Tok = (Tok.size() == 1) ? next() : Tok.substr(1);
|
|
|
|
if (Tok.empty()) {
|
|
|
|
setError("section header name is empty");
|
|
|
|
break;
|
|
|
|
}
|
2016-07-21 03:36:36 +08:00
|
|
|
Phdrs.push_back(Tok);
|
2016-07-19 17:25:43 +08:00
|
|
|
}
|
|
|
|
return Phdrs;
|
|
|
|
}
|
|
|
|
|
|
|
|
unsigned ScriptParser::readPhdrType() {
|
|
|
|
StringRef Tok = next();
|
2016-07-21 03:36:38 +08:00
|
|
|
unsigned Ret = StringSwitch<unsigned>(Tok)
|
2016-09-08 16:20:30 +08:00
|
|
|
.Case("PT_NULL", PT_NULL)
|
|
|
|
.Case("PT_LOAD", PT_LOAD)
|
|
|
|
.Case("PT_DYNAMIC", PT_DYNAMIC)
|
|
|
|
.Case("PT_INTERP", PT_INTERP)
|
|
|
|
.Case("PT_NOTE", PT_NOTE)
|
|
|
|
.Case("PT_SHLIB", PT_SHLIB)
|
|
|
|
.Case("PT_PHDR", PT_PHDR)
|
|
|
|
.Case("PT_TLS", PT_TLS)
|
|
|
|
.Case("PT_GNU_EH_FRAME", PT_GNU_EH_FRAME)
|
|
|
|
.Case("PT_GNU_STACK", PT_GNU_STACK)
|
|
|
|
.Case("PT_GNU_RELRO", PT_GNU_RELRO)
|
|
|
|
.Default(-1);
|
2016-07-19 17:25:43 +08:00
|
|
|
|
2016-07-21 03:36:38 +08:00
|
|
|
if (Ret == (unsigned)-1) {
|
|
|
|
setError("invalid program header type: " + Tok);
|
|
|
|
return PT_NULL;
|
|
|
|
}
|
|
|
|
return Ret;
|
2016-07-19 17:25:43 +08:00
|
|
|
}
|
|
|
|
|
2016-09-01 04:03:54 +08:00
|
|
|
void ScriptParser::readVersionDeclaration(StringRef VerStr) {
|
2016-08-31 17:08:26 +08:00
|
|
|
// Identifiers start at 2 because 0 and 1 are reserved
|
|
|
|
// for VER_NDX_LOCAL and VER_NDX_GLOBAL constants.
|
|
|
|
size_t VersionId = Config->VersionDefinitions.size() + 2;
|
|
|
|
Config->VersionDefinitions.push_back({VerStr, VersionId});
|
|
|
|
|
|
|
|
if (skip("global:") || peek() != "local:")
|
|
|
|
readGlobal(VerStr);
|
|
|
|
if (skip("local:"))
|
|
|
|
readLocal();
|
|
|
|
expect("}");
|
|
|
|
|
|
|
|
// Each version may have a parent version. For example, "Ver2" defined as
|
|
|
|
// "Ver2 { global: foo; local: *; } Ver1;" has "Ver1" as a parent. This
|
|
|
|
// version hierarchy is, probably against your instinct, purely for human; the
|
|
|
|
// runtime doesn't care about them at all. In LLD, we simply skip the token.
|
|
|
|
if (!VerStr.empty() && peek() != ";")
|
|
|
|
next();
|
|
|
|
expect(";");
|
|
|
|
}
|
|
|
|
|
|
|
|
void ScriptParser::readLocal() {
|
|
|
|
Config->DefaultSymbolVersion = VER_NDX_LOCAL;
|
|
|
|
expect("*");
|
|
|
|
expect(";");
|
|
|
|
}
|
|
|
|
|
|
|
|
void ScriptParser::readExtern(std::vector<SymbolVersion> *Globals) {
|
2016-09-09 22:35:36 +08:00
|
|
|
expect("\"C++\"");
|
2016-08-31 17:08:26 +08:00
|
|
|
expect("{");
|
|
|
|
|
|
|
|
for (;;) {
|
|
|
|
if (peek() == "}" || Error)
|
|
|
|
break;
|
2016-09-09 22:35:36 +08:00
|
|
|
bool HasWildcard = !peek().startswith("\"") && hasWildcard(peek());
|
|
|
|
Globals->push_back({unquote(next()), true, HasWildcard});
|
2016-08-31 17:08:26 +08:00
|
|
|
expect(";");
|
|
|
|
}
|
|
|
|
|
|
|
|
expect("}");
|
|
|
|
expect(";");
|
|
|
|
}
|
|
|
|
|
|
|
|
void ScriptParser::readGlobal(StringRef VerStr) {
|
|
|
|
std::vector<SymbolVersion> *Globals;
|
|
|
|
if (VerStr.empty())
|
|
|
|
Globals = &Config->VersionScriptGlobals;
|
|
|
|
else
|
|
|
|
Globals = &Config->VersionDefinitions.back().Globals;
|
|
|
|
|
|
|
|
for (;;) {
|
|
|
|
if (skip("extern"))
|
|
|
|
readExtern(Globals);
|
|
|
|
|
|
|
|
StringRef Cur = peek();
|
|
|
|
if (Cur == "}" || Cur == "local:" || Error)
|
|
|
|
return;
|
|
|
|
next();
|
2016-09-09 22:35:36 +08:00
|
|
|
Globals->push_back({unquote(Cur), false, hasWildcard(Cur)});
|
2016-08-31 17:08:26 +08:00
|
|
|
expect(";");
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-11-26 13:53:00 +08:00
|
|
|
static bool isUnderSysroot(StringRef Path) {
|
|
|
|
if (Config->Sysroot == "")
|
|
|
|
return false;
|
|
|
|
for (; !Path.empty(); Path = sys::path::parent_path(Path))
|
|
|
|
if (sys::fs::equivalent(Config->Sysroot, Path))
|
|
|
|
return true;
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2016-04-21 04:13:41 +08:00
|
|
|
void elf::readLinkerScript(MemoryBufferRef MB) {
|
2015-11-26 13:53:00 +08:00
|
|
|
StringRef Path = MB.getBufferIdentifier();
|
2016-08-31 17:08:26 +08:00
|
|
|
ScriptParser(MB.getBuffer(), isUnderSysroot(Path)).readLinkerScript();
|
|
|
|
}
|
|
|
|
|
|
|
|
void elf::readVersionScript(MemoryBufferRef MB) {
|
|
|
|
ScriptParser(MB.getBuffer(), false).readVersionScript();
|
2016-04-21 04:13:41 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
template class elf::LinkerScript<ELF32LE>;
|
|
|
|
template class elf::LinkerScript<ELF32BE>;
|
|
|
|
template class elf::LinkerScript<ELF64LE>;
|
|
|
|
template class elf::LinkerScript<ELF64BE>;
|