2015-07-25 05:03:07 +08:00
|
|
|
//===- SymbolTable.cpp ----------------------------------------------------===//
|
|
|
|
//
|
|
|
|
// The LLVM Linker
|
|
|
|
//
|
|
|
|
// This file is distributed under the University of Illinois Open Source
|
|
|
|
// License. See LICENSE.TXT for details.
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
2015-10-14 03:51:57 +08:00
|
|
|
//
|
|
|
|
// Symbol table is a bag of all known symbols. We put all symbols of
|
2016-01-06 04:47:37 +08:00
|
|
|
// all input files to the symbol table. The symbol table is basically
|
2015-10-14 03:51:57 +08:00
|
|
|
// a hash table with the logic to resolve symbol name conflicts using
|
|
|
|
// the symbol types.
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
2015-07-25 05:03:07 +08:00
|
|
|
|
|
|
|
#include "SymbolTable.h"
|
2015-09-12 06:42:45 +08:00
|
|
|
#include "Config.h"
|
2015-08-06 23:08:23 +08:00
|
|
|
#include "Error.h"
|
2015-07-25 05:03:07 +08:00
|
|
|
#include "Symbols.h"
|
2016-02-13 04:54:57 +08:00
|
|
|
#include "llvm/Bitcode/ReaderWriter.h"
|
2016-01-08 01:20:07 +08:00
|
|
|
#include "llvm/Support/StringSaver.h"
|
2015-07-25 05:03:07 +08:00
|
|
|
|
|
|
|
using namespace llvm;
|
2015-08-31 09:16:19 +08:00
|
|
|
using namespace llvm::object;
|
2015-09-23 02:19:46 +08:00
|
|
|
using namespace llvm::ELF;
|
2015-07-25 05:03:07 +08:00
|
|
|
|
|
|
|
using namespace lld;
|
2016-02-28 08:25:54 +08:00
|
|
|
using namespace lld::elf;
|
2015-07-25 05:03:07 +08:00
|
|
|
|
2016-01-06 04:47:37 +08:00
|
|
|
// All input object files must be for the same architecture
|
|
|
|
// (e.g. it does not make sense to link x86 object files with
|
|
|
|
// MIPS object files.) This function checks for that error.
|
2016-01-30 03:41:13 +08:00
|
|
|
template <class ELFT> static bool isCompatible(InputFile *FileP) {
|
2015-12-17 07:31:22 +08:00
|
|
|
auto *F = dyn_cast<ELFFileBase<ELFT>>(FileP);
|
|
|
|
if (!F)
|
2016-01-30 03:41:13 +08:00
|
|
|
return true;
|
2015-12-17 07:31:22 +08:00
|
|
|
if (F->getELFKind() == Config->EKind && F->getEMachine() == Config->EMachine)
|
2016-01-30 03:41:13 +08:00
|
|
|
return true;
|
2015-12-17 07:31:22 +08:00
|
|
|
StringRef A = F->getName();
|
|
|
|
StringRef B = Config->Emulation;
|
|
|
|
if (B.empty())
|
|
|
|
B = Config->FirstElf->getName();
|
2016-01-30 03:41:13 +08:00
|
|
|
error(A + " is incompatible with " + B);
|
|
|
|
return false;
|
2015-12-17 07:31:22 +08:00
|
|
|
}
|
|
|
|
|
2016-04-14 02:07:57 +08:00
|
|
|
// Returns "(internal)", "foo.a(bar.o)" or "baz.o".
|
|
|
|
static std::string getFilename(InputFile *F) {
|
|
|
|
if (!F)
|
|
|
|
return "(internal)";
|
|
|
|
if (!F->ArchiveName.empty())
|
|
|
|
return (F->ArchiveName + "(" + F->getName() + ")").str();
|
|
|
|
return F->getName();
|
|
|
|
}
|
|
|
|
|
2016-01-06 04:47:37 +08:00
|
|
|
// Add symbols in File to the symbol table.
|
2015-10-10 05:07:25 +08:00
|
|
|
template <class ELFT>
|
|
|
|
void SymbolTable<ELFT>::addFile(std::unique_ptr<InputFile> File) {
|
2015-12-23 22:35:51 +08:00
|
|
|
InputFile *FileP = File.get();
|
2016-01-30 03:41:13 +08:00
|
|
|
if (!isCompatible<ELFT>(FileP))
|
|
|
|
return;
|
2015-10-11 11:36:49 +08:00
|
|
|
|
2015-12-17 06:59:13 +08:00
|
|
|
// .a file
|
|
|
|
if (auto *F = dyn_cast<ArchiveFile>(FileP)) {
|
2015-12-23 22:35:51 +08:00
|
|
|
ArchiveFiles.emplace_back(cast<ArchiveFile>(File.release()));
|
ELF: New symbol table design.
This patch implements a new design for the symbol table that stores
SymbolBodies within a memory region of the Symbol object. Symbols are mutated
by constructing SymbolBodies in place over existing SymbolBodies, rather
than by mutating pointers. As mentioned in the initial proposal [1], this
memory layout helps reduce the cache miss rate by improving memory locality.
Performance numbers:
old(s) new(s)
Without debug info:
chrome 7.178 6.432 (-11.5%)
LLVMgold.so 0.505 0.502 (-0.5%)
clang 0.954 0.827 (-15.4%)
llvm-as 0.052 0.045 (-15.5%)
With debug info:
scylla 5.695 5.613 (-1.5%)
clang 14.396 14.143 (-1.8%)
Performance counter results show that the fewer required indirections is
indeed the cause of the improved performance. For example, when linking
chrome, stalled cycles decreases from 14,556,444,002 to 12,959,238,310, and
instructions per cycle increases from 0.78 to 0.83. We are also executing
many fewer instructions (15,516,401,933 down to 15,002,434,310), probably
because we spend less time allocating SymbolBodies.
The new mechanism by which symbols are added to the symbol table is by calling
add* functions on the SymbolTable.
In this patch, I handle local symbols by storing them inside "unparented"
SymbolBodies. This is suboptimal, but if we do want to try to avoid allocating
these SymbolBodies, we can probably do that separately.
I also removed a few members from the SymbolBody class that were only being
used to pass information from the input file to the symbol table.
This patch implements the new design for the ELF linker only. I intend to
prepare a similar patch for the COFF linker.
[1] http://lists.llvm.org/pipermail/llvm-dev/2016-April/098832.html
Differential Revision: http://reviews.llvm.org/D19752
llvm-svn: 268178
2016-05-01 12:55:03 +08:00
|
|
|
F->parse<ELFT>();
|
2015-09-05 06:28:10 +08:00
|
|
|
return;
|
|
|
|
}
|
2015-10-13 02:03:21 +08:00
|
|
|
|
2016-04-14 02:07:57 +08:00
|
|
|
// Lazy object file
|
|
|
|
if (auto *F = dyn_cast<LazyObjectFile>(FileP)) {
|
|
|
|
LazyObjectFiles.emplace_back(cast<LazyObjectFile>(File.release()));
|
ELF: New symbol table design.
This patch implements a new design for the symbol table that stores
SymbolBodies within a memory region of the Symbol object. Symbols are mutated
by constructing SymbolBodies in place over existing SymbolBodies, rather
than by mutating pointers. As mentioned in the initial proposal [1], this
memory layout helps reduce the cache miss rate by improving memory locality.
Performance numbers:
old(s) new(s)
Without debug info:
chrome 7.178 6.432 (-11.5%)
LLVMgold.so 0.505 0.502 (-0.5%)
clang 0.954 0.827 (-15.4%)
llvm-as 0.052 0.045 (-15.5%)
With debug info:
scylla 5.695 5.613 (-1.5%)
clang 14.396 14.143 (-1.8%)
Performance counter results show that the fewer required indirections is
indeed the cause of the improved performance. For example, when linking
chrome, stalled cycles decreases from 14,556,444,002 to 12,959,238,310, and
instructions per cycle increases from 0.78 to 0.83. We are also executing
many fewer instructions (15,516,401,933 down to 15,002,434,310), probably
because we spend less time allocating SymbolBodies.
The new mechanism by which symbols are added to the symbol table is by calling
add* functions on the SymbolTable.
In this patch, I handle local symbols by storing them inside "unparented"
SymbolBodies. This is suboptimal, but if we do want to try to avoid allocating
these SymbolBodies, we can probably do that separately.
I also removed a few members from the SymbolBody class that were only being
used to pass information from the input file to the symbol table.
This patch implements the new design for the ELF linker only. I intend to
prepare a similar patch for the COFF linker.
[1] http://lists.llvm.org/pipermail/llvm-dev/2016-April/098832.html
Differential Revision: http://reviews.llvm.org/D19752
llvm-svn: 268178
2016-05-01 12:55:03 +08:00
|
|
|
F->parse<ELFT>();
|
2016-04-14 02:07:57 +08:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (Config->Trace)
|
|
|
|
llvm::outs() << getFilename(FileP) << "\n";
|
|
|
|
|
2015-12-17 06:59:13 +08:00
|
|
|
// .so file
|
|
|
|
if (auto *F = dyn_cast<SharedFile<ELFT>>(FileP)) {
|
|
|
|
// DSOs are uniquified not by filename but by soname.
|
|
|
|
F->parseSoName();
|
2016-01-09 06:17:42 +08:00
|
|
|
if (!SoNames.insert(F->getSoName()).second)
|
2015-10-02 03:52:48 +08:00
|
|
|
return;
|
2015-12-17 06:59:13 +08:00
|
|
|
|
2015-12-23 22:35:51 +08:00
|
|
|
SharedFiles.emplace_back(cast<SharedFile<ELFT>>(File.release()));
|
2016-01-06 09:56:36 +08:00
|
|
|
F->parseRest();
|
2015-12-17 06:59:13 +08:00
|
|
|
return;
|
2015-10-02 03:52:48 +08:00
|
|
|
}
|
2015-12-17 06:59:13 +08:00
|
|
|
|
2016-04-08 03:24:51 +08:00
|
|
|
// LLVM bitcode file
|
2016-02-13 04:54:57 +08:00
|
|
|
if (auto *F = dyn_cast<BitcodeFile>(FileP)) {
|
|
|
|
BitcodeFiles.emplace_back(cast<BitcodeFile>(File.release()));
|
ELF: New symbol table design.
This patch implements a new design for the symbol table that stores
SymbolBodies within a memory region of the Symbol object. Symbols are mutated
by constructing SymbolBodies in place over existing SymbolBodies, rather
than by mutating pointers. As mentioned in the initial proposal [1], this
memory layout helps reduce the cache miss rate by improving memory locality.
Performance numbers:
old(s) new(s)
Without debug info:
chrome 7.178 6.432 (-11.5%)
LLVMgold.so 0.505 0.502 (-0.5%)
clang 0.954 0.827 (-15.4%)
llvm-as 0.052 0.045 (-15.5%)
With debug info:
scylla 5.695 5.613 (-1.5%)
clang 14.396 14.143 (-1.8%)
Performance counter results show that the fewer required indirections is
indeed the cause of the improved performance. For example, when linking
chrome, stalled cycles decreases from 14,556,444,002 to 12,959,238,310, and
instructions per cycle increases from 0.78 to 0.83. We are also executing
many fewer instructions (15,516,401,933 down to 15,002,434,310), probably
because we spend less time allocating SymbolBodies.
The new mechanism by which symbols are added to the symbol table is by calling
add* functions on the SymbolTable.
In this patch, I handle local symbols by storing them inside "unparented"
SymbolBodies. This is suboptimal, but if we do want to try to avoid allocating
these SymbolBodies, we can probably do that separately.
I also removed a few members from the SymbolBody class that were only being
used to pass information from the input file to the symbol table.
This patch implements the new design for the ELF linker only. I intend to
prepare a similar patch for the COFF linker.
[1] http://lists.llvm.org/pipermail/llvm-dev/2016-April/098832.html
Differential Revision: http://reviews.llvm.org/D19752
llvm-svn: 268178
2016-05-01 12:55:03 +08:00
|
|
|
F->parse<ELFT>(ComdatGroups);
|
2016-02-13 04:54:57 +08:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2016-04-08 03:24:51 +08:00
|
|
|
// Regular object file
|
2015-12-17 06:59:13 +08:00
|
|
|
auto *F = cast<ObjectFile<ELFT>>(FileP);
|
2015-12-23 22:35:51 +08:00
|
|
|
ObjectFiles.emplace_back(cast<ObjectFile<ELFT>>(File.release()));
|
2016-01-06 10:06:33 +08:00
|
|
|
F->parse(ComdatGroups);
|
2015-07-25 05:03:07 +08:00
|
|
|
}
|
|
|
|
|
2016-04-23 08:26:32 +08:00
|
|
|
// This function is where all the optimizations of link-time
|
|
|
|
// optimization happens. When LTO is in use, some input files are
|
|
|
|
// not in native object file format but in the LLVM bitcode format.
|
|
|
|
// This function compiles bitcode files into a few big native files
|
|
|
|
// using LLVM functions and replaces bitcode symbols with the results.
|
|
|
|
// Because all bitcode files that consist of a program are passed
|
|
|
|
// to the compiler at once, it can do whole-program optimization.
|
2016-02-13 04:54:57 +08:00
|
|
|
template <class ELFT> void SymbolTable<ELFT>::addCombinedLtoObject() {
|
|
|
|
if (BitcodeFiles.empty())
|
|
|
|
return;
|
2016-03-23 04:52:10 +08:00
|
|
|
|
|
|
|
// Compile bitcode files.
|
|
|
|
Lto.reset(new BitcodeCompiler);
|
|
|
|
for (const std::unique_ptr<BitcodeFile> &F : BitcodeFiles)
|
|
|
|
Lto->add(*F);
|
2016-04-16 06:38:10 +08:00
|
|
|
std::vector<std::unique_ptr<InputFile>> IFs = Lto->compile();
|
2016-03-23 04:52:10 +08:00
|
|
|
|
|
|
|
// Replace bitcode symbols.
|
2016-04-16 06:38:10 +08:00
|
|
|
for (auto &IF : IFs) {
|
|
|
|
ObjectFile<ELFT> *Obj = cast<ObjectFile<ELFT>>(IF.release());
|
|
|
|
|
|
|
|
llvm::DenseSet<StringRef> DummyGroups;
|
|
|
|
Obj->parse(DummyGroups);
|
|
|
|
ObjectFiles.emplace_back(Obj);
|
2016-02-13 04:54:57 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-11-06 15:43:03 +08:00
|
|
|
template <class ELFT>
|
2016-04-04 22:04:16 +08:00
|
|
|
DefinedRegular<ELFT> *SymbolTable<ELFT>::addAbsolute(StringRef Name,
|
|
|
|
uint8_t Visibility) {
|
ELF: New symbol table design.
This patch implements a new design for the symbol table that stores
SymbolBodies within a memory region of the Symbol object. Symbols are mutated
by constructing SymbolBodies in place over existing SymbolBodies, rather
than by mutating pointers. As mentioned in the initial proposal [1], this
memory layout helps reduce the cache miss rate by improving memory locality.
Performance numbers:
old(s) new(s)
Without debug info:
chrome 7.178 6.432 (-11.5%)
LLVMgold.so 0.505 0.502 (-0.5%)
clang 0.954 0.827 (-15.4%)
llvm-as 0.052 0.045 (-15.5%)
With debug info:
scylla 5.695 5.613 (-1.5%)
clang 14.396 14.143 (-1.8%)
Performance counter results show that the fewer required indirections is
indeed the cause of the improved performance. For example, when linking
chrome, stalled cycles decreases from 14,556,444,002 to 12,959,238,310, and
instructions per cycle increases from 0.78 to 0.83. We are also executing
many fewer instructions (15,516,401,933 down to 15,002,434,310), probably
because we spend less time allocating SymbolBodies.
The new mechanism by which symbols are added to the symbol table is by calling
add* functions on the SymbolTable.
In this patch, I handle local symbols by storing them inside "unparented"
SymbolBodies. This is suboptimal, but if we do want to try to avoid allocating
these SymbolBodies, we can probably do that separately.
I also removed a few members from the SymbolBody class that were only being
used to pass information from the input file to the symbol table.
This patch implements the new design for the ELF linker only. I intend to
prepare a similar patch for the COFF linker.
[1] http://lists.llvm.org/pipermail/llvm-dev/2016-April/098832.html
Differential Revision: http://reviews.llvm.org/D19752
llvm-svn: 268178
2016-05-01 12:55:03 +08:00
|
|
|
return cast<DefinedRegular<ELFT>>(
|
|
|
|
addRegular(Name, STB_GLOBAL, Visibility)->body());
|
2015-09-26 02:56:53 +08:00
|
|
|
}
|
|
|
|
|
2016-01-06 04:47:37 +08:00
|
|
|
// Add Name as an "ignored" symbol. An ignored symbol is a regular
|
2016-04-04 22:04:16 +08:00
|
|
|
// linker-synthesized defined symbol, but is only defined if needed.
|
2015-12-16 22:45:09 +08:00
|
|
|
template <class ELFT>
|
2016-04-04 22:04:16 +08:00
|
|
|
DefinedRegular<ELFT> *SymbolTable<ELFT>::addIgnored(StringRef Name,
|
|
|
|
uint8_t Visibility) {
|
|
|
|
if (!find(Name))
|
|
|
|
return nullptr;
|
|
|
|
return addAbsolute(Name, Visibility);
|
2015-10-02 05:22:26 +08:00
|
|
|
}
|
|
|
|
|
2016-01-08 01:20:07 +08:00
|
|
|
// Rename SYM as __wrap_SYM. The original symbol is preserved as __real_SYM.
|
|
|
|
// Used to implement --wrap.
|
|
|
|
template <class ELFT> void SymbolTable<ELFT>::wrap(StringRef Name) {
|
2016-04-28 08:03:38 +08:00
|
|
|
SymbolBody *B = find(Name);
|
|
|
|
if (!B)
|
2016-01-08 01:20:07 +08:00
|
|
|
return;
|
|
|
|
StringSaver Saver(Alloc);
|
ELF: New symbol table design.
This patch implements a new design for the symbol table that stores
SymbolBodies within a memory region of the Symbol object. Symbols are mutated
by constructing SymbolBodies in place over existing SymbolBodies, rather
than by mutating pointers. As mentioned in the initial proposal [1], this
memory layout helps reduce the cache miss rate by improving memory locality.
Performance numbers:
old(s) new(s)
Without debug info:
chrome 7.178 6.432 (-11.5%)
LLVMgold.so 0.505 0.502 (-0.5%)
clang 0.954 0.827 (-15.4%)
llvm-as 0.052 0.045 (-15.5%)
With debug info:
scylla 5.695 5.613 (-1.5%)
clang 14.396 14.143 (-1.8%)
Performance counter results show that the fewer required indirections is
indeed the cause of the improved performance. For example, when linking
chrome, stalled cycles decreases from 14,556,444,002 to 12,959,238,310, and
instructions per cycle increases from 0.78 to 0.83. We are also executing
many fewer instructions (15,516,401,933 down to 15,002,434,310), probably
because we spend less time allocating SymbolBodies.
The new mechanism by which symbols are added to the symbol table is by calling
add* functions on the SymbolTable.
In this patch, I handle local symbols by storing them inside "unparented"
SymbolBodies. This is suboptimal, but if we do want to try to avoid allocating
these SymbolBodies, we can probably do that separately.
I also removed a few members from the SymbolBody class that were only being
used to pass information from the input file to the symbol table.
This patch implements the new design for the ELF linker only. I intend to
prepare a similar patch for the COFF linker.
[1] http://lists.llvm.org/pipermail/llvm-dev/2016-April/098832.html
Differential Revision: http://reviews.llvm.org/D19752
llvm-svn: 268178
2016-05-01 12:55:03 +08:00
|
|
|
Symbol *Sym = B->symbol();
|
|
|
|
Symbol *Real = addUndefined(Saver.save("__real_" + Name));
|
|
|
|
Symbol *Wrap = addUndefined(Saver.save("__wrap_" + Name));
|
|
|
|
// We rename symbols by replacing the old symbol's SymbolBody with the new
|
|
|
|
// symbol's SymbolBody. This causes all SymbolBody pointers referring to the
|
|
|
|
// old symbol to instead refer to the new symbol.
|
|
|
|
memcpy(Real->Body.buffer, Sym->Body.buffer, sizeof(Sym->Body));
|
|
|
|
memcpy(Sym->Body.buffer, Wrap->Body.buffer, sizeof(Wrap->Body));
|
2016-01-08 01:20:07 +08:00
|
|
|
}
|
|
|
|
|
2015-12-17 06:26:48 +08:00
|
|
|
// Returns a file from which symbol B was created.
|
2016-01-06 04:01:29 +08:00
|
|
|
// If B does not belong to any file, returns a nullptr.
|
2016-02-27 05:49:38 +08:00
|
|
|
template <class ELFT> InputFile *SymbolTable<ELFT>::findFile(SymbolBody *B) {
|
ELF: New symbol table design.
This patch implements a new design for the symbol table that stores
SymbolBodies within a memory region of the Symbol object. Symbols are mutated
by constructing SymbolBodies in place over existing SymbolBodies, rather
than by mutating pointers. As mentioned in the initial proposal [1], this
memory layout helps reduce the cache miss rate by improving memory locality.
Performance numbers:
old(s) new(s)
Without debug info:
chrome 7.178 6.432 (-11.5%)
LLVMgold.so 0.505 0.502 (-0.5%)
clang 0.954 0.827 (-15.4%)
llvm-as 0.052 0.045 (-15.5%)
With debug info:
scylla 5.695 5.613 (-1.5%)
clang 14.396 14.143 (-1.8%)
Performance counter results show that the fewer required indirections is
indeed the cause of the improved performance. For example, when linking
chrome, stalled cycles decreases from 14,556,444,002 to 12,959,238,310, and
instructions per cycle increases from 0.78 to 0.83. We are also executing
many fewer instructions (15,516,401,933 down to 15,002,434,310), probably
because we spend less time allocating SymbolBodies.
The new mechanism by which symbols are added to the symbol table is by calling
add* functions on the SymbolTable.
In this patch, I handle local symbols by storing them inside "unparented"
SymbolBodies. This is suboptimal, but if we do want to try to avoid allocating
these SymbolBodies, we can probably do that separately.
I also removed a few members from the SymbolBody class that were only being
used to pass information from the input file to the symbol table.
This patch implements the new design for the ELF linker only. I intend to
prepare a similar patch for the COFF linker.
[1] http://lists.llvm.org/pipermail/llvm-dev/2016-April/098832.html
Differential Revision: http://reviews.llvm.org/D19752
llvm-svn: 268178
2016-05-01 12:55:03 +08:00
|
|
|
// If this symbol has a definition, follow pointers in the symbol to its
|
|
|
|
// defining file.
|
|
|
|
if (auto *R = dyn_cast<DefinedRegular<ELFT>>(B))
|
|
|
|
if (auto *S = R->Section)
|
|
|
|
return S->getFile();
|
|
|
|
if (auto *SS = dyn_cast<SharedSymbol<ELFT>>(B))
|
|
|
|
return SS->File;
|
|
|
|
if (auto *BC = dyn_cast<DefinedBitcode>(B))
|
|
|
|
return BC->File;
|
2016-05-03 05:30:42 +08:00
|
|
|
if (auto *U = dyn_cast<Undefined>(B))
|
|
|
|
return U->File;
|
2015-12-17 06:26:48 +08:00
|
|
|
return nullptr;
|
|
|
|
}
|
|
|
|
|
2016-04-23 02:42:48 +08:00
|
|
|
static uint8_t getMinVisibility(uint8_t VA, uint8_t VB) {
|
|
|
|
if (VA == STV_DEFAULT)
|
|
|
|
return VB;
|
|
|
|
if (VB == STV_DEFAULT)
|
|
|
|
return VA;
|
|
|
|
return std::min(VA, VB);
|
|
|
|
}
|
|
|
|
|
2016-01-09 06:01:33 +08:00
|
|
|
// Find an existing symbol or create and insert a new one.
|
ELF: New symbol table design.
This patch implements a new design for the symbol table that stores
SymbolBodies within a memory region of the Symbol object. Symbols are mutated
by constructing SymbolBodies in place over existing SymbolBodies, rather
than by mutating pointers. As mentioned in the initial proposal [1], this
memory layout helps reduce the cache miss rate by improving memory locality.
Performance numbers:
old(s) new(s)
Without debug info:
chrome 7.178 6.432 (-11.5%)
LLVMgold.so 0.505 0.502 (-0.5%)
clang 0.954 0.827 (-15.4%)
llvm-as 0.052 0.045 (-15.5%)
With debug info:
scylla 5.695 5.613 (-1.5%)
clang 14.396 14.143 (-1.8%)
Performance counter results show that the fewer required indirections is
indeed the cause of the improved performance. For example, when linking
chrome, stalled cycles decreases from 14,556,444,002 to 12,959,238,310, and
instructions per cycle increases from 0.78 to 0.83. We are also executing
many fewer instructions (15,516,401,933 down to 15,002,434,310), probably
because we spend less time allocating SymbolBodies.
The new mechanism by which symbols are added to the symbol table is by calling
add* functions on the SymbolTable.
In this patch, I handle local symbols by storing them inside "unparented"
SymbolBodies. This is suboptimal, but if we do want to try to avoid allocating
these SymbolBodies, we can probably do that separately.
I also removed a few members from the SymbolBody class that were only being
used to pass information from the input file to the symbol table.
This patch implements the new design for the ELF linker only. I intend to
prepare a similar patch for the COFF linker.
[1] http://lists.llvm.org/pipermail/llvm-dev/2016-April/098832.html
Differential Revision: http://reviews.llvm.org/D19752
llvm-svn: 268178
2016-05-01 12:55:03 +08:00
|
|
|
template <class ELFT>
|
|
|
|
std::pair<Symbol *, bool> SymbolTable<ELFT>::insert(StringRef Name) {
|
2016-04-15 04:42:43 +08:00
|
|
|
unsigned NumSyms = SymVector.size();
|
|
|
|
auto P = Symtab.insert(std::make_pair(Name, NumSyms));
|
|
|
|
Symbol *Sym;
|
|
|
|
if (P.second) {
|
2016-04-23 04:21:26 +08:00
|
|
|
Sym = new (Alloc) Symbol;
|
ELF: New symbol table design.
This patch implements a new design for the symbol table that stores
SymbolBodies within a memory region of the Symbol object. Symbols are mutated
by constructing SymbolBodies in place over existing SymbolBodies, rather
than by mutating pointers. As mentioned in the initial proposal [1], this
memory layout helps reduce the cache miss rate by improving memory locality.
Performance numbers:
old(s) new(s)
Without debug info:
chrome 7.178 6.432 (-11.5%)
LLVMgold.so 0.505 0.502 (-0.5%)
clang 0.954 0.827 (-15.4%)
llvm-as 0.052 0.045 (-15.5%)
With debug info:
scylla 5.695 5.613 (-1.5%)
clang 14.396 14.143 (-1.8%)
Performance counter results show that the fewer required indirections is
indeed the cause of the improved performance. For example, when linking
chrome, stalled cycles decreases from 14,556,444,002 to 12,959,238,310, and
instructions per cycle increases from 0.78 to 0.83. We are also executing
many fewer instructions (15,516,401,933 down to 15,002,434,310), probably
because we spend less time allocating SymbolBodies.
The new mechanism by which symbols are added to the symbol table is by calling
add* functions on the SymbolTable.
In this patch, I handle local symbols by storing them inside "unparented"
SymbolBodies. This is suboptimal, but if we do want to try to avoid allocating
these SymbolBodies, we can probably do that separately.
I also removed a few members from the SymbolBody class that were only being
used to pass information from the input file to the symbol table.
This patch implements the new design for the ELF linker only. I intend to
prepare a similar patch for the COFF linker.
[1] http://lists.llvm.org/pipermail/llvm-dev/2016-April/098832.html
Differential Revision: http://reviews.llvm.org/D19752
llvm-svn: 268178
2016-05-01 12:55:03 +08:00
|
|
|
Sym->Binding = STB_WEAK;
|
2016-04-23 04:21:26 +08:00
|
|
|
Sym->Visibility = STV_DEFAULT;
|
|
|
|
Sym->IsUsedInRegularObj = false;
|
|
|
|
Sym->ExportDynamic = false;
|
|
|
|
Sym->VersionScriptGlobal = !Config->VersionScript;
|
2016-04-15 04:42:43 +08:00
|
|
|
SymVector.push_back(Sym);
|
|
|
|
} else {
|
|
|
|
Sym = SymVector[P.first->second];
|
|
|
|
}
|
ELF: New symbol table design.
This patch implements a new design for the symbol table that stores
SymbolBodies within a memory region of the Symbol object. Symbols are mutated
by constructing SymbolBodies in place over existing SymbolBodies, rather
than by mutating pointers. As mentioned in the initial proposal [1], this
memory layout helps reduce the cache miss rate by improving memory locality.
Performance numbers:
old(s) new(s)
Without debug info:
chrome 7.178 6.432 (-11.5%)
LLVMgold.so 0.505 0.502 (-0.5%)
clang 0.954 0.827 (-15.4%)
llvm-as 0.052 0.045 (-15.5%)
With debug info:
scylla 5.695 5.613 (-1.5%)
clang 14.396 14.143 (-1.8%)
Performance counter results show that the fewer required indirections is
indeed the cause of the improved performance. For example, when linking
chrome, stalled cycles decreases from 14,556,444,002 to 12,959,238,310, and
instructions per cycle increases from 0.78 to 0.83. We are also executing
many fewer instructions (15,516,401,933 down to 15,002,434,310), probably
because we spend less time allocating SymbolBodies.
The new mechanism by which symbols are added to the symbol table is by calling
add* functions on the SymbolTable.
In this patch, I handle local symbols by storing them inside "unparented"
SymbolBodies. This is suboptimal, but if we do want to try to avoid allocating
these SymbolBodies, we can probably do that separately.
I also removed a few members from the SymbolBody class that were only being
used to pass information from the input file to the symbol table.
This patch implements the new design for the ELF linker only. I intend to
prepare a similar patch for the COFF linker.
[1] http://lists.llvm.org/pipermail/llvm-dev/2016-April/098832.html
Differential Revision: http://reviews.llvm.org/D19752
llvm-svn: 268178
2016-05-01 12:55:03 +08:00
|
|
|
return {Sym, P.second};
|
|
|
|
}
|
|
|
|
|
|
|
|
// Find an existing symbol or create and insert a new one, then apply the given
|
|
|
|
// attributes.
|
|
|
|
template <class ELFT>
|
|
|
|
std::pair<Symbol *, bool>
|
|
|
|
SymbolTable<ELFT>::insert(StringRef Name, uint8_t Type, uint8_t Visibility,
|
|
|
|
bool CanOmitFromDynSym, bool IsUsedInRegularObj,
|
|
|
|
InputFile *File) {
|
|
|
|
Symbol *S;
|
|
|
|
bool WasInserted;
|
|
|
|
std::tie(S, WasInserted) = insert(Name);
|
|
|
|
|
|
|
|
// Merge in the new symbol's visibility.
|
|
|
|
S->Visibility = getMinVisibility(S->Visibility, Visibility);
|
|
|
|
if (!CanOmitFromDynSym && (Config->Shared || Config->ExportDynamic))
|
|
|
|
S->ExportDynamic = true;
|
|
|
|
if (IsUsedInRegularObj)
|
|
|
|
S->IsUsedInRegularObj = true;
|
|
|
|
if (!WasInserted && ((Type == STT_TLS) != S->body()->isTls()))
|
|
|
|
error("TLS attribute mismatch for symbol: " +
|
|
|
|
conflictMsg(S->body(), File));
|
|
|
|
|
|
|
|
return {S, WasInserted};
|
|
|
|
}
|
|
|
|
|
|
|
|
// Construct a string in the form of "Sym in File1 and File2".
|
|
|
|
// Used to construct an error message.
|
|
|
|
template <typename ELFT>
|
|
|
|
std::string SymbolTable<ELFT>::conflictMsg(SymbolBody *Existing,
|
|
|
|
InputFile *NewFile) {
|
|
|
|
StringRef Sym = Existing->getName();
|
2016-05-03 05:30:42 +08:00
|
|
|
return demangle(Sym) + " in " + getFilename(Existing->getSourceFile<ELFT>()) +
|
|
|
|
" and " + getFilename(NewFile);
|
ELF: New symbol table design.
This patch implements a new design for the symbol table that stores
SymbolBodies within a memory region of the Symbol object. Symbols are mutated
by constructing SymbolBodies in place over existing SymbolBodies, rather
than by mutating pointers. As mentioned in the initial proposal [1], this
memory layout helps reduce the cache miss rate by improving memory locality.
Performance numbers:
old(s) new(s)
Without debug info:
chrome 7.178 6.432 (-11.5%)
LLVMgold.so 0.505 0.502 (-0.5%)
clang 0.954 0.827 (-15.4%)
llvm-as 0.052 0.045 (-15.5%)
With debug info:
scylla 5.695 5.613 (-1.5%)
clang 14.396 14.143 (-1.8%)
Performance counter results show that the fewer required indirections is
indeed the cause of the improved performance. For example, when linking
chrome, stalled cycles decreases from 14,556,444,002 to 12,959,238,310, and
instructions per cycle increases from 0.78 to 0.83. We are also executing
many fewer instructions (15,516,401,933 down to 15,002,434,310), probably
because we spend less time allocating SymbolBodies.
The new mechanism by which symbols are added to the symbol table is by calling
add* functions on the SymbolTable.
In this patch, I handle local symbols by storing them inside "unparented"
SymbolBodies. This is suboptimal, but if we do want to try to avoid allocating
these SymbolBodies, we can probably do that separately.
I also removed a few members from the SymbolBody class that were only being
used to pass information from the input file to the symbol table.
This patch implements the new design for the ELF linker only. I intend to
prepare a similar patch for the COFF linker.
[1] http://lists.llvm.org/pipermail/llvm-dev/2016-April/098832.html
Differential Revision: http://reviews.llvm.org/D19752
llvm-svn: 268178
2016-05-01 12:55:03 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
template <class ELFT> Symbol *SymbolTable<ELFT>::addUndefined(StringRef Name) {
|
|
|
|
return addUndefined(Name, STB_GLOBAL, STV_DEFAULT, /*Type*/ 0,
|
|
|
|
/*File*/ nullptr);
|
|
|
|
}
|
|
|
|
|
|
|
|
template <class ELFT>
|
|
|
|
Symbol *SymbolTable<ELFT>::addUndefined(StringRef Name, uint8_t Binding,
|
|
|
|
uint8_t StOther, uint8_t Type,
|
|
|
|
InputFile *File) {
|
|
|
|
Symbol *S;
|
|
|
|
bool WasInserted;
|
|
|
|
std::tie(S, WasInserted) =
|
|
|
|
insert(Name, Type, StOther & 3, /*CanOmitFromDynSym*/ false,
|
|
|
|
/*IsUsedInRegularObj*/ !File || !isa<BitcodeFile>(File), File);
|
|
|
|
if (WasInserted) {
|
|
|
|
S->Binding = Binding;
|
|
|
|
replaceBody<Undefined>(S, Name, StOther, Type);
|
2016-05-03 05:30:42 +08:00
|
|
|
cast<Undefined>(S->body())->File = File;
|
ELF: New symbol table design.
This patch implements a new design for the symbol table that stores
SymbolBodies within a memory region of the Symbol object. Symbols are mutated
by constructing SymbolBodies in place over existing SymbolBodies, rather
than by mutating pointers. As mentioned in the initial proposal [1], this
memory layout helps reduce the cache miss rate by improving memory locality.
Performance numbers:
old(s) new(s)
Without debug info:
chrome 7.178 6.432 (-11.5%)
LLVMgold.so 0.505 0.502 (-0.5%)
clang 0.954 0.827 (-15.4%)
llvm-as 0.052 0.045 (-15.5%)
With debug info:
scylla 5.695 5.613 (-1.5%)
clang 14.396 14.143 (-1.8%)
Performance counter results show that the fewer required indirections is
indeed the cause of the improved performance. For example, when linking
chrome, stalled cycles decreases from 14,556,444,002 to 12,959,238,310, and
instructions per cycle increases from 0.78 to 0.83. We are also executing
many fewer instructions (15,516,401,933 down to 15,002,434,310), probably
because we spend less time allocating SymbolBodies.
The new mechanism by which symbols are added to the symbol table is by calling
add* functions on the SymbolTable.
In this patch, I handle local symbols by storing them inside "unparented"
SymbolBodies. This is suboptimal, but if we do want to try to avoid allocating
these SymbolBodies, we can probably do that separately.
I also removed a few members from the SymbolBody class that were only being
used to pass information from the input file to the symbol table.
This patch implements the new design for the ELF linker only. I intend to
prepare a similar patch for the COFF linker.
[1] http://lists.llvm.org/pipermail/llvm-dev/2016-April/098832.html
Differential Revision: http://reviews.llvm.org/D19752
llvm-svn: 268178
2016-05-01 12:55:03 +08:00
|
|
|
return S;
|
|
|
|
}
|
|
|
|
if (Binding != STB_WEAK &&
|
|
|
|
(S->body()->isShared() || S->body()->isLazy()))
|
|
|
|
S->Binding = Binding;
|
|
|
|
if (auto *L = dyn_cast<Lazy>(S->body())) {
|
|
|
|
// An undefined weak will not fetch archive members, but we have to remember
|
|
|
|
// its type. See also comment in addLazyArchive.
|
|
|
|
if (S->isWeak())
|
|
|
|
L->Type = Type;
|
|
|
|
else if (auto F = L->getFile())
|
|
|
|
addFile(std::move(F));
|
|
|
|
}
|
|
|
|
return S;
|
|
|
|
}
|
|
|
|
|
|
|
|
// We have a new defined symbol with the specified binding. Return 1 if the new
|
|
|
|
// symbol should win, -1 if the new symbol should lose, or 0 if both symbols are
|
|
|
|
// strong defined symbols.
|
|
|
|
static int compareDefined(Symbol *S, bool WasInserted, uint8_t Binding) {
|
|
|
|
if (WasInserted)
|
|
|
|
return 1;
|
|
|
|
SymbolBody *Body = S->body();
|
|
|
|
if (Body->isLazy() || Body->isUndefined() || Body->isShared())
|
|
|
|
return 1;
|
|
|
|
if (Binding == STB_WEAK)
|
|
|
|
return -1;
|
|
|
|
if (S->isWeak())
|
|
|
|
return 1;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
// We have a new non-common defined symbol with the specified binding. Return 1
|
|
|
|
// if the new symbol should win, -1 if the new symbol should lose, or 0 if there
|
|
|
|
// is a conflict. If the new symbol wins, also update the binding.
|
|
|
|
static int compareDefinedNonCommon(Symbol *S, bool WasInserted, uint8_t Binding) {
|
|
|
|
if (int Cmp = compareDefined(S, WasInserted, Binding)) {
|
|
|
|
if (Cmp > 0)
|
|
|
|
S->Binding = Binding;
|
|
|
|
return Cmp;
|
|
|
|
}
|
|
|
|
if (isa<DefinedCommon>(S->body())) {
|
|
|
|
// Non-common symbols take precedence over common symbols.
|
|
|
|
if (Config->WarnCommon)
|
|
|
|
warning("common " + S->body()->getName() + " is overridden");
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
template <class ELFT>
|
|
|
|
Symbol *SymbolTable<ELFT>::addCommon(StringRef N, uint64_t Size,
|
|
|
|
uint64_t Alignment, uint8_t Binding,
|
|
|
|
uint8_t StOther, uint8_t Type,
|
|
|
|
InputFile *File) {
|
|
|
|
Symbol *S;
|
|
|
|
bool WasInserted;
|
|
|
|
std::tie(S, WasInserted) =
|
|
|
|
insert(N, Type, StOther & 3, /*CanOmitFromDynSym*/ false,
|
|
|
|
/*IsUsedInRegularObj*/ true, File);
|
|
|
|
int Cmp = compareDefined(S, WasInserted, Binding);
|
|
|
|
if (Cmp > 0) {
|
|
|
|
S->Binding = Binding;
|
|
|
|
replaceBody<DefinedCommon>(S, N, Size, Alignment, StOther, Type);
|
|
|
|
} else if (Cmp == 0) {
|
|
|
|
auto *C = dyn_cast<DefinedCommon>(S->body());
|
|
|
|
if (!C) {
|
|
|
|
// Non-common symbols take precedence over common symbols.
|
|
|
|
if (Config->WarnCommon)
|
|
|
|
warning("common " + S->body()->getName() + " is overridden");
|
|
|
|
return S;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (Config->WarnCommon)
|
|
|
|
warning("multiple common of " + S->body()->getName());
|
|
|
|
|
|
|
|
C->Size = std::max(C->Size, Size);
|
|
|
|
C->Alignment = std::max(C->Alignment, Alignment);
|
|
|
|
}
|
|
|
|
return S;
|
|
|
|
}
|
|
|
|
|
|
|
|
template <class ELFT>
|
|
|
|
void SymbolTable<ELFT>::reportDuplicate(SymbolBody *Existing,
|
|
|
|
InputFile *NewFile) {
|
|
|
|
std::string Msg = "duplicate symbol: " + conflictMsg(Existing, NewFile);
|
|
|
|
if (Config->AllowMultipleDefinition)
|
|
|
|
warning(Msg);
|
|
|
|
else
|
|
|
|
error(Msg);
|
|
|
|
}
|
|
|
|
|
|
|
|
template <typename ELFT>
|
|
|
|
Symbol *SymbolTable<ELFT>::addRegular(StringRef Name, const Elf_Sym &Sym,
|
|
|
|
InputSectionBase<ELFT> *Section) {
|
|
|
|
Symbol *S;
|
|
|
|
bool WasInserted;
|
|
|
|
std::tie(S, WasInserted) =
|
|
|
|
insert(Name, Sym.getType(), Sym.getVisibility(),
|
|
|
|
/*CanOmitFromDynSym*/ false, /*IsUsedInRegularObj*/ true,
|
|
|
|
Section ? Section->getFile() : nullptr);
|
|
|
|
int Cmp = compareDefinedNonCommon(S, WasInserted, Sym.getBinding());
|
|
|
|
if (Cmp > 0)
|
|
|
|
replaceBody<DefinedRegular<ELFT>>(S, Name, Sym, Section);
|
|
|
|
else if (Cmp == 0)
|
|
|
|
reportDuplicate(S->body(), Section->getFile());
|
|
|
|
return S;
|
|
|
|
}
|
|
|
|
|
|
|
|
template <typename ELFT>
|
|
|
|
Symbol *SymbolTable<ELFT>::addRegular(StringRef Name, uint8_t Binding,
|
|
|
|
uint8_t StOther) {
|
|
|
|
Symbol *S;
|
|
|
|
bool WasInserted;
|
|
|
|
std::tie(S, WasInserted) =
|
|
|
|
insert(Name, STT_NOTYPE, StOther & 3, /*CanOmitFromDynSym*/ false,
|
|
|
|
/*IsUsedInRegularObj*/ true, nullptr);
|
|
|
|
int Cmp = compareDefinedNonCommon(S, WasInserted, Binding);
|
|
|
|
if (Cmp > 0)
|
|
|
|
replaceBody<DefinedRegular<ELFT>>(S, Name, StOther);
|
|
|
|
else if (Cmp == 0)
|
|
|
|
reportDuplicate(S->body(), nullptr);
|
|
|
|
return S;
|
|
|
|
}
|
|
|
|
|
|
|
|
template <typename ELFT>
|
|
|
|
Symbol *SymbolTable<ELFT>::addSynthetic(StringRef N,
|
|
|
|
OutputSectionBase<ELFT> &Section,
|
|
|
|
uintX_t Value) {
|
|
|
|
Symbol *S;
|
|
|
|
bool WasInserted;
|
|
|
|
std::tie(S, WasInserted) =
|
|
|
|
insert(N, STT_NOTYPE, STV_HIDDEN, /*CanOmitFromDynSym*/ false,
|
|
|
|
/*IsUsedInRegularObj*/ true, nullptr);
|
|
|
|
int Cmp = compareDefinedNonCommon(S, WasInserted, STB_GLOBAL);
|
|
|
|
if (Cmp > 0)
|
|
|
|
replaceBody<DefinedSynthetic<ELFT>>(S, N, Value, Section);
|
|
|
|
else if (Cmp == 0)
|
|
|
|
reportDuplicate(S->body(), nullptr);
|
|
|
|
return S;
|
|
|
|
}
|
|
|
|
|
|
|
|
template <typename ELFT>
|
|
|
|
void SymbolTable<ELFT>::addShared(SharedFile<ELFT> *F, StringRef Name,
|
|
|
|
const Elf_Sym &Sym,
|
|
|
|
const typename ELFT::Verdef *Verdef) {
|
|
|
|
// DSO symbols do not affect visibility in the output, so we pass STV_DEFAULT
|
|
|
|
// as the visibility, which will leave the visibility in the symbol table
|
|
|
|
// unchanged.
|
|
|
|
Symbol *S;
|
|
|
|
bool WasInserted;
|
|
|
|
std::tie(S, WasInserted) =
|
|
|
|
insert(Name, Sym.getType(), STV_DEFAULT, /*CanOmitFromDynSym*/ true,
|
|
|
|
/*IsUsedInRegularObj*/ false, F);
|
|
|
|
// Make sure we preempt DSO symbols with default visibility.
|
|
|
|
if (Sym.getVisibility() == STV_DEFAULT)
|
|
|
|
S->ExportDynamic = true;
|
|
|
|
if (WasInserted || isa<Undefined>(S->body()))
|
|
|
|
replaceBody<SharedSymbol<ELFT>>(S, F, Name, Sym, Verdef);
|
|
|
|
}
|
|
|
|
|
|
|
|
template <class ELFT>
|
|
|
|
Symbol *SymbolTable<ELFT>::addBitcode(StringRef Name, bool IsWeak,
|
|
|
|
uint8_t StOther, uint8_t Type,
|
|
|
|
bool CanOmitFromDynSym, BitcodeFile *F) {
|
|
|
|
Symbol *S;
|
|
|
|
bool WasInserted;
|
|
|
|
std::tie(S, WasInserted) = insert(Name, Type, StOther & 3, CanOmitFromDynSym,
|
|
|
|
/*IsUsedInRegularObj*/ false, F);
|
|
|
|
int Cmp =
|
|
|
|
compareDefinedNonCommon(S, WasInserted, IsWeak ? STB_WEAK : STB_GLOBAL);
|
|
|
|
if (Cmp > 0)
|
|
|
|
replaceBody<DefinedBitcode>(S, Name, StOther, Type, F);
|
|
|
|
else if (Cmp == 0)
|
|
|
|
reportDuplicate(S->body(), F);
|
|
|
|
return S;
|
2015-09-05 06:28:10 +08:00
|
|
|
}
|
2015-07-25 05:03:07 +08:00
|
|
|
|
2015-10-14 00:34:14 +08:00
|
|
|
template <class ELFT> SymbolBody *SymbolTable<ELFT>::find(StringRef Name) {
|
|
|
|
auto It = Symtab.find(Name);
|
|
|
|
if (It == Symtab.end())
|
|
|
|
return nullptr;
|
ELF: New symbol table design.
This patch implements a new design for the symbol table that stores
SymbolBodies within a memory region of the Symbol object. Symbols are mutated
by constructing SymbolBodies in place over existing SymbolBodies, rather
than by mutating pointers. As mentioned in the initial proposal [1], this
memory layout helps reduce the cache miss rate by improving memory locality.
Performance numbers:
old(s) new(s)
Without debug info:
chrome 7.178 6.432 (-11.5%)
LLVMgold.so 0.505 0.502 (-0.5%)
clang 0.954 0.827 (-15.4%)
llvm-as 0.052 0.045 (-15.5%)
With debug info:
scylla 5.695 5.613 (-1.5%)
clang 14.396 14.143 (-1.8%)
Performance counter results show that the fewer required indirections is
indeed the cause of the improved performance. For example, when linking
chrome, stalled cycles decreases from 14,556,444,002 to 12,959,238,310, and
instructions per cycle increases from 0.78 to 0.83. We are also executing
many fewer instructions (15,516,401,933 down to 15,002,434,310), probably
because we spend less time allocating SymbolBodies.
The new mechanism by which symbols are added to the symbol table is by calling
add* functions on the SymbolTable.
In this patch, I handle local symbols by storing them inside "unparented"
SymbolBodies. This is suboptimal, but if we do want to try to avoid allocating
these SymbolBodies, we can probably do that separately.
I also removed a few members from the SymbolBody class that were only being
used to pass information from the input file to the symbol table.
This patch implements the new design for the ELF linker only. I intend to
prepare a similar patch for the COFF linker.
[1] http://lists.llvm.org/pipermail/llvm-dev/2016-April/098832.html
Differential Revision: http://reviews.llvm.org/D19752
llvm-svn: 268178
2016-05-01 12:55:03 +08:00
|
|
|
return SymVector[It->second]->body();
|
2015-10-14 00:34:14 +08:00
|
|
|
}
|
|
|
|
|
ELF: New symbol table design.
This patch implements a new design for the symbol table that stores
SymbolBodies within a memory region of the Symbol object. Symbols are mutated
by constructing SymbolBodies in place over existing SymbolBodies, rather
than by mutating pointers. As mentioned in the initial proposal [1], this
memory layout helps reduce the cache miss rate by improving memory locality.
Performance numbers:
old(s) new(s)
Without debug info:
chrome 7.178 6.432 (-11.5%)
LLVMgold.so 0.505 0.502 (-0.5%)
clang 0.954 0.827 (-15.4%)
llvm-as 0.052 0.045 (-15.5%)
With debug info:
scylla 5.695 5.613 (-1.5%)
clang 14.396 14.143 (-1.8%)
Performance counter results show that the fewer required indirections is
indeed the cause of the improved performance. For example, when linking
chrome, stalled cycles decreases from 14,556,444,002 to 12,959,238,310, and
instructions per cycle increases from 0.78 to 0.83. We are also executing
many fewer instructions (15,516,401,933 down to 15,002,434,310), probably
because we spend less time allocating SymbolBodies.
The new mechanism by which symbols are added to the symbol table is by calling
add* functions on the SymbolTable.
In this patch, I handle local symbols by storing them inside "unparented"
SymbolBodies. This is suboptimal, but if we do want to try to avoid allocating
these SymbolBodies, we can probably do that separately.
I also removed a few members from the SymbolBody class that were only being
used to pass information from the input file to the symbol table.
This patch implements the new design for the ELF linker only. I intend to
prepare a similar patch for the COFF linker.
[1] http://lists.llvm.org/pipermail/llvm-dev/2016-April/098832.html
Differential Revision: http://reviews.llvm.org/D19752
llvm-svn: 268178
2016-05-01 12:55:03 +08:00
|
|
|
template <class ELFT>
|
|
|
|
void SymbolTable<ELFT>::addLazyArchive(
|
|
|
|
ArchiveFile *F, const llvm::object::Archive::Symbol Sym) {
|
|
|
|
Symbol *S;
|
|
|
|
bool WasInserted;
|
|
|
|
std::tie(S, WasInserted) = insert(Sym.getName());
|
|
|
|
if (WasInserted) {
|
|
|
|
replaceBody<LazyArchive>(S, F, Sym, STT_NOTYPE);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
if (!S->body()->isUndefined())
|
|
|
|
return;
|
|
|
|
|
|
|
|
// Weak undefined symbols should not fetch members from archives. If we were
|
|
|
|
// to keep old symbol we would not know that an archive member was available
|
|
|
|
// if a strong undefined symbol shows up afterwards in the link. If a strong
|
|
|
|
// undefined symbol never shows up, this lazy symbol will get to the end of
|
|
|
|
// the link and must be treated as the weak undefined one. We already marked
|
|
|
|
// this symbol as used when we added it to the symbol table, but we also need
|
|
|
|
// to preserve its type. FIXME: Move the Type field to Symbol.
|
|
|
|
if (S->isWeak()) {
|
|
|
|
replaceBody<LazyArchive>(S, F, Sym, S->body()->Type);
|
2015-10-06 22:33:58 +08:00
|
|
|
return;
|
|
|
|
}
|
ELF: New symbol table design.
This patch implements a new design for the symbol table that stores
SymbolBodies within a memory region of the Symbol object. Symbols are mutated
by constructing SymbolBodies in place over existing SymbolBodies, rather
than by mutating pointers. As mentioned in the initial proposal [1], this
memory layout helps reduce the cache miss rate by improving memory locality.
Performance numbers:
old(s) new(s)
Without debug info:
chrome 7.178 6.432 (-11.5%)
LLVMgold.so 0.505 0.502 (-0.5%)
clang 0.954 0.827 (-15.4%)
llvm-as 0.052 0.045 (-15.5%)
With debug info:
scylla 5.695 5.613 (-1.5%)
clang 14.396 14.143 (-1.8%)
Performance counter results show that the fewer required indirections is
indeed the cause of the improved performance. For example, when linking
chrome, stalled cycles decreases from 14,556,444,002 to 12,959,238,310, and
instructions per cycle increases from 0.78 to 0.83. We are also executing
many fewer instructions (15,516,401,933 down to 15,002,434,310), probably
because we spend less time allocating SymbolBodies.
The new mechanism by which symbols are added to the symbol table is by calling
add* functions on the SymbolTable.
In this patch, I handle local symbols by storing them inside "unparented"
SymbolBodies. This is suboptimal, but if we do want to try to avoid allocating
these SymbolBodies, we can probably do that separately.
I also removed a few members from the SymbolBody class that were only being
used to pass information from the input file to the symbol table.
This patch implements the new design for the ELF linker only. I intend to
prepare a similar patch for the COFF linker.
[1] http://lists.llvm.org/pipermail/llvm-dev/2016-April/098832.html
Differential Revision: http://reviews.llvm.org/D19752
llvm-svn: 268178
2016-05-01 12:55:03 +08:00
|
|
|
MemoryBufferRef MBRef = F->getMember(&Sym);
|
|
|
|
if (!MBRef.getBuffer().empty())
|
|
|
|
addFile(createObjectFile(MBRef, F->getName()));
|
2015-09-05 06:28:10 +08:00
|
|
|
}
|
|
|
|
|
2015-12-17 07:23:14 +08:00
|
|
|
template <class ELFT>
|
ELF: New symbol table design.
This patch implements a new design for the symbol table that stores
SymbolBodies within a memory region of the Symbol object. Symbols are mutated
by constructing SymbolBodies in place over existing SymbolBodies, rather
than by mutating pointers. As mentioned in the initial proposal [1], this
memory layout helps reduce the cache miss rate by improving memory locality.
Performance numbers:
old(s) new(s)
Without debug info:
chrome 7.178 6.432 (-11.5%)
LLVMgold.so 0.505 0.502 (-0.5%)
clang 0.954 0.827 (-15.4%)
llvm-as 0.052 0.045 (-15.5%)
With debug info:
scylla 5.695 5.613 (-1.5%)
clang 14.396 14.143 (-1.8%)
Performance counter results show that the fewer required indirections is
indeed the cause of the improved performance. For example, when linking
chrome, stalled cycles decreases from 14,556,444,002 to 12,959,238,310, and
instructions per cycle increases from 0.78 to 0.83. We are also executing
many fewer instructions (15,516,401,933 down to 15,002,434,310), probably
because we spend less time allocating SymbolBodies.
The new mechanism by which symbols are added to the symbol table is by calling
add* functions on the SymbolTable.
In this patch, I handle local symbols by storing them inside "unparented"
SymbolBodies. This is suboptimal, but if we do want to try to avoid allocating
these SymbolBodies, we can probably do that separately.
I also removed a few members from the SymbolBody class that were only being
used to pass information from the input file to the symbol table.
This patch implements the new design for the ELF linker only. I intend to
prepare a similar patch for the COFF linker.
[1] http://lists.llvm.org/pipermail/llvm-dev/2016-April/098832.html
Differential Revision: http://reviews.llvm.org/D19752
llvm-svn: 268178
2016-05-01 12:55:03 +08:00
|
|
|
void SymbolTable<ELFT>::addLazyObject(StringRef Name, MemoryBufferRef MBRef) {
|
|
|
|
Symbol *S;
|
|
|
|
bool WasInserted;
|
|
|
|
std::tie(S, WasInserted) = insert(Name);
|
|
|
|
if (WasInserted) {
|
|
|
|
replaceBody<LazyObject>(S, Name, MBRef, STT_NOTYPE);
|
2015-12-17 07:23:14 +08:00
|
|
|
return;
|
|
|
|
}
|
ELF: New symbol table design.
This patch implements a new design for the symbol table that stores
SymbolBodies within a memory region of the Symbol object. Symbols are mutated
by constructing SymbolBodies in place over existing SymbolBodies, rather
than by mutating pointers. As mentioned in the initial proposal [1], this
memory layout helps reduce the cache miss rate by improving memory locality.
Performance numbers:
old(s) new(s)
Without debug info:
chrome 7.178 6.432 (-11.5%)
LLVMgold.so 0.505 0.502 (-0.5%)
clang 0.954 0.827 (-15.4%)
llvm-as 0.052 0.045 (-15.5%)
With debug info:
scylla 5.695 5.613 (-1.5%)
clang 14.396 14.143 (-1.8%)
Performance counter results show that the fewer required indirections is
indeed the cause of the improved performance. For example, when linking
chrome, stalled cycles decreases from 14,556,444,002 to 12,959,238,310, and
instructions per cycle increases from 0.78 to 0.83. We are also executing
many fewer instructions (15,516,401,933 down to 15,002,434,310), probably
because we spend less time allocating SymbolBodies.
The new mechanism by which symbols are added to the symbol table is by calling
add* functions on the SymbolTable.
In this patch, I handle local symbols by storing them inside "unparented"
SymbolBodies. This is suboptimal, but if we do want to try to avoid allocating
these SymbolBodies, we can probably do that separately.
I also removed a few members from the SymbolBody class that were only being
used to pass information from the input file to the symbol table.
This patch implements the new design for the ELF linker only. I intend to
prepare a similar patch for the COFF linker.
[1] http://lists.llvm.org/pipermail/llvm-dev/2016-April/098832.html
Differential Revision: http://reviews.llvm.org/D19752
llvm-svn: 268178
2016-05-01 12:55:03 +08:00
|
|
|
if (!S->body()->isUndefined())
|
|
|
|
return;
|
2015-12-17 07:23:14 +08:00
|
|
|
|
ELF: New symbol table design.
This patch implements a new design for the symbol table that stores
SymbolBodies within a memory region of the Symbol object. Symbols are mutated
by constructing SymbolBodies in place over existing SymbolBodies, rather
than by mutating pointers. As mentioned in the initial proposal [1], this
memory layout helps reduce the cache miss rate by improving memory locality.
Performance numbers:
old(s) new(s)
Without debug info:
chrome 7.178 6.432 (-11.5%)
LLVMgold.so 0.505 0.502 (-0.5%)
clang 0.954 0.827 (-15.4%)
llvm-as 0.052 0.045 (-15.5%)
With debug info:
scylla 5.695 5.613 (-1.5%)
clang 14.396 14.143 (-1.8%)
Performance counter results show that the fewer required indirections is
indeed the cause of the improved performance. For example, when linking
chrome, stalled cycles decreases from 14,556,444,002 to 12,959,238,310, and
instructions per cycle increases from 0.78 to 0.83. We are also executing
many fewer instructions (15,516,401,933 down to 15,002,434,310), probably
because we spend less time allocating SymbolBodies.
The new mechanism by which symbols are added to the symbol table is by calling
add* functions on the SymbolTable.
In this patch, I handle local symbols by storing them inside "unparented"
SymbolBodies. This is suboptimal, but if we do want to try to avoid allocating
these SymbolBodies, we can probably do that separately.
I also removed a few members from the SymbolBody class that were only being
used to pass information from the input file to the symbol table.
This patch implements the new design for the ELF linker only. I intend to
prepare a similar patch for the COFF linker.
[1] http://lists.llvm.org/pipermail/llvm-dev/2016-April/098832.html
Differential Revision: http://reviews.llvm.org/D19752
llvm-svn: 268178
2016-05-01 12:55:03 +08:00
|
|
|
// See comment for addLazyArchive above.
|
|
|
|
if (S->isWeak())
|
|
|
|
replaceBody<LazyObject>(S, Name, MBRef, S->body()->Type);
|
|
|
|
else
|
|
|
|
addFile(createObjectFile(MBRef));
|
2015-07-25 05:03:07 +08:00
|
|
|
}
|
2015-09-26 02:56:53 +08:00
|
|
|
|
2016-04-27 08:05:03 +08:00
|
|
|
// Process undefined (-u) flags by loading lazy symbols named by those flags.
|
ELF: New symbol table design.
This patch implements a new design for the symbol table that stores
SymbolBodies within a memory region of the Symbol object. Symbols are mutated
by constructing SymbolBodies in place over existing SymbolBodies, rather
than by mutating pointers. As mentioned in the initial proposal [1], this
memory layout helps reduce the cache miss rate by improving memory locality.
Performance numbers:
old(s) new(s)
Without debug info:
chrome 7.178 6.432 (-11.5%)
LLVMgold.so 0.505 0.502 (-0.5%)
clang 0.954 0.827 (-15.4%)
llvm-as 0.052 0.045 (-15.5%)
With debug info:
scylla 5.695 5.613 (-1.5%)
clang 14.396 14.143 (-1.8%)
Performance counter results show that the fewer required indirections is
indeed the cause of the improved performance. For example, when linking
chrome, stalled cycles decreases from 14,556,444,002 to 12,959,238,310, and
instructions per cycle increases from 0.78 to 0.83. We are also executing
many fewer instructions (15,516,401,933 down to 15,002,434,310), probably
because we spend less time allocating SymbolBodies.
The new mechanism by which symbols are added to the symbol table is by calling
add* functions on the SymbolTable.
In this patch, I handle local symbols by storing them inside "unparented"
SymbolBodies. This is suboptimal, but if we do want to try to avoid allocating
these SymbolBodies, we can probably do that separately.
I also removed a few members from the SymbolBody class that were only being
used to pass information from the input file to the symbol table.
This patch implements the new design for the ELF linker only. I intend to
prepare a similar patch for the COFF linker.
[1] http://lists.llvm.org/pipermail/llvm-dev/2016-April/098832.html
Differential Revision: http://reviews.llvm.org/D19752
llvm-svn: 268178
2016-05-01 12:55:03 +08:00
|
|
|
template <class ELFT> void SymbolTable<ELFT>::scanUndefinedFlags() {
|
2016-04-27 08:05:03 +08:00
|
|
|
for (StringRef S : Config->Undefined)
|
ELF: New symbol table design.
This patch implements a new design for the symbol table that stores
SymbolBodies within a memory region of the Symbol object. Symbols are mutated
by constructing SymbolBodies in place over existing SymbolBodies, rather
than by mutating pointers. As mentioned in the initial proposal [1], this
memory layout helps reduce the cache miss rate by improving memory locality.
Performance numbers:
old(s) new(s)
Without debug info:
chrome 7.178 6.432 (-11.5%)
LLVMgold.so 0.505 0.502 (-0.5%)
clang 0.954 0.827 (-15.4%)
llvm-as 0.052 0.045 (-15.5%)
With debug info:
scylla 5.695 5.613 (-1.5%)
clang 14.396 14.143 (-1.8%)
Performance counter results show that the fewer required indirections is
indeed the cause of the improved performance. For example, when linking
chrome, stalled cycles decreases from 14,556,444,002 to 12,959,238,310, and
instructions per cycle increases from 0.78 to 0.83. We are also executing
many fewer instructions (15,516,401,933 down to 15,002,434,310), probably
because we spend less time allocating SymbolBodies.
The new mechanism by which symbols are added to the symbol table is by calling
add* functions on the SymbolTable.
In this patch, I handle local symbols by storing them inside "unparented"
SymbolBodies. This is suboptimal, but if we do want to try to avoid allocating
these SymbolBodies, we can probably do that separately.
I also removed a few members from the SymbolBody class that were only being
used to pass information from the input file to the symbol table.
This patch implements the new design for the ELF linker only. I intend to
prepare a similar patch for the COFF linker.
[1] http://lists.llvm.org/pipermail/llvm-dev/2016-April/098832.html
Differential Revision: http://reviews.llvm.org/D19752
llvm-svn: 268178
2016-05-01 12:55:03 +08:00
|
|
|
if (auto *L = dyn_cast_or_null<Lazy>(find(S)))
|
|
|
|
if (std::unique_ptr<InputFile> File = L->getFile())
|
|
|
|
addFile(std::move(File));
|
2016-04-27 08:05:03 +08:00
|
|
|
}
|
|
|
|
|
2015-10-14 02:10:33 +08:00
|
|
|
// This function takes care of the case in which shared libraries depend on
|
|
|
|
// the user program (not the other way, which is usual). Shared libraries
|
|
|
|
// may have undefined symbols, expecting that the user program provides
|
|
|
|
// the definitions for them. An example is BSD's __progname symbol.
|
|
|
|
// We need to put such symbols to the main program's .dynsym so that
|
|
|
|
// shared libraries can find them.
|
|
|
|
// Except this, we ignore undefined symbols in DSOs.
|
|
|
|
template <class ELFT> void SymbolTable<ELFT>::scanShlibUndefined() {
|
2015-10-14 00:34:14 +08:00
|
|
|
for (std::unique_ptr<SharedFile<ELFT>> &File : SharedFiles)
|
|
|
|
for (StringRef U : File->getUndefinedSymbols())
|
|
|
|
if (SymbolBody *Sym = find(U))
|
|
|
|
if (Sym->isDefined())
|
ELF: New symbol table design.
This patch implements a new design for the symbol table that stores
SymbolBodies within a memory region of the Symbol object. Symbols are mutated
by constructing SymbolBodies in place over existing SymbolBodies, rather
than by mutating pointers. As mentioned in the initial proposal [1], this
memory layout helps reduce the cache miss rate by improving memory locality.
Performance numbers:
old(s) new(s)
Without debug info:
chrome 7.178 6.432 (-11.5%)
LLVMgold.so 0.505 0.502 (-0.5%)
clang 0.954 0.827 (-15.4%)
llvm-as 0.052 0.045 (-15.5%)
With debug info:
scylla 5.695 5.613 (-1.5%)
clang 14.396 14.143 (-1.8%)
Performance counter results show that the fewer required indirections is
indeed the cause of the improved performance. For example, when linking
chrome, stalled cycles decreases from 14,556,444,002 to 12,959,238,310, and
instructions per cycle increases from 0.78 to 0.83. We are also executing
many fewer instructions (15,516,401,933 down to 15,002,434,310), probably
because we spend less time allocating SymbolBodies.
The new mechanism by which symbols are added to the symbol table is by calling
add* functions on the SymbolTable.
In this patch, I handle local symbols by storing them inside "unparented"
SymbolBodies. This is suboptimal, but if we do want to try to avoid allocating
these SymbolBodies, we can probably do that separately.
I also removed a few members from the SymbolBody class that were only being
used to pass information from the input file to the symbol table.
This patch implements the new design for the ELF linker only. I intend to
prepare a similar patch for the COFF linker.
[1] http://lists.llvm.org/pipermail/llvm-dev/2016-April/098832.html
Differential Revision: http://reviews.llvm.org/D19752
llvm-svn: 268178
2016-05-01 12:55:03 +08:00
|
|
|
Sym->symbol()->ExportDynamic = true;
|
2015-10-14 00:34:14 +08:00
|
|
|
}
|
|
|
|
|
2016-04-14 02:51:11 +08:00
|
|
|
// This function process the dynamic list option by marking all the symbols
|
|
|
|
// to be exported in the dynamic table.
|
|
|
|
template <class ELFT> void SymbolTable<ELFT>::scanDynamicList() {
|
|
|
|
for (StringRef S : Config->DynamicList)
|
|
|
|
if (SymbolBody *B = find(S))
|
ELF: New symbol table design.
This patch implements a new design for the symbol table that stores
SymbolBodies within a memory region of the Symbol object. Symbols are mutated
by constructing SymbolBodies in place over existing SymbolBodies, rather
than by mutating pointers. As mentioned in the initial proposal [1], this
memory layout helps reduce the cache miss rate by improving memory locality.
Performance numbers:
old(s) new(s)
Without debug info:
chrome 7.178 6.432 (-11.5%)
LLVMgold.so 0.505 0.502 (-0.5%)
clang 0.954 0.827 (-15.4%)
llvm-as 0.052 0.045 (-15.5%)
With debug info:
scylla 5.695 5.613 (-1.5%)
clang 14.396 14.143 (-1.8%)
Performance counter results show that the fewer required indirections is
indeed the cause of the improved performance. For example, when linking
chrome, stalled cycles decreases from 14,556,444,002 to 12,959,238,310, and
instructions per cycle increases from 0.78 to 0.83. We are also executing
many fewer instructions (15,516,401,933 down to 15,002,434,310), probably
because we spend less time allocating SymbolBodies.
The new mechanism by which symbols are added to the symbol table is by calling
add* functions on the SymbolTable.
In this patch, I handle local symbols by storing them inside "unparented"
SymbolBodies. This is suboptimal, but if we do want to try to avoid allocating
these SymbolBodies, we can probably do that separately.
I also removed a few members from the SymbolBody class that were only being
used to pass information from the input file to the symbol table.
This patch implements the new design for the ELF linker only. I intend to
prepare a similar patch for the COFF linker.
[1] http://lists.llvm.org/pipermail/llvm-dev/2016-April/098832.html
Differential Revision: http://reviews.llvm.org/D19752
llvm-svn: 268178
2016-05-01 12:55:03 +08:00
|
|
|
B->symbol()->ExportDynamic = true;
|
2016-04-14 02:51:11 +08:00
|
|
|
}
|
|
|
|
|
2016-04-23 04:21:26 +08:00
|
|
|
// This function processes the --version-script option by marking all global
|
|
|
|
// symbols with the VersionScriptGlobal flag, which acts as a filter on the
|
|
|
|
// dynamic symbol table.
|
|
|
|
template <class ELFT> void SymbolTable<ELFT>::scanVersionScript() {
|
|
|
|
for (StringRef S : Config->VersionScriptGlobals)
|
|
|
|
if (SymbolBody *B = find(S))
|
ELF: New symbol table design.
This patch implements a new design for the symbol table that stores
SymbolBodies within a memory region of the Symbol object. Symbols are mutated
by constructing SymbolBodies in place over existing SymbolBodies, rather
than by mutating pointers. As mentioned in the initial proposal [1], this
memory layout helps reduce the cache miss rate by improving memory locality.
Performance numbers:
old(s) new(s)
Without debug info:
chrome 7.178 6.432 (-11.5%)
LLVMgold.so 0.505 0.502 (-0.5%)
clang 0.954 0.827 (-15.4%)
llvm-as 0.052 0.045 (-15.5%)
With debug info:
scylla 5.695 5.613 (-1.5%)
clang 14.396 14.143 (-1.8%)
Performance counter results show that the fewer required indirections is
indeed the cause of the improved performance. For example, when linking
chrome, stalled cycles decreases from 14,556,444,002 to 12,959,238,310, and
instructions per cycle increases from 0.78 to 0.83. We are also executing
many fewer instructions (15,516,401,933 down to 15,002,434,310), probably
because we spend less time allocating SymbolBodies.
The new mechanism by which symbols are added to the symbol table is by calling
add* functions on the SymbolTable.
In this patch, I handle local symbols by storing them inside "unparented"
SymbolBodies. This is suboptimal, but if we do want to try to avoid allocating
these SymbolBodies, we can probably do that separately.
I also removed a few members from the SymbolBody class that were only being
used to pass information from the input file to the symbol table.
This patch implements the new design for the ELF linker only. I intend to
prepare a similar patch for the COFF linker.
[1] http://lists.llvm.org/pipermail/llvm-dev/2016-April/098832.html
Differential Revision: http://reviews.llvm.org/D19752
llvm-svn: 268178
2016-05-01 12:55:03 +08:00
|
|
|
B->symbol()->VersionScriptGlobal = true;
|
2016-04-23 04:21:26 +08:00
|
|
|
}
|
|
|
|
|
2016-02-28 08:25:54 +08:00
|
|
|
template class elf::SymbolTable<ELF32LE>;
|
|
|
|
template class elf::SymbolTable<ELF32BE>;
|
|
|
|
template class elf::SymbolTable<ELF64LE>;
|
|
|
|
template class elf::SymbolTable<ELF64BE>;
|