[WebAssembly] LTO: Honor comdat groups when loading bitcode files

But don't apply comdat groups when loading the LTO object files.
This is basically the same logic used by the ELF linker.

Differential Revision: https://reviews.llvm.org/D61924

llvm-svn: 360782
This commit is contained in:
Sam Clegg 2019-05-15 16:03:28 +00:00
parent 5c15dbafb9
commit 697f2149f1
5 changed files with 49 additions and 19 deletions

View File

@ -0,0 +1,15 @@
; Verify that comdat symbols can be defined in LTO objects. We had a
; regression where the comdat handling code was causing symbol in the lto object
; to be ignored.
; RUN: llvm-as %s -o %t.o
; RUN: wasm-ld %t.o %t.o -o %t.wasm
target datalayout = "e-m:e-p:32:32-i64:64-n32:64-S128"
target triple = "wasm32-unknown-unknown"
$foo = comdat any
define linkonce_odr void @_start() comdat($foo) {
entry:
ret void
}

View File

@ -60,7 +60,7 @@ InputFile *lld::wasm::createObjectFile(MemoryBufferRef MB,
} }
void ObjFile::dumpInfo() const { void ObjFile::dumpInfo() const {
log("info for: " + getName() + log("info for: " + toString(this) +
"\n Symbols : " + Twine(Symbols.size()) + "\n Symbols : " + Twine(Symbols.size()) +
"\n Function Imports : " + Twine(WasmObj->getNumImportedFunctions()) + "\n Function Imports : " + Twine(WasmObj->getNumImportedFunctions()) +
"\n Global Imports : " + Twine(WasmObj->getNumImportedGlobals()) + "\n Global Imports : " + Twine(WasmObj->getNumImportedGlobals()) +
@ -232,7 +232,7 @@ static void setRelocs(const std::vector<T *> &Chunks,
} }
} }
void ObjFile::parse() { void ObjFile::parse(bool IgnoreComdats) {
// Parse a memory buffer as a wasm file. // Parse a memory buffer as a wasm file.
LLVM_DEBUG(dbgs() << "Parsing object: " << toString(this) << "\n"); LLVM_DEBUG(dbgs() << "Parsing object: " << toString(this) << "\n");
std::unique_ptr<Binary> Bin = CHECK(createBinary(MB), toString(this)); std::unique_ptr<Binary> Bin = CHECK(createBinary(MB), toString(this));
@ -283,9 +283,11 @@ void ObjFile::parse() {
TypeIsUsed.resize(getWasmObj()->types().size(), false); TypeIsUsed.resize(getWasmObj()->types().size(), false);
ArrayRef<StringRef> Comdats = WasmObj->linkingData().Comdats; ArrayRef<StringRef> Comdats = WasmObj->linkingData().Comdats;
UsedComdats.resize(Comdats.size());
for (unsigned I = 0; I < Comdats.size(); ++I) for (unsigned I = 0; I < Comdats.size(); ++I)
UsedComdats[I] = Symtab->addComdat(Comdats[I]); if (IgnoreComdats)
KeptComdats.push_back(true);
else
KeptComdats.push_back(Symtab->addComdat(Comdats[I]));
// Populate `Segments`. // Populate `Segments`.
for (const WasmSegment &S : WasmObj->dataSegments()) for (const WasmSegment &S : WasmObj->dataSegments())
@ -326,7 +328,7 @@ bool ObjFile::isExcludedByComdat(InputChunk *Chunk) const {
uint32_t C = Chunk->getComdat(); uint32_t C = Chunk->getComdat();
if (C == UINT32_MAX) if (C == UINT32_MAX)
return false; return false;
return !UsedComdats[C]; return !KeptComdats[C];
} }
FunctionSymbol *ObjFile::getFunctionSymbol(uint32_t Index) const { FunctionSymbol *ObjFile::getFunctionSymbol(uint32_t Index) const {
@ -427,7 +429,7 @@ Symbol *ObjFile::createUndefined(const WasmSymbol &Sym) {
llvm_unreachable("unknown symbol kind"); llvm_unreachable("unknown symbol kind");
} }
void ArchiveFile::parse() { void ArchiveFile::parse(bool IgnoreComdats) {
// Parse a MemoryBufferRef as an archive file. // Parse a MemoryBufferRef as an archive file.
LLVM_DEBUG(dbgs() << "Parsing library: " << toString(this) << "\n"); LLVM_DEBUG(dbgs() << "Parsing library: " << toString(this) << "\n");
File = CHECK(Archive::create(MB), toString(this)); File = CHECK(Archive::create(MB), toString(this));
@ -474,14 +476,18 @@ static uint8_t mapVisibility(GlobalValue::VisibilityTypes GvVisibility) {
llvm_unreachable("unknown visibility"); llvm_unreachable("unknown visibility");
} }
static Symbol *createBitcodeSymbol(const lto::InputFile::Symbol &ObjSym, static Symbol *createBitcodeSymbol(const std::vector<bool> &KeptComdats,
const lto::InputFile::Symbol &ObjSym,
BitcodeFile &F) { BitcodeFile &F) {
StringRef Name = Saver.save(ObjSym.getName()); StringRef Name = Saver.save(ObjSym.getName());
uint32_t Flags = ObjSym.isWeak() ? WASM_SYMBOL_BINDING_WEAK : 0; uint32_t Flags = ObjSym.isWeak() ? WASM_SYMBOL_BINDING_WEAK : 0;
Flags |= mapVisibility(ObjSym.getVisibility()); Flags |= mapVisibility(ObjSym.getVisibility());
if (ObjSym.isUndefined()) { int C = ObjSym.getComdatIndex();
bool ExcludedByComdat = C != -1 && !KeptComdats[C];
if (ObjSym.isUndefined() || ExcludedByComdat) {
if (ObjSym.isExecutable()) if (ObjSym.isExecutable())
return Symtab->addUndefinedFunction(Name, Name, DefaultModule, Flags, &F, return Symtab->addUndefinedFunction(Name, Name, DefaultModule, Flags, &F,
nullptr); nullptr);
@ -493,7 +499,7 @@ static Symbol *createBitcodeSymbol(const lto::InputFile::Symbol &ObjSym,
return Symtab->addDefinedData(Name, Flags, &F, nullptr, 0, 0); return Symtab->addDefinedData(Name, Flags, &F, nullptr, 0, 0);
} }
void BitcodeFile::parse() { void BitcodeFile::parse(bool IgnoreComdats) {
Obj = check(lto::InputFile::create(MemoryBufferRef( Obj = check(lto::InputFile::create(MemoryBufferRef(
MB.getBuffer(), Saver.save(ArchiveName + MB.getBufferIdentifier())))); MB.getBuffer(), Saver.save(ArchiveName + MB.getBufferIdentifier()))));
Triple T(Obj->getTargetTriple()); Triple T(Obj->getTargetTriple());
@ -501,9 +507,15 @@ void BitcodeFile::parse() {
error(toString(MB.getBufferIdentifier()) + ": machine type must be wasm32"); error(toString(MB.getBufferIdentifier()) + ": machine type must be wasm32");
return; return;
} }
std::vector<bool> KeptComdats;
for (StringRef S : Obj->getComdatTable())
if (IgnoreComdats)
KeptComdats.push_back(true);
else
KeptComdats.push_back(Symtab->addComdat(S));
for (const lto::InputFile::Symbol &ObjSym : Obj->symbols()) for (const lto::InputFile::Symbol &ObjSym : Obj->symbols())
Symbols.push_back(createBitcodeSymbol(ObjSym, *this)); Symbols.push_back(createBitcodeSymbol(KeptComdats, ObjSym, *this));
} }
// Returns a string in the format of "foo.o" or "foo.a(bar.o)". // Returns a string in the format of "foo.o" or "foo.a(bar.o)".

View File

@ -44,7 +44,7 @@ public:
StringRef getName() const { return MB.getBufferIdentifier(); } StringRef getName() const { return MB.getBufferIdentifier(); }
// Reads a file (the constructor doesn't do that). // Reads a file (the constructor doesn't do that).
virtual void parse() = 0; virtual void parse(bool IgnoreComdats = false) = 0;
Kind kind() const { return FileKind; } Kind kind() const { return FileKind; }
@ -72,7 +72,7 @@ public:
void addMember(const llvm::object::Archive::Symbol *Sym); void addMember(const llvm::object::Archive::Symbol *Sym);
void parse() override; void parse(bool IgnoreComdats) override;
private: private:
std::unique_ptr<llvm::object::Archive> File; std::unique_ptr<llvm::object::Archive> File;
@ -88,7 +88,7 @@ public:
} }
static bool classof(const InputFile *F) { return F->kind() == ObjectKind; } static bool classof(const InputFile *F) { return F->kind() == ObjectKind; }
void parse() override; void parse(bool IgnoreComdats) override;
// Returns the underlying wasm file. // Returns the underlying wasm file.
const WasmObjectFile *getWasmObj() const { return WasmObj.get(); } const WasmObjectFile *getWasmObj() const { return WasmObj.get(); }
@ -111,7 +111,7 @@ public:
std::vector<bool> TypeIsUsed; std::vector<bool> TypeIsUsed;
// Maps function indices to table indices // Maps function indices to table indices
std::vector<uint32_t> TableEntries; std::vector<uint32_t> TableEntries;
std::vector<bool> UsedComdats; std::vector<bool> KeptComdats;
std::vector<InputSegment *> Segments; std::vector<InputSegment *> Segments;
std::vector<InputFunction *> Functions; std::vector<InputFunction *> Functions;
std::vector<InputGlobal *> Globals; std::vector<InputGlobal *> Globals;
@ -141,7 +141,7 @@ public:
explicit SharedFile(MemoryBufferRef M) : InputFile(SharedKind, M) {} explicit SharedFile(MemoryBufferRef M) : InputFile(SharedKind, M) {}
static bool classof(const InputFile *F) { return F->kind() == SharedKind; } static bool classof(const InputFile *F) { return F->kind() == SharedKind; }
void parse() override {} void parse(bool IgnoreComdats) override {}
}; };
// .bc file // .bc file
@ -153,7 +153,7 @@ public:
} }
static bool classof(const InputFile *F) { return F->kind() == BitcodeKind; } static bool classof(const InputFile *F) { return F->kind() == BitcodeKind; }
void parse() override; void parse(bool IgnoreComdats) override;
std::unique_ptr<llvm::lto::InputFile> Obj; std::unique_ptr<llvm::lto::InputFile> Obj;
}; };

View File

@ -59,7 +59,7 @@ void SymbolTable::addCombinedLTOObject() {
for (StringRef Filename : LTO->compile()) { for (StringRef Filename : LTO->compile()) {
auto *Obj = make<ObjFile>(MemoryBufferRef(Filename, "lto.tmp"), ""); auto *Obj = make<ObjFile>(MemoryBufferRef(Filename, "lto.tmp"), "");
Obj->parse(); Obj->parse(true);
ObjectFiles.push_back(Obj); ObjectFiles.push_back(Obj);
} }
} }
@ -476,7 +476,7 @@ void SymbolTable::addLazy(ArchiveFile *File, const Archive::Symbol *Sym) {
} }
bool SymbolTable::addComdat(StringRef Name) { bool SymbolTable::addComdat(StringRef Name) {
return Comdats.insert(CachedHashStringRef(Name)).second; return ComdatGroups.insert(CachedHashStringRef(Name)).second;
} }
// The new signature doesn't match. Create a variant to the symbol with the // The new signature doesn't match. Create a variant to the symbol with the

View File

@ -104,7 +104,10 @@ private:
// variants of the same symbol with different signatures. // variants of the same symbol with different signatures.
llvm::DenseMap<llvm::CachedHashStringRef, std::vector<Symbol *>> SymVariants; llvm::DenseMap<llvm::CachedHashStringRef, std::vector<Symbol *>> SymVariants;
llvm::DenseSet<llvm::CachedHashStringRef> Comdats; // Comdat groups define "link once" sections. If two comdat groups have the
// same name, only one of them is linked, and the other is ignored. This set
// is used to uniquify them.
llvm::DenseSet<llvm::CachedHashStringRef> ComdatGroups;
// For LTO. // For LTO.
std::unique_ptr<BitcodeCompiler> LTO; std::unique_ptr<BitcodeCompiler> LTO;