2017-04-25 07:21:38 +08:00
|
|
|
//===- ModuleSymbolTable.cpp - symbol table for in-memory IR --------------===//
|
2016-12-01 14:51:47 +08:00
|
|
|
//
|
2019-01-19 16:50:56 +08:00
|
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
2016-12-01 14:51:47 +08:00
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
//
|
|
|
|
// This class represents a symbol table built from in-memory IR. It provides
|
|
|
|
// access to GlobalValues and should only be used if such access is required
|
|
|
|
// (e.g. in the LTO implementation).
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
2017-06-06 19:49:48 +08:00
|
|
|
#include "llvm/Object/ModuleSymbolTable.h"
|
2016-12-01 14:51:47 +08:00
|
|
|
#include "RecordStreamer.h"
|
|
|
|
#include "llvm/ADT/STLExtras.h"
|
2017-06-06 19:49:48 +08:00
|
|
|
#include "llvm/ADT/SmallString.h"
|
2017-04-25 07:21:38 +08:00
|
|
|
#include "llvm/ADT/StringMap.h"
|
|
|
|
#include "llvm/ADT/StringRef.h"
|
|
|
|
#include "llvm/ADT/Triple.h"
|
|
|
|
#include "llvm/IR/Function.h"
|
|
|
|
#include "llvm/IR/GlobalAlias.h"
|
|
|
|
#include "llvm/IR/GlobalValue.h"
|
|
|
|
#include "llvm/IR/GlobalVariable.h"
|
2020-06-30 18:48:10 +08:00
|
|
|
#include "llvm/IR/InlineAsm.h"
|
2016-12-01 14:51:47 +08:00
|
|
|
#include "llvm/IR/Module.h"
|
|
|
|
#include "llvm/MC/MCAsmInfo.h"
|
|
|
|
#include "llvm/MC/MCContext.h"
|
2017-04-25 07:21:38 +08:00
|
|
|
#include "llvm/MC/MCDirectives.h"
|
2016-12-01 14:51:47 +08:00
|
|
|
#include "llvm/MC/MCInstrInfo.h"
|
|
|
|
#include "llvm/MC/MCObjectFileInfo.h"
|
|
|
|
#include "llvm/MC/MCParser/MCAsmParser.h"
|
|
|
|
#include "llvm/MC/MCParser/MCTargetAsmParser.h"
|
|
|
|
#include "llvm/MC/MCRegisterInfo.h"
|
|
|
|
#include "llvm/MC/MCSubtargetInfo.h"
|
2017-04-25 07:21:38 +08:00
|
|
|
#include "llvm/MC/MCSymbol.h"
|
|
|
|
#include "llvm/MC/MCTargetOptions.h"
|
|
|
|
#include "llvm/Object/SymbolicFile.h"
|
|
|
|
#include "llvm/Support/Casting.h"
|
|
|
|
#include "llvm/Support/CodeGen.h"
|
|
|
|
#include "llvm/Support/ErrorHandling.h"
|
2016-12-01 14:51:47 +08:00
|
|
|
#include "llvm/Support/MemoryBuffer.h"
|
2017-04-25 07:21:38 +08:00
|
|
|
#include "llvm/Support/SMLoc.h"
|
2016-12-01 14:51:47 +08:00
|
|
|
#include "llvm/Support/SourceMgr.h"
|
|
|
|
#include "llvm/Support/TargetRegistry.h"
|
2017-06-06 19:49:48 +08:00
|
|
|
#include "llvm/Support/raw_ostream.h"
|
2017-04-25 07:21:38 +08:00
|
|
|
#include <algorithm>
|
|
|
|
#include <cassert>
|
|
|
|
#include <cstdint>
|
|
|
|
#include <memory>
|
|
|
|
#include <string>
|
|
|
|
|
2016-12-01 14:51:47 +08:00
|
|
|
using namespace llvm;
|
|
|
|
using namespace object;
|
|
|
|
|
|
|
|
void ModuleSymbolTable::addModule(Module *M) {
|
|
|
|
if (FirstMod)
|
|
|
|
assert(FirstMod->getTargetTriple() == M->getTargetTriple());
|
|
|
|
else
|
|
|
|
FirstMod = M;
|
|
|
|
|
2017-03-30 03:26:26 +08:00
|
|
|
for (GlobalValue &GV : M->global_values())
|
2016-12-01 14:51:47 +08:00
|
|
|
SymTab.push_back(&GV);
|
|
|
|
|
Perform symbol binding for .symver versioned symbols
Summary:
In a .symver assembler directive like:
.symver name, name2@@nodename
"name2@@nodename" should get the same symbol binding as "name".
While the ELF object writer is updating the symbol binding for .symver
aliases before emitting the object file, not doing so when the module
inline assembly is handled by the RecordStreamer is causing the wrong
behavior in *LTO mode.
E.g. when "name" is global, "name2@@nodename" must also be marked as
global. Otherwise, the symbol is skipped when iterating over the LTO
InputFile symbols (InputFile::Symbol::shouldSkip). So, for example,
when performing any *LTO via the gold-plugin, the versioned symbol
definition is not recorded by the plugin and passed back to the
linker. If the object was in an archive, and there were no other symbols
needed from that object, the object would not be included in the final
link and references to the versioned symbol are undefined.
The llvm-lto2 tests added will give an error about an unused symbol
resolution without the fix.
Reviewers: rafael, pcc
Reviewed By: pcc
Subscribers: mehdi_amini, llvm-commits
Differential Revision: https://reviews.llvm.org/D30485
llvm-svn: 297332
2017-03-09 08:19:49 +08:00
|
|
|
CollectAsmSymbols(*M, [this](StringRef Name, BasicSymbolRef::Flags Flags) {
|
2020-01-29 09:09:24 +08:00
|
|
|
SymTab.push_back(new (AsmSymbols.Allocate())
|
|
|
|
AsmSymbol(std::string(Name), Flags));
|
Perform symbol binding for .symver versioned symbols
Summary:
In a .symver assembler directive like:
.symver name, name2@@nodename
"name2@@nodename" should get the same symbol binding as "name".
While the ELF object writer is updating the symbol binding for .symver
aliases before emitting the object file, not doing so when the module
inline assembly is handled by the RecordStreamer is causing the wrong
behavior in *LTO mode.
E.g. when "name" is global, "name2@@nodename" must also be marked as
global. Otherwise, the symbol is skipped when iterating over the LTO
InputFile symbols (InputFile::Symbol::shouldSkip). So, for example,
when performing any *LTO via the gold-plugin, the versioned symbol
definition is not recorded by the plugin and passed back to the
linker. If the object was in an archive, and there were no other symbols
needed from that object, the object would not be included in the final
link and references to the versioned symbol are undefined.
The llvm-lto2 tests added will give an error about an unused symbol
resolution without the fix.
Reviewers: rafael, pcc
Reviewed By: pcc
Subscribers: mehdi_amini, llvm-commits
Differential Revision: https://reviews.llvm.org/D30485
llvm-svn: 297332
2017-03-09 08:19:49 +08:00
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2018-04-20 09:36:48 +08:00
|
|
|
static void
|
|
|
|
initializeRecordStreamer(const Module &M,
|
|
|
|
function_ref<void(RecordStreamer &)> Init) {
|
Perform symbol binding for .symver versioned symbols
Summary:
In a .symver assembler directive like:
.symver name, name2@@nodename
"name2@@nodename" should get the same symbol binding as "name".
While the ELF object writer is updating the symbol binding for .symver
aliases before emitting the object file, not doing so when the module
inline assembly is handled by the RecordStreamer is causing the wrong
behavior in *LTO mode.
E.g. when "name" is global, "name2@@nodename" must also be marked as
global. Otherwise, the symbol is skipped when iterating over the LTO
InputFile symbols (InputFile::Symbol::shouldSkip). So, for example,
when performing any *LTO via the gold-plugin, the versioned symbol
definition is not recorded by the plugin and passed back to the
linker. If the object was in an archive, and there were no other symbols
needed from that object, the object would not be included in the final
link and references to the versioned symbol are undefined.
The llvm-lto2 tests added will give an error about an unused symbol
resolution without the fix.
Reviewers: rafael, pcc
Reviewed By: pcc
Subscribers: mehdi_amini, llvm-commits
Differential Revision: https://reviews.llvm.org/D30485
llvm-svn: 297332
2017-03-09 08:19:49 +08:00
|
|
|
StringRef InlineAsm = M.getModuleInlineAsm();
|
2016-12-01 14:51:47 +08:00
|
|
|
if (InlineAsm.empty())
|
|
|
|
return;
|
|
|
|
|
|
|
|
std::string Err;
|
Perform symbol binding for .symver versioned symbols
Summary:
In a .symver assembler directive like:
.symver name, name2@@nodename
"name2@@nodename" should get the same symbol binding as "name".
While the ELF object writer is updating the symbol binding for .symver
aliases before emitting the object file, not doing so when the module
inline assembly is handled by the RecordStreamer is causing the wrong
behavior in *LTO mode.
E.g. when "name" is global, "name2@@nodename" must also be marked as
global. Otherwise, the symbol is skipped when iterating over the LTO
InputFile symbols (InputFile::Symbol::shouldSkip). So, for example,
when performing any *LTO via the gold-plugin, the versioned symbol
definition is not recorded by the plugin and passed back to the
linker. If the object was in an archive, and there were no other symbols
needed from that object, the object would not be included in the final
link and references to the versioned symbol are undefined.
The llvm-lto2 tests added will give an error about an unused symbol
resolution without the fix.
Reviewers: rafael, pcc
Reviewed By: pcc
Subscribers: mehdi_amini, llvm-commits
Differential Revision: https://reviews.llvm.org/D30485
llvm-svn: 297332
2017-03-09 08:19:49 +08:00
|
|
|
const Triple TT(M.getTargetTriple());
|
2016-12-01 14:51:47 +08:00
|
|
|
const Target *T = TargetRegistry::lookupTarget(TT.str(), Err);
|
|
|
|
assert(T && T->hasMCAsmParser());
|
|
|
|
|
|
|
|
std::unique_ptr<MCRegisterInfo> MRI(T->createMCRegInfo(TT.str()));
|
|
|
|
if (!MRI)
|
|
|
|
return;
|
|
|
|
|
2019-10-23 18:24:35 +08:00
|
|
|
MCTargetOptions MCOptions;
|
|
|
|
std::unique_ptr<MCAsmInfo> MAI(T->createMCAsmInfo(*MRI, TT.str(), MCOptions));
|
2016-12-01 14:51:47 +08:00
|
|
|
if (!MAI)
|
|
|
|
return;
|
|
|
|
|
|
|
|
std::unique_ptr<MCSubtargetInfo> STI(
|
|
|
|
T->createMCSubtargetInfo(TT.str(), "", ""));
|
|
|
|
if (!STI)
|
|
|
|
return;
|
|
|
|
|
|
|
|
std::unique_ptr<MCInstrInfo> MCII(T->createMCInstrInfo());
|
|
|
|
if (!MCII)
|
|
|
|
return;
|
|
|
|
|
|
|
|
MCObjectFileInfo MOFI;
|
|
|
|
MCContext MCCtx(MAI.get(), MRI.get(), &MOFI);
|
2017-08-03 04:32:26 +08:00
|
|
|
MOFI.InitMCObjectFileInfo(TT, /*PIC*/ false, MCCtx);
|
2018-12-14 09:14:10 +08:00
|
|
|
MOFI.setSDKVersion(M.getSDKVersion());
|
2018-03-20 08:38:33 +08:00
|
|
|
RecordStreamer Streamer(MCCtx, M);
|
2016-12-01 14:51:47 +08:00
|
|
|
T->createNullTargetStreamer(Streamer);
|
|
|
|
|
|
|
|
std::unique_ptr<MemoryBuffer> Buffer(MemoryBuffer::getMemBuffer(InlineAsm));
|
|
|
|
SourceMgr SrcMgr;
|
|
|
|
SrcMgr.AddNewSourceBuffer(std::move(Buffer), SMLoc());
|
|
|
|
std::unique_ptr<MCAsmParser> Parser(
|
|
|
|
createMCAsmParser(SrcMgr, MCCtx, Streamer, *MAI));
|
|
|
|
|
|
|
|
std::unique_ptr<MCTargetAsmParser> TAP(
|
|
|
|
T->createMCAsmParser(*STI, *Parser, *MCII, MCOptions));
|
|
|
|
if (!TAP)
|
|
|
|
return;
|
|
|
|
|
2020-06-30 18:48:10 +08:00
|
|
|
// Module-level inline asm is assumed to use At&t syntax (see
|
|
|
|
// AsmPrinter::doInitialization()).
|
|
|
|
Parser->setAssemblerDialect(InlineAsm::AD_ATT);
|
|
|
|
|
2016-12-01 14:51:47 +08:00
|
|
|
Parser->setTargetParser(*TAP);
|
|
|
|
if (Parser->Run(false))
|
|
|
|
return;
|
|
|
|
|
2018-04-20 09:36:48 +08:00
|
|
|
Init(Streamer);
|
|
|
|
}
|
|
|
|
|
|
|
|
void ModuleSymbolTable::CollectAsmSymbols(
|
|
|
|
const Module &M,
|
|
|
|
function_ref<void(StringRef, BasicSymbolRef::Flags)> AsmSymbol) {
|
|
|
|
initializeRecordStreamer(M, [&](RecordStreamer &Streamer) {
|
|
|
|
Streamer.flushSymverDirectives();
|
|
|
|
|
|
|
|
for (auto &KV : Streamer) {
|
|
|
|
StringRef Key = KV.first();
|
|
|
|
RecordStreamer::State Value = KV.second;
|
|
|
|
// FIXME: For now we just assume that all asm symbols are executable.
|
|
|
|
uint32_t Res = BasicSymbolRef::SF_Executable;
|
|
|
|
switch (Value) {
|
|
|
|
case RecordStreamer::NeverSeen:
|
|
|
|
llvm_unreachable("NeverSeen should have been replaced earlier");
|
|
|
|
case RecordStreamer::DefinedGlobal:
|
|
|
|
Res |= BasicSymbolRef::SF_Global;
|
|
|
|
break;
|
|
|
|
case RecordStreamer::Defined:
|
|
|
|
break;
|
|
|
|
case RecordStreamer::Global:
|
|
|
|
case RecordStreamer::Used:
|
|
|
|
Res |= BasicSymbolRef::SF_Undefined;
|
|
|
|
Res |= BasicSymbolRef::SF_Global;
|
|
|
|
break;
|
|
|
|
case RecordStreamer::DefinedWeak:
|
|
|
|
Res |= BasicSymbolRef::SF_Weak;
|
|
|
|
Res |= BasicSymbolRef::SF_Global;
|
|
|
|
break;
|
|
|
|
case RecordStreamer::UndefinedWeak:
|
|
|
|
Res |= BasicSymbolRef::SF_Weak;
|
|
|
|
Res |= BasicSymbolRef::SF_Undefined;
|
|
|
|
}
|
|
|
|
AsmSymbol(Key, BasicSymbolRef::Flags(Res));
|
2016-12-01 14:51:47 +08:00
|
|
|
}
|
2018-04-20 09:36:48 +08:00
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
void ModuleSymbolTable::CollectAsmSymvers(
|
|
|
|
const Module &M, function_ref<void(StringRef, StringRef)> AsmSymver) {
|
|
|
|
initializeRecordStreamer(M, [&](RecordStreamer &Streamer) {
|
|
|
|
for (auto &KV : Streamer.symverAliases())
|
|
|
|
for (auto &Alias : KV.second)
|
|
|
|
AsmSymver(KV.first->getName(), Alias);
|
|
|
|
});
|
2016-12-01 14:51:47 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
void ModuleSymbolTable::printSymbolName(raw_ostream &OS, Symbol S) const {
|
|
|
|
if (S.is<AsmSymbol *>()) {
|
|
|
|
OS << S.get<AsmSymbol *>()->first;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
auto *GV = S.get<GlobalValue *>();
|
|
|
|
if (GV->hasDLLImportStorageClass())
|
|
|
|
OS << "__imp_";
|
|
|
|
|
|
|
|
Mang.getNameWithPrefix(OS, GV, false);
|
|
|
|
}
|
|
|
|
|
|
|
|
uint32_t ModuleSymbolTable::getSymbolFlags(Symbol S) const {
|
|
|
|
if (S.is<AsmSymbol *>())
|
|
|
|
return S.get<AsmSymbol *>()->second;
|
|
|
|
|
|
|
|
auto *GV = S.get<GlobalValue *>();
|
|
|
|
|
|
|
|
uint32_t Res = BasicSymbolRef::SF_None;
|
|
|
|
if (GV->isDeclarationForLinker())
|
|
|
|
Res |= BasicSymbolRef::SF_Undefined;
|
|
|
|
else if (GV->hasHiddenVisibility() && !GV->hasLocalLinkage())
|
|
|
|
Res |= BasicSymbolRef::SF_Hidden;
|
|
|
|
if (const GlobalVariable *GVar = dyn_cast<GlobalVariable>(GV)) {
|
|
|
|
if (GVar->isConstant())
|
|
|
|
Res |= BasicSymbolRef::SF_Const;
|
|
|
|
}
|
2016-12-01 14:53:47 +08:00
|
|
|
if (dyn_cast_or_null<Function>(GV->getBaseObject()))
|
|
|
|
Res |= BasicSymbolRef::SF_Executable;
|
2016-12-01 15:00:35 +08:00
|
|
|
if (isa<GlobalAlias>(GV))
|
|
|
|
Res |= BasicSymbolRef::SF_Indirect;
|
2016-12-01 14:51:47 +08:00
|
|
|
if (GV->hasPrivateLinkage())
|
|
|
|
Res |= BasicSymbolRef::SF_FormatSpecific;
|
|
|
|
if (!GV->hasLocalLinkage())
|
|
|
|
Res |= BasicSymbolRef::SF_Global;
|
|
|
|
if (GV->hasCommonLinkage())
|
|
|
|
Res |= BasicSymbolRef::SF_Common;
|
|
|
|
if (GV->hasLinkOnceLinkage() || GV->hasWeakLinkage() ||
|
|
|
|
GV->hasExternalWeakLinkage())
|
|
|
|
Res |= BasicSymbolRef::SF_Weak;
|
|
|
|
|
|
|
|
if (GV->getName().startswith("llvm."))
|
|
|
|
Res |= BasicSymbolRef::SF_FormatSpecific;
|
|
|
|
else if (auto *Var = dyn_cast<GlobalVariable>(GV)) {
|
|
|
|
if (Var->getSection() == "llvm.metadata")
|
|
|
|
Res |= BasicSymbolRef::SF_FormatSpecific;
|
|
|
|
}
|
|
|
|
|
|
|
|
return Res;
|
|
|
|
}
|