forked from OSchip/llvm-project
534 lines
17 KiB
C++
534 lines
17 KiB
C++
//===-- sancov.cc --------------------------------------------===//
|
|
//
|
|
// The LLVM Compiler Infrastructure
|
|
//
|
|
// This file is distributed under the University of Illinois Open Source
|
|
// License. See LICENSE.TXT for details.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This file is a command-line tool for reading and analyzing sanitizer
|
|
// coverage.
|
|
//===----------------------------------------------------------------------===//
|
|
#include "llvm/ADT/STLExtras.h"
|
|
#include "llvm/DebugInfo/Symbolize/Symbolize.h"
|
|
#include "llvm/MC/MCAsmInfo.h"
|
|
#include "llvm/MC/MCContext.h"
|
|
#include "llvm/MC/MCDisassembler.h"
|
|
#include "llvm/MC/MCInst.h"
|
|
#include "llvm/MC/MCInstPrinter.h"
|
|
#include "llvm/MC/MCInstrAnalysis.h"
|
|
#include "llvm/MC/MCInstrInfo.h"
|
|
#include "llvm/MC/MCObjectFileInfo.h"
|
|
#include "llvm/MC/MCRegisterInfo.h"
|
|
#include "llvm/MC/MCSubtargetInfo.h"
|
|
#include "llvm/Object/Archive.h"
|
|
#include "llvm/Object/Binary.h"
|
|
#include "llvm/Object/ObjectFile.h"
|
|
#include "llvm/Support/CommandLine.h"
|
|
#include "llvm/Support/Errc.h"
|
|
#include "llvm/Support/ErrorOr.h"
|
|
#include "llvm/Support/FileSystem.h"
|
|
#include "llvm/Support/LineIterator.h"
|
|
#include "llvm/Support/ManagedStatic.h"
|
|
#include "llvm/Support/MemoryBuffer.h"
|
|
#include "llvm/Support/Path.h"
|
|
#include "llvm/Support/PrettyStackTrace.h"
|
|
#include "llvm/Support/Signals.h"
|
|
#include "llvm/Support/SpecialCaseList.h"
|
|
#include "llvm/Support/TargetRegistry.h"
|
|
#include "llvm/Support/TargetSelect.h"
|
|
#include "llvm/Support/ToolOutputFile.h"
|
|
#include "llvm/Support/raw_ostream.h"
|
|
|
|
#include <set>
|
|
#include <stdio.h>
|
|
#include <string>
|
|
#include <vector>
|
|
|
|
using namespace llvm;
|
|
|
|
namespace {
|
|
|
|
// --------- COMMAND LINE FLAGS ---------
|
|
|
|
enum ActionType {
|
|
PrintAction,
|
|
CoveredFunctionsAction,
|
|
NotCoveredFunctionsAction
|
|
};
|
|
|
|
cl::opt<ActionType> Action(
|
|
cl::desc("Action (required)"), cl::Required,
|
|
cl::values(clEnumValN(PrintAction, "print", "Print coverage addresses"),
|
|
clEnumValN(CoveredFunctionsAction, "covered-functions",
|
|
"Print all covered funcions."),
|
|
clEnumValN(NotCoveredFunctionsAction, "not-covered-functions",
|
|
"Print all not covered funcions."),
|
|
clEnumValEnd));
|
|
|
|
static cl::list<std::string> ClInputFiles(cl::Positional, cl::OneOrMore,
|
|
cl::desc("<filenames...>"));
|
|
|
|
static cl::opt<std::string>
|
|
ClBinaryName("obj", cl::Required,
|
|
cl::desc("Path to object file to be symbolized"));
|
|
|
|
static cl::opt<bool>
|
|
ClDemangle("demangle", cl::init(true),
|
|
cl::desc("Print demangled function name."));
|
|
|
|
static cl::opt<std::string> ClStripPathPrefix(
|
|
"strip_path_prefix", cl::init(""),
|
|
cl::desc("Strip this prefix from file paths in reports."));
|
|
|
|
static cl::opt<std::string>
|
|
ClBlacklist("blacklist", cl::init(""),
|
|
cl::desc("Blacklist file (sanitizer blacklist format)."));
|
|
|
|
static cl::opt<bool> ClUseDefaultBlacklist(
|
|
"use_default_blacklist", cl::init(true), cl::Hidden,
|
|
cl::desc("Controls if default blacklist should be used."));
|
|
|
|
static const char *const DefaultBlacklist = "fun:__sanitizer_*";
|
|
|
|
// --------- FORMAT SPECIFICATION ---------
|
|
|
|
struct FileHeader {
|
|
uint32_t Bitness;
|
|
uint32_t Magic;
|
|
};
|
|
|
|
static const uint32_t BinCoverageMagic = 0xC0BFFFFF;
|
|
static const uint32_t Bitness32 = 0xFFFFFF32;
|
|
static const uint32_t Bitness64 = 0xFFFFFF64;
|
|
|
|
// ---------
|
|
|
|
static void FailIfError(std::error_code Error) {
|
|
if (!Error)
|
|
return;
|
|
errs() << "Error: " << Error.message() << "(" << Error.value() << ")\n";
|
|
exit(1);
|
|
}
|
|
|
|
template <typename T> static void FailIfError(const ErrorOr<T> &E) {
|
|
FailIfError(E.getError());
|
|
}
|
|
|
|
static void FailIfNotEmpty(const std::string &E) {
|
|
if (E.empty())
|
|
return;
|
|
errs() << "Error: " << E << "\n";
|
|
exit(1);
|
|
}
|
|
|
|
template <typename T>
|
|
static void FailIfEmpty(const std::unique_ptr<T> &Ptr,
|
|
const std::string &Message) {
|
|
if (Ptr.get())
|
|
return;
|
|
errs() << "Error: " << Message << "\n";
|
|
exit(1);
|
|
}
|
|
|
|
template <typename T>
|
|
static void readInts(const char *Start, const char *End,
|
|
std::set<uint64_t> *Ints) {
|
|
const T *S = reinterpret_cast<const T *>(Start);
|
|
const T *E = reinterpret_cast<const T *>(End);
|
|
std::copy(S, E, std::inserter(*Ints, Ints->end()));
|
|
}
|
|
|
|
struct FileLoc {
|
|
bool operator<(const FileLoc &RHS) const {
|
|
return std::tie(FileName, Line) < std::tie(RHS.FileName, RHS.Line);
|
|
}
|
|
|
|
std::string FileName;
|
|
uint32_t Line;
|
|
};
|
|
|
|
struct FunctionLoc {
|
|
bool operator<(const FunctionLoc &RHS) const {
|
|
return std::tie(Loc, FunctionName) < std::tie(RHS.Loc, RHS.FunctionName);
|
|
}
|
|
|
|
FileLoc Loc;
|
|
std::string FunctionName;
|
|
};
|
|
|
|
std::string stripPathPrefix(std::string Path) {
|
|
if (ClStripPathPrefix.empty())
|
|
return Path;
|
|
size_t Pos = Path.find(ClStripPathPrefix);
|
|
if (Pos == std::string::npos)
|
|
return Path;
|
|
return Path.substr(Pos + ClStripPathPrefix.size());
|
|
}
|
|
|
|
// Compute [FileLoc -> FunctionName] map for given addresses.
|
|
static std::map<FileLoc, std::string>
|
|
computeFunctionsMap(const std::set<uint64_t> &Addrs) {
|
|
std::map<FileLoc, std::string> Fns;
|
|
|
|
symbolize::LLVMSymbolizer::Options SymbolizerOptions;
|
|
SymbolizerOptions.Demangle = ClDemangle;
|
|
SymbolizerOptions.UseSymbolTable = true;
|
|
symbolize::LLVMSymbolizer Symbolizer(SymbolizerOptions);
|
|
|
|
// Fill in Fns map.
|
|
for (auto Addr : Addrs) {
|
|
auto InliningInfo = Symbolizer.symbolizeInlinedCode(ClBinaryName, Addr);
|
|
FailIfError(InliningInfo);
|
|
for (uint32_t I = 0; I < InliningInfo->getNumberOfFrames(); ++I) {
|
|
auto FrameInfo = InliningInfo->getFrame(I);
|
|
SmallString<256> FileName(FrameInfo.FileName);
|
|
sys::path::remove_dots(FileName, /* remove_dot_dot */ true);
|
|
FileLoc Loc = {FileName.str(), FrameInfo.Line};
|
|
Fns[Loc] = FrameInfo.FunctionName;
|
|
}
|
|
}
|
|
|
|
return Fns;
|
|
}
|
|
|
|
// Compute functions for given addresses. It keeps only the first
|
|
// occurence of a function within a file.
|
|
std::set<FunctionLoc> computeFunctionLocs(const std::set<uint64_t> &Addrs) {
|
|
std::map<FileLoc, std::string> Fns = computeFunctionsMap(Addrs);
|
|
|
|
std::set<FunctionLoc> Result;
|
|
std::string LastFileName;
|
|
std::set<std::string> ProcessedFunctions;
|
|
|
|
for (const auto &P : Fns) {
|
|
std::string FileName = P.first.FileName;
|
|
std::string FunctionName = P.second;
|
|
|
|
if (LastFileName != FileName)
|
|
ProcessedFunctions.clear();
|
|
LastFileName = FileName;
|
|
|
|
if (!ProcessedFunctions.insert(FunctionName).second)
|
|
continue;
|
|
|
|
Result.insert(FunctionLoc{P.first, P.second});
|
|
}
|
|
|
|
return Result;
|
|
}
|
|
|
|
// Locate __sanitizer_cov* function addresses that are used for coverage
|
|
// reporting.
|
|
static std::set<uint64_t>
|
|
findSanitizerCovFunctions(const object::ObjectFile &O) {
|
|
std::set<uint64_t> Result;
|
|
|
|
for (const object::SymbolRef &Symbol : O.symbols()) {
|
|
ErrorOr<uint64_t> AddressOrErr = Symbol.getAddress();
|
|
FailIfError(AddressOrErr);
|
|
|
|
ErrorOr<StringRef> NameOrErr = Symbol.getName();
|
|
FailIfError(NameOrErr);
|
|
StringRef Name = NameOrErr.get();
|
|
|
|
if (Name == "__sanitizer_cov" || Name == "__sanitizer_cov_with_check" ||
|
|
Name == "__sanitizer_cov_trace_func_enter") {
|
|
Result.insert(AddressOrErr.get());
|
|
}
|
|
}
|
|
|
|
if (Result.empty())
|
|
FailIfNotEmpty("__sanitizer_cov* functions not found");
|
|
|
|
return Result;
|
|
}
|
|
|
|
// Locate addresses of all coverage points in a file. Coverage point
|
|
// is defined as the 'address of instruction following __sanitizer_cov
|
|
// call - 1'.
|
|
static void getObjectCoveragePoints(const object::ObjectFile &O,
|
|
std::set<uint64_t> *Addrs) {
|
|
Triple TheTriple("unknown-unknown-unknown");
|
|
TheTriple.setArch(Triple::ArchType(O.getArch()));
|
|
auto TripleName = TheTriple.getTriple();
|
|
|
|
std::string Error;
|
|
const Target *TheTarget = TargetRegistry::lookupTarget(TripleName, Error);
|
|
FailIfNotEmpty(Error);
|
|
|
|
std::unique_ptr<const MCSubtargetInfo> STI(
|
|
TheTarget->createMCSubtargetInfo(TripleName, "", ""));
|
|
FailIfEmpty(STI, "no subtarget info for target " + TripleName);
|
|
|
|
std::unique_ptr<const MCRegisterInfo> MRI(
|
|
TheTarget->createMCRegInfo(TripleName));
|
|
FailIfEmpty(MRI, "no register info for target " + TripleName);
|
|
|
|
std::unique_ptr<const MCAsmInfo> AsmInfo(
|
|
TheTarget->createMCAsmInfo(*MRI, TripleName));
|
|
FailIfEmpty(AsmInfo, "no asm info for target " + TripleName);
|
|
|
|
std::unique_ptr<const MCObjectFileInfo> MOFI(new MCObjectFileInfo);
|
|
MCContext Ctx(AsmInfo.get(), MRI.get(), MOFI.get());
|
|
std::unique_ptr<MCDisassembler> DisAsm(
|
|
TheTarget->createMCDisassembler(*STI, Ctx));
|
|
FailIfEmpty(DisAsm, "no disassembler info for target " + TripleName);
|
|
|
|
std::unique_ptr<const MCInstrInfo> MII(TheTarget->createMCInstrInfo());
|
|
FailIfEmpty(MII, "no instruction info for target " + TripleName);
|
|
|
|
std::unique_ptr<const MCInstrAnalysis> MIA(
|
|
TheTarget->createMCInstrAnalysis(MII.get()));
|
|
FailIfEmpty(MIA, "no instruction analysis info for target " + TripleName);
|
|
|
|
auto SanCovAddrs = findSanitizerCovFunctions(O);
|
|
|
|
for (const auto Section : O.sections()) {
|
|
if (Section.isVirtual() || !Section.isText()) // llvm-objdump does the same.
|
|
continue;
|
|
uint64_t SectionAddr = Section.getAddress();
|
|
uint64_t SectSize = Section.getSize();
|
|
if (!SectSize)
|
|
continue;
|
|
|
|
StringRef SectionName;
|
|
FailIfError(Section.getName(SectionName));
|
|
|
|
StringRef BytesStr;
|
|
FailIfError(Section.getContents(BytesStr));
|
|
ArrayRef<uint8_t> Bytes(reinterpret_cast<const uint8_t *>(BytesStr.data()),
|
|
BytesStr.size());
|
|
|
|
for (uint64_t Index = 0, Size = 0; Index < Section.getSize();
|
|
Index += Size) {
|
|
MCInst Inst;
|
|
if (!DisAsm->getInstruction(Inst, Size, Bytes.slice(Index),
|
|
SectionAddr + Index, nulls(), nulls())) {
|
|
if (Size == 0)
|
|
Size = 1;
|
|
continue;
|
|
}
|
|
uint64_t Target;
|
|
if (MIA->isCall(Inst) &&
|
|
MIA->evaluateBranch(Inst, SectionAddr + Index, Size, Target)) {
|
|
if (SanCovAddrs.find(Target) != SanCovAddrs.end()) {
|
|
// Sanitizer coverage uses the address of the next instruction - 1.
|
|
Addrs->insert(Index + SectionAddr + Size - 1);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
static void getArchiveCoveragePoints(const object::Archive &A,
|
|
std::set<uint64_t> *Addrs) {
|
|
for (auto &ErrorOrChild : A.children()) {
|
|
FailIfError(ErrorOrChild);
|
|
const object::Archive::Child &C = *ErrorOrChild;
|
|
ErrorOr<std::unique_ptr<object::Binary>> ChildOrErr = C.getAsBinary();
|
|
FailIfError(ChildOrErr);
|
|
if (object::ObjectFile *O =
|
|
dyn_cast<object::ObjectFile>(&*ChildOrErr.get()))
|
|
getObjectCoveragePoints(*O, Addrs);
|
|
else
|
|
FailIfError(object::object_error::invalid_file_type);
|
|
}
|
|
}
|
|
|
|
// Locate addresses of all coverage points in a file. Coverage point
|
|
// is defined as the 'address of instruction following __sanitizer_cov
|
|
// call - 1'.
|
|
std::set<uint64_t> getCoveragePoints(std::string FileName) {
|
|
std::set<uint64_t> Result;
|
|
|
|
ErrorOr<object::OwningBinary<object::Binary>> BinaryOrErr =
|
|
object::createBinary(FileName);
|
|
FailIfError(BinaryOrErr);
|
|
|
|
object::Binary &Binary = *BinaryOrErr.get().getBinary();
|
|
if (object::Archive *A = dyn_cast<object::Archive>(&Binary))
|
|
getArchiveCoveragePoints(*A, &Result);
|
|
else if (object::ObjectFile *O = dyn_cast<object::ObjectFile>(&Binary))
|
|
getObjectCoveragePoints(*O, &Result);
|
|
else
|
|
FailIfError(object::object_error::invalid_file_type);
|
|
|
|
return Result;
|
|
}
|
|
|
|
static std::unique_ptr<SpecialCaseList> createDefaultBlacklist() {
|
|
if (!ClUseDefaultBlacklist)
|
|
return std::unique_ptr<SpecialCaseList>();
|
|
std::unique_ptr<MemoryBuffer> MB =
|
|
MemoryBuffer::getMemBuffer(DefaultBlacklist);
|
|
std::string Error;
|
|
auto Blacklist = SpecialCaseList::create(MB.get(), Error);
|
|
FailIfNotEmpty(Error);
|
|
return Blacklist;
|
|
}
|
|
|
|
static std::unique_ptr<SpecialCaseList> createUserBlacklist() {
|
|
if (ClBlacklist.empty())
|
|
return std::unique_ptr<SpecialCaseList>();
|
|
|
|
return SpecialCaseList::createOrDie({{ClBlacklist}});
|
|
}
|
|
|
|
static void printFunctionLocs(const std::set<FunctionLoc> &FnLocs,
|
|
raw_ostream &OS) {
|
|
std::unique_ptr<SpecialCaseList> DefaultBlacklist = createDefaultBlacklist();
|
|
std::unique_ptr<SpecialCaseList> UserBlacklist = createUserBlacklist();
|
|
|
|
for (const FunctionLoc &FnLoc : FnLocs) {
|
|
if (DefaultBlacklist &&
|
|
DefaultBlacklist->inSection("fun", FnLoc.FunctionName))
|
|
continue;
|
|
if (DefaultBlacklist &&
|
|
DefaultBlacklist->inSection("src", FnLoc.Loc.FileName))
|
|
continue;
|
|
if (UserBlacklist && UserBlacklist->inSection("fun", FnLoc.FunctionName))
|
|
continue;
|
|
if (UserBlacklist && UserBlacklist->inSection("src", FnLoc.Loc.FileName))
|
|
continue;
|
|
|
|
OS << stripPathPrefix(FnLoc.Loc.FileName) << ":" << FnLoc.Loc.Line << " "
|
|
<< FnLoc.FunctionName << "\n";
|
|
}
|
|
}
|
|
|
|
class CoverageData {
|
|
public:
|
|
// Read single file coverage data.
|
|
static ErrorOr<std::unique_ptr<CoverageData>> read(std::string FileName) {
|
|
ErrorOr<std::unique_ptr<MemoryBuffer>> BufOrErr =
|
|
MemoryBuffer::getFile(FileName);
|
|
if (!BufOrErr)
|
|
return BufOrErr.getError();
|
|
std::unique_ptr<MemoryBuffer> Buf = std::move(BufOrErr.get());
|
|
if (Buf->getBufferSize() < 8) {
|
|
errs() << "File too small (<8): " << Buf->getBufferSize();
|
|
return make_error_code(errc::illegal_byte_sequence);
|
|
}
|
|
const FileHeader *Header =
|
|
reinterpret_cast<const FileHeader *>(Buf->getBufferStart());
|
|
|
|
if (Header->Magic != BinCoverageMagic) {
|
|
errs() << "Wrong magic: " << Header->Magic;
|
|
return make_error_code(errc::illegal_byte_sequence);
|
|
}
|
|
|
|
auto Addrs = llvm::make_unique<std::set<uint64_t>>();
|
|
|
|
switch (Header->Bitness) {
|
|
case Bitness64:
|
|
readInts<uint64_t>(Buf->getBufferStart() + 8, Buf->getBufferEnd(),
|
|
Addrs.get());
|
|
break;
|
|
case Bitness32:
|
|
readInts<uint32_t>(Buf->getBufferStart() + 8, Buf->getBufferEnd(),
|
|
Addrs.get());
|
|
break;
|
|
default:
|
|
errs() << "Unsupported bitness: " << Header->Bitness;
|
|
return make_error_code(errc::illegal_byte_sequence);
|
|
}
|
|
|
|
return std::unique_ptr<CoverageData>(new CoverageData(std::move(Addrs)));
|
|
}
|
|
|
|
// Merge multiple coverage data together.
|
|
static std::unique_ptr<CoverageData>
|
|
merge(const std::vector<std::unique_ptr<CoverageData>> &Covs) {
|
|
auto Addrs = llvm::make_unique<std::set<uint64_t>>();
|
|
|
|
for (const auto &Cov : Covs)
|
|
Addrs->insert(Cov->Addrs->begin(), Cov->Addrs->end());
|
|
|
|
return std::unique_ptr<CoverageData>(new CoverageData(std::move(Addrs)));
|
|
}
|
|
|
|
// Read list of files and merges their coverage info.
|
|
static ErrorOr<std::unique_ptr<CoverageData>>
|
|
readAndMerge(const std::vector<std::string> &FileNames) {
|
|
std::vector<std::unique_ptr<CoverageData>> Covs;
|
|
for (const auto &FileName : FileNames) {
|
|
auto Cov = read(FileName);
|
|
if (!Cov)
|
|
return Cov.getError();
|
|
Covs.push_back(std::move(Cov.get()));
|
|
}
|
|
return merge(Covs);
|
|
}
|
|
|
|
// Print coverage addresses.
|
|
void printAddrs(raw_ostream &OS) {
|
|
for (auto Addr : *Addrs) {
|
|
OS << "0x";
|
|
OS.write_hex(Addr);
|
|
OS << "\n";
|
|
}
|
|
}
|
|
|
|
// Print list of covered functions.
|
|
// Line format: <file_name>:<line> <function_name>
|
|
void printCoveredFunctions(raw_ostream &OS) {
|
|
printFunctionLocs(computeFunctionLocs(*Addrs), OS);
|
|
}
|
|
|
|
// Print list of not covered functions.
|
|
// Line format: <file_name>:<line> <function_name>
|
|
void printNotCoveredFunctions(raw_ostream &OS) {
|
|
std::set<FunctionLoc> AllFns =
|
|
computeFunctionLocs(getCoveragePoints(ClBinaryName));
|
|
std::set<FunctionLoc> CoveredFns = computeFunctionLocs(*Addrs);
|
|
|
|
std::set<FunctionLoc> NotCoveredFns;
|
|
std::set_difference(AllFns.begin(), AllFns.end(), CoveredFns.begin(),
|
|
CoveredFns.end(),
|
|
std::inserter(NotCoveredFns, NotCoveredFns.end()));
|
|
printFunctionLocs(NotCoveredFns, OS);
|
|
}
|
|
|
|
private:
|
|
explicit CoverageData(std::unique_ptr<std::set<uint64_t>> Addrs)
|
|
: Addrs(std::move(Addrs)) {}
|
|
|
|
std::unique_ptr<std::set<uint64_t>> Addrs;
|
|
};
|
|
} // namespace
|
|
|
|
int main(int argc, char **argv) {
|
|
// Print stack trace if we signal out.
|
|
sys::PrintStackTraceOnErrorSignal();
|
|
PrettyStackTraceProgram X(argc, argv);
|
|
llvm_shutdown_obj Y; // Call llvm_shutdown() on exit.
|
|
|
|
llvm::InitializeAllTargetInfos();
|
|
llvm::InitializeAllTargetMCs();
|
|
llvm::InitializeAllDisassemblers();
|
|
|
|
cl::ParseCommandLineOptions(argc, argv, "Sanitizer Coverage Processing Tool");
|
|
|
|
auto CovData = CoverageData::readAndMerge(ClInputFiles);
|
|
FailIfError(CovData);
|
|
|
|
switch (Action) {
|
|
case PrintAction: {
|
|
CovData.get()->printAddrs(outs());
|
|
return 0;
|
|
}
|
|
case CoveredFunctionsAction: {
|
|
CovData.get()->printCoveredFunctions(outs());
|
|
return 0;
|
|
}
|
|
case NotCoveredFunctionsAction: {
|
|
CovData.get()->printNotCoveredFunctions(outs());
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
llvm_unreachable("unsupported action");
|
|
}
|