2016-05-03 08:28:21 +08:00
|
|
|
//===- TpiStream.cpp - PDB Type Info (TPI) Stream 2 Access ----------------===//
|
|
|
|
//
|
|
|
|
// The LLVM Compiler Infrastructure
|
|
|
|
//
|
|
|
|
// This file is distributed under the University of Illinois Open Source
|
|
|
|
// License. See LICENSE.TXT for details.
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
#include "llvm/DebugInfo/PDB/Raw/TpiStream.h"
|
|
|
|
|
2016-06-16 21:14:42 +08:00
|
|
|
#include "llvm/DebugInfo/CodeView/CVTypeVisitor.h"
|
2016-05-03 08:28:21 +08:00
|
|
|
#include "llvm/DebugInfo/CodeView/CodeView.h"
|
2016-05-26 04:37:03 +08:00
|
|
|
#include "llvm/DebugInfo/CodeView/StreamReader.h"
|
2016-06-04 04:48:51 +08:00
|
|
|
#include "llvm/DebugInfo/CodeView/TypeIndex.h"
|
2016-05-03 08:28:21 +08:00
|
|
|
#include "llvm/DebugInfo/CodeView/TypeRecord.h"
|
2016-06-09 08:10:19 +08:00
|
|
|
#include "llvm/DebugInfo/PDB/Raw/Hash.h"
|
[pdb] Use MappedBlockStream to parse the PDB directory.
In order to efficiently write PDBs, we need to be able to make a
StreamWriter class similar to a StreamReader, which can transparently deal
with writing to discontiguous streams, and we need to use this for all
writing, similar to how we use StreamReader for all reading.
Most discontiguous streams are the typical numbered streams that appear in
a PDB file and are described by the directory, but the exception to this,
that until now has been parsed by hand, is the directory itself.
MappedBlockStream works by querying the directory to find out which blocks
a stream occupies and various other things, so naturally the same logic
could not possibly work to describe the blocks that the directory itself
resided on.
To solve this, I've introduced an abstraction IPDBStreamData, which allows
the client to query for the list of blocks occupied by the stream, as well
as the stream length. I provide two implementations of this: one which
queries the directory (for indexed streams), and one which queries the
super block (for the directory stream).
This has the side benefit of vastly simplifying the code to parse the
directory. Whereas before a mini state machine was rolled by hand, now we
simply use FixedStreamArray to read out the stream sizes, then build a
vector of FixedStreamArrays for the stream map, all in just a few lines of
code.
Reviewed By: ruiu
Differential Revision: http://reviews.llvm.org/D21046
llvm-svn: 271982
2016-06-07 13:28:55 +08:00
|
|
|
#include "llvm/DebugInfo/PDB/Raw/IndexedStreamData.h"
|
2016-05-03 08:28:21 +08:00
|
|
|
#include "llvm/DebugInfo/PDB/Raw/MappedBlockStream.h"
|
2016-06-01 06:41:52 +08:00
|
|
|
#include "llvm/DebugInfo/PDB/Raw/PDBFile.h"
|
2016-05-03 08:28:21 +08:00
|
|
|
#include "llvm/DebugInfo/PDB/Raw/RawConstants.h"
|
2016-05-07 04:51:57 +08:00
|
|
|
#include "llvm/DebugInfo/PDB/Raw/RawError.h"
|
2016-06-04 04:48:51 +08:00
|
|
|
#include "llvm/DebugInfo/PDB/Raw/RawTypes.h"
|
2016-05-03 08:28:21 +08:00
|
|
|
|
|
|
|
#include "llvm/Support/Endian.h"
|
|
|
|
|
|
|
|
using namespace llvm;
|
2016-06-16 21:14:42 +08:00
|
|
|
using namespace llvm::codeview;
|
2016-05-03 08:28:21 +08:00
|
|
|
using namespace llvm::support;
|
|
|
|
using namespace llvm::pdb;
|
|
|
|
|
|
|
|
namespace {
|
|
|
|
const uint32_t MinHashBuckets = 0x1000;
|
|
|
|
const uint32_t MaxHashBuckets = 0x40000;
|
|
|
|
}
|
|
|
|
|
2016-06-03 05:13:47 +08:00
|
|
|
// This corresponds to `HDR` in PDB/dbi/tpi.h.
|
2016-05-03 08:28:21 +08:00
|
|
|
struct TpiStream::HeaderInfo {
|
|
|
|
struct EmbeddedBuf {
|
|
|
|
little32_t Off;
|
|
|
|
ulittle32_t Length;
|
|
|
|
};
|
|
|
|
|
|
|
|
ulittle32_t Version;
|
|
|
|
ulittle32_t HeaderSize;
|
|
|
|
ulittle32_t TypeIndexBegin;
|
|
|
|
ulittle32_t TypeIndexEnd;
|
|
|
|
ulittle32_t TypeRecordBytes;
|
|
|
|
|
2016-06-03 05:13:47 +08:00
|
|
|
// The following members correspond to `TpiHash` in PDB/dbi/tpi.h.
|
2016-05-03 08:28:21 +08:00
|
|
|
ulittle16_t HashStreamIndex;
|
|
|
|
ulittle16_t HashAuxStreamIndex;
|
|
|
|
ulittle32_t HashKeySize;
|
|
|
|
ulittle32_t NumHashBuckets;
|
|
|
|
|
|
|
|
EmbeddedBuf HashValueBuffer;
|
|
|
|
EmbeddedBuf IndexOffsetBuffer;
|
|
|
|
EmbeddedBuf HashAdjBuffer;
|
|
|
|
};
|
|
|
|
|
2016-06-09 01:26:39 +08:00
|
|
|
TpiStream::TpiStream(const PDBFile &File,
|
|
|
|
std::unique_ptr<MappedBlockStream> Stream)
|
2016-06-16 21:48:16 +08:00
|
|
|
: Pdb(File), Stream(std::move(Stream)) {}
|
2016-05-03 08:28:21 +08:00
|
|
|
|
|
|
|
TpiStream::~TpiStream() {}
|
|
|
|
|
2016-06-20 15:31:29 +08:00
|
|
|
// Corresponds to `fUDTAnon`.
|
|
|
|
template <typename T> static bool isAnonymous(T &Rec) {
|
|
|
|
StringRef Name = Rec.getUniqueName();
|
|
|
|
return Name == "<unnamed-tag>" || Name == "__unnamed" ||
|
|
|
|
Name.endswith("::<unnamed-tag>") || Name.endswith("::__unnamed");
|
|
|
|
}
|
|
|
|
|
2016-06-16 02:26:59 +08:00
|
|
|
// Computes a hash for a given TPI record.
|
2016-06-17 02:39:17 +08:00
|
|
|
template <typename T>
|
|
|
|
static uint32_t getTpiHash(T &Rec, const CVRecord<TypeLeafKind> &RawRec) {
|
2016-06-16 21:14:42 +08:00
|
|
|
auto Opts = static_cast<uint16_t>(Rec.getOptions());
|
|
|
|
|
2016-06-17 02:39:17 +08:00
|
|
|
bool ForwardRef =
|
|
|
|
Opts & static_cast<uint16_t>(ClassOptions::ForwardReference);
|
|
|
|
bool Scoped = Opts & static_cast<uint16_t>(ClassOptions::Scoped);
|
|
|
|
bool UniqueName = Opts & static_cast<uint16_t>(ClassOptions::HasUniqueName);
|
2016-06-20 15:31:29 +08:00
|
|
|
bool IsAnon = UniqueName && isAnonymous(Rec);
|
2016-06-16 21:14:42 +08:00
|
|
|
|
2016-06-20 15:31:29 +08:00
|
|
|
if (!ForwardRef && !Scoped && !IsAnon)
|
2016-06-16 21:14:42 +08:00
|
|
|
return hashStringV1(Rec.getName());
|
2016-06-20 15:31:29 +08:00
|
|
|
if (!ForwardRef && UniqueName && !IsAnon)
|
2016-06-16 21:14:42 +08:00
|
|
|
return hashStringV1(Rec.getUniqueName());
|
2016-06-17 02:39:17 +08:00
|
|
|
return hashBufferV8(RawRec.RawData);
|
2016-06-16 21:14:42 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
namespace {
|
2016-06-17 02:22:27 +08:00
|
|
|
class TpiHashVerifier : public TypeVisitorCallbacks {
|
2016-06-16 21:14:42 +08:00
|
|
|
public:
|
|
|
|
TpiHashVerifier(FixedStreamArray<support::ulittle32_t> &HashValues,
|
|
|
|
uint32_t NumHashBuckets)
|
|
|
|
: HashValues(HashValues), NumHashBuckets(NumHashBuckets) {}
|
|
|
|
|
2016-06-17 02:22:27 +08:00
|
|
|
Error visitUdtSourceLine(UdtSourceLineRecord &Rec) override {
|
|
|
|
return verifySourceLine(Rec);
|
|
|
|
}
|
2016-06-16 02:26:59 +08:00
|
|
|
|
2016-06-17 02:22:27 +08:00
|
|
|
Error visitUdtModSourceLine(UdtModSourceLineRecord &Rec) override {
|
|
|
|
return verifySourceLine(Rec);
|
2016-06-16 02:26:59 +08:00
|
|
|
}
|
|
|
|
|
2016-06-17 02:22:27 +08:00
|
|
|
Error visitClass(ClassRecord &Rec) override { return verify(Rec); }
|
|
|
|
Error visitEnum(EnumRecord &Rec) override { return verify(Rec); }
|
|
|
|
Error visitUnion(UnionRecord &Rec) override { return verify(Rec); }
|
2016-06-16 21:14:42 +08:00
|
|
|
|
2016-06-17 02:39:17 +08:00
|
|
|
Error visitTypeBegin(const CVRecord<TypeLeafKind> &Rec) override {
|
2016-06-17 02:22:27 +08:00
|
|
|
++Index;
|
2016-06-17 02:39:17 +08:00
|
|
|
RawRecord = &Rec;
|
2016-06-17 02:22:27 +08:00
|
|
|
return Error::success();
|
|
|
|
}
|
2016-06-16 02:26:59 +08:00
|
|
|
|
2016-06-16 21:14:42 +08:00
|
|
|
private:
|
2016-06-17 02:22:27 +08:00
|
|
|
template <typename T> Error verify(T &Rec) {
|
2016-06-17 02:39:17 +08:00
|
|
|
uint32_t Hash = getTpiHash(Rec, *RawRecord);
|
|
|
|
if (Hash % NumHashBuckets != HashValues[Index])
|
2016-06-17 02:22:27 +08:00
|
|
|
return make_error<RawError>(raw_error_code::invalid_tpi_hash);
|
|
|
|
return Error::success();
|
2016-06-16 21:14:42 +08:00
|
|
|
}
|
|
|
|
|
2016-06-17 02:22:27 +08:00
|
|
|
template <typename T> Error verifySourceLine(T &Rec) {
|
2016-06-16 21:14:42 +08:00
|
|
|
char Buf[4];
|
|
|
|
support::endian::write32le(Buf, Rec.getUDT().getIndex());
|
|
|
|
uint32_t Hash = hashStringV1(StringRef(Buf, 4));
|
|
|
|
if (Hash % NumHashBuckets != HashValues[Index])
|
2016-06-17 02:22:27 +08:00
|
|
|
return make_error<RawError>(raw_error_code::invalid_tpi_hash);
|
|
|
|
return Error::success();
|
2016-06-16 21:14:42 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
FixedStreamArray<support::ulittle32_t> HashValues;
|
2016-06-17 02:39:17 +08:00
|
|
|
const CVRecord<TypeLeafKind> *RawRecord;
|
2016-06-16 21:14:42 +08:00
|
|
|
uint32_t NumHashBuckets;
|
2016-06-17 02:39:17 +08:00
|
|
|
uint32_t Index = -1;
|
2016-06-16 21:14:42 +08:00
|
|
|
};
|
2016-06-16 02:26:59 +08:00
|
|
|
}
|
|
|
|
|
2016-06-09 08:10:19 +08:00
|
|
|
// Verifies that a given type record matches with a given hash value.
|
|
|
|
// Currently we only verify SRC_LINE records.
|
2016-06-16 21:14:42 +08:00
|
|
|
Error TpiStream::verifyHashValues() {
|
|
|
|
TpiHashVerifier Verifier(HashValues, Header->NumHashBuckets);
|
2016-06-17 02:22:27 +08:00
|
|
|
CVTypeVisitor Visitor(Verifier);
|
|
|
|
return Visitor.visitTypeStream(TypeRecords);
|
2016-06-09 08:10:19 +08:00
|
|
|
}
|
|
|
|
|
2016-05-07 04:51:57 +08:00
|
|
|
Error TpiStream::reload() {
|
2016-06-16 21:17:59 +08:00
|
|
|
StreamReader Reader(*Stream);
|
2016-05-03 08:28:21 +08:00
|
|
|
|
|
|
|
if (Reader.bytesRemaining() < sizeof(HeaderInfo))
|
2016-05-07 04:51:57 +08:00
|
|
|
return make_error<RawError>(raw_error_code::corrupt_file,
|
|
|
|
"TPI Stream does not contain a header.");
|
2016-05-03 08:28:21 +08:00
|
|
|
|
2016-05-27 09:54:44 +08:00
|
|
|
if (Reader.readObject(Header))
|
2016-05-07 04:51:57 +08:00
|
|
|
return make_error<RawError>(raw_error_code::corrupt_file,
|
|
|
|
"TPI Stream does not contain a header.");
|
2016-05-03 08:28:21 +08:00
|
|
|
|
|
|
|
if (Header->Version != PdbTpiV80)
|
2016-05-07 04:51:57 +08:00
|
|
|
return make_error<RawError>(raw_error_code::corrupt_file,
|
|
|
|
"Unsupported TPI Version.");
|
2016-05-03 08:28:21 +08:00
|
|
|
|
|
|
|
if (Header->HeaderSize != sizeof(HeaderInfo))
|
2016-05-07 04:51:57 +08:00
|
|
|
return make_error<RawError>(raw_error_code::corrupt_file,
|
|
|
|
"Corrupt TPI Header size.");
|
2016-05-03 08:28:21 +08:00
|
|
|
|
|
|
|
if (Header->HashKeySize != sizeof(ulittle32_t))
|
2016-05-07 04:51:57 +08:00
|
|
|
return make_error<RawError>(raw_error_code::corrupt_file,
|
|
|
|
"TPI Stream expected 4 byte hash key size.");
|
2016-05-03 08:28:21 +08:00
|
|
|
|
|
|
|
if (Header->NumHashBuckets < MinHashBuckets ||
|
|
|
|
Header->NumHashBuckets > MaxHashBuckets)
|
2016-05-07 04:51:57 +08:00
|
|
|
return make_error<RawError>(raw_error_code::corrupt_file,
|
|
|
|
"TPI Stream Invalid number of hash buckets.");
|
2016-05-03 08:28:21 +08:00
|
|
|
|
|
|
|
// The actual type records themselves come from this stream
|
2016-05-28 13:21:57 +08:00
|
|
|
if (auto EC = Reader.readArray(TypeRecords, Header->TypeRecordBytes))
|
2016-05-07 04:51:57 +08:00
|
|
|
return EC;
|
2016-05-03 08:28:21 +08:00
|
|
|
|
|
|
|
// Hash indices, hash values, etc come from the hash stream.
|
2016-06-08 08:25:08 +08:00
|
|
|
if (Header->HashStreamIndex >= Pdb.getNumStreams())
|
|
|
|
return make_error<RawError>(raw_error_code::corrupt_file,
|
|
|
|
"Invalid TPI hash stream index.");
|
|
|
|
|
2016-06-09 01:26:39 +08:00
|
|
|
auto HS =
|
|
|
|
MappedBlockStream::createIndexedStream(Header->HashStreamIndex, Pdb);
|
|
|
|
if (!HS)
|
|
|
|
return HS.takeError();
|
2016-06-16 21:17:59 +08:00
|
|
|
StreamReader HSR(**HS);
|
2016-06-07 07:19:23 +08:00
|
|
|
|
2016-06-04 04:48:51 +08:00
|
|
|
uint32_t NumHashValues = Header->HashValueBuffer.Length / sizeof(ulittle32_t);
|
2016-06-07 07:19:23 +08:00
|
|
|
if (NumHashValues != NumTypeRecords())
|
|
|
|
return make_error<RawError>(
|
|
|
|
raw_error_code::corrupt_file,
|
|
|
|
"TPI hash count does not match with the number of type records.");
|
2016-05-03 08:28:21 +08:00
|
|
|
HSR.setOffset(Header->HashValueBuffer.Off);
|
2016-06-04 04:48:51 +08:00
|
|
|
if (auto EC = HSR.readArray(HashValues, NumHashValues))
|
2016-05-07 04:51:57 +08:00
|
|
|
return EC;
|
2016-05-03 08:28:21 +08:00
|
|
|
|
2016-06-04 04:48:51 +08:00
|
|
|
HSR.setOffset(Header->IndexOffsetBuffer.Off);
|
|
|
|
uint32_t NumTypeIndexOffsets =
|
|
|
|
Header->IndexOffsetBuffer.Length / sizeof(TypeIndexOffset);
|
|
|
|
if (auto EC = HSR.readArray(TypeIndexOffsets, NumTypeIndexOffsets))
|
2016-05-07 04:51:57 +08:00
|
|
|
return EC;
|
2016-05-03 08:28:21 +08:00
|
|
|
|
2016-06-04 04:48:51 +08:00
|
|
|
HSR.setOffset(Header->HashAdjBuffer.Off);
|
|
|
|
uint32_t NumHashAdjustments =
|
|
|
|
Header->HashAdjBuffer.Length / sizeof(TypeIndexOffset);
|
|
|
|
if (auto EC = HSR.readArray(HashAdjustments, NumHashAdjustments))
|
2016-05-07 04:51:57 +08:00
|
|
|
return EC;
|
2016-05-03 08:28:21 +08:00
|
|
|
|
2016-06-09 01:26:39 +08:00
|
|
|
HashStream = std::move(*HS);
|
2016-06-09 08:10:19 +08:00
|
|
|
|
|
|
|
// TPI hash table is a parallel array for the type records.
|
|
|
|
// Verify that the hash values match with type records.
|
2016-06-16 21:14:42 +08:00
|
|
|
if (auto EC = verifyHashValues())
|
|
|
|
return EC;
|
2016-06-09 08:10:19 +08:00
|
|
|
|
2016-05-07 04:51:57 +08:00
|
|
|
return Error::success();
|
2016-05-03 08:28:21 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
PdbRaw_TpiVer TpiStream::getTpiVersion() const {
|
|
|
|
uint32_t Value = Header->Version;
|
|
|
|
return static_cast<PdbRaw_TpiVer>(Value);
|
|
|
|
}
|
|
|
|
|
|
|
|
uint32_t TpiStream::TypeIndexBegin() const { return Header->TypeIndexBegin; }
|
|
|
|
|
|
|
|
uint32_t TpiStream::TypeIndexEnd() const { return Header->TypeIndexEnd; }
|
|
|
|
|
|
|
|
uint32_t TpiStream::NumTypeRecords() const {
|
|
|
|
return TypeIndexEnd() - TypeIndexBegin();
|
|
|
|
}
|
|
|
|
|
2016-05-25 11:43:17 +08:00
|
|
|
uint16_t TpiStream::getTypeHashStreamIndex() const {
|
|
|
|
return Header->HashStreamIndex;
|
|
|
|
}
|
|
|
|
|
|
|
|
uint16_t TpiStream::getTypeHashStreamAuxIndex() const {
|
|
|
|
return Header->HashAuxStreamIndex;
|
|
|
|
}
|
|
|
|
|
2016-06-08 07:53:43 +08:00
|
|
|
uint32_t TpiStream::NumHashBuckets() const { return Header->NumHashBuckets; }
|
2016-06-08 07:44:27 +08:00
|
|
|
uint32_t TpiStream::getHashKeySize() const { return Header->HashKeySize; }
|
|
|
|
|
2016-06-16 21:17:59 +08:00
|
|
|
FixedStreamArray<support::ulittle32_t>
|
2016-06-04 04:48:51 +08:00
|
|
|
TpiStream::getHashValues() const {
|
|
|
|
return HashValues;
|
|
|
|
}
|
|
|
|
|
2016-06-16 21:17:59 +08:00
|
|
|
FixedStreamArray<TypeIndexOffset>
|
2016-06-04 04:48:51 +08:00
|
|
|
TpiStream::getTypeIndexOffsets() const {
|
|
|
|
return TypeIndexOffsets;
|
|
|
|
}
|
|
|
|
|
2016-06-16 21:17:59 +08:00
|
|
|
FixedStreamArray<TypeIndexOffset>
|
2016-06-04 04:48:51 +08:00
|
|
|
TpiStream::getHashAdjustments() const {
|
|
|
|
return HashAdjustments;
|
|
|
|
}
|
|
|
|
|
2016-06-16 21:17:59 +08:00
|
|
|
iterator_range<CVTypeArray::Iterator>
|
2016-05-28 13:21:57 +08:00
|
|
|
TpiStream::types(bool *HadError) const {
|
|
|
|
return llvm::make_range(TypeRecords.begin(HadError), TypeRecords.end());
|
2016-05-03 08:28:21 +08:00
|
|
|
}
|