llvm-project/lldb/source/Core/DataFileCache.cpp

308 lines
11 KiB
C++

//===-- DataFileCache.cpp -------------------------------------------------===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//
#include "lldb/Core/DataFileCache.h"
#include "lldb/Core/Module.h"
#include "lldb/Core/ModuleList.h"
#include "lldb/Host/FileSystem.h"
#include "lldb/Symbol/ObjectFile.h"
#include "lldb/Utility/DataEncoder.h"
#include "lldb/Utility/LLDBLog.h"
#include "lldb/Utility/Log.h"
#include "llvm/Support/CachePruning.h"
#include "llvm/Support/MemoryBuffer.h"
using namespace llvm;
using namespace lldb_private;
DataFileCache::DataFileCache(StringRef path) {
m_cache_dir.SetPath(path);
// Prune the cache based off of the LLDB settings each time we create a cache
// object.
ModuleListProperties &properties =
ModuleList::GetGlobalModuleListProperties();
CachePruningPolicy policy;
// Only scan once an hour. If we have lots of debug sessions we don't want
// to scan this directory too often. A timestamp file is written to the
// directory to ensure different processes don't scan the directory too often.
// This setting doesn't mean that a thread will continually scan the cache
// directory within this process.
policy.Interval = std::chrono::hours(1);
// Get the user settings for pruning.
policy.MaxSizeBytes = properties.GetLLDBIndexCacheMaxByteSize();
policy.MaxSizePercentageOfAvailableSpace =
properties.GetLLDBIndexCacheMaxPercent();
policy.Expiration =
std::chrono::hours(properties.GetLLDBIndexCacheExpirationDays() * 24);
pruneCache(path, policy);
// This lambda will get called when the data is gotten from the cache and
// also after the data was set for a given key. We only need to take
// ownership of the data if we are geting the data, so we use the
// m_take_ownership member variable to indicate if we need to take
// ownership.
auto add_buffer = [this](unsigned task, std::unique_ptr<llvm::MemoryBuffer> m) {
if (m_take_ownership)
m_mem_buff_up = std::move(m);
};
Expected<FileCache> cache_or_err =
llvm::localCache("LLDBModuleCache", "lldb-module", path, add_buffer);
if (cache_or_err)
m_cache_callback = std::move(*cache_or_err);
else {
Log *log = GetLog(LLDBLog::Modules);
LLDB_LOG_ERROR(log, cache_or_err.takeError(),
"failed to create lldb index cache directory: {0}");
}
}
std::unique_ptr<llvm::MemoryBuffer>
DataFileCache::GetCachedData(StringRef key) {
std::lock_guard<std::mutex> guard(m_mutex);
const unsigned task = 1;
m_take_ownership = true;
// If we call the "m_cache_callback" function and the data is cached, it will
// call the "add_buffer" lambda function from the constructor which will in
// turn take ownership of the member buffer that is passed to the callback and
// put it into a member variable.
Expected<AddStreamFn> add_stream_or_err = m_cache_callback(task, key);
m_take_ownership = false;
// At this point we either already called the "add_buffer" lambda with
// the data or we haven't. We can tell if we got the cached data by checking
// the add_stream function pointer value below.
if (add_stream_or_err) {
AddStreamFn &add_stream = *add_stream_or_err;
// If the "add_stream" is nullptr, then the data was cached and we already
// called the "add_buffer" lambda. If it is valid, then if we were to call
// the add_stream function it would cause a cache file to get generated
// and we would be expected to fill in the data. In this function we only
// want to check if the data was cached, so we don't want to call
// "add_stream" in this function.
if (!add_stream)
return std::move(m_mem_buff_up);
} else {
Log *log = GetLog(LLDBLog::Modules);
LLDB_LOG_ERROR(log, add_stream_or_err.takeError(),
"failed to get the cache add stream callback for key: {0}");
}
// Data was not cached.
return std::unique_ptr<llvm::MemoryBuffer>();
}
bool DataFileCache::SetCachedData(StringRef key, llvm::ArrayRef<uint8_t> data) {
std::lock_guard<std::mutex> guard(m_mutex);
const unsigned task = 2;
// If we call this function and the data is cached, it will call the
// add_buffer lambda function from the constructor which will ignore the
// data.
Expected<AddStreamFn> add_stream_or_err = m_cache_callback(task, key);
// If we reach this code then we either already called the callback with
// the data or we haven't. We can tell if we had the cached data by checking
// the CacheAddStream function pointer value below.
if (add_stream_or_err) {
AddStreamFn &add_stream = *add_stream_or_err;
// If the "add_stream" is nullptr, then the data was cached. If it is
// valid, then if we call the add_stream function with a task it will
// cause the file to get generated, but we only want to check if the data
// is cached here, so we don't want to call it here. Note that the
// add_buffer will also get called in this case after the data has been
// provided, but we won't take ownership of the memory buffer as we just
// want to write the data.
if (add_stream) {
Expected<std::unique_ptr<CachedFileStream>> file_or_err =
add_stream(task);
if (file_or_err) {
CachedFileStream *cfs = file_or_err->get();
cfs->OS->write((const char *)data.data(), data.size());
return true;
} else {
Log *log = GetLog(LLDBLog::Modules);
LLDB_LOG_ERROR(log, file_or_err.takeError(),
"failed to get the cache file stream for key: {0}");
}
}
} else {
Log *log = GetLog(LLDBLog::Modules);
LLDB_LOG_ERROR(log, add_stream_or_err.takeError(),
"failed to get the cache add stream callback for key: {0}");
}
return false;
}
FileSpec DataFileCache::GetCacheFilePath(llvm::StringRef key) {
FileSpec cache_file(m_cache_dir);
std::string filename("llvmcache-");
filename += key.str();
cache_file.AppendPathComponent(filename);
return cache_file;
}
Status DataFileCache::RemoveCacheFile(llvm::StringRef key) {
FileSpec cache_file = GetCacheFilePath(key);
FileSystem &fs = FileSystem::Instance();
if (!fs.Exists(cache_file))
return Status();
return fs.RemoveFile(cache_file);
}
CacheSignature::CacheSignature(lldb_private::Module *module) {
Clear();
UUID uuid = module->GetUUID();
if (uuid.IsValid())
m_uuid = uuid;
std::time_t mod_time = 0;
mod_time = llvm::sys::toTimeT(module->GetModificationTime());
if (mod_time != 0)
m_mod_time = mod_time;
mod_time = llvm::sys::toTimeT(module->GetObjectModificationTime());
if (mod_time != 0)
m_obj_mod_time = mod_time;
}
CacheSignature::CacheSignature(lldb_private::ObjectFile *objfile) {
Clear();
UUID uuid = objfile->GetUUID();
if (uuid.IsValid())
m_uuid = uuid;
std::time_t mod_time = 0;
// Grab the modification time of the object file's file. It isn't always the
// same as the module's file when you have a executable file as the main
// executable, and you have a object file for a symbol file.
FileSystem &fs = FileSystem::Instance();
mod_time = llvm::sys::toTimeT(fs.GetModificationTime(objfile->GetFileSpec()));
if (mod_time != 0)
m_mod_time = mod_time;
mod_time =
llvm::sys::toTimeT(objfile->GetModule()->GetObjectModificationTime());
if (mod_time != 0)
m_obj_mod_time = mod_time;
}
enum SignatureEncoding {
eSignatureUUID = 1u,
eSignatureModTime = 2u,
eSignatureObjectModTime = 3u,
eSignatureEnd = 255u,
};
bool CacheSignature::Encode(DataEncoder &encoder) {
if (!IsValid())
return false; // Invalid signature, return false!
if (m_uuid.hasValue()) {
llvm::ArrayRef<uint8_t> uuid_bytes = m_uuid->GetBytes();
encoder.AppendU8(eSignatureUUID);
encoder.AppendU8(uuid_bytes.size());
encoder.AppendData(uuid_bytes);
}
if (m_mod_time.hasValue()) {
encoder.AppendU8(eSignatureModTime);
encoder.AppendU32(*m_mod_time);
}
if (m_obj_mod_time.hasValue()) {
encoder.AppendU8(eSignatureObjectModTime);
encoder.AppendU32(*m_obj_mod_time);
}
encoder.AppendU8(eSignatureEnd);
return true;
}
bool CacheSignature::Decode(const DataExtractor &data,
lldb::offset_t *offset_ptr) {
Clear();
while (uint8_t sig_encoding = data.GetU8(offset_ptr)) {
switch (sig_encoding) {
case eSignatureUUID: {
const uint8_t length = data.GetU8(offset_ptr);
const uint8_t *bytes = (const uint8_t *)data.GetData(offset_ptr, length);
if (bytes != nullptr && length > 0)
m_uuid = UUID::fromData(llvm::ArrayRef<uint8_t>(bytes, length));
} break;
case eSignatureModTime: {
uint32_t mod_time = data.GetU32(offset_ptr);
if (mod_time > 0)
m_mod_time = mod_time;
} break;
case eSignatureObjectModTime: {
uint32_t mod_time = data.GetU32(offset_ptr);
if (mod_time > 0)
m_mod_time = mod_time;
} break;
case eSignatureEnd:
return true;
default:
break;
}
}
return false;
}
uint32_t ConstStringTable::Add(ConstString s) {
auto pos = m_string_to_offset.find(s);
if (pos != m_string_to_offset.end())
return pos->second;
const uint32_t offset = m_next_offset;
m_strings.push_back(s);
m_string_to_offset[s] = offset;
m_next_offset += s.GetLength() + 1;
return offset;
}
static const llvm::StringRef kStringTableIdentifier("STAB");
bool ConstStringTable::Encode(DataEncoder &encoder) {
// Write an 4 character code into the stream. This will help us when decoding
// to make sure we find this identifier when decoding the string table to make
// sure we have the rigth data. It also helps to identify the string table
// when dumping the hex bytes in a cache file.
encoder.AppendData(kStringTableIdentifier);
size_t length_offset = encoder.GetByteSize();
encoder.AppendU32(0); // Total length of all strings which will be fixed up.
size_t strtab_offset = encoder.GetByteSize();
encoder.AppendU8(0); // Start the string table with with an empty string.
for (auto s: m_strings) {
// Make sure all of the offsets match up with what we handed out!
assert(m_string_to_offset.find(s)->second ==
encoder.GetByteSize() - strtab_offset);
// Append the C string into the encoder
encoder.AppendCString(s.GetStringRef());
}
// Fixup the string table length.
encoder.PutU32(length_offset, encoder.GetByteSize() - strtab_offset);
return true;
}
bool StringTableReader::Decode(const DataExtractor &data,
lldb::offset_t *offset_ptr) {
llvm::StringRef identifier((const char *)data.GetData(offset_ptr, 4), 4);
if (identifier != kStringTableIdentifier)
return false;
const uint32_t length = data.GetU32(offset_ptr);
// We always have at least one byte for the empty string at offset zero.
if (length == 0)
return false;
const char *bytes = (const char *)data.GetData(offset_ptr, length);
if (bytes == nullptr)
return false;
m_data = StringRef(bytes, length);
return true;
}
StringRef StringTableReader::Get(uint32_t offset) const {
if (offset >= m_data.size())
return StringRef();
return StringRef(m_data.data() + offset);
}