298 lines
9.2 KiB
C++
298 lines
9.2 KiB
C++
/*
|
|
* AsyncFileCached.actor.cpp
|
|
*
|
|
* This source file is part of the FoundationDB open source project
|
|
*
|
|
* Copyright 2013-2018 Apple Inc. and the FoundationDB project authors
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
#include "fdbrpc/AsyncFileCached.actor.h"
|
|
|
|
// Page caches used in non-simulated environments
|
|
Optional<Reference<EvictablePageCache>> pc4k, pc64k;
|
|
|
|
// The simulator needs to store separate page caches for each machine
|
|
static std::map<NetworkAddress, std::pair<Reference<EvictablePageCache>, Reference<EvictablePageCache>>>
|
|
simulatorPageCaches;
|
|
|
|
EvictablePage::~EvictablePage() {
|
|
if (data) {
|
|
if (pageCache->pageSize == 4096)
|
|
FastAllocator<4096>::release(data);
|
|
else
|
|
aligned_free(data);
|
|
}
|
|
if (EvictablePageCache::RANDOM == pageCache->cacheEvictionType) {
|
|
if (index > -1) {
|
|
pageCache->pages[index] = pageCache->pages.back();
|
|
pageCache->pages[index]->index = index;
|
|
pageCache->pages.pop_back();
|
|
}
|
|
} else {
|
|
// remove it from the LRU
|
|
pageCache->lruPages.erase(EvictablePageCache::List::s_iterator_to(*this));
|
|
}
|
|
}
|
|
|
|
std::map<std::string, OpenFileInfo> AsyncFileCached::openFiles;
|
|
|
|
void AsyncFileCached::remove_page(AFCPage* page) {
|
|
pages.erase(page->pageOffset);
|
|
}
|
|
|
|
Future<Reference<IAsyncFile>> AsyncFileCached::open_impl(std::string filename, int flags, int mode) {
|
|
Reference<EvictablePageCache> pageCache;
|
|
|
|
// In a simulated environment, each machine needs its own caches
|
|
if (g_network->isSimulated()) {
|
|
auto cacheItr = simulatorPageCaches.find(g_network->getLocalAddress());
|
|
if (cacheItr == simulatorPageCaches.end()) {
|
|
int64_t pageCacheSize4k = (BUGGIFY) ? FLOW_KNOBS->BUGGIFY_SIM_PAGE_CACHE_4K : FLOW_KNOBS->SIM_PAGE_CACHE_4K;
|
|
int64_t pageCacheSize64k =
|
|
(BUGGIFY) ? FLOW_KNOBS->BUGGIFY_SIM_PAGE_CACHE_64K : FLOW_KNOBS->SIM_PAGE_CACHE_64K;
|
|
auto caches = std::make_pair(makeReference<EvictablePageCache>(4096, pageCacheSize4k),
|
|
makeReference<EvictablePageCache>(65536, pageCacheSize64k));
|
|
simulatorPageCaches[g_network->getLocalAddress()] = caches;
|
|
pageCache = (flags & IAsyncFile::OPEN_LARGE_PAGES) ? caches.second : caches.first;
|
|
} else
|
|
pageCache = (flags & IAsyncFile::OPEN_LARGE_PAGES) ? cacheItr->second.second : cacheItr->second.first;
|
|
} else {
|
|
if (flags & IAsyncFile::OPEN_LARGE_PAGES) {
|
|
if (!pc64k.present())
|
|
pc64k = makeReference<EvictablePageCache>(65536, FLOW_KNOBS->PAGE_CACHE_64K);
|
|
pageCache = pc64k.get();
|
|
} else {
|
|
if (!pc4k.present())
|
|
pc4k = makeReference<EvictablePageCache>(4096, FLOW_KNOBS->PAGE_CACHE_4K);
|
|
pageCache = pc4k.get();
|
|
}
|
|
}
|
|
|
|
return open_impl(filename, flags, mode, pageCache);
|
|
}
|
|
|
|
template <bool writing>
|
|
Future<Void> AsyncFileCached::read_write_impl(AsyncFileCached* self,
|
|
typename std::conditional_t<writing, const uint8_t*, uint8_t*> data,
|
|
int length,
|
|
int64_t offset) {
|
|
if constexpr (writing) {
|
|
if (offset + length > self->length)
|
|
self->length = offset + length;
|
|
}
|
|
|
|
std::vector<Future<Void>> actors;
|
|
|
|
int offsetInPage = offset % self->pageCache->pageSize;
|
|
int64_t pageOffset = offset - offsetInPage;
|
|
|
|
int remaining = length;
|
|
|
|
while (remaining) {
|
|
++self->countFileCacheFinds;
|
|
++self->countCacheFinds;
|
|
auto p = self->pages.find(pageOffset);
|
|
if (p == self->pages.end()) {
|
|
AFCPage* page = new AFCPage(self, pageOffset);
|
|
p = self->pages.insert(std::make_pair(pageOffset, page)).first;
|
|
} else {
|
|
self->pageCache->updateHit(p->second);
|
|
}
|
|
|
|
int bytesInPage = std::min(self->pageCache->pageSize - offsetInPage, remaining);
|
|
|
|
Future<Void> w;
|
|
if constexpr (writing) {
|
|
w = p->second->write(data, bytesInPage, offsetInPage);
|
|
} else {
|
|
w = p->second->read(data, bytesInPage, offsetInPage);
|
|
}
|
|
if (!w.isReady() || w.isError())
|
|
actors.push_back(w);
|
|
|
|
data += bytesInPage;
|
|
pageOffset += self->pageCache->pageSize;
|
|
offsetInPage = 0;
|
|
|
|
remaining -= bytesInPage;
|
|
}
|
|
|
|
// This is susceptible to the introduction of waits on the read/write path: no wait can occur prior to
|
|
// AFCPage::readThrough or prevLength will be set prematurely
|
|
self->prevLength = self->length;
|
|
|
|
return waitForAll(actors);
|
|
}
|
|
|
|
Future<Void> AsyncFileCached::readZeroCopy(void** data, int* length, int64_t offset) {
|
|
++countFileCacheReads;
|
|
++countCacheReads;
|
|
|
|
// Only aligned page reads are zero-copy
|
|
if (*length != pageCache->pageSize || (offset & (pageCache->pageSize - 1)) || offset + *length > this->length)
|
|
return io_error();
|
|
|
|
auto p = pages.find(offset);
|
|
if (p == pages.end()) {
|
|
AFCPage* page = new AFCPage(this, offset);
|
|
p = pages.insert(std::make_pair(offset, page)).first;
|
|
} else {
|
|
p->second->pageCache->updateHit(p->second);
|
|
}
|
|
|
|
*data = p->second->data;
|
|
|
|
return p->second->readZeroCopy();
|
|
}
|
|
void AsyncFileCached::releaseZeroCopy(void* data, int length, int64_t offset) {
|
|
ASSERT(length == pageCache->pageSize && !(offset & (pageCache->pageSize - 1)) && offset + length <= this->length);
|
|
auto p = pages.find(offset);
|
|
// If the page is in the cache and the data pointer matches then release the page
|
|
if (p != pages.end() && p->second->data == data) {
|
|
p->second->releaseZeroCopy();
|
|
} else {
|
|
// Otherwise, the data pointer might exist in the orphaned pages map
|
|
auto o = orphanedPages.find(data);
|
|
if (o != orphanedPages.end()) {
|
|
if (o->second == 1) {
|
|
if (data) {
|
|
if (length == 4096)
|
|
FastAllocator<4096>::release(data);
|
|
else
|
|
aligned_free(data);
|
|
}
|
|
} else {
|
|
--o->second;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
Future<Void> AsyncFileCached::changeFileSize(int64_t size) {
|
|
++countFileCacheWrites;
|
|
++countCacheWrites;
|
|
|
|
std::vector<Future<Void>> actors;
|
|
int64_t oldLength = length;
|
|
|
|
int offsetInPage = size % pageCache->pageSize;
|
|
int64_t pageOffset = size - offsetInPage;
|
|
|
|
if (offsetInPage == 0 && size == length) {
|
|
return Void();
|
|
}
|
|
|
|
length = size;
|
|
prevLength = size;
|
|
|
|
if (offsetInPage) {
|
|
TEST(true); // Truncating to the middle of a page
|
|
auto p = pages.find(pageOffset);
|
|
if (p != pages.end()) {
|
|
auto f = p->second->flush();
|
|
if (!f.isReady() || f.isError())
|
|
actors.push_back(f);
|
|
} else {
|
|
TEST(true); // Truncating to the middle of a page that isn't in cache
|
|
}
|
|
|
|
pageOffset += pageCache->pageSize;
|
|
}
|
|
|
|
// if this call to truncate results in a larger file, there is no
|
|
// need to erase any pages
|
|
if (oldLength > pageOffset) {
|
|
// Iterating through all pages results in better cache locality than
|
|
// looking up pages one by one in the hash table. However, if we only need
|
|
// to truncate a small portion of data, looking up pages one by one should
|
|
// be faster. So for now we do single key lookup for each page if it results
|
|
// in less than a fixed percentage of the unordered map being accessed.
|
|
int64_t numLookups = (oldLength + (pageCache->pageSize - 1) - pageOffset) / pageCache->pageSize;
|
|
if (numLookups < pages.size() * FLOW_KNOBS->PAGE_CACHE_TRUNCATE_LOOKUP_FRACTION) {
|
|
for (int64_t offset = pageOffset; offset < oldLength; offset += pageCache->pageSize) {
|
|
auto iter = pages.find(offset);
|
|
if (iter != pages.end()) {
|
|
auto f = iter->second->truncate();
|
|
if (!f.isReady() || f.isError()) {
|
|
actors.push_back(f);
|
|
}
|
|
pages.erase(iter);
|
|
}
|
|
}
|
|
} else {
|
|
for (auto p = pages.begin(); p != pages.end();) {
|
|
if (p->first >= pageOffset) {
|
|
auto f = p->second->truncate();
|
|
if (!f.isReady() || f.isError()) {
|
|
actors.push_back(f);
|
|
}
|
|
auto last = p;
|
|
++p;
|
|
pages.erase(last);
|
|
} else {
|
|
++p;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
// Wait for the page truncations to finish, then truncate the underlying file
|
|
// Template types are being provided explicitly because they can't be automatically deduced for some reason.
|
|
return mapAsync<Void, std::function<Future<Void>(Void)>, Void>(
|
|
waitForAll(actors), [=](Void _) -> Future<Void> { return uncached->truncate(size); });
|
|
}
|
|
|
|
Future<Void> AsyncFileCached::flush() {
|
|
++countFileCacheWrites;
|
|
++countCacheWrites;
|
|
|
|
std::vector<Future<Void>> unflushed;
|
|
|
|
int debug_count = flushable.size();
|
|
for (int i = 0; i < flushable.size();) {
|
|
auto p = flushable[i];
|
|
auto f = p->flush();
|
|
if (!f.isReady() || f.isError())
|
|
unflushed.push_back(f);
|
|
ASSERT((i < flushable.size() && flushable[i] == p) != f.isReady());
|
|
if (!f.isReady())
|
|
i++;
|
|
}
|
|
ASSERT(flushable.size() <= debug_count);
|
|
|
|
return waitForAll(unflushed);
|
|
}
|
|
|
|
Future<Void> AsyncFileCached::quiesce() {
|
|
std::vector<Future<Void>> unquiescent;
|
|
|
|
for (auto i = pages.begin(); i != pages.end(); ++i) {
|
|
auto f = i->second->quiesce();
|
|
if (!f.isReady())
|
|
unquiescent.push_back(f);
|
|
}
|
|
|
|
// Errors are absorbed because we need everything to finish
|
|
return waitForAllReady(unquiescent);
|
|
}
|
|
|
|
AsyncFileCached::~AsyncFileCached() {
|
|
while (!pages.empty()) {
|
|
auto ok = pages.begin()->second->evict();
|
|
ASSERT_ABORT(ok);
|
|
}
|
|
openFiles.erase(filename);
|
|
}
|