2017-05-26 04:48:44 +08:00
|
|
|
/*
|
|
|
|
* AsyncFileCached.actor.h
|
|
|
|
*
|
|
|
|
* This source file is part of the FoundationDB open source project
|
|
|
|
*
|
2022-03-22 04:36:23 +08:00
|
|
|
* Copyright 2013-2022 Apple Inc. and the FoundationDB project authors
|
2018-02-22 02:25:11 +08:00
|
|
|
*
|
2017-05-26 04:48:44 +08:00
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
* you may not use this file except in compliance with the License.
|
|
|
|
* You may obtain a copy of the License at
|
2018-02-22 02:25:11 +08:00
|
|
|
*
|
2017-05-26 04:48:44 +08:00
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
2018-02-22 02:25:11 +08:00
|
|
|
*
|
2017-05-26 04:48:44 +08:00
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
* See the License for the specific language governing permissions and
|
|
|
|
* limitations under the License.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#pragma once
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
// When actually compiled (NO_INTELLISENSE), include the generated version of this file. In intellisense use the source
|
|
|
|
// version.
|
2017-05-26 04:48:44 +08:00
|
|
|
#if defined(NO_INTELLISENSE) && !defined(FLOW_ASYNCFILECACHED_ACTOR_G_H)
|
2021-03-11 02:06:03 +08:00
|
|
|
#define FLOW_ASYNCFILECACHED_ACTOR_G_H
|
|
|
|
#include "fdbrpc/AsyncFileCached.actor.g.h"
|
2017-05-26 04:48:44 +08:00
|
|
|
#elif !defined(FLOW_ASYNCFILECACHED_ACTOR_H)
|
2021-03-11 02:06:03 +08:00
|
|
|
#define FLOW_ASYNCFILECACHED_ACTOR_H
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2019-04-30 17:33:12 +08:00
|
|
|
#include <boost/intrusive/list.hpp>
|
2020-05-23 00:25:32 +08:00
|
|
|
#include <type_traits>
|
2019-04-30 17:33:12 +08:00
|
|
|
|
2017-05-26 04:48:44 +08:00
|
|
|
#include "flow/flow.h"
|
2018-10-20 01:30:13 +08:00
|
|
|
#include "fdbrpc/IAsyncFile.h"
|
2017-05-26 04:48:44 +08:00
|
|
|
#include "flow/Knobs.h"
|
|
|
|
#include "flow/TDMetric.actor.h"
|
|
|
|
#include "flow/network.h"
|
2021-03-11 02:06:03 +08:00
|
|
|
#include "flow/actorcompiler.h" // This must be the last #include.
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2019-04-30 17:33:12 +08:00
|
|
|
namespace bi = boost::intrusive;
|
2017-05-26 04:48:44 +08:00
|
|
|
struct EvictablePage {
|
|
|
|
void* data;
|
|
|
|
int index;
|
|
|
|
class Reference<struct EvictablePageCache> pageCache;
|
2019-04-30 17:33:12 +08:00
|
|
|
bi::list_member_hook<> member_hook;
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
virtual bool evict() = 0; // true if page was evicted, false if it isn't immediately evictable (but will be evicted
|
|
|
|
// regardless if possible)
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
EvictablePage(Reference<EvictablePageCache> pageCache) : data(0), index(-1), pageCache(pageCache) {}
|
|
|
|
virtual ~EvictablePage();
|
|
|
|
};
|
|
|
|
|
|
|
|
struct EvictablePageCache : ReferenceCounted<EvictablePageCache> {
|
2021-03-11 02:06:03 +08:00
|
|
|
using List =
|
|
|
|
bi::list<EvictablePage, bi::member_hook<EvictablePage, bi::list_member_hook<>, &EvictablePage::member_hook>>;
|
2019-05-06 16:11:46 +08:00
|
|
|
enum CacheEvictionType { RANDOM = 0, LRU = 1 };
|
2019-04-30 17:33:12 +08:00
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
static CacheEvictionType evictionPolicyStringToEnum(const std::string& policy) {
|
2019-05-06 16:11:46 +08:00
|
|
|
std::string cep = policy;
|
2019-05-03 20:04:43 +08:00
|
|
|
std::transform(cep.begin(), cep.end(), cep.begin(), ::tolower);
|
2019-05-06 16:11:46 +08:00
|
|
|
if (cep != "random" && cep != "lru")
|
|
|
|
throw invalid_cache_eviction_policy();
|
|
|
|
|
|
|
|
if (cep == "random")
|
|
|
|
return RANDOM;
|
|
|
|
return LRU;
|
|
|
|
}
|
|
|
|
|
|
|
|
EvictablePageCache() : pageSize(0), maxPages(0), cacheEvictionType(RANDOM) {}
|
2019-05-03 20:04:43 +08:00
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
explicit EvictablePageCache(int pageSize, int64_t maxSize)
|
|
|
|
: pageSize(pageSize), maxPages(maxSize / pageSize),
|
|
|
|
cacheEvictionType(evictionPolicyStringToEnum(FLOW_KNOBS->CACHE_EVICTION_POLICY)) {
|
2019-05-08 21:41:17 +08:00
|
|
|
cacheEvictions.init(LiteralStringRef("EvictablePageCache.CacheEvictions"));
|
2019-05-02 23:35:30 +08:00
|
|
|
}
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
void allocate(EvictablePage* page) {
|
|
|
|
try_evict();
|
|
|
|
try_evict();
|
2022-03-22 07:57:38 +08:00
|
|
|
|
|
|
|
page->data = allocateFast4kAligned(pageSize);
|
|
|
|
|
2019-05-03 20:04:43 +08:00
|
|
|
if (RANDOM == cacheEvictionType) {
|
2019-05-02 23:35:30 +08:00
|
|
|
page->index = pages.size();
|
|
|
|
pages.push_back(page);
|
|
|
|
} else {
|
|
|
|
lruPages.push_back(*page); // new page is considered the most recently used (placed at LRU tail)
|
|
|
|
}
|
2019-04-30 17:33:12 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
void updateHit(EvictablePage* page) {
|
2019-05-03 20:04:43 +08:00
|
|
|
if (RANDOM != cacheEvictionType) {
|
2019-05-02 23:35:30 +08:00
|
|
|
// on a hit, update page's location in the LRU so that it's most recent (tail)
|
|
|
|
lruPages.erase(List::s_iterator_to(*page));
|
|
|
|
lruPages.push_back(*page);
|
|
|
|
}
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
void try_evict() {
|
2019-05-03 20:04:43 +08:00
|
|
|
if (RANDOM == cacheEvictionType) {
|
2019-05-02 23:35:30 +08:00
|
|
|
if (pages.size() >= (uint64_t)maxPages && !pages.empty()) {
|
2021-03-11 02:06:03 +08:00
|
|
|
for (int i = 0; i < FLOW_KNOBS->MAX_EVICT_ATTEMPTS;
|
|
|
|
i++) { // If we don't manage to evict anything, just go ahead and exceed the cache limit
|
2019-05-23 23:35:47 +08:00
|
|
|
int toEvict = deterministicRandom()->randomInt(0, pages.size());
|
2019-05-02 23:35:30 +08:00
|
|
|
if (pages[toEvict]->evict()) {
|
2019-05-08 21:41:17 +08:00
|
|
|
++cacheEvictions;
|
2019-05-02 23:35:30 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
// For now, LRU is the only other CACHE_EVICTION option
|
|
|
|
if (lruPages.size() >= (uint64_t)maxPages) {
|
|
|
|
int i = 0;
|
|
|
|
// try the least recently used pages first (starting at head of the LRU list)
|
2021-03-11 02:06:03 +08:00
|
|
|
for (List::iterator it = lruPages.begin(); it != lruPages.end() && i < FLOW_KNOBS->MAX_EVICT_ATTEMPTS;
|
2019-05-02 23:35:30 +08:00
|
|
|
++it, ++i) { // If we don't manage to evict anything, just go ahead and exceed the cache limit
|
|
|
|
if (it->evict()) {
|
2019-05-08 21:41:17 +08:00
|
|
|
++cacheEvictions;
|
2019-05-02 23:35:30 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
std::vector<EvictablePage*> pages;
|
2019-04-30 17:33:12 +08:00
|
|
|
List lruPages;
|
2017-05-26 04:48:44 +08:00
|
|
|
int pageSize;
|
|
|
|
int64_t maxPages;
|
2019-05-02 23:35:30 +08:00
|
|
|
Int64MetricHandle cacheEvictions;
|
2019-05-06 16:11:46 +08:00
|
|
|
const CacheEvictionType cacheEvictionType;
|
2017-05-26 04:48:44 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
struct AFCPage;
|
|
|
|
|
2020-11-28 02:10:41 +08:00
|
|
|
class AsyncFileCached final : public IAsyncFile, public ReferenceCounted<AsyncFileCached> {
|
2017-05-26 04:48:44 +08:00
|
|
|
friend struct AFCPage;
|
|
|
|
|
|
|
|
public:
|
2021-05-27 04:38:24 +08:00
|
|
|
// Opens a file that uses the FDB in-memory page cache
|
2021-03-11 02:06:03 +08:00
|
|
|
static Future<Reference<IAsyncFile>> open(std::string filename, int flags, int mode) {
|
2017-05-26 04:48:44 +08:00
|
|
|
//TraceEvent("AsyncFileCachedOpen").detail("Filename", filename);
|
2021-06-04 04:30:28 +08:00
|
|
|
auto itr = openFiles.find(filename);
|
|
|
|
if (itr == openFiles.end()) {
|
2021-03-11 02:06:03 +08:00
|
|
|
auto f = open_impl(filename, flags, mode);
|
|
|
|
if (f.isReady() && f.isError())
|
2017-05-26 04:48:44 +08:00
|
|
|
return f;
|
2021-06-04 04:30:28 +08:00
|
|
|
|
2021-06-04 04:51:47 +08:00
|
|
|
auto result = openFiles.try_emplace(filename, f);
|
|
|
|
|
|
|
|
// This should be inserting a new entry
|
|
|
|
ASSERT(result.second);
|
|
|
|
itr = result.first;
|
2021-06-04 04:30:28 +08:00
|
|
|
|
|
|
|
// We return here instead of falling through to the outer scope so that we don't delete all references to
|
|
|
|
// the underlying file before returning
|
|
|
|
return itr->second.get();
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
2021-06-04 04:30:28 +08:00
|
|
|
return itr->second.get();
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
|
2020-08-20 09:17:05 +08:00
|
|
|
Future<int> read(void* data, int length, int64_t offset) override {
|
2017-05-26 04:48:44 +08:00
|
|
|
++countFileCacheReads;
|
|
|
|
++countCacheReads;
|
|
|
|
if (offset + length > this->length) {
|
|
|
|
length = int(this->length - offset);
|
|
|
|
ASSERT(length >= 0);
|
|
|
|
}
|
2020-05-23 00:25:32 +08:00
|
|
|
auto f = read_write_impl<false>(this, static_cast<uint8_t*>(data), length, offset);
|
2021-03-11 02:06:03 +08:00
|
|
|
if (f.isReady() && !f.isError())
|
|
|
|
return length;
|
2017-05-26 04:48:44 +08:00
|
|
|
++countFileCacheReadsBlocked;
|
|
|
|
++countCacheReadsBlocked;
|
2021-03-11 02:06:03 +08:00
|
|
|
return tag(f, length);
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
ACTOR static Future<Void> write_impl(AsyncFileCached* self, void const* data, int length, int64_t offset) {
|
|
|
|
// If there is a truncate in progress before the the write position then we must
|
2017-09-21 08:58:56 +08:00
|
|
|
// wait for it to complete.
|
2021-03-11 02:06:03 +08:00
|
|
|
if (length + offset > self->currentTruncateSize)
|
2018-09-20 18:39:55 +08:00
|
|
|
wait(self->currentTruncate);
|
2017-09-21 08:58:56 +08:00
|
|
|
++self->countFileCacheWrites;
|
|
|
|
++self->countCacheWrites;
|
2020-05-23 00:25:32 +08:00
|
|
|
Future<Void> f = read_write_impl<true>(self, static_cast<const uint8_t*>(data), length, offset);
|
2017-05-26 04:48:44 +08:00
|
|
|
if (!f.isReady()) {
|
2017-09-21 08:58:56 +08:00
|
|
|
++self->countFileCacheWritesBlocked;
|
|
|
|
++self->countCacheWritesBlocked;
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
2018-09-20 18:39:55 +08:00
|
|
|
wait(f);
|
|
|
|
return Void();
|
2017-09-21 08:58:56 +08:00
|
|
|
}
|
|
|
|
|
2020-08-20 09:17:05 +08:00
|
|
|
Future<Void> write(void const* data, int length, int64_t offset) override {
|
2017-09-21 08:58:56 +08:00
|
|
|
return write_impl(this, data, length, offset);
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
|
2020-08-20 09:17:05 +08:00
|
|
|
Future<Void> readZeroCopy(void** data, int* length, int64_t offset) override;
|
|
|
|
void releaseZeroCopy(void* data, int length, int64_t offset) override;
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2018-09-20 18:39:55 +08:00
|
|
|
// This waits for previously started truncates to finish and then truncates
|
2020-08-20 09:17:05 +08:00
|
|
|
Future<Void> truncate(int64_t size) override { return truncate_impl(this, size); }
|
2017-09-21 08:58:56 +08:00
|
|
|
|
2018-09-20 18:39:55 +08:00
|
|
|
// This is the 'real' truncate that does the actual removal of cache blocks and then shortens the file
|
2021-03-11 02:06:03 +08:00
|
|
|
Future<Void> changeFileSize(int64_t size);
|
2017-09-21 08:58:56 +08:00
|
|
|
|
2018-09-20 18:39:55 +08:00
|
|
|
// This wrapper for the actual truncation operation enforces ordering of truncates.
|
|
|
|
// It maintains currentTruncate and currentTruncateSize so writers can wait behind truncates that would affect them.
|
2021-03-11 02:06:03 +08:00
|
|
|
ACTOR static Future<Void> truncate_impl(AsyncFileCached* self, int64_t size) {
|
2018-09-20 18:39:55 +08:00
|
|
|
wait(self->currentTruncate);
|
|
|
|
self->currentTruncateSize = size;
|
|
|
|
self->currentTruncate = self->changeFileSize(size);
|
|
|
|
wait(self->currentTruncate);
|
2017-05-26 04:48:44 +08:00
|
|
|
return Void();
|
|
|
|
}
|
|
|
|
|
2020-08-20 09:17:05 +08:00
|
|
|
Future<Void> sync() override { return waitAndSync(this, flush()); }
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2020-08-20 08:32:11 +08:00
|
|
|
Future<int64_t> size() const override { return length; }
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2020-08-20 08:32:11 +08:00
|
|
|
int64_t debugFD() const override { return uncached->debugFD(); }
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2020-08-20 08:32:11 +08:00
|
|
|
std::string getFilename() const override { return filename; }
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2020-12-10 04:03:32 +08:00
|
|
|
void setRateControl(Reference<IRateControl> const& rc) override { rateControl = rc; }
|
|
|
|
|
2021-01-24 17:50:09 +08:00
|
|
|
Reference<IRateControl> const& getRateControl() override { return rateControl; }
|
2020-12-10 04:03:32 +08:00
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
void addref() override {
|
|
|
|
ReferenceCounted<AsyncFileCached>::addref();
|
2017-05-26 04:48:44 +08:00
|
|
|
//TraceEvent("AsyncFileCachedAddRef").detail("Filename", filename).detail("Refcount", debugGetReferenceCount()).backtrace();
|
|
|
|
}
|
2020-11-28 02:10:41 +08:00
|
|
|
void delref() override {
|
2017-05-26 04:48:44 +08:00
|
|
|
if (delref_no_destroy()) {
|
|
|
|
// If this is ever ThreadSafeReferenceCounted...
|
|
|
|
// setrefCountUnsafe(0);
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
if (rateControl) {
|
|
|
|
TraceEvent(SevDebug, "AsyncFileCachedKillWaiters").detail("Filename", filename);
|
2021-01-24 17:50:09 +08:00
|
|
|
rateControl->killWaiters(io_error());
|
|
|
|
}
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
auto f = quiesce();
|
2021-03-11 02:06:03 +08:00
|
|
|
TraceEvent("AsyncFileCachedDel")
|
|
|
|
.detail("Filename", filename)
|
|
|
|
.detail("Refcount", debugGetReferenceCount())
|
2021-06-14 13:31:04 +08:00
|
|
|
.detail("CanDie", f.isReady());
|
2021-08-28 08:07:47 +08:00
|
|
|
// .backtrace();
|
2017-05-26 04:48:44 +08:00
|
|
|
if (f.isReady())
|
|
|
|
delete this;
|
|
|
|
else
|
2021-03-11 02:06:03 +08:00
|
|
|
uncancellable(holdWhile(Reference<AsyncFileCached>::addRef(this), f));
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-01-26 09:55:43 +08:00
|
|
|
~AsyncFileCached() override;
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
private:
|
2021-05-27 04:38:24 +08:00
|
|
|
// A map of filename to the file handle for all opened cached files
|
2021-05-29 05:34:20 +08:00
|
|
|
static std::map<std::string, UnsafeWeakFutureReference<IAsyncFile>> openFiles;
|
2021-05-27 04:38:24 +08:00
|
|
|
|
2017-05-26 04:48:44 +08:00
|
|
|
std::string filename;
|
|
|
|
Reference<IAsyncFile> uncached;
|
|
|
|
int64_t length;
|
|
|
|
int64_t prevLength;
|
|
|
|
std::unordered_map<int64_t, AFCPage*> pages;
|
|
|
|
std::vector<AFCPage*> flushable;
|
|
|
|
Reference<EvictablePageCache> pageCache;
|
2017-09-21 08:58:56 +08:00
|
|
|
Future<Void> currentTruncate;
|
|
|
|
int64_t currentTruncateSize;
|
2020-12-10 04:03:32 +08:00
|
|
|
Reference<IRateControl> rateControl;
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2018-07-05 17:59:13 +08:00
|
|
|
// Map of pointers which hold page buffers for pages which have been overwritten
|
|
|
|
// but at the time of write there were still readZeroCopy holders.
|
2021-03-11 02:06:03 +08:00
|
|
|
std::unordered_map<void*, int> orphanedPages;
|
2018-07-05 17:59:13 +08:00
|
|
|
|
2017-05-26 04:48:44 +08:00
|
|
|
Int64MetricHandle countFileCacheFinds;
|
|
|
|
Int64MetricHandle countFileCacheReads;
|
|
|
|
Int64MetricHandle countFileCacheWrites;
|
|
|
|
Int64MetricHandle countFileCacheReadsBlocked;
|
|
|
|
Int64MetricHandle countFileCacheWritesBlocked;
|
2019-07-11 05:43:20 +08:00
|
|
|
Int64MetricHandle countFileCachePageReadsHit;
|
|
|
|
Int64MetricHandle countFileCachePageReadsMissed;
|
2017-05-26 04:48:44 +08:00
|
|
|
Int64MetricHandle countFileCachePageReadsMerged;
|
|
|
|
Int64MetricHandle countFileCacheReadBytes;
|
|
|
|
|
|
|
|
Int64MetricHandle countCacheFinds;
|
|
|
|
Int64MetricHandle countCacheReads;
|
|
|
|
Int64MetricHandle countCacheWrites;
|
|
|
|
Int64MetricHandle countCacheReadsBlocked;
|
|
|
|
Int64MetricHandle countCacheWritesBlocked;
|
2019-07-11 05:43:20 +08:00
|
|
|
Int64MetricHandle countCachePageReadsHit;
|
|
|
|
Int64MetricHandle countCachePageReadsMissed;
|
2017-05-26 04:48:44 +08:00
|
|
|
Int64MetricHandle countCachePageReadsMerged;
|
|
|
|
Int64MetricHandle countCacheReadBytes;
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
AsyncFileCached(Reference<IAsyncFile> uncached,
|
|
|
|
const std::string& filename,
|
|
|
|
int64_t length,
|
2020-12-10 04:03:32 +08:00
|
|
|
Reference<EvictablePageCache> pageCache)
|
2021-07-23 13:48:27 +08:00
|
|
|
: filename(filename), uncached(uncached), length(length), prevLength(length), pageCache(pageCache),
|
2020-12-10 04:03:32 +08:00
|
|
|
currentTruncate(Void()), currentTruncateSize(0), rateControl(nullptr) {
|
2021-03-11 02:06:03 +08:00
|
|
|
if (!g_network->isSimulated()) {
|
2019-07-11 05:43:20 +08:00
|
|
|
countFileCacheWrites.init(LiteralStringRef("AsyncFile.CountFileCacheWrites"), filename);
|
|
|
|
countFileCacheReads.init(LiteralStringRef("AsyncFile.CountFileCacheReads"), filename);
|
|
|
|
countFileCacheWritesBlocked.init(LiteralStringRef("AsyncFile.CountFileCacheWritesBlocked"), filename);
|
|
|
|
countFileCacheReadsBlocked.init(LiteralStringRef("AsyncFile.CountFileCacheReadsBlocked"), filename);
|
|
|
|
countFileCachePageReadsHit.init(LiteralStringRef("AsyncFile.CountFileCachePageReadsHit"), filename);
|
|
|
|
countFileCachePageReadsMissed.init(LiteralStringRef("AsyncFile.CountFileCachePageReadsMissed"), filename);
|
2017-05-26 04:48:44 +08:00
|
|
|
countFileCachePageReadsMerged.init(LiteralStringRef("AsyncFile.CountFileCachePageReadsMerged"), filename);
|
2019-07-11 05:43:20 +08:00
|
|
|
countFileCacheFinds.init(LiteralStringRef("AsyncFile.CountFileCacheFinds"), filename);
|
|
|
|
countFileCacheReadBytes.init(LiteralStringRef("AsyncFile.CountFileCacheReadBytes"), filename);
|
|
|
|
|
|
|
|
countCacheWrites.init(LiteralStringRef("AsyncFile.CountCacheWrites"));
|
|
|
|
countCacheReads.init(LiteralStringRef("AsyncFile.CountCacheReads"));
|
|
|
|
countCacheWritesBlocked.init(LiteralStringRef("AsyncFile.CountCacheWritesBlocked"));
|
|
|
|
countCacheReadsBlocked.init(LiteralStringRef("AsyncFile.CountCacheReadsBlocked"));
|
|
|
|
countCachePageReadsHit.init(LiteralStringRef("AsyncFile.CountCachePageReadsHit"));
|
|
|
|
countCachePageReadsMissed.init(LiteralStringRef("AsyncFile.CountCachePageReadsMissed"));
|
2017-05-26 04:48:44 +08:00
|
|
|
countCachePageReadsMerged.init(LiteralStringRef("AsyncFile.CountCachePageReadsMerged"));
|
2019-07-11 05:43:20 +08:00
|
|
|
countCacheFinds.init(LiteralStringRef("AsyncFile.CountCacheFinds"));
|
|
|
|
countCacheReadBytes.init(LiteralStringRef("AsyncFile.CountCacheReadBytes"));
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
static Future<Reference<IAsyncFile>> open_impl(std::string filename, int flags, int mode);
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2021-05-27 04:38:24 +08:00
|
|
|
// Opens a file that uses the FDB in-memory page cache
|
2021-03-11 02:06:03 +08:00
|
|
|
ACTOR static Future<Reference<IAsyncFile>> open_impl(std::string filename,
|
|
|
|
int flags,
|
|
|
|
int mode,
|
|
|
|
Reference<EvictablePageCache> pageCache) {
|
2017-05-26 04:48:44 +08:00
|
|
|
try {
|
2018-06-09 02:11:08 +08:00
|
|
|
TraceEvent("AFCUnderlyingOpenBegin").detail("Filename", filename);
|
2021-03-11 02:06:03 +08:00
|
|
|
if (flags & IAsyncFile::OPEN_CACHED_READ_ONLY)
|
2019-01-03 02:15:59 +08:00
|
|
|
flags = (flags & ~IAsyncFile::OPEN_READWRITE) | IAsyncFile::OPEN_READONLY;
|
2017-05-26 04:48:44 +08:00
|
|
|
else
|
2019-01-03 02:15:59 +08:00
|
|
|
flags = (flags & ~IAsyncFile::OPEN_READONLY) | IAsyncFile::OPEN_READWRITE;
|
2021-03-11 02:06:03 +08:00
|
|
|
state Reference<IAsyncFile> f = wait(IAsyncFileSystem::filesystem()->open(
|
|
|
|
filename, flags | IAsyncFile::OPEN_UNCACHED | IAsyncFile::OPEN_UNBUFFERED, mode));
|
2018-06-09 02:11:08 +08:00
|
|
|
TraceEvent("AFCUnderlyingOpenEnd").detail("Filename", filename);
|
2021-03-11 02:06:03 +08:00
|
|
|
int64_t l = wait(f->size());
|
2018-06-09 02:11:08 +08:00
|
|
|
TraceEvent("AFCUnderlyingSize").detail("Filename", filename).detail("Size", l);
|
2021-05-27 04:38:24 +08:00
|
|
|
return new AsyncFileCached(f, filename, l, pageCache);
|
2017-05-26 04:48:44 +08:00
|
|
|
} catch (Error& e) {
|
2021-03-11 02:06:03 +08:00
|
|
|
if (e.code() != error_code_actor_cancelled)
|
|
|
|
openFiles.erase(filename);
|
2017-05-26 04:48:44 +08:00
|
|
|
throw e;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-08-20 09:17:05 +08:00
|
|
|
Future<Void> flush() override;
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
Future<Void> quiesce();
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
ACTOR static Future<Void> waitAndSync(AsyncFileCached* self, Future<Void> flush) {
|
|
|
|
wait(flush);
|
|
|
|
wait(self->uncached->sync());
|
2017-05-26 04:48:44 +08:00
|
|
|
return Void();
|
|
|
|
}
|
|
|
|
|
2020-05-23 00:25:32 +08:00
|
|
|
template <bool writing>
|
|
|
|
static Future<Void> read_write_impl(AsyncFileCached* self,
|
|
|
|
typename std::conditional_t<writing, const uint8_t*, uint8_t*> data,
|
2021-03-11 02:06:03 +08:00
|
|
|
int length,
|
|
|
|
int64_t offset);
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
void remove_page(AFCPage* page);
|
2017-05-26 04:48:44 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
struct AFCPage : public EvictablePage, public FastAllocated<AFCPage> {
|
2020-08-20 09:17:05 +08:00
|
|
|
bool evict() override {
|
2021-03-11 02:06:03 +08:00
|
|
|
if (notReading.isReady() && notFlushing.isReady() && !dirty && !zeroCopyRefCount && !truncated) {
|
|
|
|
owner->remove_page(this);
|
2017-05-26 04:48:44 +08:00
|
|
|
delete this;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (dirty)
|
|
|
|
flush();
|
|
|
|
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
2018-07-05 17:59:13 +08:00
|
|
|
// Move this page's data into the orphanedPages set of the owner
|
|
|
|
void orphan() {
|
|
|
|
owner->orphanedPages[data] = zeroCopyRefCount;
|
|
|
|
zeroCopyRefCount = 0;
|
2018-11-07 11:31:16 +08:00
|
|
|
notReading = Void();
|
2022-03-22 07:57:38 +08:00
|
|
|
data = allocateFast4kAligned(pageCache->pageSize);
|
2018-07-05 17:59:13 +08:00
|
|
|
}
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
Future<Void> write(void const* data, int length, int offset) {
|
2018-07-05 17:59:13 +08:00
|
|
|
// If zero-copy reads are in progress, allow whole page writes to a new page buffer so the effects
|
|
|
|
// are not seen by the prior readers who still hold zeroCopyRead pointers
|
|
|
|
bool fullPage = offset == 0 && length == pageCache->pageSize;
|
2018-10-31 17:14:55 +08:00
|
|
|
ASSERT(zeroCopyRefCount == 0 || fullPage);
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
if (zeroCopyRefCount != 0) {
|
2018-11-07 11:31:16 +08:00
|
|
|
ASSERT(fullPage);
|
|
|
|
orphan();
|
|
|
|
}
|
|
|
|
|
2017-05-26 04:48:44 +08:00
|
|
|
setDirty();
|
|
|
|
|
2018-11-07 11:31:16 +08:00
|
|
|
// If there are no active readers then if data is valid or we're replacing all of it we can write directly
|
|
|
|
if (valid || fullPage) {
|
2021-03-11 02:06:03 +08:00
|
|
|
if (!fullPage) {
|
2019-07-11 05:43:20 +08:00
|
|
|
++owner->countFileCachePageReadsHit;
|
|
|
|
++owner->countCachePageReadsHit;
|
|
|
|
}
|
2017-05-26 04:48:44 +08:00
|
|
|
valid = true;
|
2021-03-11 02:06:03 +08:00
|
|
|
memcpy(static_cast<uint8_t*>(this->data) + offset, data, length);
|
2017-05-26 04:48:44 +08:00
|
|
|
return yield();
|
|
|
|
}
|
|
|
|
|
2019-07-11 05:43:20 +08:00
|
|
|
++owner->countFileCachePageReadsMissed;
|
|
|
|
++owner->countCachePageReadsMissed;
|
|
|
|
|
2018-11-07 11:31:16 +08:00
|
|
|
// If data is not valid but no read is in progress, start reading
|
2017-05-26 04:48:44 +08:00
|
|
|
if (notReading.isReady()) {
|
2021-03-11 02:06:03 +08:00
|
|
|
notReading = readThrough(this);
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
notReading = waitAndWrite(this, data, length, offset);
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
return notReading;
|
|
|
|
}
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
ACTOR static Future<Void> waitAndWrite(AFCPage* self, void const* data, int length, int offset) {
|
|
|
|
wait(self->notReading);
|
|
|
|
memcpy(static_cast<uint8_t*>(self->data) + offset, data, length);
|
2017-05-26 04:48:44 +08:00
|
|
|
return Void();
|
|
|
|
}
|
|
|
|
|
|
|
|
Future<Void> readZeroCopy() {
|
|
|
|
++zeroCopyRefCount;
|
2019-07-11 05:43:20 +08:00
|
|
|
if (valid) {
|
|
|
|
++owner->countFileCachePageReadsHit;
|
|
|
|
++owner->countCachePageReadsHit;
|
|
|
|
return yield();
|
|
|
|
}
|
|
|
|
|
|
|
|
++owner->countFileCachePageReadsMissed;
|
|
|
|
++owner->countCachePageReadsMissed;
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
if (notReading.isReady()) {
|
2021-03-11 02:06:03 +08:00
|
|
|
notReading = readThrough(this);
|
2017-05-26 04:48:44 +08:00
|
|
|
} else {
|
|
|
|
++owner->countFileCachePageReadsMerged;
|
|
|
|
++owner->countCachePageReadsMerged;
|
|
|
|
}
|
|
|
|
|
|
|
|
return notReading;
|
|
|
|
}
|
|
|
|
void releaseZeroCopy() {
|
|
|
|
--zeroCopyRefCount;
|
2021-03-11 02:06:03 +08:00
|
|
|
ASSERT(zeroCopyRefCount >= 0);
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
Future<Void> read(void* data, int length, int offset) {
|
2017-05-26 04:48:44 +08:00
|
|
|
if (valid) {
|
2019-07-11 05:43:20 +08:00
|
|
|
++owner->countFileCachePageReadsHit;
|
|
|
|
++owner->countCachePageReadsHit;
|
2017-05-26 04:48:44 +08:00
|
|
|
owner->countFileCacheReadBytes += length;
|
|
|
|
owner->countCacheReadBytes += length;
|
2021-03-11 02:06:03 +08:00
|
|
|
memcpy(data, static_cast<uint8_t const*>(this->data) + offset, length);
|
2017-05-26 04:48:44 +08:00
|
|
|
return yield();
|
|
|
|
}
|
|
|
|
|
2019-07-11 05:43:20 +08:00
|
|
|
++owner->countFileCachePageReadsMissed;
|
|
|
|
++owner->countCachePageReadsMissed;
|
|
|
|
|
2017-05-26 04:48:44 +08:00
|
|
|
if (notReading.isReady()) {
|
2021-03-11 02:06:03 +08:00
|
|
|
notReading = readThrough(this);
|
2017-05-26 04:48:44 +08:00
|
|
|
} else {
|
|
|
|
++owner->countFileCachePageReadsMerged;
|
|
|
|
++owner->countCachePageReadsMerged;
|
|
|
|
}
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
notReading = waitAndRead(this, data, length, offset);
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
return notReading;
|
|
|
|
}
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
ACTOR static Future<Void> waitAndRead(AFCPage* self, void* data, int length, int offset) {
|
|
|
|
wait(self->notReading);
|
|
|
|
memcpy(data, static_cast<uint8_t const*>(self->data) + offset, length);
|
2017-05-26 04:48:44 +08:00
|
|
|
return Void();
|
|
|
|
}
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
ACTOR static Future<Void> readThrough(AFCPage* self) {
|
2017-05-26 04:48:44 +08:00
|
|
|
ASSERT(!self->valid);
|
2021-03-11 02:06:03 +08:00
|
|
|
state void* dst = self->data;
|
|
|
|
if (self->pageOffset < self->owner->prevLength) {
|
2017-05-26 04:48:44 +08:00
|
|
|
try {
|
2021-03-11 02:06:03 +08:00
|
|
|
int _ = wait(self->owner->uncached->read(dst, self->pageCache->pageSize, self->pageOffset));
|
2017-05-26 04:48:44 +08:00
|
|
|
if (_ != self->pageCache->pageSize)
|
2021-03-11 02:06:03 +08:00
|
|
|
TraceEvent("ReadThroughShortRead")
|
|
|
|
.detail("ReadAmount", _)
|
|
|
|
.detail("PageSize", self->pageCache->pageSize)
|
|
|
|
.detail("PageOffset", self->pageOffset);
|
2017-05-26 04:48:44 +08:00
|
|
|
} catch (Error& e) {
|
|
|
|
self->zeroCopyRefCount = 0;
|
|
|
|
TraceEvent("ReadThroughFailed").error(e);
|
|
|
|
throw;
|
|
|
|
}
|
|
|
|
}
|
2018-11-07 11:31:16 +08:00
|
|
|
// If the memory we read into wasn't orphaned while we were waiting on the read then set valid to true
|
2021-03-11 02:06:03 +08:00
|
|
|
if (dst == self->data)
|
2018-11-07 11:31:16 +08:00
|
|
|
self->valid = true;
|
2017-05-26 04:48:44 +08:00
|
|
|
return Void();
|
|
|
|
}
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
ACTOR static Future<Void> writeThrough(AFCPage* self, Promise<Void> writing) {
|
|
|
|
// writeThrough can be called on a page that is not dirty, just to wait for a previous writeThrough to finish.
|
|
|
|
// In that case we don't want to do any disk I/O
|
2017-05-26 04:48:44 +08:00
|
|
|
try {
|
|
|
|
state bool dirty = self->dirty;
|
|
|
|
++self->writeThroughCount;
|
|
|
|
self->updateFlushableIndex();
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
wait(self->notReading && self->notFlushing);
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
if (dirty) {
|
2020-12-12 02:33:50 +08:00
|
|
|
// Wait for rate control if it is set
|
2021-02-03 04:39:05 +08:00
|
|
|
if (self->owner->getRateControl()) {
|
|
|
|
int allowance = 1;
|
|
|
|
// If I/O size is defined, wait for the calculated I/O quota
|
|
|
|
if (FLOW_KNOBS->FLOW_CACHEDFILE_WRITE_IO_SIZE > 0) {
|
|
|
|
allowance = (self->pageCache->pageSize + FLOW_KNOBS->FLOW_CACHEDFILE_WRITE_IO_SIZE - 1) /
|
|
|
|
FLOW_KNOBS->FLOW_CACHEDFILE_WRITE_IO_SIZE; // round up
|
|
|
|
ASSERT(allowance > 0);
|
|
|
|
}
|
|
|
|
wait(self->owner->getRateControl()->getAllowance(allowance));
|
|
|
|
}
|
2020-12-12 02:33:50 +08:00
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
if (self->pageOffset + self->pageCache->pageSize > self->owner->length) {
|
2017-05-26 04:48:44 +08:00
|
|
|
ASSERT(self->pageOffset < self->owner->length);
|
2021-03-11 02:06:03 +08:00
|
|
|
memset(static_cast<uint8_t*>(self->data) + self->owner->length - self->pageOffset,
|
|
|
|
0,
|
|
|
|
self->pageCache->pageSize - (self->owner->length - self->pageOffset));
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
auto f = self->owner->uncached->write(self->data, self->pageCache->pageSize, self->pageOffset);
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
wait(f);
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
2021-03-11 02:06:03 +08:00
|
|
|
} catch (Error& e) {
|
2017-05-26 04:48:44 +08:00
|
|
|
--self->writeThroughCount;
|
|
|
|
self->setDirty();
|
|
|
|
writing.sendError(e);
|
|
|
|
throw;
|
|
|
|
}
|
|
|
|
--self->writeThroughCount;
|
|
|
|
self->updateFlushableIndex();
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
writing.send(Void()); // FIXME: This could happen before the wait if AsyncFileKAIO dealt properly with
|
|
|
|
// overlapping write and sync operations
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
self->pageCache->try_evict();
|
|
|
|
|
|
|
|
return Void();
|
|
|
|
}
|
|
|
|
|
|
|
|
Future<Void> flush() {
|
2021-03-11 02:06:03 +08:00
|
|
|
if (!dirty && notFlushing.isReady())
|
|
|
|
return Void();
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
ASSERT(valid || !notReading.isReady() || notReading.isError());
|
|
|
|
|
|
|
|
Promise<Void> writing;
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
notFlushing = writeThrough(this, writing);
|
2017-05-26 04:48:44 +08:00
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
clearDirty(); // Do this last so that if writeThrough immediately calls try_evict, we can't be evicted before
|
|
|
|
// assigning notFlushing
|
2017-05-26 04:48:44 +08:00
|
|
|
return writing.getFuture();
|
|
|
|
}
|
|
|
|
|
|
|
|
Future<Void> quiesce() {
|
2021-03-11 02:06:03 +08:00
|
|
|
if (dirty)
|
|
|
|
flush();
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
// If we are flushing, we will be quiescent when all flushes are finished
|
|
|
|
// Returning flush() isn't right, because flush can return before notFlushing.isReady()
|
|
|
|
if (!notFlushing.isReady()) {
|
|
|
|
return notFlushing;
|
|
|
|
}
|
|
|
|
|
|
|
|
// else if we are reading, we will be quiescent when the read is finished
|
2021-03-11 02:06:03 +08:00
|
|
|
if (!notReading.isReady())
|
2017-05-26 04:48:44 +08:00
|
|
|
return notReading;
|
|
|
|
|
|
|
|
return Void();
|
|
|
|
}
|
|
|
|
|
|
|
|
Future<Void> truncate() {
|
2018-07-05 17:59:13 +08:00
|
|
|
// Allow truncatation during zero copy reads but orphan the previous buffer
|
2021-03-11 02:06:03 +08:00
|
|
|
if (zeroCopyRefCount != 0)
|
2018-07-05 17:59:13 +08:00
|
|
|
orphan();
|
2017-05-26 04:48:44 +08:00
|
|
|
truncated = true;
|
2021-03-11 02:06:03 +08:00
|
|
|
return truncate_impl(this);
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
ACTOR static Future<Void> truncate_impl(AFCPage* self) {
|
|
|
|
wait(self->notReading && self->notFlushing && yield());
|
2017-05-26 04:48:44 +08:00
|
|
|
delete self;
|
|
|
|
return Void();
|
|
|
|
}
|
|
|
|
|
2021-03-11 02:06:03 +08:00
|
|
|
AFCPage(AsyncFileCached* owner, int64_t offset)
|
2021-07-23 13:48:27 +08:00
|
|
|
: EvictablePage(owner->pageCache), owner(owner), pageOffset(offset), notReading(Void()), notFlushing(Void()),
|
|
|
|
dirty(false), valid(false), truncated(false), writeThroughCount(0), flushableIndex(-1), zeroCopyRefCount(0) {
|
2017-05-26 04:48:44 +08:00
|
|
|
pageCache->allocate(this);
|
|
|
|
}
|
|
|
|
|
2021-01-26 09:55:43 +08:00
|
|
|
~AFCPage() override {
|
2017-05-26 04:48:44 +08:00
|
|
|
clearDirty();
|
2021-03-11 02:06:03 +08:00
|
|
|
ASSERT_ABORT(flushableIndex == -1);
|
2017-05-26 04:48:44 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
void setDirty() {
|
|
|
|
dirty = true;
|
|
|
|
updateFlushableIndex();
|
|
|
|
}
|
|
|
|
|
|
|
|
void clearDirty() {
|
|
|
|
dirty = false;
|
|
|
|
updateFlushableIndex();
|
|
|
|
}
|
|
|
|
|
|
|
|
void updateFlushableIndex() {
|
|
|
|
bool flushable = dirty || writeThroughCount;
|
2021-03-11 02:06:03 +08:00
|
|
|
if (flushable == (flushableIndex != -1))
|
|
|
|
return;
|
2017-05-26 04:48:44 +08:00
|
|
|
|
|
|
|
if (flushable) {
|
|
|
|
flushableIndex = owner->flushable.size();
|
|
|
|
owner->flushable.push_back(this);
|
|
|
|
} else {
|
2021-03-11 02:06:03 +08:00
|
|
|
ASSERT(owner->flushable[flushableIndex] == this);
|
2017-05-26 04:48:44 +08:00
|
|
|
owner->flushable[flushableIndex] = owner->flushable.back();
|
|
|
|
owner->flushable[flushableIndex]->flushableIndex = flushableIndex;
|
|
|
|
owner->flushable.pop_back();
|
|
|
|
flushableIndex = -1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
AsyncFileCached* owner;
|
|
|
|
int64_t pageOffset;
|
|
|
|
|
|
|
|
Future<Void> notReading; // .isReady when a readThrough (or waitAndWrite) is not in progress
|
|
|
|
Future<Void> notFlushing; // .isReady when a writeThrough is not in progress
|
|
|
|
|
|
|
|
bool dirty; // write has been called more recently than flush
|
|
|
|
bool valid; // data contains the file contents
|
|
|
|
bool truncated; // true if this page has been truncated
|
2021-03-11 02:06:03 +08:00
|
|
|
int writeThroughCount; // number of writeThrough actors that are in progress (potentially writing or waiting to
|
|
|
|
// write)
|
|
|
|
int flushableIndex; // index in owner->flushable[]
|
|
|
|
int zeroCopyRefCount; // references held by "zero-copy" reads
|
2017-05-26 04:48:44 +08:00
|
|
|
};
|
|
|
|
|
2018-08-11 06:47:41 +08:00
|
|
|
#include "flow/unactorcompiler.h"
|
2017-05-26 04:48:44 +08:00
|
|
|
#endif
|