Merge pull request #3442 from sfc-gh-almiller/read-after-write

Add a ReadAfterWrite workload, to measure TLog->SS propagation delay
This commit is contained in:
Russell Sears 2020-07-02 16:42:09 -07:00 committed by GitHub
commit 3e2b7e5cf0
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
4 changed files with 132 additions and 0 deletions

View File

@ -171,6 +171,7 @@ set(FDBSERVER_SRCS
workloads/RandomClogging.actor.cpp
workloads/RandomMoveKeys.actor.cpp
workloads/RandomSelector.actor.cpp
workloads/ReadAfterWrite.actor.cpp
workloads/ReadWrite.actor.cpp
workloads/RemoveServersSafely.actor.cpp
workloads/ReportConflictingKeys.actor.cpp

View File

@ -0,0 +1,125 @@
/*
* ReadAfterWrite.actor.cpp
*
* This source file is part of the FoundationDB open source project
*
* Copyright 2013-2020 Apple Inc. and the FoundationDB project authors
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#include <vector>
#include "fdbclient/NativeAPI.actor.h"
#include "fdbserver/workloads/workloads.actor.h"
#include "flow/genericactors.actor.h"
#include "flow/actorcompiler.h" // This must be the last #include.
static constexpr int SAMPLE_SIZE = 10000;
// If the log->storage propagation delay is longer than 1 second, then it's likely that our read
// will see a `future_version` error from the storage server. We need to retry the read until
// a value is returned, or a different error is thrown.
ACTOR Future<double> latencyOfRead(Transaction* tr, Key k) {
state double start = timer();
loop {
try {
wait(success(tr->get(k)));
break;
} catch (Error &e) {
if (e.code() == error_code_future_version) {
continue;
}
throw;
}
}
return timer() - start;
}
// Measure the latency of a storage server making a committed value available for reading.
struct ReadAfterWriteWorkload : KVWorkload {
double testDuration;
ContinuousSample<double> propagationLatency;
ReadAfterWriteWorkload(WorkloadContext const& wcx) : KVWorkload(wcx), propagationLatency(SAMPLE_SIZE) {
testDuration = getOption(options, LiteralStringRef("testDuration"), 10.0);
}
virtual std::string description() { return "ReadAfterWriteWorkload"; }
virtual Future<Void> setup(Database const& cx) { return Void(); }
ACTOR static Future<Void> benchmark(Database cx, ReadAfterWriteWorkload* self) {
loop {
state Key key = self->getRandomKey();
state Transaction writeTr(cx);
state Transaction baselineReadTr(cx);
state Transaction afterWriteTr(cx);
try {
state Version readVersion = wait(writeTr.getReadVersion());
// We do a read in this writeTransaction only to enforce that `readVersion` is already on a storage
// server after we commit. Its existence or non-existence is irrelevant. We write back the exact same
// value (or clear the key, if empty) so that the database state is not mutated. This means this
// workload can be paired with any other workload, and it won't affect any results.
Optional<Value> value = wait( writeTr.get(key) );
if (value.present()) {
writeTr.set(key, value.get());
} else {
writeTr.clear(key);
}
wait(writeTr.commit());
Version commitVersion = writeTr.getCommittedVersion();
baselineReadTr.setVersion(readVersion);
afterWriteTr.setVersion(commitVersion);
state double baselineLatency = 0;
state double afterWriteLatency = 0;
wait(store(baselineLatency, latencyOfRead(&baselineReadTr, key)) &&
store(afterWriteLatency, latencyOfRead(&afterWriteTr, key)));
// By reading the same key at two different versions, we should be able to measure the latency of the
// network, the storage server overhead, and the propagation delay, and then with our baseline read,
// subtract out the network and the storage server overhead, leaving only the propagation delay.
self->propagationLatency.addSample(std::max<double>(afterWriteLatency - baselineLatency, 0));
} catch (Error& e) {
wait(writeTr.onError(e));
}
}
}
virtual Future<Void> start(Database const& cx) { return _start(cx, this); }
ACTOR Future<Void> _start(Database cx, ReadAfterWriteWorkload* self) {
state Future<Void> lifetime = benchmark(cx, self);
wait(delay(self->testDuration));
return Void();
}
virtual Future<bool> check(Database const& cx) override { return true; }
virtual void getMetrics(std::vector<PerfMetric>& m) {
m.emplace_back("Mean Latency (ms)", 1000 * propagationLatency.mean(), true);
m.emplace_back("Median Latency (ms, averaged)", 1000 * propagationLatency.median(), true);
m.emplace_back("90% Latency (ms, averaged)", 1000 * propagationLatency.percentile(0.90), true);
m.emplace_back("99% Latency (ms, averaged)", 1000 * propagationLatency.percentile(0.99), true);
m.emplace_back("Max Latency (ms, averaged)", 1000 * propagationLatency.max(), true);
}
};
WorkloadFactory<ReadAfterWriteWorkload> ReadAfterWriteWorkloadFactory("ReadAfterWrite");

View File

@ -65,6 +65,7 @@ if(WITH_PYTHON)
add_fdb_test(TEST_FILES RandomRead.txt IGNORE)
add_fdb_test(TEST_FILES RandomReadWrite.txt IGNORE)
add_fdb_test(TEST_FILES ReadAbsent.txt IGNORE)
add_fdb_test(TEST_FILES ReadAfterWrite.txt IGNORE)
add_fdb_test(TEST_FILES ReadHalfAbsent.txt IGNORE)
add_fdb_test(TEST_FILES fast/ReadHotDetectionCorrectness.txt)
add_fdb_test(TEST_FILES RedwoodCorrectnessUnits.txt IGNORE)

5
tests/ReadAfterWrite.txt Normal file
View File

@ -0,0 +1,5 @@
testTitle=ReadAfterWriteTest
testName=ReadAfterWrite
testDuration=10
waitForQuiescenceBegin=false
waitForQuiescenceEnd=false