Merge pull request #3442 from sfc-gh-almiller/read-after-write

Add a ReadAfterWrite workload, to measure TLog->SS propagation delay
2020-07-02 16:42:09 -07:00 · 2020-07-02 16:42:09 -07:00 · 3e2b7e5cf0
parent b7189f5168 c76e0cfe04
commit 3e2b7e5cf0
4 changed files with 132 additions and 0 deletions
--- a/fdbserver/CMakeLists.txt
+++ b/fdbserver/CMakeLists.txt
@ -171,6 +171,7 @@ set(FDBSERVER_SRCS
  workloads/RandomClogging.actor.cpp
  workloads/RandomMoveKeys.actor.cpp
  workloads/RandomSelector.actor.cpp
+  workloads/ReadAfterWrite.actor.cpp
  workloads/ReadWrite.actor.cpp
  workloads/RemoveServersSafely.actor.cpp
  workloads/ReportConflictingKeys.actor.cpp
--- a/fdbserver/workloads/ReadAfterWrite.actor.cpp
+++ b/fdbserver/workloads/ReadAfterWrite.actor.cpp
@ -0,0 +1,125 @@
+/*
+ * ReadAfterWrite.actor.cpp
+ *
+ * This source file is part of the FoundationDB open source project
+ *
+ * Copyright 2013-2020 Apple Inc. and the FoundationDB project authors
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include <vector>
+
+#include "fdbclient/NativeAPI.actor.h"
+#include "fdbserver/workloads/workloads.actor.h"
+#include "flow/genericactors.actor.h"
+#include "flow/actorcompiler.h" // This must be the last #include.
+
+static constexpr int SAMPLE_SIZE = 10000;
+
+// If the log->storage propagation delay is longer than 1 second, then it's likely that our read
+// will see a `future_version` error from the storage server.  We need to retry the read until
+// a value is returned, or a different error is thrown.
+ACTOR Future<double> latencyOfRead(Transaction* tr, Key k) {
+	state double start = timer();
+	loop {
+		try {
+			wait(success(tr->get(k)));
+			break;
+		} catch (Error &e) {
+			if (e.code() == error_code_future_version) {
+				continue;
+			}
+			throw;
+		}
+	}
+	return timer() - start;
+}
+
+// Measure the latency of a storage server making a committed value available for reading.
+struct ReadAfterWriteWorkload : KVWorkload {
+
+	double testDuration;
+	ContinuousSample<double> propagationLatency;
+
+	ReadAfterWriteWorkload(WorkloadContext const& wcx) : KVWorkload(wcx), propagationLatency(SAMPLE_SIZE) {
+		testDuration = getOption(options, LiteralStringRef("testDuration"), 10.0);
+	}
+
+	virtual std::string description() { return "ReadAfterWriteWorkload"; }
+
+	virtual Future<Void> setup(Database const& cx) { return Void(); }
+
+	ACTOR static Future<Void> benchmark(Database cx, ReadAfterWriteWorkload* self) {
+		loop {
+			state Key key = self->getRandomKey();
+			state Transaction writeTr(cx);
+			state Transaction baselineReadTr(cx);
+			state Transaction afterWriteTr(cx);
+
+			try {
+				state Version readVersion = wait(writeTr.getReadVersion());
+
+				// We do a read in this writeTransaction only to enforce that `readVersion` is already on a storage
+				// server after we commit.  Its existence or non-existence is irrelevant.  We write back the exact same
+				// value (or clear the key, if empty) so that the database state is not mutated.  This means this
+				// workload can be paired with any other workload, and it won't affect any results.
+				Optional<Value> value = wait( writeTr.get(key) );
+				if (value.present()) {
+					writeTr.set(key, value.get());
+				} else {
+					writeTr.clear(key);
+				}
+
+				wait(writeTr.commit());
+
+				Version commitVersion = writeTr.getCommittedVersion();
+
+				baselineReadTr.setVersion(readVersion);
+				afterWriteTr.setVersion(commitVersion);
+
+				state double baselineLatency = 0;
+				state double afterWriteLatency = 0;
+
+				wait(store(baselineLatency, latencyOfRead(&baselineReadTr, key)) &&
+				     store(afterWriteLatency, latencyOfRead(&afterWriteTr, key)));
+
+				// By reading the same key at two different versions, we should be able to measure the latency of the
+				// network, the storage server overhead, and the propagation delay, and then with our baseline read,
+				// subtract out the network and the storage server overhead, leaving only the propagation delay.
+				self->propagationLatency.addSample(std::max<double>(afterWriteLatency - baselineLatency, 0));
+			} catch (Error& e) {
+				wait(writeTr.onError(e));
+			}
+		}
+	}
+
+	virtual Future<Void> start(Database const& cx) { return _start(cx, this); }
+	ACTOR Future<Void> _start(Database cx, ReadAfterWriteWorkload* self) {
+		state Future<Void> lifetime = benchmark(cx, self);
+		wait(delay(self->testDuration));
+		return Void();
+	}
+
+	virtual Future<bool> check(Database const& cx) override { return true; }
+
+	virtual void getMetrics(std::vector<PerfMetric>& m) {
+		m.emplace_back("Mean Latency (ms)", 1000 * propagationLatency.mean(), true);
+		m.emplace_back("Median Latency (ms, averaged)", 1000 * propagationLatency.median(), true);
+		m.emplace_back("90% Latency (ms, averaged)", 1000 * propagationLatency.percentile(0.90), true);
+		m.emplace_back("99% Latency (ms, averaged)", 1000 * propagationLatency.percentile(0.99), true);
+		m.emplace_back("Max Latency (ms, averaged)", 1000 * propagationLatency.max(), true);
+	}
+};
+
+WorkloadFactory<ReadAfterWriteWorkload> ReadAfterWriteWorkloadFactory("ReadAfterWrite");
--- a/tests/CMakeLists.txt
+++ b/tests/CMakeLists.txt
@ -65,6 +65,7 @@ if(WITH_PYTHON)
  add_fdb_test(TEST_FILES RandomRead.txt IGNORE)
  add_fdb_test(TEST_FILES RandomReadWrite.txt IGNORE)
  add_fdb_test(TEST_FILES ReadAbsent.txt IGNORE)
+  add_fdb_test(TEST_FILES ReadAfterWrite.txt IGNORE)
  add_fdb_test(TEST_FILES ReadHalfAbsent.txt IGNORE)
  add_fdb_test(TEST_FILES fast/ReadHotDetectionCorrectness.txt)
  add_fdb_test(TEST_FILES RedwoodCorrectnessUnits.txt IGNORE)
--- a/tests/ReadAfterWrite.txt
+++ b/tests/ReadAfterWrite.txt
@ -0,0 +1,5 @@
+testTitle=ReadAfterWriteTest
+testName=ReadAfterWrite
+testDuration=10
+waitForQuiescenceBegin=false
+waitForQuiescenceEnd=false