foundationdb/fdbserver/workloads/IncrementalBackup.actor.cpp

228 lines
8.4 KiB
C++

/*
* IncrementalBackup.actor.cpp
*
* This source file is part of the FoundationDB open source project
*
* Copyright 2013-2018 Apple Inc. and the FoundationDB project authors
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#include "fdbclient/FDBTypes.h"
#include "fdbclient/Knobs.h"
#include "fdbclient/SystemData.h"
#include "fdbclient/ReadYourWrites.h"
#include "fdbrpc/simulator.h"
#include "fdbclient/BackupAgent.actor.h"
#include "fdbclient/BackupContainer.h"
#include "fdbserver/workloads/workloads.actor.h"
#include "flow/Arena.h"
#include "flow/serialize.h"
#include "flow/actorcompiler.h" // This must be the last #include.
struct IncrementalBackupWorkload : TestWorkload {
Standalone<StringRef> backupDir;
Standalone<StringRef> tag;
FileBackupAgent backupAgent;
bool submitOnly;
bool restoreOnly;
bool waitForBackup;
int waitRetries;
bool stopBackup;
bool checkBeginVersion;
bool clearBackupAgentKeys;
IncrementalBackupWorkload(WorkloadContext const& wcx) : TestWorkload(wcx) {
backupDir = getOption(options, LiteralStringRef("backupDir"), LiteralStringRef("file://simfdb/backups/"));
tag = getOption(options, LiteralStringRef("tag"), LiteralStringRef("default"));
submitOnly = getOption(options, LiteralStringRef("submitOnly"), false);
restoreOnly = getOption(options, LiteralStringRef("restoreOnly"), false);
waitForBackup = getOption(options, LiteralStringRef("waitForBackup"), false);
waitRetries = getOption(options, LiteralStringRef("waitRetries"), -1);
stopBackup = getOption(options, LiteralStringRef("stopBackup"), false);
checkBeginVersion = getOption(options, LiteralStringRef("checkBeginVersion"), false);
clearBackupAgentKeys = getOption(options, LiteralStringRef("clearBackupAgentKeys"), false);
}
std::string description() const override { return "IncrementalBackup"; }
Future<Void> setup(Database const& cx) override { return Void(); }
Future<Void> start(Database const& cx) override {
if (clientId) {
return Void();
}
return _start(cx, this);
}
Future<bool> check(Database const& cx) override {
if (clientId) {
return true;
}
return _check(cx, this);
}
ACTOR static Future<bool> _check(Database cx, IncrementalBackupWorkload* self) {
if (self->waitForBackup) {
// Undergoing recovery with the snapshot system keys set will pause the backup agent
// Pre-emptively unpause any backup agents before attempting to wait to avoid getting stuck
wait(self->backupAgent.changePause(cx, false));
state Reference<IBackupContainer> backupContainer;
state UID backupUID;
state Version v;
state Transaction tr(cx);
loop {
try {
wait(store(v, tr.getReadVersion()));
break;
} catch (Error& e) {
wait(tr.onError(e));
}
}
loop {
// Wait for backup container to be created and avoid race condition
TraceEvent("IBackupWaitContainer");
wait(success(
self->backupAgent.waitBackup(cx, self->tag.toString(), false, &backupContainer, &backupUID)));
if (!backupContainer.isValid()) {
TraceEvent("IBackupCheckListContainersAttempt");
state std::vector<std::string> containers =
wait(IBackupContainer::listContainers(self->backupDir.toString()));
TraceEvent("IBackupCheckListContainersSuccess")
.detail("Size", containers.size())
.detail("First", containers.front());
if (containers.size()) {
backupContainer = IBackupContainer::openContainer(containers.front());
}
}
state bool e = wait(backupContainer->exists());
if (e) break;
wait(delay(5.0));
}
state int tries = 0;
loop {
tries++;
BackupDescription desc = wait(backupContainer->describeBackup(true));
TraceEvent("IBackupVersionGate")
.detail("MaxLogEndVersion", desc.maxLogEnd.present() ? desc.maxLogEnd.get() : invalidVersion)
.detail("ContiguousLogEndVersion",
desc.contiguousLogEnd.present() ? desc.contiguousLogEnd.get() : invalidVersion)
.detail("TargetVersion", v);
if (!desc.contiguousLogEnd.present()) continue;
if (desc.contiguousLogEnd.get() >= v) break;
if (self->waitRetries != -1 && tries > self->waitRetries) break;
// Avoid spamming requests with a delay
wait(delay(5.0));
}
}
if (self->stopBackup) {
try {
TraceEvent("IBackupDiscontinueBackup");
wait(self->backupAgent.discontinueBackup(cx, self->tag));
} catch (Error& e) {
TraceEvent("IBackupDiscontinueBackupException").error(e);
if (e.code() != error_code_backup_unneeded) {
throw;
}
}
}
return true;
}
ACTOR static Future<Void> _start(Database cx, IncrementalBackupWorkload* self) {
if (self->submitOnly) {
Standalone<VectorRef<KeyRangeRef>> backupRanges;
backupRanges.push_back_deep(backupRanges.arena(), normalKeys);
TraceEvent("IBackupSubmitAttempt");
try {
wait(self->backupAgent.submitBackup(cx, self->backupDir, 1e8, self->tag.toString(), backupRanges, false,
false, true));
} catch (Error& e) {
TraceEvent("IBackupSubmitError").error(e);
if (e.code() != error_code_backup_duplicate) {
throw;
}
}
TraceEvent("IBackupSubmitSuccess");
}
if (self->restoreOnly) {
if (self->clearBackupAgentKeys) {
state Transaction clearTr(cx);
// Clear Relevant System Keys
loop {
try {
clearTr.setOption(FDBTransactionOptions::ACCESS_SYSTEM_KEYS);
clearTr.setOption(FDBTransactionOptions::LOCK_AWARE);
clearTr.clear(fileBackupPrefixRange);
wait(clearTr.commit());
break;
} catch (Error& e) {
wait(clearTr.onError(e));
}
}
}
state Reference<IBackupContainer> backupContainer;
state UID backupUID;
state Version beginVersion = invalidVersion;
wait(success(self->backupAgent.waitBackup(cx, self->tag.toString(), false, &backupContainer, &backupUID)));
if (self->checkBeginVersion) {
TraceEvent("IBackupReadSystemKeys");
state Reference<ReadYourWritesTransaction> tr(new ReadYourWritesTransaction(cx));
loop {
try {
tr->setOption(FDBTransactionOptions::ACCESS_SYSTEM_KEYS);
tr->setOption(FDBTransactionOptions::LOCK_AWARE);
state Optional<Value> writeFlag = wait(tr->get(writeRecoveryKey));
state Optional<Value> versionValue = wait(tr->get(snapshotEndVersionKey));
TraceEvent("IBackupCheckSpecialKeys")
.detail("WriteRecoveryValue", writeFlag.present() ? writeFlag.get().toString() : "N/A")
.detail("EndVersionValue", versionValue.present() ? versionValue.get().toString() : "N/A");
if (!versionValue.present()) {
TraceEvent("IBackupCheckSpecialKeysFailure");
// Snapshot failed to write to special keys, possibly due to snapshot itself failing
throw key_not_found();
}
beginVersion = BinaryReader::fromStringRef<Version>(versionValue.get(), Unversioned());
TraceEvent("IBackupCheckBeginVersion").detail("Version", beginVersion);
break;
} catch (Error& e) {
TraceEvent("IBackupReadSystemKeysError").error(e);
if (e.code() == error_code_key_not_found) {
throw;
}
wait(tr->onError(e));
}
}
}
TraceEvent("IBackupStartListContainersAttempt");
state std::vector<std::string> containers =
wait(IBackupContainer::listContainers(self->backupDir.toString()));
TraceEvent("IBackupStartListContainersSuccess")
.detail("Size", containers.size())
.detail("First", containers.front());
state Key backupURL = Key(containers.front());
TraceEvent("IBackupRestoreAttempt")
.detail("BeginVersion", beginVersion);
wait(success(self->backupAgent.restore(cx, cx, Key(self->tag.toString()), backupURL, true, invalidVersion,
true, normalKeys, Key(), Key(), true, true, beginVersion)));
TraceEvent("IBackupRestoreSuccess");
}
return Void();
}
void getMetrics(vector<PerfMetric>& m) override {}
};
WorkloadFactory<IncrementalBackupWorkload> IncrementalBackupWorkloadFactory("IncrementalBackup");