121 lines
4.4 KiB
C++
121 lines
4.4 KiB
C++
/*
|
|
* KillRegion.actor.cpp
|
|
*
|
|
* This source file is part of the FoundationDB open source project
|
|
*
|
|
* Copyright 2013-2018 Apple Inc. and the FoundationDB project authors
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
#include "fdbclient/NativeAPI.actor.h"
|
|
#include "fdbserver/TesterInterface.actor.h"
|
|
#include "fdbserver/WorkerInterface.actor.h"
|
|
#include "fdbserver/workloads/workloads.actor.h"
|
|
#include "fdbserver/RecoveryState.h"
|
|
#include "fdbserver/ServerDBInfo.h"
|
|
#include "fdbrpc/simulator.h"
|
|
#include "fdbclient/ManagementAPI.actor.h"
|
|
#include "flow/actorcompiler.h" // This must be the last include.
|
|
|
|
struct KillRegionWorkload : TestWorkload {
|
|
bool enabled;
|
|
double testDuration;
|
|
|
|
KillRegionWorkload( WorkloadContext const& wcx )
|
|
: TestWorkload(wcx)
|
|
{
|
|
enabled = !clientId && g_network->isSimulated(); // only do this on the "first" client, and only when in simulation
|
|
testDuration = getOption( options, LiteralStringRef("testDuration"), 10.0 );
|
|
g_simulator.usableRegions = 1;
|
|
}
|
|
|
|
std::string description() const override { return "KillRegionWorkload"; }
|
|
Future<Void> setup(Database const& cx) override {
|
|
if(enabled) {
|
|
return _setup( this, cx );
|
|
}
|
|
return Void();
|
|
}
|
|
Future<Void> start(Database const& cx) override {
|
|
if(enabled) {
|
|
return killRegion( this, cx );
|
|
}
|
|
return Void();
|
|
}
|
|
Future<bool> check(Database const& cx) override { return true; }
|
|
void getMetrics(vector<PerfMetric>& m) override {}
|
|
|
|
ACTOR static Future<Void> _setup( KillRegionWorkload *self, Database cx ) {
|
|
TraceEvent("ForceRecovery_DisablePrimaryBegin");
|
|
wait(success( changeConfig( cx, g_simulator.disablePrimary, true ) ));
|
|
TraceEvent("ForceRecovery_WaitForRemote");
|
|
wait( waitForPrimaryDC(cx, LiteralStringRef("1")) );
|
|
TraceEvent("ForceRecovery_DisablePrimaryComplete");
|
|
return Void();
|
|
}
|
|
|
|
ACTOR static Future<Void> waitForStorageRecovered( KillRegionWorkload *self ) {
|
|
while( self->dbInfo->get().recoveryState < RecoveryState::STORAGE_RECOVERED ) {
|
|
wait( self->dbInfo->onChange() );
|
|
}
|
|
return Void();
|
|
}
|
|
|
|
ACTOR static Future<Void> killRegion( KillRegionWorkload *self, Database cx ) {
|
|
ASSERT( g_network->isSimulated() );
|
|
if(deterministicRandom()->random01() < 0.5) {
|
|
TraceEvent("ForceRecovery_DisableRemoteBegin");
|
|
wait( success( changeConfig( cx, g_simulator.disableRemote, true ) ) );
|
|
TraceEvent("ForceRecovery_WaitForPrimary");
|
|
wait( waitForPrimaryDC(cx, LiteralStringRef("0")) );
|
|
TraceEvent("ForceRecovery_DisableRemoteComplete");
|
|
wait( success( changeConfig( cx, g_simulator.originalRegions, true ) ) );
|
|
}
|
|
TraceEvent("ForceRecovery_Wait");
|
|
wait( delay( deterministicRandom()->random01() * self->testDuration ) );
|
|
|
|
g_simulator.killDataCenter( LiteralStringRef("0"), deterministicRandom()->random01() < 0.5 ? ISimulator::KillInstantly : ISimulator::RebootAndDelete, true );
|
|
g_simulator.killDataCenter( LiteralStringRef("2"), deterministicRandom()->random01() < 0.5 ? ISimulator::KillInstantly : ISimulator::RebootAndDelete, true );
|
|
g_simulator.killDataCenter( LiteralStringRef("4"), deterministicRandom()->random01() < 0.5 ? ISimulator::KillInstantly : ISimulator::RebootAndDelete, true );
|
|
|
|
TraceEvent("ForceRecovery_Begin");
|
|
|
|
wait( forceRecovery(cx->getConnectionFile(), LiteralStringRef("1")) );
|
|
|
|
TraceEvent("ForceRecovery_UsableRegions");
|
|
|
|
DatabaseConfiguration conf = wait(getDatabaseConfiguration(cx));
|
|
|
|
TraceEvent("ForceRecovery_GotConfig").detail("Conf", conf.toString());
|
|
|
|
if(conf.usableRegions>1) {
|
|
loop {
|
|
//only needed if force recovery was unnecessary and we killed the secondary
|
|
wait( success( changeConfig( cx, g_simulator.disablePrimary + " repopulate_anti_quorum=1", true ) ) );
|
|
choose {
|
|
when( wait( waitForStorageRecovered(self) ) ) { break; }
|
|
when( wait( delay(300.0) ) ) { }
|
|
}
|
|
}
|
|
wait( success( changeConfig( cx, "usable_regions=1", true ) ) );
|
|
}
|
|
|
|
TraceEvent("ForceRecovery_Complete");
|
|
|
|
return Void();
|
|
}
|
|
};
|
|
|
|
WorkloadFactory<KillRegionWorkload> KillRegionWorkloadFactory("KillRegion");
|