foundationdb/fdbserver/Status.actor.cpp

2167 lines
82 KiB
C++
Raw Normal View History

2017-05-26 04:48:44 +08:00
/*
* Status.actor.cpp
*
* This source file is part of the FoundationDB open source project
*
* Copyright 2013-2018 Apple Inc. and the FoundationDB project authors
*
2017-05-26 04:48:44 +08:00
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
2017-05-26 04:48:44 +08:00
* http://www.apache.org/licenses/LICENSE-2.0
*
2017-05-26 04:48:44 +08:00
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#include "Status.h"
#include "flow/actorcompiler.h"
#include "flow/Trace.h"
#include "fdbclient/NativeAPI.h"
#include "fdbclient/SystemData.h"
#include "fdbclient/ReadYourWrites.h"
#include "WorkerInterface.h"
#include "ClusterRecruitmentInterface.h"
#include <time.h>
#include "CoordinationInterface.h"
#include "DataDistribution.h"
#include "flow/UnitTest.h"
#include "QuietDatabase.h"
#include "RecoveryState.h"
const char* RecoveryStatus::names[] = {
"reading_coordinated_state", "locking_coordinated_state", "locking_old_transaction_servers", "reading_transaction_system_state",
"configuration_missing", "configuration_never_created", "configuration_invalid",
"recruiting_transaction_servers", "initializing_transaction_servers", "recovery_transaction",
"writing_coordinated_state", "accepting_commits", "all_logs_recruited", "storage_recovered", "fully_recovered"
2017-05-26 04:48:44 +08:00
};
static_assert( sizeof(RecoveryStatus::names) == sizeof(RecoveryStatus::names[0])*RecoveryStatus::END, "RecoveryStatus::names[] size" );
const char* RecoveryStatus::descriptions[] = {
// reading_coordinated_state
"Requesting information from coordination servers. Verify that a majority of coordination server processes are active.",
// locking_coordinated_state
"Locking coordination state. Verify that a majority of coordination server processes are active.",
// locking_old_transaction_servers
"Locking old transaction servers. Verify that at least one transaction server from the previous generation is running.",
2017-05-26 04:48:44 +08:00
// reading_transaction_system_state
"Recovering transaction server state. Verify that the transaction server processes are active.",
// configuration_missing
"There appears to be a database, but its configuration does not appear to be initialized.",
// configuration_never_created
"The coordinator(s) have no record of this database. Either the coordinator addresses are incorrect, the coordination state on those machines is missing, or no database has been created.",
// configuration_invalid
"The database configuration is invalid. Set a new, valid configuration to recover the database.",
// recruiting_transaction_servers
"Recruiting new transaction servers.",
// initializing_transaction_servers
"Initializing new transaction servers and recovering transaction logs.",
// recovery_transaction
"Performing recovery transaction.",
// writing_coordinated_state
"Writing coordinated state. Verify that a majority of coordination server processes are active.",
// accepting_commits
"Accepting commits.",
// all_logs_recruited
"Accepting commits. All logs recruited.",
// storage_recovered
"Accepting commits. All storage servers are reading from the new logs.",
2017-05-26 04:48:44 +08:00
// fully_recovered
"Recovery complete."
2017-05-26 04:48:44 +08:00
};
static_assert( sizeof(RecoveryStatus::descriptions) == sizeof(RecoveryStatus::descriptions[0])*RecoveryStatus::END, "RecoveryStatus::descriptions[] size" );
// From Ratekeeper.actor.cpp
extern int limitReasonEnd;
extern const char* limitReasonName[];
extern const char* limitReasonDesc[];
struct WorkerEvents : std::map<NetworkAddress, TraceEventFields> {};
2017-05-26 04:48:44 +08:00
ACTOR static Future< Optional<TraceEventFields> > latestEventOnWorker(WorkerInterface worker, std::string eventName) {
2017-05-26 04:48:44 +08:00
try {
EventLogRequest req = eventName.size() > 0 ? EventLogRequest(Standalone<StringRef>(eventName)) : EventLogRequest();
ErrorOr<TraceEventFields> eventTrace = wait( errorOr(timeoutError(worker.eventLogRequest.getReply(req), 2.0)));
2017-05-26 04:48:44 +08:00
if (eventTrace.isError()){
return Optional<TraceEventFields>();
2017-05-26 04:48:44 +08:00
}
return eventTrace.get();
2017-05-26 04:48:44 +08:00
}
catch (Error &e){
if (e.code() == error_code_actor_cancelled)
throw;
return Optional<TraceEventFields>();
2017-05-26 04:48:44 +08:00
}
}
ACTOR static Future< Optional< std::pair<WorkerEvents, std::set<std::string>> > > latestEventOnWorkers(std::vector<std::pair<WorkerInterface, ProcessClass>> workers, std::string eventName) {
try {
state vector<Future<ErrorOr<TraceEventFields>>> eventTraces;
2017-05-26 04:48:44 +08:00
for (int c = 0; c < workers.size(); c++) {
EventLogRequest req = eventName.size() > 0 ? EventLogRequest(Standalone<StringRef>(eventName)) : EventLogRequest();
eventTraces.push_back(errorOr(timeoutError(workers[c].first.eventLogRequest.getReply(req), 2.0)));
}
Void _ = wait(waitForAll(eventTraces));
std::set<std::string> failed;
WorkerEvents results;
for (int i = 0; i < eventTraces.size(); i++) {
2018-06-27 05:37:21 +08:00
const ErrorOr<TraceEventFields>& v = eventTraces[i].get();
2017-05-26 04:48:44 +08:00
if (v.isError()){
failed.insert(workers[i].first.address().toString());
results[workers[i].first.address()] = TraceEventFields();
2017-05-26 04:48:44 +08:00
}
else {
results[workers[i].first.address()] = v.get();
2017-05-26 04:48:44 +08:00
}
}
std::pair<WorkerEvents, std::set<std::string>> val;
val.first = results;
val.second = failed;
return val;
}
catch (Error &e){
ASSERT(e.code() == error_code_actor_cancelled); // All errors should be filtering through the errorOr actor above
throw;
}
}
static Future< Optional< std::pair<WorkerEvents, std::set<std::string>> > > latestErrorOnWorkers(std::vector<std::pair<WorkerInterface, ProcessClass>> workers) {
return latestEventOnWorkers( workers, "" );
}
static Optional<std::pair<WorkerInterface, ProcessClass>> getWorker(std::vector<std::pair<WorkerInterface, ProcessClass>> const& workers, NetworkAddress const& address) {
try {
for (int c = 0; c < workers.size(); c++)
if (address == workers[c].first.address())
return workers[c];
return Optional<std::pair<WorkerInterface, ProcessClass>>();
}
catch (Error &e){
return Optional<std::pair<WorkerInterface, ProcessClass>>();
}
}
static Optional<std::pair<WorkerInterface, ProcessClass>> getWorker(std::map<NetworkAddress, std::pair<WorkerInterface, ProcessClass>> const& workersMap, NetworkAddress const& address) {
auto itr = workersMap.find(address);
if(itr == workersMap.end()) {
return Optional<std::pair<WorkerInterface, ProcessClass>>();
}
return itr->second;
}
class StatusCounter {
public:
StatusCounter(double hz=0.0, double roughness=0.0, int64_t counter=0) : _hz(hz), _roughness(roughness), _counter(counter) {}
StatusCounter(const std::string& parsableText) {
parseText(parsableText);
}
2017-05-26 04:48:44 +08:00
StatusCounter& parseText(const std::string& parsableText) {
sscanf(parsableText.c_str(), "%lf %lf %lld", &_hz, &_roughness, &_counter);
return *this;
}
2017-05-26 04:48:44 +08:00
StatusCounter& updateValues(const StatusCounter& statusCounter) {
double hzNew = _hz + statusCounter._hz;
double roughnessNew = (_hz + statusCounter._hz) ? (_roughness*_hz + statusCounter._roughness*statusCounter._hz) / (_hz + statusCounter._hz) : 0.0;
int64_t counterNew = _counter + statusCounter._counter;
_hz = hzNew;
_roughness = roughnessNew;
_counter = counterNew;
return *this;
}
JsonString getStatus() const {
JsonString statusObject;
statusObject["hz"] = _hz;
statusObject["roughness"] = _roughness;
statusObject["counter"] = _counter;
return statusObject;
}
protected:
double _hz;
double _roughness;
int64_t _counter;
};
2017-05-26 04:48:44 +08:00
static double parseDouble(std::string const& s, bool permissive = false) {
double d = 0;
int consumed = 0;
int r = sscanf(s.c_str(), "%lf%n", &d, &consumed);
if (r == 1 && (consumed == s.size() || permissive))
return d;
throw attribute_not_found();
}
static int parseInt(std::string const& s, bool permissive = false) {
long long int iLong = 0;
int consumed = 0;
int r = sscanf(s.c_str(), "%lld%n", &iLong, &consumed);
if (r == 1 && (consumed == s.size() || permissive)){
if (std::numeric_limits<int>::min() <= iLong && iLong <= std::numeric_limits<int>::max())
return (int)iLong; // Downcast definitely safe
else
throw attribute_too_large();
}
throw attribute_not_found();
}
static int64_t parseInt64(std::string const& s, bool permissive = false) {
long long int i = 0;
int consumed = 0;
int r = sscanf(s.c_str(), "%lld%n", &i, &consumed);
if (r == 1 && (consumed == s.size() || permissive))
return i;
throw attribute_not_found();
}
static JsonString getLocalityInfo(const LocalityData& locality) {
JsonString localityObj;
2017-05-26 04:48:44 +08:00
for(auto it = locality._data.begin(); it != locality._data.end(); it++) {
if(it->second.present()) {
localityObj[it->first.toString()] = it->second.get().toString();
}
else {
localityObj[it->first.toString()] = JsonString();
2017-05-26 04:48:44 +08:00
}
}
return localityObj;
}
static JsonString getError(const TraceEventFields& errorFields) {
JsonString statusObj;
2017-05-26 04:48:44 +08:00
try {
if (errorFields.size()) {
double time = atof(errorFields.getValue("Time").c_str());
2017-05-26 04:48:44 +08:00
statusObj["time"] = time;
statusObj["raw_log_message"] = errorFields.toString();
2017-05-26 04:48:44 +08:00
std::string type = errorFields.getValue("Type");
2017-05-26 04:48:44 +08:00
statusObj["type"] = type;
std::string description = type;
std::string errorName;
if(errorFields.tryGetValue("Error", errorName)) {
2017-05-26 04:48:44 +08:00
statusObj["name"] = errorName;
description += ": " + errorName;
}
else
statusObj["name"] = "process_error";
struct tm* timeinfo;
time_t t = (time_t)time;
timeinfo = localtime(&t);
char buffer[128];
strftime(buffer, 128, "%c", timeinfo);
description += " at " + std::string(buffer);
statusObj["description"] = description;
}
}
catch (Error &e){
TraceEvent(SevError, "StatusGetErrorError").error(e).detail("RawError", errorFields.toString());
2017-05-26 04:48:44 +08:00
}
return statusObj;
}
static JsonString machineStatusFetcher(WorkerEvents mMetrics, vector<std::pair<WorkerInterface, ProcessClass>> workers, Optional<DatabaseConfiguration> configuration, std::set<std::string> *incomplete_reasons) {
JsonString machineMap;
2017-05-26 04:48:44 +08:00
double metric;
int failed = 0;
// map from machine networkAddress to datacenter ID
std::map<NetworkAddress, std::string> dcIds;
2017-05-26 04:48:44 +08:00
std::map<NetworkAddress, LocalityData> locality;
std::map<std::string, bool> notExcludedMap;
std::map<std::string, int32_t> workerContribMap;
std::map<std::string, JsonString> machineJsonMap;
2017-05-26 04:48:44 +08:00
for (auto worker : workers){
locality[worker.first.address()] = worker.first.locality;
if (worker.first.locality.dcId().present())
dcIds[worker.first.address()] = worker.first.locality.dcId().get().printable();
}
for(auto it = mMetrics.begin(); it != mMetrics.end(); it++) {
if (!it->second.size()){
continue;
}
JsonString statusObj; // Represents the status for a machine
2018-06-27 05:37:21 +08:00
const TraceEventFields& event = it->second;
2017-05-26 04:48:44 +08:00
try {
std::string address = toIPString(it->first.ip);
// We will use the "physical" caluculated machine ID here to limit exposure to machineID repurposing
std::string machineId = event.getValue("MachineID");
2017-05-26 04:48:44 +08:00
// If this machine ID does not already exist in the machineMap, add it
if (!machineMap.isPresent(machineId)) {
2017-05-26 04:48:44 +08:00
statusObj["machine_id"] = machineId;
if (dcIds.count(it->first)){
statusObj["datacenter_id"] = dcIds[it->first];
}
if(locality.count(it->first)) {
statusObj["locality"] = getLocalityInfo(locality[it->first]);
}
statusObj["address"] = address;
JsonString memoryObj;
2017-05-26 04:48:44 +08:00
metric = parseDouble(event.getValue("TotalMemory"));
2017-05-26 04:48:44 +08:00
memoryObj["total_bytes"] = metric;
metric = parseDouble(event.getValue("CommittedMemory"));
2017-05-26 04:48:44 +08:00
memoryObj["committed_bytes"] = metric;
metric = parseDouble(event.getValue("AvailableMemory"));
2017-05-26 04:48:44 +08:00
memoryObj["free_bytes"] = metric;
statusObj["memory"] = memoryObj;
JsonString cpuObj;
2017-05-26 04:48:44 +08:00
metric = parseDouble(event.getValue("CPUSeconds"));
2017-05-26 04:48:44 +08:00
double cpu_seconds = metric;
metric = parseDouble(event.getValue("Elapsed"));
2017-05-26 04:48:44 +08:00
double elapsed = metric;
if (elapsed > 0){
cpuObj["logical_core_utilization"] = std::max(0.0, std::min(cpu_seconds / elapsed, 1.0));
}
statusObj["cpu"] = cpuObj;
JsonString networkObj;
2017-05-26 04:48:44 +08:00
metric = parseDouble(event.getValue("MbpsSent"));
JsonString megabits_sent;
2017-05-26 04:48:44 +08:00
megabits_sent["hz"] = metric;
networkObj["megabits_sent"] = megabits_sent;
metric = parseDouble(event.getValue("MbpsReceived"));
JsonString megabits_received;
2017-05-26 04:48:44 +08:00
megabits_received["hz"] = metric;
networkObj["megabits_received"] = megabits_received;
metric = parseDouble(event.getValue("RetransSegs"));
JsonString retransSegsObj;
2017-05-26 04:48:44 +08:00
if (elapsed > 0){
retransSegsObj["hz"] = metric / elapsed;
}
networkObj["tcp_segments_retransmitted"] = retransSegsObj;
statusObj["network"] = networkObj;
if (configuration.present()){
notExcludedMap[machineId] = true; // Will be set to false below if this or any later process is not excluded
2017-05-26 04:48:44 +08:00
}
workerContribMap[machineId] = 0;
machineJsonMap[machineId] = statusObj;
2017-05-26 04:48:44 +08:00
}
if (configuration.present() && !configuration.get().isExcludedServer(it->first))
notExcludedMap[machineId] = false;
workerContribMap[machineId] ++;
2017-05-26 04:48:44 +08:00
}
catch (Error& e) {
++failed;
}
}
// Add the status json for each machine with tracked values
for (auto mapPair : machineJsonMap) {
auto& machineId = mapPair.first;
machineJsonMap[machineId]["excluded"] = notExcludedMap[machineId];
machineJsonMap[machineId]["contributing_workers"] = workerContribMap[machineId];
machineMap[machineId] = machineJsonMap[machineId];
}
2017-05-26 04:48:44 +08:00
if(failed > 0)
incomplete_reasons->insert("Cannot retrieve all machine status information.");
return machineMap;
}
struct MachineMemoryInfo {
double memoryUsage;
double numProcesses;
MachineMemoryInfo() : memoryUsage(0), numProcesses(0) {}
bool valid() { return memoryUsage >= 0; }
void invalidate() { memoryUsage = -1; }
};
struct RolesInfo {
std::multimap<NetworkAddress, JsonString> roles;
JsonString& addRole( NetworkAddress address, std::string const& role, UID id) {
JsonString obj;
2017-05-26 04:48:44 +08:00
obj["id"] = id.shortString();
obj["role"] = role;
return roles.insert( std::make_pair(address, obj ))->second;
2017-05-26 04:48:44 +08:00
}
JsonString& addRole(std::string const& role, StorageServerInterface& iface, TraceEventFields const& metrics, Version maxTLogVersion, double* pDataLagSeconds) {
JsonString obj;
double dataLagSeconds = -1.0;
2017-05-26 04:48:44 +08:00
obj["id"] = iface.id().shortString();
obj["role"] = role;
try {
obj["stored_bytes"] = parseInt64(metrics.getValue("BytesStored"));
obj["kvstore_used_bytes"] = parseInt64(metrics.getValue("KvstoreBytesUsed"));
obj["kvstore_free_bytes"] = parseInt64(metrics.getValue("KvstoreBytesFree"));
obj["kvstore_available_bytes"] = parseInt64(metrics.getValue("KvstoreBytesAvailable"));
obj["kvstore_total_bytes"] = parseInt64(metrics.getValue("KvstoreBytesTotal"));
obj["input_bytes"] = StatusCounter(metrics.getValue("BytesInput")).getStatus();
obj["durable_bytes"] = StatusCounter(metrics.getValue("BytesDurable")).getStatus();
obj["query_queue_max"] = parseInt(metrics.getValue("QueryQueueMax"));
obj["finished_queries"] = StatusCounter(metrics.getValue("FinishedQueries")).getStatus();
Version version = parseInt64(metrics.getValue("Version"));
2017-05-26 04:48:44 +08:00
obj["data_version"] = version;
int64_t versionLag = parseInt64(metrics.getValue("VersionLag"));
2017-05-26 04:48:44 +08:00
if(maxTLogVersion > 0) {
// It's possible that the storage server hasn't talked to the logs recently, in which case it may not be aware of how far behind it is.
// To account for that, we also compute the version difference between each storage server and the tlog with the largest version.
//
// Because this data is only logged periodically, this difference will likely be an overestimate for the lag. We subtract off the logging interval
// in order to make this estimate a bounded underestimate instead.
versionLag = std::max<int64_t>(versionLag, maxTLogVersion - version - SERVER_KNOBS->STORAGE_LOGGING_DELAY * SERVER_KNOBS->VERSIONS_PER_SECOND);
2017-05-26 04:48:44 +08:00
}
JsonString dataLag;
dataLag["versions"] = versionLag;
dataLagSeconds = versionLag / (double)SERVER_KNOBS->VERSIONS_PER_SECOND;
dataLag["seconds"] = dataLagSeconds;
obj["data_lag"] = dataLag;
2017-05-26 04:48:44 +08:00
} catch (Error& e) {
if(e.code() != error_code_attribute_not_found)
throw e;
}
if (pDataLagSeconds)
*pDataLagSeconds = dataLagSeconds;
return roles.insert( std::make_pair(iface.address(), obj ))->second;
2017-05-26 04:48:44 +08:00
}
JsonString& addRole(std::string const& role, TLogInterface& iface, TraceEventFields const& metrics, Version* pMetricVersion) {
JsonString obj;
Version metricVersion = 0;
2017-05-26 04:48:44 +08:00
obj["id"] = iface.id().shortString();
obj["role"] = role;
try {
obj["kvstore_used_bytes"] = parseInt64(metrics.getValue("KvstoreBytesUsed"));
obj["kvstore_free_bytes"] = parseInt64(metrics.getValue("KvstoreBytesFree"));
obj["kvstore_available_bytes"] = parseInt64(metrics.getValue("KvstoreBytesAvailable"));
obj["kvstore_total_bytes"] = parseInt64(metrics.getValue("KvstoreBytesTotal"));
obj["queue_disk_used_bytes"] = parseInt64(metrics.getValue("QueueDiskBytesUsed"));
obj["queue_disk_free_bytes"] = parseInt64(metrics.getValue("QueueDiskBytesFree"));
obj["queue_disk_available_bytes"] = parseInt64(metrics.getValue("QueueDiskBytesAvailable"));
obj["queue_disk_total_bytes"] = parseInt64(metrics.getValue("QueueDiskBytesTotal"));
obj["input_bytes"] = StatusCounter(metrics.getValue("BytesInput")).getStatus();
obj["durable_bytes"] = StatusCounter(metrics.getValue("BytesDurable")).getStatus();
metricVersion = parseInt64(metrics.getValue("Version"));
obj["data_version"] = metricVersion;
2017-05-26 04:48:44 +08:00
} catch (Error& e) {
if(e.code() != error_code_attribute_not_found)
throw e;
}
if (pMetricVersion)
*pMetricVersion = metricVersion;
return roles.insert( std::make_pair(iface.address(), obj ))->second;
2017-05-26 04:48:44 +08:00
}
template <class InterfaceType>
JsonString& addRole(std::string const& role, InterfaceType& iface) {
2017-05-26 04:48:44 +08:00
return addRole(iface.address(), role, iface.id());
}
JsonStringArray getStatusForAddress( NetworkAddress a ) {
JsonStringArray v;
2017-05-26 04:48:44 +08:00
auto it = roles.lower_bound(a);
while (it != roles.end() && it->first == a) {
v.push_back(it->second);
++it;
}
return v;
}
};
ACTOR static Future<JsonString> processStatusFetcher(
2017-05-26 04:48:44 +08:00
Reference<AsyncVar<struct ServerDBInfo>> db,
std::vector<std::pair<WorkerInterface, ProcessClass>> workers,
WorkerEvents pMetrics,
WorkerEvents mMetrics,
WorkerEvents errors,
WorkerEvents traceFileOpenErrors,
WorkerEvents programStarts,
std::map<std::string, JsonString> processIssues,
vector<std::pair<StorageServerInterface, TraceEventFields>> storageServers,
vector<std::pair<TLogInterface, TraceEventFields>> tLogs,
2017-05-26 04:48:44 +08:00
Database cx,
Optional<DatabaseConfiguration> configuration,
std::set<std::string> *incomplete_reasons) {
// Array to hold one entry for each process
state JsonString processMap;
2017-05-26 04:48:44 +08:00
state double metric;
// construct a map from a process address to a status object containing a trace file open error
// this is later added to the messages subsection
state std::map<std::string, JsonString> tracefileOpenErrorMap;
2017-05-26 04:48:44 +08:00
state WorkerEvents::iterator traceFileErrorsItr;
for(traceFileErrorsItr = traceFileOpenErrors.begin(); traceFileErrorsItr != traceFileOpenErrors.end(); ++traceFileErrorsItr) {
Void _ = wait(yield());
if (traceFileErrorsItr->second.size()){
try {
// Have event fields, parse it and turn it into a message object describing the trace file opening error
2018-06-27 05:37:21 +08:00
const TraceEventFields& event = traceFileErrorsItr->second;
std::string fileName = event.getValue("Filename");
JsonString msgObj = JsonString::makeMessage("file_open_error", format("Could not open file '%s' (%s).", fileName.c_str(), event.getValue("Error").c_str()).c_str());
2017-05-26 04:48:44 +08:00
msgObj["file_name"] = fileName;
// Map the address of the worker to the error message object
tracefileOpenErrorMap[traceFileErrorsItr->first.toString()] = msgObj;
}
catch(Error &e) {
incomplete_reasons->insert("file_open_error details could not be retrieved");
}
}
}
state std::map<Optional<Standalone<StringRef>>, MachineMemoryInfo> machineMemoryUsage;
state std::vector<std::pair<WorkerInterface, ProcessClass>>::iterator workerItr;
for(workerItr = workers.begin(); workerItr != workers.end(); ++workerItr) {
Void _ = wait(yield());
state std::map<Optional<Standalone<StringRef>>, MachineMemoryInfo>::iterator memInfo = machineMemoryUsage.insert(std::make_pair(workerItr->first.locality.machineId(), MachineMemoryInfo())).first;
try {
ASSERT(pMetrics.count(workerItr->first.address()));
2018-06-27 06:22:39 +08:00
const TraceEventFields& processMetrics = pMetrics[workerItr->first.address()];
2017-05-26 04:48:44 +08:00
if(memInfo->second.valid()) {
if(processMetrics.size() > 0) {
memInfo->second.memoryUsage += parseDouble(processMetrics.getValue("Memory"));
2017-05-26 04:48:44 +08:00
++memInfo->second.numProcesses;
}
else
memInfo->second.invalidate();
}
}
catch(Error &e) {
memInfo->second.invalidate();
}
}
state RolesInfo roles;
roles.addRole("master", db->get().master);
roles.addRole("cluster_controller", db->get().clusterInterface.clientInterface);
state Reference<ProxyInfo> proxies = cx->getMasterProxies();
if (proxies) {
state int proxyIndex;
for(proxyIndex = 0; proxyIndex < proxies->size(); proxyIndex++) {
roles.addRole( "proxy", proxies->getInterface(proxyIndex) );
Void _ = wait(yield());
}
}
state std::vector<std::pair<TLogInterface, TraceEventFields>>::iterator log;
2017-05-26 04:48:44 +08:00
state Version maxTLogVersion = 0;
state Version tLogVersion = 0;
// Get largest TLog version
2017-05-26 04:48:44 +08:00
for(log = tLogs.begin(); log != tLogs.end(); ++log) {
JsonString const& roleStatus = roles.addRole( "log", log->first, log->second, &tLogVersion );
if (roleStatus.isPresent("data_version")) {
maxTLogVersion = std::max(maxTLogVersion, tLogVersion);
2017-05-26 04:48:44 +08:00
}
Void _ = wait(yield());
}
state std::vector<std::pair<StorageServerInterface, TraceEventFields>>::iterator ss;
state std::map<NetworkAddress, double> ssLag;
state double lagSeconds;
2017-05-26 04:48:44 +08:00
for(ss = storageServers.begin(); ss != storageServers.end(); ++ss) {
JsonString const& roleStatus = roles.addRole( "storage", ss->first, ss->second, maxTLogVersion, &lagSeconds );
if (lagSeconds != -1.0) {
ssLag[ss->first.address()] = lagSeconds;
2017-05-26 04:48:44 +08:00
}
Void _ = wait(yield());
}
state std::vector<ResolverInterface>::const_iterator res;
state std::vector<ResolverInterface> resolvers = db->get().resolvers;
for(res = resolvers.begin(); res != resolvers.end(); ++res) {
roles.addRole( "resolver", *res );
Void _ = wait(yield());
}
for(workerItr = workers.begin(); workerItr != workers.end(); ++workerItr) {
Void _ = wait(yield());
state JsonString statusObj;
2017-05-26 04:48:44 +08:00
try {
ASSERT(pMetrics.count(workerItr->first.address()));
NetworkAddress address = workerItr->first.address();
2018-06-27 06:22:39 +08:00
const TraceEventFields& event = pMetrics[workerItr->first.address()];
2017-05-26 04:48:44 +08:00
statusObj["address"] = address.toString();
JsonString memoryObj;
2017-05-26 04:48:44 +08:00
if (event.size() > 0) {
std::string zoneID = event.getValue("ZoneID");
2017-05-26 04:48:44 +08:00
statusObj["fault_domain"] = zoneID;
std::string MachineID = event.getValue("MachineID");
2017-05-26 04:48:44 +08:00
statusObj["machine_id"] = MachineID;
statusObj["locality"] = getLocalityInfo(workerItr->first.locality);
statusObj["uptime_seconds"] = parseDouble(event.getValue("UptimeSeconds"));
2017-05-26 04:48:44 +08:00
metric = parseDouble(event.getValue("CPUSeconds"));
2017-05-26 04:48:44 +08:00
double cpu_seconds = metric;
// rates are calculated over the last elapsed seconds
metric = parseDouble(event.getValue("Elapsed"));
2017-05-26 04:48:44 +08:00
double elapsed = metric;
metric = parseDouble(event.getValue("DiskIdleSeconds"));
2017-05-26 04:48:44 +08:00
double diskIdleSeconds = metric;
metric = parseDouble(event.getValue("DiskReads"));
2017-05-26 04:48:44 +08:00
double diskReads = metric;
metric = parseDouble(event.getValue("DiskWrites"));
2017-05-26 04:48:44 +08:00
double diskWrites = metric;
uint64_t diskReadsCount = parseInt64(event.getValue("DiskReadsCount"));
2017-05-26 04:48:44 +08:00
uint64_t diskWritesCount = parseInt64(event.getValue("DiskWritesCount"));
2017-05-26 04:48:44 +08:00
metric = parseDouble(event.getValue("DiskWriteSectors"));
2017-05-26 04:48:44 +08:00
double diskWriteSectors = metric;
metric = parseDouble(event.getValue("DiskReadSectors"));
2017-05-26 04:48:44 +08:00
double diskReadSectors = metric;
JsonString diskObj;
2017-05-26 04:48:44 +08:00
if (elapsed > 0){
JsonString cpuObj;
2017-05-26 04:48:44 +08:00
cpuObj["usage_cores"] = std::max(0.0, cpu_seconds / elapsed);
statusObj["cpu"] = cpuObj;
diskObj["busy"] = std::max(0.0, std::min((elapsed - diskIdleSeconds) / elapsed, 1.0));
JsonString readsObj;
2017-05-26 04:48:44 +08:00
readsObj["counter"] = diskReadsCount;
if (elapsed > 0)
readsObj["hz"] = diskReads / elapsed;
readsObj["sectors"] = diskReadSectors;
JsonString writesObj;
2017-05-26 04:48:44 +08:00
writesObj["counter"] = diskWritesCount;
if (elapsed > 0)
writesObj["hz"] = diskWrites / elapsed;
writesObj["sectors"] = diskWriteSectors;
diskObj["reads"] = readsObj;
diskObj["writes"] = writesObj;
}
diskObj["total_bytes"] = parseInt64(event.getValue("DiskTotalBytes"));
diskObj["free_bytes"] = parseInt64(event.getValue("DiskFreeBytes"));
2017-05-26 04:48:44 +08:00
statusObj["disk"] = diskObj;
JsonString networkObj;
2017-05-26 04:48:44 +08:00
networkObj["current_connections"] = parseInt64(event.getValue("CurrentConnections"));
JsonString connections_established;
connections_established["hz"] = parseDouble(event.getValue("ConnectionsEstablished"));
2017-05-26 04:48:44 +08:00
networkObj["connections_established"] = connections_established;
JsonString connections_closed;
connections_closed["hz"] = parseDouble(event.getValue("ConnectionsClosed"));
2017-05-26 04:48:44 +08:00
networkObj["connections_closed"] = connections_closed;
JsonString connection_errors;
connection_errors["hz"] = parseDouble(event.getValue("ConnectionErrors"));
2017-05-26 04:48:44 +08:00
networkObj["connection_errors"] = connection_errors;
metric = parseDouble(event.getValue("MbpsSent"));
JsonString megabits_sent;
2017-05-26 04:48:44 +08:00
megabits_sent["hz"] = metric;
networkObj["megabits_sent"] = megabits_sent;
metric = parseDouble(event.getValue("MbpsReceived"));
JsonString megabits_received;
2017-05-26 04:48:44 +08:00
megabits_received["hz"] = metric;
networkObj["megabits_received"] = megabits_received;
statusObj["network"] = networkObj;
metric = parseDouble(event.getValue("Memory"));
2017-05-26 04:48:44 +08:00
memoryObj["used_bytes"] = metric;
metric = parseDouble(event.getValue("UnusedAllocatedMemory"));
memoryObj["unused_allocated_memory"] = metric;
2017-05-26 04:48:44 +08:00
}
if (programStarts.count(address)) {
auto const& psxml = programStarts.at(address);
if(psxml.size() > 0) {
int64_t memLimit = parseInt64(psxml.getValue("MemoryLimit"));
memoryObj["limit_bytes"] = memLimit;
std::string version;
if (psxml.tryGetValue("Version", version)) {
statusObj["version"] = version;
}
std::string commandLine;
if (psxml.tryGetValue("CommandLine", commandLine)) {
statusObj["command_line"] = commandLine;
}
}
2017-05-26 04:48:44 +08:00
}
// if this process address is in the machine metrics
if (mMetrics.count(address) && mMetrics[address].size()){
double availableMemory;
availableMemory = parseDouble(mMetrics[address].getValue("AvailableMemory"));
2017-05-26 04:48:44 +08:00
auto machineMemInfo = machineMemoryUsage[workerItr->first.locality.machineId()];
if (machineMemInfo.valid()) {
ASSERT(machineMemInfo.numProcesses > 0);
int64_t memory = (availableMemory + machineMemInfo.memoryUsage) / machineMemInfo.numProcesses;
memoryObj["available_bytes"] = std::max<int64_t>(memory, 0);
}
}
statusObj["memory"] = memoryObj;
JsonStringArray messages;
2017-05-26 04:48:44 +08:00
if (errors.count(address) && errors[address].size()) {
2017-05-26 04:48:44 +08:00
// returns status object with type and time of error
messages.push_back(getError(errors.at(address)));
}
2017-05-26 04:48:44 +08:00
// string of address used so that other fields of a NetworkAddress are not compared
std::string strAddress = address.toString();
// If this process has a process issue, identified by strAddress, then add it to messages array
if (processIssues.count(strAddress)){
messages.push_back(processIssues[strAddress]);
}
// If this process had a trace file open error, identified by strAddress, then add it to messages array
if (tracefileOpenErrorMap.count(strAddress)){
messages.push_back(tracefileOpenErrorMap[strAddress]);
}
if(ssLag[address] >= 60) {
messages.push_back(JsonString::makeMessage("storage_server_lagging", format("Storage server lagging by %ld seconds.", (int64_t)ssLag[address]).c_str()));
2017-05-26 04:48:44 +08:00
}
// Store the message array into the status object that represents the worker process
statusObj["messages"] = messages;
// Get roles for the worker's address as an array of objects
statusObj["roles"] = roles.getStatusForAddress(address);
if (configuration.present()){
statusObj["excluded"] = configuration.get().isExcludedServer(address);
}
statusObj["class_type"] = workerItr->second.toString();
statusObj["class_source"] = workerItr->second.sourceString();
}
catch (Error& e){
// Something strange occurred, process list is incomplete but what was built so far, if anything, will be returned.
incomplete_reasons->insert("Cannot retrieve all process status information.");
}
processMap[printable(workerItr->first.locality.processId())] = statusObj;
}
return processMap;
}
static JsonString clientStatusFetcher(ClientVersionMap clientVersionMap, std::map<NetworkAddress, std::string> traceLogGroupMap) {
JsonString clientStatus;
2017-05-26 04:48:44 +08:00
clientStatus["count"] = (int64_t)clientVersionMap.size();
std::map<ClientVersionRef, std::set<NetworkAddress>> clientVersions;
for(auto client : clientVersionMap) {
for(auto ver : client.second) {
clientVersions[ver].insert(client.first);
}
}
JsonStringArray versionsArray = JsonStringArray();
2017-05-26 04:48:44 +08:00
for(auto cv : clientVersions) {
JsonString ver;
2017-05-26 04:48:44 +08:00
ver["count"] = (int64_t)cv.second.size();
ver["client_version"] = cv.first.clientVersion.toString();
ver["protocol_version"] = cv.first.protocolVersion.toString();
ver["source_version"] = cv.first.sourceVersion.toString();
JsonStringArray clients = JsonStringArray();
2017-05-26 04:48:44 +08:00
for(auto client : cv.second) {
JsonString cli;
2017-09-29 07:31:29 +08:00
cli["address"] = client.toString();
cli["log_group"] = traceLogGroupMap[client];
clients.push_back(cli);
2017-05-26 04:48:44 +08:00
}
ver["connected_clients"] = clients;
2017-05-26 04:48:44 +08:00
versionsArray.push_back(ver);
}
if(versionsArray.size() > 0) {
clientStatus["supported_versions"] = versionsArray;
}
return clientStatus;
}
ACTOR static Future<JsonString> recoveryStateStatusFetcher(std::pair<WorkerInterface, ProcessClass> mWorker, int workerCount, std::set<std::string> *incomplete_reasons, int* statusCode) {
state JsonString message;
2017-05-26 04:48:44 +08:00
try {
TraceEventFields md = wait( timeoutError(mWorker.first.eventLogRequest.getReply( EventLogRequest( LiteralStringRef("MasterRecoveryState") ) ), 1.0) );
state int mStatusCode = parseInt( md.getValue("StatusCode") );
2017-05-26 04:48:44 +08:00
if (mStatusCode < 0 || mStatusCode >= RecoveryStatus::END)
throw attribute_not_found();
message = JsonString::makeMessage(RecoveryStatus::names[mStatusCode], RecoveryStatus::descriptions[mStatusCode]);
*statusCode = mStatusCode;
2017-05-26 04:48:44 +08:00
// Add additional metadata for certain statuses
if (mStatusCode == RecoveryStatus::recruiting_transaction_servers) {
int requiredLogs = atoi( md.getValue("RequiredTLogs").c_str() );
int requiredProxies = atoi( md.getValue("RequiredProxies").c_str() );
int requiredResolvers = atoi( md.getValue("RequiredResolvers").c_str() );
2017-05-26 04:48:44 +08:00
//int requiredProcesses = std::max(requiredLogs, std::max(requiredResolvers, requiredProxies));
//int requiredMachines = std::max(requiredLogs, 1);
message["required_logs"] = requiredLogs;
message["required_proxies"] = requiredProxies;
message["required_resolvers"] = requiredResolvers;
} else if (mStatusCode == RecoveryStatus::locking_old_transaction_servers) {
message["missing_logs"] = md.getValue("MissingIDs").c_str();
2017-05-26 04:48:44 +08:00
}
// TODO: time_in_recovery: 0.5
// time_in_state: 0.1
} catch (Error &e){
if (e.code() == error_code_actor_cancelled)
throw;
}
// If recovery status name is not know, status is incomplete
if (!message.isPresent("name"))
2017-05-26 04:48:44 +08:00
incomplete_reasons->insert("Recovery Status unavailable.");
return message;
}
ACTOR static Future<double> doGrvProbe(Transaction *tr, Optional<FDBTransactionOptions::Option> priority = Optional<FDBTransactionOptions::Option>()) {
state double start = timer_monotonic();
loop {
try {
tr->setOption(FDBTransactionOptions::LOCK_AWARE);
2017-05-26 04:48:44 +08:00
if(priority.present()) {
tr->setOption(priority.get());
}
Version _ = wait(tr->getReadVersion());
return timer_monotonic() - start;
}
catch(Error &e) {
Void _ = wait(tr->onError(e));
}
}
}
ACTOR static Future<double> doReadProbe(Future<double> grvProbe, Transaction *tr) {
ErrorOr<double> grv = wait(errorOr(grvProbe));
if(grv.isError()) {
throw grv.getError();
}
state double start = timer_monotonic();
loop {
tr->setOption(FDBTransactionOptions::LOCK_AWARE);
2017-05-26 04:48:44 +08:00
try {
Optional<Standalone<StringRef> > _ = wait(tr->get(LiteralStringRef("\xff/StatusJsonTestKey62793")));
return timer_monotonic() - start;
}
catch(Error &e) {
Void _ = wait(tr->onError(e));
tr->setOption(FDBTransactionOptions::PRIORITY_SYSTEM_IMMEDIATE);
}
}
}
ACTOR static Future<double> doCommitProbe(Future<double> grvProbe, Transaction *sourceTr, Transaction *tr) {
ErrorOr<double> grv = wait(errorOr(grvProbe));
if(grv.isError()) {
throw grv.getError();
}
ASSERT(sourceTr->getReadVersion().isReady());
tr->setVersion(sourceTr->getReadVersion().get());
state double start = timer_monotonic();
loop {
try {
tr->setOption(FDBTransactionOptions::LOCK_AWARE);
2017-05-26 04:48:44 +08:00
tr->setOption(FDBTransactionOptions::PRIORITY_SYSTEM_IMMEDIATE);
tr->makeSelfConflicting();
Void _ = wait(tr->commit());
return timer_monotonic() - start;
}
catch(Error &e) {
Void _ = wait(tr->onError(e));
}
}
}
ACTOR static Future<Void> doProbe(Future<double> probe, int timeoutSeconds, const char* prefix, const char* description, JsonString *probeObj, JsonStringArray *messages, std::set<std::string> *incomplete_reasons) {
2017-05-26 04:48:44 +08:00
choose {
when(ErrorOr<double> result = wait(errorOr(probe))) {
if(result.isError()) {
incomplete_reasons->insert(format("Unable to retrieve latency probe information (%s: %s).", description, result.getError().what()));
}
else {
(*probeObj)[format("%s_seconds", prefix).c_str()] = result.get();
}
}
when(Void _ = wait(delay(timeoutSeconds))) {
messages->push_back(JsonString::makeMessage(format("%s_probe_timeout", prefix).c_str(), format("Unable to %s after %d seconds.", description, timeoutSeconds).c_str()));
2017-05-26 04:48:44 +08:00
}
}
return Void();
}
ACTOR static Future<JsonString> latencyProbeFetcher(Database cx, JsonStringArray *messages, std::set<std::string> *incomplete_reasons) {
2017-05-26 04:48:44 +08:00
state Transaction trImmediate(cx);
state Transaction trDefault(cx);
state Transaction trBatch(cx);
state Transaction trWrite(cx);
state JsonString statusObj;
2017-05-26 04:48:44 +08:00
try {
Future<double> immediateGrvProbe = doGrvProbe(&trImmediate, FDBTransactionOptions::PRIORITY_SYSTEM_IMMEDIATE);
Future<double> defaultGrvProbe = doGrvProbe(&trDefault);
Future<double> batchGrvProbe = doGrvProbe(&trBatch, FDBTransactionOptions::PRIORITY_BATCH);
Future<double> readProbe = doReadProbe(immediateGrvProbe, &trImmediate);
Future<double> commitProbe = doCommitProbe(immediateGrvProbe, &trImmediate, &trWrite);
int timeoutSeconds = 5;
std::vector<Future<Void>> probes;
probes.push_back(doProbe(immediateGrvProbe, timeoutSeconds, "immediate_priority_transaction_start", "start immediate priority transaction", &statusObj, messages, incomplete_reasons));
probes.push_back(doProbe(defaultGrvProbe, timeoutSeconds, "transaction_start", "start default priority transaction", &statusObj, messages, incomplete_reasons));
probes.push_back(doProbe(batchGrvProbe, timeoutSeconds, "batch_priority_transaction_start", "start batch priority transaction", &statusObj, messages, incomplete_reasons));
probes.push_back(doProbe(readProbe, timeoutSeconds, "read", "read", &statusObj, messages, incomplete_reasons));
probes.push_back(doProbe(commitProbe, timeoutSeconds, "commit", "commit", &statusObj, messages, incomplete_reasons));
Void _ = wait(waitForAll(probes));
}
catch (Error &e) {
incomplete_reasons->insert(format("Unable to retrieve latency probe information (%s).", e.what()));
}
return statusObj;
}
ACTOR static Future<std::pair<Optional<DatabaseConfiguration>,Optional<bool>>> loadConfiguration(Database cx, JsonStringArray *messages, std::set<std::string> *status_incomplete_reasons){
2017-05-26 04:48:44 +08:00
state Optional<DatabaseConfiguration> result;
2018-06-15 12:14:18 +08:00
state Optional<bool> fullReplication;
2017-05-26 04:48:44 +08:00
state Transaction tr(cx);
state Future<Void> getConfTimeout = delay(5.0);
loop{
tr.setOption(FDBTransactionOptions::PRIORITY_SYSTEM_IMMEDIATE);
tr.setOption(FDBTransactionOptions::CAUSAL_READ_RISKY);
try {
choose{
when(Standalone<RangeResultRef> res = wait(tr.getRange(configKeys, SERVER_KNOBS->CONFIGURATION_ROWS_TO_FETCH))) {
DatabaseConfiguration configuration;
if (res.size() == SERVER_KNOBS->CONFIGURATION_ROWS_TO_FETCH) {
status_incomplete_reasons->insert("Too many configuration parameters set.");
}
else {
configuration.fromKeyValues((VectorRef<KeyValueRef>)res);
2017-05-26 04:48:44 +08:00
}
result = configuration;
}
when(Void _ = wait(getConfTimeout)) {
2018-06-15 12:14:18 +08:00
if(!result.present()) {
messages->push_back(JsonString::makeMessage("unreadable_configuration", "Unable to read database configuration."));
2018-06-15 12:14:18 +08:00
} else {
messages->push_back(JsonString::makeMessage("full_replication_timeout", "Unable to read datacenter replicas."));
2018-06-15 12:14:18 +08:00
}
break;
}
}
ASSERT(result.present());
state std::vector<Future<Optional<Value>>> replicasFutures;
for(auto& region : result.get().regions) {
replicasFutures.push_back(tr.get(datacenterReplicasKeyFor(region.dcId)));
}
choose {
when( Void _ = wait( waitForAll(replicasFutures) ) ) {
int unreplicated = 0;
for(int i = 0; i < result.get().regions.size(); i++) {
if( !replicasFutures[i].get().present() || decodeDatacenterReplicasValue(replicasFutures[i].get().get()) < result.get().storageTeamSize ) {
unreplicated++;
}
}
fullReplication = (!unreplicated || (result.get().usableRegions == 1 && unreplicated < result.get().regions.size()));
2018-06-15 12:14:18 +08:00
}
when(Void _ = wait(getConfTimeout)) {
messages->push_back(JsonString::makeMessage("full_replication_timeout", "Unable to read datacenter replicas."));
2017-05-26 04:48:44 +08:00
}
}
break;
}
catch (Error &e) {
Void _ = wait(tr.onError(e));
}
}
2018-06-15 12:14:18 +08:00
return std::make_pair(result, fullReplication);
2017-05-26 04:48:44 +08:00
}
static JsonString configurationFetcher(Optional<DatabaseConfiguration> conf, ServerCoordinators coordinators, std::set<std::string> *incomplete_reasons) {
JsonString statusObj;
2017-05-26 04:48:44 +08:00
try {
if(conf.present()) {
DatabaseConfiguration configuration = conf.get();
statusObj = configuration.toJSON().toJsonString();
2017-05-26 04:48:44 +08:00
JsonStringArray excludedServersArr;
2017-05-26 04:48:44 +08:00
std::set<AddressExclusion> excludedServers = configuration.getExcludedServers();
for (std::set<AddressExclusion>::iterator it = excludedServers.begin(); it != excludedServers.end(); it++) {
JsonString statusObj;
2017-05-26 04:48:44 +08:00
statusObj["address"] = it->toString();
excludedServersArr.push_back(statusObj);
}
statusObj["excluded_servers"] = excludedServersArr;
}
vector< ClientLeaderRegInterface > coordinatorLeaderServers = coordinators.clientLeaderServers;
int count = coordinatorLeaderServers.size();
statusObj["coordinators_count"] = count;
2017-05-26 04:48:44 +08:00
}
catch (Error &e){
incomplete_reasons->insert("Could not retrieve all configuration status information.");
}
return statusObj;
}
ACTOR static Future<JsonString> dataStatusFetcher(std::pair<WorkerInterface, ProcessClass> mWorker, std::string dbName, int *minReplicasRemaining) {
state JsonString statusObjData;
2017-05-26 04:48:44 +08:00
try {
std::vector<Future<TraceEventFields>> futures;
2017-05-26 04:48:44 +08:00
// TODO: Should this be serial?
futures.push_back(timeoutError(mWorker.first.eventLogRequest.getReply(EventLogRequest(StringRef(dbName + "/DDTrackerStarting"))), 1.0));
futures.push_back(timeoutError(mWorker.first.eventLogRequest.getReply(EventLogRequest(StringRef(dbName + "/DDTrackerStats"))), 1.0));
futures.push_back(timeoutError(mWorker.first.eventLogRequest.getReply(EventLogRequest(StringRef(dbName + "/MovingData"))), 1.0));
futures.push_back(timeoutError(mWorker.first.eventLogRequest.getReply(EventLogRequest(LiteralStringRef("TotalDataInFlight"))), 1.0));
futures.push_back(timeoutError(mWorker.first.eventLogRequest.getReply(EventLogRequest(LiteralStringRef("TotalDataInFlightRemote"))), 1.0));
2017-05-26 04:48:44 +08:00
std::vector<TraceEventFields> dataInfo = wait(getAll(futures));
2017-05-26 04:48:44 +08:00
TraceEventFields startingStats = dataInfo[0];
TraceEventFields dataStats = dataInfo[1];
2017-05-26 04:48:44 +08:00
if (startingStats.size() && startingStats.getValue("State") != "Active") {
JsonString stateSectionObj;
2017-05-26 04:48:44 +08:00
stateSectionObj["name"] = "initializing";
stateSectionObj["description"] = "(Re)initializing automatic data distribution";
statusObjData["state"] = stateSectionObj;
return statusObjData;
}
TraceEventFields md = dataInfo[2];
// If we have a MovingData message, parse it.
if (md.size())
{
int64_t partitionsInQueue = parseInt64(md.getValue("InQueue"));
int64_t partitionsInFlight = parseInt64(md.getValue("InFlight"));
int64_t averagePartitionSize = parseInt64(md.getValue("AverageShardSize"));
int64_t totalBytesWritten = parseInt64(md.getValue("BytesWritten"));
int highestPriority = parseInt(md.getValue("HighestPriority"));
if( averagePartitionSize >= 0 ) {
JsonString moving_data;
moving_data["in_queue_bytes"] = partitionsInQueue * averagePartitionSize;
moving_data["in_flight_bytes"] = partitionsInFlight * averagePartitionSize;
moving_data["total_written_bytes"] = totalBytesWritten;
moving_data["highest_priority"] = highestPriority;
// TODO: moving_data["rate_bytes"] = makeCounter(hz, c, r);
statusObjData["moving_data"] = moving_data;
statusObjData["average_partition_size_bytes"] = averagePartitionSize;
}
2017-05-26 04:48:44 +08:00
}
if (dataStats.size())
{
int64_t totalDBBytes = parseInt64(dataStats.getValue("TotalSizeBytes"));
statusObjData["total_kv_size_bytes"] = totalDBBytes;
int shards = parseInt(dataStats.getValue("Shards"));
statusObjData["partitions_count"] = shards;
}
JsonStringArray teamTrackers;
for(int i = 0; i < 2; i++) {
TraceEventFields inFlight = dataInfo[3 + i];
if (!inFlight.size()) {
continue;
}
bool primary = parseInt(inFlight.getValue("Primary"));
int64_t totalDataInFlight = parseInt64(inFlight.getValue("TotalBytes"));
int unhealthyServers = parseInt(inFlight.getValue("UnhealthyServers"));
int highestPriority = parseInt(inFlight.getValue("HighestPriority"));
JsonString team_tracker;
team_tracker["primary"] = primary;
team_tracker["in_flight_bytes"] = totalDataInFlight;
team_tracker["unhealthy_servers"] = unhealthyServers;
JsonString stateSectionObj;
if (highestPriority >= PRIORITY_TEAM_0_LEFT) {
stateSectionObj["healthy"] = false;
stateSectionObj["name"] = "missing_data";
stateSectionObj["description"] = "No replicas remain of some data";
stateSectionObj["min_replicas_remaining"] = 0;
if(primary) {
2017-05-26 04:48:44 +08:00
*minReplicasRemaining = 0;
}
}
else if (highestPriority >= PRIORITY_TEAM_1_LEFT) {
stateSectionObj["healthy"] = false;
stateSectionObj["name"] = "healing";
stateSectionObj["description"] = "Only one replica remains of some data";
stateSectionObj["min_replicas_remaining"] = 1;
if(primary) {
2017-05-26 04:48:44 +08:00
*minReplicasRemaining = 1;
}
}
else if (highestPriority >= PRIORITY_TEAM_2_LEFT) {
stateSectionObj["healthy"] = false;
stateSectionObj["name"] = "healing";
stateSectionObj["description"] = "Only two replicas remain of some data";
stateSectionObj["min_replicas_remaining"] = 2;
if(primary) {
2017-05-26 04:48:44 +08:00
*minReplicasRemaining = 2;
}
}
else if (highestPriority >= PRIORITY_TEAM_UNHEALTHY) {
stateSectionObj["healthy"] = false;
stateSectionObj["name"] = "healing";
stateSectionObj["description"] = "Restoring replication factor";
}
else if (highestPriority >= PRIORITY_MERGE_SHARD) {
stateSectionObj["healthy"] = true;
stateSectionObj["name"] = "healthy_repartitioning";
stateSectionObj["description"] = "Repartitioning.";
}
else if (highestPriority >= PRIORITY_TEAM_CONTAINS_UNDESIRED_SERVER) {
stateSectionObj["healthy"] = true;
stateSectionObj["name"] = "healthy_removing_server";
stateSectionObj["description"] = "Removing storage server";
}
else if (highestPriority >= PRIORITY_REBALANCE_SHARD) {
stateSectionObj["healthy"] = true;
stateSectionObj["name"] = "healthy_rebalancing";
stateSectionObj["description"] = "Rebalancing";
}
else if (highestPriority >= 0) {
stateSectionObj["healthy"] = true;
stateSectionObj["name"] = "healthy";
2017-05-26 04:48:44 +08:00
}
if(!stateSectionObj.empty()) {
team_tracker["state"] = stateSectionObj;
teamTrackers.push_back(team_tracker);
if(primary) {
statusObjData["state"] = stateSectionObj;
}
}
2017-05-26 04:48:44 +08:00
}
statusObjData["team_trackers"] = teamTrackers;
2017-05-26 04:48:44 +08:00
}
catch (Error &e) {
if (e.code() == error_code_actor_cancelled)
throw;
// The most likely reason to be here is a timeout, either way we have no idea if the data state is healthy or not
// from the "cluster" perspective - from the client perspective it is not but that is indicated elsewhere.
}
return statusObjData;
}
namespace std
{
template <>
struct hash<NetworkAddress>
{
size_t operator()(const NetworkAddress& na) const
{
return (na.ip << 16) + na.port;
}
};
}
ACTOR template <class iface>
static Future<vector<std::pair<iface, TraceEventFields>>> getServerMetrics(vector<iface> servers, std::unordered_map<NetworkAddress, WorkerInterface> address_workers, std::string suffix) {
state vector<Future<Optional<TraceEventFields>>> futures;
2017-05-26 04:48:44 +08:00
for (auto s : servers) {
futures.push_back(latestEventOnWorker(address_workers[s.address()], s.id().toString() + suffix));
}
Void _ = wait(waitForAll(futures));
vector<std::pair<iface, TraceEventFields>> results;
2017-05-26 04:48:44 +08:00
for (int i = 0; i < servers.size(); i++) {
results.push_back(std::make_pair(servers[i], futures[i].get().present() ? futures[i].get().get() : TraceEventFields()));
2017-05-26 04:48:44 +08:00
}
return results;
}
ACTOR static Future<vector<std::pair<StorageServerInterface, TraceEventFields>>> getStorageServersAndMetrics(Database cx, std::unordered_map<NetworkAddress, WorkerInterface> address_workers) {
2017-05-26 04:48:44 +08:00
vector<StorageServerInterface> servers = wait(timeoutError(getStorageServers(cx, true), 5.0));
vector<std::pair<StorageServerInterface, TraceEventFields>> results = wait(getServerMetrics(servers, address_workers, "/StorageMetrics"));
2017-05-26 04:48:44 +08:00
return results;
}
ACTOR static Future<vector<std::pair<TLogInterface, TraceEventFields>>> getTLogsAndMetrics(Reference<AsyncVar<struct ServerDBInfo>> db, std::unordered_map<NetworkAddress, WorkerInterface> address_workers) {
2017-05-26 04:48:44 +08:00
vector<TLogInterface> servers = db->get().logSystemConfig.allPresentLogs();
vector<std::pair<TLogInterface, TraceEventFields>> results = wait(getServerMetrics(servers, address_workers, "/TLogMetrics"));
2017-05-26 04:48:44 +08:00
return results;
}
static int getExtraTLogEligibleMachines(vector<std::pair<WorkerInterface, ProcessClass>> workers, DatabaseConfiguration configuration) {
std::set<StringRef> allMachines;
std::map<Key,std::set<StringRef>> dcId_machine;
2017-05-26 04:48:44 +08:00
for(auto worker : workers) {
if(worker.second.machineClassFitness(ProcessClass::TLog) < ProcessClass::NeverAssign
&& !configuration.isExcludedServer(worker.first.address()))
{
allMachines.insert(worker.first.locality.zoneId().get());
if(worker.first.locality.dcId().present()) {
dcId_machine[worker.first.locality.dcId().get()].insert(worker.first.locality.zoneId().get());
}
2017-05-26 04:48:44 +08:00
}
}
if(configuration.regions.size() == 0) {
return allMachines.size() - std::max(configuration.tLogReplicationFactor, configuration.storageTeamSize);
}
int extraTlogEligibleMachines = std::numeric_limits<int>::max();
for(auto& region : configuration.regions) {
extraTlogEligibleMachines = std::min<int>( extraTlogEligibleMachines, dcId_machine[region.dcId].size() - std::max(configuration.remoteTLogReplicationFactor, std::max(configuration.tLogReplicationFactor, configuration.storageTeamSize) ) );
//FIXME: does not take into account fallback satellite policies
if(region.satelliteTLogReplicationFactor > 0) {
int totalSatelliteEligible = 0;
for(auto& sat : region.satellites) {
totalSatelliteEligible += dcId_machine[sat.dcId].size();
}
extraTlogEligibleMachines = std::min<int>( extraTlogEligibleMachines, totalSatelliteEligible - region.satelliteTLogReplicationFactor );
}
}
return extraTlogEligibleMachines;
2017-05-26 04:48:44 +08:00
}
ACTOR static Future<JsonString> workloadStatusFetcher(Reference<AsyncVar<struct ServerDBInfo>> db, vector<std::pair<WorkerInterface, ProcessClass>> workers, std::pair<WorkerInterface, ProcessClass> mWorker,
std::string dbName, JsonString *qos, JsonString *data_overlay, std::set<std::string> *incomplete_reasons, Future<ErrorOr<vector<std::pair<StorageServerInterface, TraceEventFields>>>> storageServerFuture)
{
state JsonString statusObj;
state JsonString operationsObj;
state JsonString bytesObj;
state JsonString keysObj;
2017-05-26 04:48:44 +08:00
// Writes and conflicts
try {
vector<Future<TraceEventFields>> proxyStatFutures;
2017-05-26 04:48:44 +08:00
std::map<NetworkAddress, std::pair<WorkerInterface, ProcessClass>> workersMap;
for (auto w : workers) {
workersMap[w.first.address()] = w;
}
for (auto &p : db->get().client.proxies) {
auto worker = getWorker(workersMap, p.address());
if (worker.present())
proxyStatFutures.push_back(timeoutError(worker.get().first.eventLogRequest.getReply(EventLogRequest(LiteralStringRef("ProxyMetrics"))), 1.0));
else
throw all_alternatives_failed(); // We need data from all proxies for this result to be trustworthy
}
vector<TraceEventFields> proxyStats = wait(getAll(proxyStatFutures));
2017-05-26 04:48:44 +08:00
StatusCounter mutations, mutationBytes, txnConflicts, txnStartOut, txnCommitOutSuccess;
2017-05-26 04:48:44 +08:00
for (auto &ps : proxyStats) {
mutations.updateValues( StatusCounter(ps.getValue("Mutations")) );
mutationBytes.updateValues( StatusCounter(ps.getValue("MutationBytes")) );
txnConflicts.updateValues( StatusCounter(ps.getValue("TxnConflicts")) );
txnStartOut.updateValues( StatusCounter(ps.getValue("TxnStartOut")) );
txnCommitOutSuccess.updateValues( StatusCounter(ps.getValue("TxnCommitOutSuccess")) );
2017-05-26 04:48:44 +08:00
}
operationsObj["writes"] = mutations.getStatus();
bytesObj["written"] = mutationBytes.getStatus();
2017-05-26 04:48:44 +08:00
JsonString transactions;
transactions["conflicted"] = txnConflicts.getStatus();
transactions["started"] = txnStartOut.getStatus();
transactions["committed"] = txnCommitOutSuccess.getStatus();
2017-05-26 04:48:44 +08:00
statusObj["transactions"] = transactions;
}
catch (Error& e) {
if (e.code() == error_code_actor_cancelled)
throw;
incomplete_reasons->insert("Unknown mutations, conflicts, and transactions state.");
}
// Transactions
2017-05-26 04:48:44 +08:00
try {
TraceEventFields md = wait( timeoutError(mWorker.first.eventLogRequest.getReply( EventLogRequest(StringRef(dbName+"/RkUpdate") ) ), 1.0) );
double tpsLimit = parseDouble(md.getValue("TPSLimit"));
double transPerSec = parseDouble(md.getValue("ReleasedTPS"));
int ssCount = parseInt(md.getValue("StorageServers"));
int tlogCount = parseInt(md.getValue("TLogs"));
int64_t worstFreeSpaceStorageServer = parseInt64(md.getValue("WorstFreeSpaceStorageServer"));
int64_t worstFreeSpaceTLog = parseInt64(md.getValue("WorstFreeSpaceTLog"));
int64_t worstStorageServerQueue = parseInt64(md.getValue("WorstStorageServerQueue"));
int64_t limitingStorageServerQueue = parseInt64(md.getValue("LimitingStorageServerQueue"));
int64_t worstTLogQueue = parseInt64(md.getValue("WorstTLogQueue"));
int64_t totalDiskUsageBytes = parseInt64(md.getValue("TotalDiskUsageBytes"));
int64_t worstVersionLag = parseInt64(md.getValue("WorstStorageServerVersionLag"));
int64_t limitingVersionLag = parseInt64(md.getValue("LimitingStorageServerVersionLag"));
2017-05-26 04:48:44 +08:00
(*data_overlay)["total_disk_used_bytes"] = totalDiskUsageBytes;
if(ssCount > 0) {
(*data_overlay)["least_operating_space_bytes_storage_server"] = std::max(worstFreeSpaceStorageServer, (int64_t)0);
(*qos)["worst_queue_bytes_storage_server"] = worstStorageServerQueue;
(*qos)["limiting_queue_bytes_storage_server"] = limitingStorageServerQueue;
(*qos)["worst_version_lag_storage_server"] = worstVersionLag;
(*qos)["limiting_version_lag_storage_server"] = limitingVersionLag;
}
if(tlogCount > 0) {
(*data_overlay)["least_operating_space_bytes_log_server"] = std::max(worstFreeSpaceTLog, (int64_t)0);
(*qos)["worst_queue_bytes_log_server"] = worstTLogQueue;
}
(*qos)["transactions_per_second_limit"] = tpsLimit;
(*qos)["released_transactions_per_second"] = transPerSec;
int reason = parseInt(md.getValue("Reason"));
JsonString perfLimit;
2017-05-26 04:48:44 +08:00
if (transPerSec > tpsLimit * 0.8) {
// If reason is known, set qos.performance_limited_by, otherwise omit
if (reason >= 0 && reason < limitReasonEnd) {
perfLimit = JsonString::makeMessage(limitReasonName[reason], limitReasonDesc[reason]);
std::string reason_server_id = md.getValue("ReasonServerID");
2017-05-26 04:48:44 +08:00
if (!reason_server_id.empty())
perfLimit["reason_server_id"] = reason_server_id;
}
}
else {
perfLimit = JsonString::makeMessage("workload", "The database is not being saturated by the workload.");
2017-05-26 04:48:44 +08:00
}
if(!perfLimit.empty()) {
perfLimit["reason_id"] = reason;
(*qos)["performance_limited_by"] = perfLimit;
}
} catch (Error &e){
if (e.code() == error_code_actor_cancelled)
throw;
incomplete_reasons->insert("Unknown performance state.");
}
// Reads
try {
ErrorOr<vector<std::pair<StorageServerInterface, TraceEventFields>>> storageServers = wait(storageServerFuture);
if(!storageServers.present()) {
throw storageServers.getError();
}
StatusCounter reads;
StatusCounter readKeys;
StatusCounter readBytes;
for(auto &ss : storageServers.get()) {
reads.updateValues( StatusCounter(ss.second.getValue("FinishedQueries")));
readKeys.updateValues( StatusCounter(ss.second.getValue("RowsQueried")));
readBytes.updateValues( StatusCounter(ss.second.getValue("BytesQueried")));
}
operationsObj["reads"] = reads.getStatus();
keysObj["read"] = readKeys.getStatus();
bytesObj["read"] = readBytes.getStatus();
2017-05-26 04:48:44 +08:00
}
catch (Error& e) {
if (e.code() == error_code_actor_cancelled)
throw;
incomplete_reasons->insert("Unknown read state.");
}
2017-05-26 04:48:44 +08:00
statusObj["operations"] = operationsObj;
statusObj["keys"] = keysObj;
statusObj["bytes"] = bytesObj;
2017-05-26 04:48:44 +08:00
return statusObj;
}
static JsonStringArray oldTlogFetcher(int* oldLogFaultTolerance, Reference<AsyncVar<struct ServerDBInfo>> db, std::unordered_map<NetworkAddress, WorkerInterface> const& address_workers) {
JsonStringArray oldTlogsArray;
2017-05-26 04:48:44 +08:00
if(db->get().recoveryState >= RecoveryState::ACCEPTING_COMMITS) {
2017-05-26 04:48:44 +08:00
for(auto it : db->get().logSystemConfig.oldTLogs) {
JsonString statusObj;
JsonStringArray logsObj;
Optional<int32_t> sat_log_replication_factor, sat_log_write_anti_quorum, sat_log_fault_tolerance, log_replication_factor, log_write_anti_quorum, log_fault_tolerance, remote_log_replication_factor, remote_log_fault_tolerance;
int maxFaultTolerance = 0;
for(int i = 0; i < it.tLogs.size(); i++) {
int failedLogs = 0;
for(auto& log : it.tLogs[i].tLogs) {
JsonString logObj;
bool failed = !log.present() || !address_workers.count(log.interf().address());
logObj["id"] = log.id().shortString();
logObj["healthy"] = !failed;
if(log.present()) {
logObj["address"] = log.interf().address().toString();
}
logsObj.push_back(logObj);
if(failed) {
failedLogs++;
}
2017-05-26 04:48:44 +08:00
}
maxFaultTolerance = std::max(maxFaultTolerance, it.tLogs[i].tLogReplicationFactor - 1 - it.tLogs[i].tLogWriteAntiQuorum - failedLogs);
2018-06-16 03:36:19 +08:00
if(it.tLogs[i].isLocal && it.tLogs[i].locality == tagLocalitySatellite) {
sat_log_replication_factor = it.tLogs[i].tLogReplicationFactor;
sat_log_write_anti_quorum = it.tLogs[i].tLogWriteAntiQuorum;
sat_log_fault_tolerance = it.tLogs[i].tLogReplicationFactor - 1 - it.tLogs[i].tLogWriteAntiQuorum - failedLogs;
2018-06-16 03:36:19 +08:00
}
else if(it.tLogs[i].isLocal) {
log_replication_factor = it.tLogs[i].tLogReplicationFactor;
log_write_anti_quorum = it.tLogs[i].tLogWriteAntiQuorum;
log_fault_tolerance = it.tLogs[i].tLogReplicationFactor - 1 - it.tLogs[i].tLogWriteAntiQuorum - failedLogs;
2017-05-26 04:48:44 +08:00
}
2018-06-16 03:36:19 +08:00
else {
remote_log_replication_factor = it.tLogs[i].tLogReplicationFactor;
remote_log_fault_tolerance = it.tLogs[i].tLogReplicationFactor - 1 - failedLogs;
}
2017-05-26 04:48:44 +08:00
}
*oldLogFaultTolerance = std::min(*oldLogFaultTolerance, maxFaultTolerance);
2017-05-26 04:48:44 +08:00
statusObj["logs"] = logsObj;
if (sat_log_replication_factor.present())
statusObj["satellite_log_replication_factor"] = sat_log_replication_factor.get();
if (sat_log_write_anti_quorum.present())
statusObj["satellite_log_write_anti_quorum"] = sat_log_write_anti_quorum.get();
if (sat_log_fault_tolerance.present())
statusObj["satellite_log_fault_tolerance"] = sat_log_fault_tolerance.get();
if (log_replication_factor.present())
statusObj["log_replication_factor"] = log_replication_factor.get();
if (log_write_anti_quorum.present())
statusObj["log_write_anti_quorum"] = log_write_anti_quorum.get();
if (log_fault_tolerance.present())
statusObj["log_fault_tolerance"] = log_fault_tolerance.get();
if (remote_log_replication_factor.present())
statusObj["remote_log_replication_factor"] = remote_log_replication_factor.get();
if (remote_log_fault_tolerance.present())
statusObj["remote_log_fault_tolerance"] = remote_log_fault_tolerance.get();
2017-05-26 04:48:44 +08:00
oldTlogsArray.push_back(statusObj);
}
}
return oldTlogsArray;
}
static JsonString faultToleranceStatusFetcher(DatabaseConfiguration configuration, ServerCoordinators coordinators, std::vector<std::pair<WorkerInterface, ProcessClass>>& workers, int extraTlogEligibleMachines, int minReplicasRemaining) {
JsonString statusObj;
2017-05-26 04:48:44 +08:00
// without losing data
int32_t maxMachineFailures = configuration.maxMachineFailuresTolerated();
int maxCoordinatorFailures = (coordinators.clientLeaderServers.size() - 1) / 2;
std::map<NetworkAddress, StringRef> workerZones;
for(auto& worker : workers) {
workerZones[worker.first.address()] = worker.first.locality.zoneId().orDefault(LiteralStringRef(""));
}
std::map<StringRef, int> coordinatorZoneCounts;
for(auto& coordinator : coordinators.ccf->getConnectionString().coordinators()) {
auto zone = workerZones[coordinator];
coordinatorZoneCounts[zone] += 1;
}
std::vector<std::pair<StringRef, int>> coordinatorZones(coordinatorZoneCounts.begin(), coordinatorZoneCounts.end());
std::sort(coordinatorZones.begin(), coordinatorZones.end(), [] (const std::pair<StringRef,int>& lhs, const std::pair<StringRef,int>& rhs) {
return lhs.second > rhs.second;
});
int lostCoordinators = 0;
int maxCoordinatorZoneFailures = 0;
for(auto zone : coordinatorZones) {
lostCoordinators += zone.second;
if(lostCoordinators > maxCoordinatorFailures) {
break;
}
maxCoordinatorZoneFailures += 1;
}
int machineFailuresWithoutLosingData = std::min(maxMachineFailures, maxCoordinatorZoneFailures);
if (minReplicasRemaining >= 0){
machineFailuresWithoutLosingData = std::min(machineFailuresWithoutLosingData, minReplicasRemaining - 1);
}
statusObj["max_machine_failures_without_losing_data"] = std::max(machineFailuresWithoutLosingData, 0);
// without losing availablity
statusObj["max_machine_failures_without_losing_availability"] = std::max(std::min(extraTlogEligibleMachines, machineFailuresWithoutLosingData), 0);
2017-05-26 04:48:44 +08:00
return statusObj;
}
static std::string getIssueDescription(std::string name) {
if(name == "incorrect_cluster_file_contents") {
2018-06-13 02:59:47 +08:00
return "Cluster file contents do not match current cluster connection string. Verify the cluster file and its parent directory are writable and that the cluster file has not been overwritten externally.";
2017-05-26 04:48:44 +08:00
}
// FIXME: name and description will be the same unless the message is 'incorrect_cluster_file_contents', which is currently the only possible message
2017-05-26 04:48:44 +08:00
return name;
}
static std::map<std::string, JsonString> getProcessIssuesAsMessages( ProcessIssuesMap const& _issues ) {
std::map<std::string, JsonString> issuesMap;
2017-05-26 04:48:44 +08:00
try {
ProcessIssuesMap issues = _issues;
for (auto i : issues) {
JsonString message = JsonString::makeMessage(i.second.first.c_str(), getIssueDescription(i.second.first).c_str());
2017-05-26 04:48:44 +08:00
issuesMap[i.first.toString()] = message;
}
}
catch (Error &e) {
TraceEvent(SevError, "ErrorParsingProcessIssues").error(e);
// swallow
}
return issuesMap;
}
static JsonStringArray getClientIssuesAsMessages( ProcessIssuesMap const& _issues) {
JsonStringArray issuesList;
2017-05-26 04:48:44 +08:00
try {
ProcessIssuesMap issues = _issues;
std::map<std::string, std::vector<std::string>> deduplicatedIssues;
for(auto i : issues) {
deduplicatedIssues[i.second.first].push_back(format("%s:%d", toIPString(i.first.ip).c_str(), i.first.port));
}
for (auto i : deduplicatedIssues) {
JsonString message = JsonString::makeMessage(i.first.c_str(), getIssueDescription(i.first).c_str());
JsonStringArray addresses;
2017-05-26 04:48:44 +08:00
for(auto addr : i.second) {
addresses.push_back(addr);
}
message["addresses"] = addresses;
issuesList.push_back(message);
}
}
catch (Error &e) {
TraceEvent(SevError, "ErrorParsingClientIssues").error(e);
// swallow
}
return issuesList;
}
ACTOR Future<JsonString> layerStatusFetcher(Database cx, JsonStringArray *messages, std::set<std::string> *incomplete_reasons) {
state StatusObject result;
state JSONDoc json(result);
state double tStart = now();
2017-05-26 04:48:44 +08:00
try {
state ReadYourWritesTransaction tr(cx);
loop {
try {
tr.setOption(FDBTransactionOptions::ACCESS_SYSTEM_KEYS);
int64_t timeout_ms = 3000;
tr.setOption(FDBTransactionOptions::TIMEOUT, StringRef((uint8_t *)&timeout_ms, sizeof(int64_t)));
std::string jsonPrefix = layerStatusMetaPrefixRange.begin.toString() + "json/";
Standalone<RangeResultRef> jsonLayers = wait(tr.getRange(KeyRangeRef(jsonPrefix, strinc(jsonPrefix)), 1000));
// TODO: Also fetch other linked subtrees of meta keys
state std::vector<Future<Standalone<RangeResultRef>>> docFutures;
state int i;
for(i = 0; i < jsonLayers.size(); ++i)
docFutures.push_back(tr.getRange(KeyRangeRef(jsonLayers[i].value, strinc(jsonLayers[i].value)), 1000));
result.clear();
JSONDoc::expires_reference_version = (uint64_t)tr.getReadVersion().get();
for(i = 0; i < docFutures.size(); ++i) {
state Standalone<RangeResultRef> docs = wait(docFutures[i]);
state int j;
for(j = 0; j < docs.size(); ++j) {
state json_spirit::mValue doc;
try {
json_spirit::read_string(docs[j].value.toString(), doc);
Void _ = wait(yield());
json.absorb(doc.get_obj());
Void _ = wait(yield());
} catch(Error &e) {
TraceEvent(SevWarn, "LayerStatusBadJSON").detail("Key", printable(docs[j].key));
}
}
}
json.create("_valid") = true;
break;
} catch(Error &e) {
Void _ = wait(tr.onError(e));
}
}
} catch(Error &e) {
TraceEvent(SevWarn, "LayerStatusError").error(e);
incomplete_reasons->insert(format("Unable to retrieve layer status (%s).", e.what()));
json.create("_error") = format("Unable to retrieve layer status (%s).", e.what());
json.create("_valid") = false;
}
json.cleanOps();
JsonString statusObj = result.toJsonString();
TraceEvent("LayerStatusFetcher").detail("Duration", now()-tStart).detail("StatusSize",statusObj.getLength()).detail("StatusNameTotal",statusObj.getNameTotal());
return statusObj;
2017-05-26 04:48:44 +08:00
}
ACTOR Future<JsonString> lockedStatusFetcher(Reference<AsyncVar<struct ServerDBInfo>> db, JsonStringArray *messages, std::set<std::string> *incomplete_reasons) {
state JsonString statusObj;
2017-05-26 04:48:44 +08:00
state Database cx = openDBOnServer(db, TaskDefaultEndpoint, true, false); // Open a new database connection that isn't lock-aware
state Transaction tr(cx);
state int timeoutSeconds = 5;
state Future<Void> getTimeout = delay(timeoutSeconds);
loop {
tr.setOption(FDBTransactionOptions::PRIORITY_SYSTEM_IMMEDIATE);
try {
choose{
when(Version f = wait(tr.getReadVersion())) {
statusObj["database_locked"] = false;
}
when(Void _ = wait(getTimeout)) {
incomplete_reasons->insert(format("Unable to determine if database is locked after %d seconds.", timeoutSeconds));
}
}
break;
}
catch (Error &e) {
if (e.code() == error_code_database_locked) {
statusObj["database_locked"] = true;
break;
}
else {
try {
Void _ = wait(tr.onError(e));
}
catch (Error &e) {
incomplete_reasons->insert(format("Unable to determine if database is locked (%s).", e.what()));
break;
}
}
}
}
return statusObj;
}
// constructs the cluster section of the json status output
ACTOR Future<StatusReply> clusterGetStatus(
Reference<AsyncVar<struct ServerDBInfo>> db,
Database cx,
vector<std::pair<WorkerInterface, ProcessClass>> workers,
ProcessIssuesMap workerIssues,
ProcessIssuesMap clientIssues,
ClientVersionMap clientVersionMap,
2017-09-29 07:31:29 +08:00
std::map<NetworkAddress, std::string> traceLogGroupMap,
2017-05-26 04:48:44 +08:00
ServerCoordinators coordinators,
std::vector<NetworkAddress> incompatibleConnections,
Version datacenterVersionDifference )
2017-05-26 04:48:44 +08:00
{
// since we no longer offer multi-database support, all databases must be named DB
state std::string dbName = "DB";
state double tStart = now();
2017-05-26 04:48:44 +08:00
// Check if master worker is present
state JsonStringArray messages;
2017-05-26 04:48:44 +08:00
state std::set<std::string> status_incomplete_reasons;
state std::pair<WorkerInterface, ProcessClass> mWorker;
try {
// Get the master Worker interface
Optional<std::pair<WorkerInterface, ProcessClass>> _mWorker = getWorker( workers, db->get().master.address() );
if (_mWorker.present()) {
mWorker = _mWorker.get();
} else {
messages.push_back(JsonString::makeMessage("unreachable_master_worker", "Unable to locate the master worker."));
2017-05-26 04:48:44 +08:00
}
// Get latest events for various event types from ALL workers
// WorkerEvents is a map of worker's NetworkAddress to its event string
// The pair represents worker responses and a set of worker NetworkAddress strings which did not respond
std::vector< Future< Optional <std::pair<WorkerEvents, std::set<std::string>>> > > futures;
futures.push_back(latestEventOnWorkers(workers, "MachineMetrics"));
futures.push_back(latestEventOnWorkers(workers, "ProcessMetrics"));
futures.push_back(latestErrorOnWorkers(workers));
futures.push_back(latestEventOnWorkers(workers, "TraceFileOpenError"));
futures.push_back(latestEventOnWorkers(workers, "ProgramStart"));
// Wait for all response pairs.
state std::vector< Optional <std::pair<WorkerEvents, std::set<std::string>>> > workerEventsVec = wait(getAll(futures));
// Create a unique set of all workers who were unreachable for 1 or more of the event requests above.
// Since each event request is independent and to all workers, workers can have responded to some
// event requests but still end up in the unreachable set.
std::set<std::string> mergeUnreachable;
// For each (optional) pair, if the pair is present and not empty then add the unreachable workers to the set.
for (auto pair : workerEventsVec)
{
if (pair.present() && pair.get().second.size())
mergeUnreachable.insert(pair.get().second.begin(), pair.get().second.end());
}
// We now have a unique set of workers who were in some way unreachable. If there is anything in that set, create a message
// for it and include the list of unreachable processes.
if (mergeUnreachable.size()){
JsonString message = JsonString::makeMessage("unreachable_processes", "The cluster has some unreachable processes.");
JsonStringArray unreachableProcs;
2017-05-26 04:48:44 +08:00
for (auto m : mergeUnreachable){
unreachableProcs.push_back(JsonString("address", m));
2017-05-26 04:48:44 +08:00
}
message["unreachable_processes"] = unreachableProcs;
messages.push_back(message);
}
// construct status information for cluster subsections
state int statusCode = (int) RecoveryStatus::END;
state JsonString recoveryStateStatus = wait(recoveryStateStatusFetcher(mWorker, workers.size(), &status_incomplete_reasons, &statusCode));
2017-05-26 04:48:44 +08:00
// machine metrics
state WorkerEvents mMetrics = workerEventsVec[0].present() ? workerEventsVec[0].get().first : WorkerEvents();
// process metrics
state WorkerEvents pMetrics = workerEventsVec[1].present() ? workerEventsVec[1].get().first : WorkerEvents();
state WorkerEvents latestError = workerEventsVec[2].present() ? workerEventsVec[2].get().first : WorkerEvents();
state WorkerEvents traceFileOpenErrors = workerEventsVec[3].present() ? workerEventsVec[3].get().first : WorkerEvents();
state WorkerEvents programStarts = workerEventsVec[4].present() ? workerEventsVec[4].get().first : WorkerEvents();
state JsonString statusObj;
2017-05-26 04:48:44 +08:00
if(db->get().recoveryCount > 0) {
statusObj["generation"] = db->get().recoveryCount;
}
state std::map<std::string, JsonString> processIssues = getProcessIssuesAsMessages(workerIssues);
state vector<std::pair<StorageServerInterface, TraceEventFields>> storageServers;
state vector<std::pair<TLogInterface, TraceEventFields>> tLogs;
state JsonString qos;
state JsonString data_overlay;
2017-05-26 04:48:44 +08:00
statusObj["protocol_version"] = format("%llx", currentProtocolVersion);
2018-07-10 13:11:58 +08:00
statusObj["connection_string"] = coordinators.ccf->getConnectionString().toString();
2017-05-26 04:48:44 +08:00
2018-06-15 12:14:18 +08:00
state Optional<DatabaseConfiguration> configuration;
state Optional<bool> fullReplication;
2017-05-26 04:48:44 +08:00
if(!(recoveryStateStatus.isPresent("name") && statusCode == RecoveryStatus::configuration_missing)) {
2018-06-15 12:14:18 +08:00
std::pair<Optional<DatabaseConfiguration>,Optional<bool>> loadResults = wait(loadConfiguration(cx, &messages, &status_incomplete_reasons));
configuration = loadResults.first;
fullReplication = loadResults.second;
}
if(fullReplication.present()) {
statusObj["full_replication"] = fullReplication.get();
2017-05-26 04:48:44 +08:00
}
statusObj["machines"] = machineStatusFetcher(mMetrics, workers, configuration, &status_incomplete_reasons);
if (configuration.present()){
// Do the latency probe by itself to avoid interference from other status activities
JsonString latencyProbeResults = wait(latencyProbeFetcher(cx, &messages, &status_incomplete_reasons));
2017-05-26 04:48:44 +08:00
statusObj["database_available"] = latencyProbeResults.isPresent("immediate_priority_transaction_start_seconds") && latencyProbeResults.isPresent("read_seconds") && latencyProbeResults.isPresent("commit_seconds");
2017-05-26 04:48:44 +08:00
if (!latencyProbeResults.empty()) {
statusObj["latency_probe"] = latencyProbeResults;
}
// Start getting storage servers now (using system priority) concurrently. Using sys priority because having storage servers
// in status output is important to give context to error messages in status that reference a storage server role ID.
state std::unordered_map<NetworkAddress, WorkerInterface> address_workers;
for (auto worker : workers)
address_workers[worker.first.address()] = worker.first;
state Future<ErrorOr<vector<std::pair<StorageServerInterface, TraceEventFields>>>> storageServerFuture = errorOr(getStorageServersAndMetrics(cx, address_workers));
state Future<ErrorOr<vector<std::pair<TLogInterface, TraceEventFields>>>> tLogFuture = errorOr(getTLogsAndMetrics(db, address_workers));
2017-05-26 04:48:44 +08:00
state int minReplicasRemaining = -1;
std::vector<Future<JsonString>> futures2;
futures2.push_back(dataStatusFetcher(mWorker, dbName, &minReplicasRemaining));
futures2.push_back(workloadStatusFetcher(db, workers, mWorker, dbName, &qos, &data_overlay, &status_incomplete_reasons, storageServerFuture));
futures2.push_back(layerStatusFetcher(cx, &messages, &status_incomplete_reasons));
futures2.push_back(lockedStatusFetcher(db, &messages, &status_incomplete_reasons));
state std::vector<JsonString> workerStatuses = wait(getAll(futures2));
2017-05-26 04:48:44 +08:00
int oldLogFaultTolerance = 100;
if(db->get().recoveryState >= RecoveryState::ACCEPTING_COMMITS && db->get().logSystemConfig.oldTLogs.size() > 0) {
2017-05-26 04:48:44 +08:00
statusObj["old_logs"] = oldTlogFetcher(&oldLogFaultTolerance, db, address_workers);
}
if(configuration.present()) {
int extraTlogEligibleMachines = getExtraTLogEligibleMachines(workers, configuration.get());
statusObj["fault_tolerance"] = faultToleranceStatusFetcher(configuration.get(), coordinators, workers, extraTlogEligibleMachines, minReplicasRemaining);
2017-05-26 04:48:44 +08:00
}
JsonString configObj = configurationFetcher(configuration, coordinators, &status_incomplete_reasons);
2017-05-26 04:48:44 +08:00
// configArr could be empty
if (!configObj.empty())
statusObj["configuration"] = configObj;
// workloadStatusFetcher returns the workload section but also optionally writes the qos section and adds to the data_overlay object
if (!workerStatuses[1].empty())
statusObj["workload"] = workerStatuses[1];
statusObj["layers"] = workerStatuses[2];
// Add qos section if it was populated
if (!qos.empty())
statusObj["qos"] = qos;
// Merge data_overlay into data
JsonString &clusterDataSection = workerStatuses[0];
clusterDataSection.append(data_overlay);
2017-05-26 04:48:44 +08:00
// If data section not empty, add it to statusObj
if (!clusterDataSection.empty())
statusObj["data"] = clusterDataSection;
// Insert database_locked section
if(!workerStatuses[3].empty()) {
statusObj.append(workerStatuses[3]);
2017-05-26 04:48:44 +08:00
}
// Need storage servers now for processStatusFetcher() below.
ErrorOr<vector<std::pair<StorageServerInterface, TraceEventFields>>> _storageServers = wait(storageServerFuture);
2017-05-26 04:48:44 +08:00
if (_storageServers.present()) {
storageServers = _storageServers.get();
}
else
messages.push_back(JsonString::makeMessage("storage_servers_error", "Timed out trying to retrieve storage servers."));
2017-05-26 04:48:44 +08:00
// ...also tlogs
ErrorOr<vector<std::pair<TLogInterface, TraceEventFields>>> _tLogs = wait(tLogFuture);
2017-05-26 04:48:44 +08:00
if (_tLogs.present()) {
tLogs = _tLogs.get();
}
else
messages.push_back(JsonString::makeMessage("log_servers_error", "Timed out trying to retrieve log servers."));
2017-05-26 04:48:44 +08:00
}
else {
// Set layers status to { _valid: false, error: "configurationMissing"}
JsonString jsonString("_valid", false);
jsonString.append("_error", "configurationMissing");
statusObj["layers"] = jsonString;
2017-05-26 04:48:44 +08:00
}
JsonString processStatus = wait(processStatusFetcher(db, workers, pMetrics, mMetrics, latestError, traceFileOpenErrors, programStarts, processIssues, storageServers, tLogs, cx, configuration, &status_incomplete_reasons));
2017-05-26 04:48:44 +08:00
statusObj["processes"] = processStatus;
2017-09-29 07:31:29 +08:00
statusObj["clients"] = clientStatusFetcher(clientVersionMap, traceLogGroupMap);
2017-05-26 04:48:44 +08:00
JsonStringArray incompatibleConnectionsArray;
2017-05-26 04:48:44 +08:00
for(auto it : incompatibleConnections) {
incompatibleConnectionsArray.push_back(it.toString());
}
statusObj["incompatible_connections"] = incompatibleConnectionsArray;
statusObj["datacenter_version_difference"] = datacenterVersionDifference;
2017-05-26 04:48:44 +08:00
if (!recoveryStateStatus.empty())
statusObj["recovery_state"] = recoveryStateStatus;
// cluster messages subsection;
JsonStringArray clientIssuesArr = getClientIssuesAsMessages(clientIssues);
2017-05-26 04:48:44 +08:00
if (clientIssuesArr.size() > 0) {
JsonString clientIssueMessage = JsonString::makeMessage("client_issues", "Some clients of this cluster have issues.");
2017-05-26 04:48:44 +08:00
clientIssueMessage["issues"] = clientIssuesArr;
messages.push_back(clientIssueMessage);
}
// Create the status_incomplete message if there were any reasons that the status is incomplete.
if (!status_incomplete_reasons.empty())
{
JsonString incomplete_message = JsonString::makeMessage("status_incomplete", "Unable to retrieve all status information.");
2017-05-26 04:48:44 +08:00
// Make a JSON array of all of the reasons in the status_incomplete_reasons set.
JsonStringArray reasons;
for (auto i : status_incomplete_reasons) {
reasons.push_back(JsonString("description", i));
}
2017-05-26 04:48:44 +08:00
incomplete_message["reasons"] = reasons;
messages.push_back(incomplete_message);
}
statusObj["messages"] = messages;
int64_t clusterTime = time(0);
if (clusterTime != -1){
statusObj["cluster_controller_timestamp"] = clusterTime;
}
TraceEvent("ClusterGetStatus").detail("Duration", now()-tStart)
.detail("StatusSize",statusObj.getLength()) .detail("StatusNameTotal",statusObj.getNameTotal());
return StatusReply(statusObj);
2017-05-26 04:48:44 +08:00
} catch( Error&e ) {
TraceEvent(SevError, "StatusError").error(e);
throw;
}
}
TEST_CASE("status/json/jsonstring") {
JsonString jsonObj, testObj;
JsonStringArray jsonArray;
JsonString jsonString1;
jsonString1["_valid"] = false;
jsonString1["error"] = "configurationMissing";
JsonString jsonString2("_valid", false);
jsonString2["error"] = "configurationMissing";
JsonString jsonString3("error", "configurationMissing");
jsonString3["_valid"] = false;
JsonString jsonString4("_valid", false);
jsonString4.append("error", "configurationMissing");
std::cout << "Json: " << jsonString1.getJson() << std::endl;
// Validate equality
ASSERT(jsonString1 == jsonString2);
ASSERT(jsonString1 != jsonString3); // wrong order
ASSERT(jsonString1.equals(jsonString4));
ASSERT(jsonString4.equals(jsonString1));
// Check presence of top level keys
ASSERT(jsonString1.isPresent("_valid"));
ASSERT(jsonString1.isPresent("error"));
ASSERT(!jsonString1.isPresent("configurationMissing"));
ASSERT(jsonString1.getNameTotal() == 2);
// Check empty
ASSERT(!jsonString1.empty());
ASSERT(JsonString().empty());
// Check clear
jsonString1.clear();
ASSERT(jsonString1.empty());
// Set object
jsonObj.clear();
testObj.clear();
jsonObj["first"] = "last";
jsonObj["count"] = 3;
testObj["pi"] = 3.14159;
jsonObj["piobj"] = testObj;
// Check presence of top level keys
ASSERT(jsonObj.isPresent("count"));
ASSERT(testObj.isPresent("pi"));
ASSERT(!jsonObj.isPresent("pi"));
ASSERT(jsonObj.getNameTotal() == 3);
testObj.clear();
testObj["val1"] = 7.9;
testObj["val2"] = 34;
jsonArray.push_back(testObj);
testObj.clear();
testObj["name1"] = "robert";
testObj["name2"] = "john";
testObj["name3"] = "eric";
jsonArray.push_back(testObj);
jsonObj.append("name_vals", jsonArray);
std::cout << "Json (complex): " << jsonObj.getJson() << std::endl;
jsonObj.clear();
jsonObj.append(jsonArray);
std::cout << "Json (complex array): " << jsonObj.getJson() << std::endl;
jsonArray.clear();
jsonArray.push_back("nissan");
jsonArray.push_back("honda");
jsonArray.push_back("bmw");
jsonObj.clear();
jsonObj.append(jsonArray);
std::cout << "Array (simple array #1): " << jsonObj.getJson() << std::endl;
jsonObj.clear();
testObj.clear();
jsonArray.clear();
testObj.append("nissan");
testObj.append("honda");
testObj.append("bmw");
jsonArray.push_back(testObj);
jsonObj.append(jsonArray);
std::cout << "Array (simple array #2): " << jsonObj.getJson() << std::endl;
jsonObj.clear();
testObj.clear();
jsonObj["name1"] = "robert";
jsonObj["name2"] = "john";
jsonObj["name3"] = "eric";
testObj["val1"] = 7.9;
testObj["val2"] = 34;
std::cout << "Merge (obj #1): " << jsonObj.getJson() << std::endl;
std::cout << "Merge (obj #2): " << testObj.getJson() << std::endl;
jsonObj.append(testObj);
std::cout << "Merged: " << jsonObj.getJson() << std::endl;
return Void();
}
2017-05-26 04:48:44 +08:00
TEST_CASE("status/json/merging") {
StatusObject objA, objB, objC;
JSONDoc a(objA), b(objB), c(objC);
a.create("int_one") = 1;
a.create("int_unmatched") = 2;
a.create("int_total_30.$sum") = 10;
a.create("bool_true.$and") = true;
a.create("string") = "test";
a.create("subdoc.int_11") = 11;
a.create("a") = "justA";
a.create("subdoc.double_max_5.$max") = 2.0;
a.create("subdoc.double_min_2.$min") = 2.0;
a.create("subdoc.obj_count_3.$count_keys.one") = 1;
a.create("subdoc.obj_count_3.$count_keys.two") = 2;
a.create("expired.$expires") = "I should have expired.";
a.create("expired.version") = 1;
a.create("not_expired_and_merged.$expires.seven.$sum") = 1;
a.create("not_expired_and_merged.$expires.one.$min") = 3;
a.create("not_expired_and_merged.version") = 3;
a.create("mixed_numeric_sum_6.$sum") = 0.5;
a.create("mixed_numeric_min_0.$min") = 1.5;
2017-05-26 04:48:44 +08:00
b.create("int_one") = 1;
b.create("int_unmatched") = 3;
b.create("int_total_30.$sum") = 20;
b.create("bool_true.$and") = true;
b.create("string") = "test";
b.create("subdoc.int_11") = 11;
b.create("b") = "justB";
b.create("subdoc.double_max_5.$max") = 5.0;
b.create("subdoc.double_min_2.$min") = 5.0;
b.create("subdoc.obj_count_3.$count_keys.three") = 3;
b.create("expired.$expires") = "I should have also expired.";
b.create("expired.version") = 1;
b.create("not_expired_and_merged.$expires.seven.$sum") = 2;
b.create("not_expired_and_merged.$expires.one.$min") = 1;
b.create("not_expired_and_merged.version") = 3;
b.create("last_hello.$last") = "blah";
b.create("latest_obj.$latest.a") = 0;
b.create("latest_obj.$latest.b") = 0;
b.create("latest_obj.$latest.c") = 0;
b.create("latest_obj.timestamp") = 2;
b.create("latest_int_5.$latest") = 7;
b.create("latest_int_5.timestamp") = 2;
b.create("mixed_numeric_sum_6.$sum") = 1;
b.create("mixed_numeric_min_0.$min") = 4.5;
2017-05-26 04:48:44 +08:00
c.create("int_total_30.$sum") = 0;
c.create("not_expired.$expires") = "I am still valid";
c.create("not_expired.version") = 3;
c.create("not_expired_and_merged.$expires.seven.$sum") = 4;
c.create("not_expired_and_merged.$expires.one.$min") = 2;
c.create("not_expired_and_merged.version") = 3;
c.create("last_hello.$last") = "hello";
c.create("latest_obj.$latest.a.$max") = "a";
c.create("latest_obj.$latest.b.$min") = "b";
c.create("latest_obj.$latest.expired.$expires") = "I should not be here.";
c.create("latest_obj.$latest.expired.version") = 1;
c.create("latest_obj.$latest.not_expired.$expires") = "Still alive.";
c.create("latest_obj.$latest.not_expired.version") = 3;
c.create("latest_obj.timestamp") = 3;
c.create("latest_int_5.$latest") = 5;
c.create("latest_int_5.timestamp") = 3;
c.create("mixed_numeric_sum_6.$sum") = 4.5;
c.create("mixed_numeric_min_0.$min") = (double)0.0;
printf("a = \n%s\n", json_spirit::write_string(json_spirit::mValue(objA), json_spirit::pretty_print).c_str());
printf("b = \n%s\n", json_spirit::write_string(json_spirit::mValue(objB), json_spirit::pretty_print).c_str());
printf("c = \n%s\n", json_spirit::write_string(json_spirit::mValue(objC), json_spirit::pretty_print).c_str());
2017-05-26 04:48:44 +08:00
JSONDoc::expires_reference_version = 2;
a.absorb(b);
a.absorb(c);
a.cleanOps();
printf("result = \n%s\n", json_spirit::write_string(json_spirit::mValue(objA), json_spirit::pretty_print).c_str());
2017-05-26 04:48:44 +08:00
std::string result = json_spirit::write_string(json_spirit::mValue(objA));
std::string expected = "{\"a\":\"justA\",\"b\":\"justB\",\"bool_true\":true,\"expired\":null,\"int_one\":1,\"int_total_30\":30,\"int_unmatched\":{\"ERROR\":\"Values do not match.\",\"a\":2,\"b\":3},\"last_hello\":\"hello\",\"latest_int_5\":5,\"latest_obj\":{\"a\":\"a\",\"b\":\"b\",\"not_expired\":\"Still alive.\"},\"mixed_numeric_min_0\":0,\"mixed_numeric_sum_6\":6,\"not_expired\":\"I am still valid\",\"not_expired_and_merged\":{\"one\":1,\"seven\":7},\"string\":\"test\",\"subdoc\":{\"double_max_5\":5,\"double_min_2\":2,\"int_11\":11,\"obj_count_3\":3}}";
2017-05-26 04:48:44 +08:00
if(result != expected) {
printf("ERROR: Combined doc does not match expected.\nexpected:\n\n%s\nresult:\n%s\n", expected.c_str(), result.c_str());
2017-05-26 04:48:44 +08:00
ASSERT(false);
}
return Void();
}