2022-02-05 02:59:01 +08:00
|
|
|
/*
|
2022-02-05 05:46:44 +08:00
|
|
|
* TCInfo.h
|
2022-02-05 02:59:01 +08:00
|
|
|
*
|
|
|
|
* This source file is part of the FoundationDB open source project
|
|
|
|
*
|
2022-02-10 05:28:40 +08:00
|
|
|
* Copyright 2013-2022 Apple Inc. and the FoundationDB project authors
|
2022-02-05 02:59:01 +08:00
|
|
|
*
|
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
* you may not use this file except in compliance with the License.
|
|
|
|
* You may obtain a copy of the License at
|
|
|
|
*
|
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
*
|
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
* See the License for the specific language governing permissions and
|
|
|
|
* limitations under the License.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#pragma once
|
|
|
|
|
|
|
|
#include "fdbserver/DDTeamCollection.h"
|
|
|
|
|
|
|
|
class TCTeamInfo;
|
|
|
|
class TCMachineInfo;
|
|
|
|
class TCMachineTeamInfo;
|
|
|
|
|
|
|
|
class TCServerInfo : public ReferenceCounted<TCServerInfo> {
|
|
|
|
friend class TCServerInfoImpl;
|
2022-03-03 04:56:19 +08:00
|
|
|
friend class DDTeamCollectionUnitTest;
|
2022-02-11 15:04:25 +08:00
|
|
|
UID id;
|
2022-02-12 02:29:10 +08:00
|
|
|
bool inDesiredDC;
|
2022-02-05 02:59:01 +08:00
|
|
|
DDTeamCollection* collection;
|
2022-02-12 04:52:09 +08:00
|
|
|
Future<Void> tracker;
|
2022-02-05 02:59:01 +08:00
|
|
|
|
2022-02-12 05:49:16 +08:00
|
|
|
// TODO: Remove?
|
|
|
|
[[maybe_unused]] Version addedVersion; // Read version when this Server is added
|
|
|
|
|
2022-02-05 02:59:01 +08:00
|
|
|
StorageServerInterface lastKnownInterface;
|
|
|
|
ProcessClass lastKnownClass;
|
2022-02-12 05:49:16 +08:00
|
|
|
|
|
|
|
// A storage server's StoreType does not change.
|
|
|
|
// To change storeType for an ip:port, we destroy the old one and create a new one.
|
|
|
|
KeyValueStoreType storeType; // Storage engine type
|
|
|
|
|
2022-02-05 02:59:01 +08:00
|
|
|
int64_t dataInFlightToServer;
|
2022-02-12 13:44:28 +08:00
|
|
|
std::vector<Reference<TCTeamInfo>> teams;
|
2022-03-03 07:14:29 +08:00
|
|
|
ErrorOr<GetStorageMetricsReply> metrics;
|
2022-02-12 05:55:07 +08:00
|
|
|
|
2022-03-03 07:14:29 +08:00
|
|
|
GetStorageMetricsReply const& getMetrics() const { return metrics.get(); }
|
|
|
|
|
|
|
|
void setMetrics(GetStorageMetricsReply serverMetrics) { this->metrics = serverMetrics; }
|
2022-03-03 04:56:19 +08:00
|
|
|
void markTeamUnhealthy(int teamIndex);
|
|
|
|
|
2022-02-12 05:49:16 +08:00
|
|
|
public:
|
2022-02-05 02:59:01 +08:00
|
|
|
Reference<TCMachineInfo> machine;
|
|
|
|
Promise<std::pair<StorageServerInterface, ProcessClass>> interfaceChanged;
|
|
|
|
Future<std::pair<StorageServerInterface, ProcessClass>> onInterfaceChanged;
|
|
|
|
Promise<Void> removed;
|
|
|
|
Future<Void> onRemoved;
|
|
|
|
Future<Void> onTSSPairRemoved;
|
|
|
|
Promise<Void> killTss;
|
|
|
|
Promise<Void> wakeUpTracker;
|
|
|
|
LocalityEntry localityEntry;
|
|
|
|
Promise<Void> updated;
|
|
|
|
AsyncVar<bool> wrongStoreTypeToRemove;
|
|
|
|
AsyncVar<bool> ssVersionTooFarBehind;
|
|
|
|
|
|
|
|
TCServerInfo(StorageServerInterface ssi,
|
|
|
|
DDTeamCollection* collection,
|
|
|
|
ProcessClass processClass,
|
|
|
|
bool inDesiredDC,
|
|
|
|
Reference<LocalitySet> storageServerSet,
|
2022-02-11 11:19:50 +08:00
|
|
|
Version addedVersion = 0);
|
2022-02-05 02:59:01 +08:00
|
|
|
|
2022-02-11 15:04:25 +08:00
|
|
|
UID const& getId() const { return id; }
|
2022-02-12 02:29:10 +08:00
|
|
|
bool isInDesiredDC() const { return inDesiredDC; }
|
|
|
|
void updateInDesiredDC(std::vector<Optional<Key>> const& includedDCs);
|
2022-02-12 04:52:09 +08:00
|
|
|
void setTracker(Future<Void> tracker) { this->tracker = tracker; }
|
2022-02-12 05:49:16 +08:00
|
|
|
void updateLastKnown(StorageServerInterface const&, ProcessClass);
|
|
|
|
StorageServerInterface const& getLastKnownInterface() const { return lastKnownInterface; }
|
|
|
|
ProcessClass const& getLastKnownClass() const { return lastKnownClass; }
|
|
|
|
Future<Void> updateStoreType();
|
|
|
|
KeyValueStoreType getStoreType() const { return storeType; }
|
2022-02-12 05:55:07 +08:00
|
|
|
int64_t getDataInFlightToServer() const { return dataInFlightToServer; }
|
|
|
|
void incrementDataInFlightToServer(int64_t bytes) { dataInFlightToServer += bytes; }
|
2022-02-12 04:52:09 +08:00
|
|
|
void cancel();
|
2022-02-12 13:44:28 +08:00
|
|
|
std::vector<Reference<TCTeamInfo>> const& getTeams() const { return teams; }
|
|
|
|
void addTeam(Reference<TCTeamInfo> team) { teams.push_back(team); }
|
2022-02-12 13:29:52 +08:00
|
|
|
void removeTeamsContainingServer(UID removedServer);
|
|
|
|
void removeTeam(Reference<TCTeamInfo>);
|
2022-03-03 07:14:29 +08:00
|
|
|
bool metricsPresent() const { return metrics.present(); }
|
2022-02-11 15:04:25 +08:00
|
|
|
|
2022-02-05 02:59:01 +08:00
|
|
|
bool isCorrectStoreType(KeyValueStoreType configStoreType) const {
|
|
|
|
// A new storage server's store type may not be set immediately.
|
|
|
|
// If a storage server does not reply its storeType, it will be tracked by failure monitor and removed.
|
|
|
|
return (storeType == configStoreType || storeType == KeyValueStoreType::END);
|
|
|
|
}
|
2022-03-15 07:02:42 +08:00
|
|
|
bool isWigglePausedServer() const;
|
2022-02-05 02:59:01 +08:00
|
|
|
|
2022-03-03 06:29:43 +08:00
|
|
|
std::pair<int64_t, int64_t> spaceBytes(bool includeInFlight = true) const;
|
|
|
|
int64_t loadBytes() const;
|
2022-02-16 14:43:06 +08:00
|
|
|
bool hasHealthyAvailableSpace(double minAvailableSpaceRatio) const;
|
|
|
|
|
2022-02-05 02:59:01 +08:00
|
|
|
Future<Void> updateServerMetrics();
|
|
|
|
static Future<Void> updateServerMetrics(Reference<TCServerInfo> server);
|
|
|
|
Future<Void> serverMetricsPolling();
|
|
|
|
|
|
|
|
~TCServerInfo();
|
|
|
|
};
|
|
|
|
|
|
|
|
class TCMachineInfo : public ReferenceCounted<TCMachineInfo> {
|
|
|
|
TCMachineInfo() = default;
|
|
|
|
|
|
|
|
public:
|
|
|
|
std::vector<Reference<TCServerInfo>> serversOnMachine; // SOMEDAY: change from vector to set
|
|
|
|
Standalone<StringRef> machineID;
|
|
|
|
std::vector<Reference<TCMachineTeamInfo>> machineTeams; // SOMEDAY: split good and bad machine teams.
|
|
|
|
LocalityEntry localityEntry;
|
|
|
|
|
2022-02-11 11:19:50 +08:00
|
|
|
Reference<TCMachineInfo> clone() const;
|
2022-02-05 02:59:01 +08:00
|
|
|
|
2022-02-11 11:19:50 +08:00
|
|
|
explicit TCMachineInfo(Reference<TCServerInfo> server, const LocalityEntry& entry);
|
2022-02-05 02:59:01 +08:00
|
|
|
|
2022-02-11 11:19:50 +08:00
|
|
|
std::string getServersIDStr() const;
|
2022-02-05 02:59:01 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
// TeamCollection's machine team information
|
|
|
|
class TCMachineTeamInfo : public ReferenceCounted<TCMachineTeamInfo> {
|
2022-02-12 14:56:16 +08:00
|
|
|
UID _id;
|
2022-02-05 02:59:01 +08:00
|
|
|
std::vector<Reference<TCMachineInfo>> machines;
|
|
|
|
std::vector<Standalone<StringRef>> machineIDs;
|
|
|
|
std::vector<Reference<TCTeamInfo>> serverTeams;
|
|
|
|
|
2022-02-13 07:50:51 +08:00
|
|
|
public:
|
2022-02-11 11:19:50 +08:00
|
|
|
explicit TCMachineTeamInfo(std::vector<Reference<TCMachineInfo>> const& machines);
|
2022-02-05 02:59:01 +08:00
|
|
|
|
|
|
|
int size() const {
|
2022-02-12 14:56:16 +08:00
|
|
|
ASSERT_EQ(machines.size(), machineIDs.size());
|
2022-02-05 02:59:01 +08:00
|
|
|
return machineIDs.size();
|
|
|
|
}
|
|
|
|
|
2022-02-12 14:56:16 +08:00
|
|
|
UID id() const { return _id; }
|
2022-02-13 07:50:51 +08:00
|
|
|
std::vector<Reference<TCMachineInfo>> const& getMachines() const { return machines; }
|
|
|
|
std::vector<Standalone<StringRef>> const& getMachineIDs() const { return machineIDs; }
|
|
|
|
std::vector<Reference<TCTeamInfo>> const& getServerTeams() const { return serverTeams; }
|
|
|
|
void addServerTeam(Reference<TCTeamInfo> team) { serverTeams.push_back(team); }
|
|
|
|
bool matches(std::vector<Standalone<StringRef>> const& sortedMachineIDs);
|
2022-02-11 11:19:50 +08:00
|
|
|
std::string getMachineIDsStr() const;
|
2022-02-13 07:50:51 +08:00
|
|
|
bool containsMachine(Standalone<StringRef> machineID) const {
|
|
|
|
return std::count(machineIDs.begin(), machineIDs.end(), machineID);
|
|
|
|
}
|
|
|
|
|
|
|
|
// Returns true iff team is found
|
|
|
|
bool removeServerTeam(Reference<TCTeamInfo> team);
|
2022-02-05 02:59:01 +08:00
|
|
|
|
|
|
|
bool operator==(TCMachineTeamInfo& rhs) const { return this->machineIDs == rhs.machineIDs; }
|
|
|
|
};
|
|
|
|
|
|
|
|
// TeamCollection's server team info.
|
|
|
|
class TCTeamInfo final : public ReferenceCounted<TCTeamInfo>, public IDataDistributionTeam {
|
|
|
|
friend class TCTeamInfoImpl;
|
|
|
|
std::vector<Reference<TCServerInfo>> servers;
|
|
|
|
std::vector<UID> serverIDs;
|
|
|
|
bool healthy;
|
|
|
|
bool wrongConfiguration; // True if any of the servers in the team have the wrong configuration
|
|
|
|
int priority;
|
|
|
|
UID id;
|
|
|
|
|
|
|
|
public:
|
|
|
|
Reference<TCMachineTeamInfo> machineTeam;
|
|
|
|
Future<Void> tracker;
|
|
|
|
|
2022-02-11 11:19:50 +08:00
|
|
|
explicit TCTeamInfo(std::vector<Reference<TCServerInfo>> const& servers);
|
2022-02-05 02:59:01 +08:00
|
|
|
|
|
|
|
std::string getTeamID() const override { return id.shortString(); }
|
|
|
|
|
2022-02-11 11:19:50 +08:00
|
|
|
std::vector<StorageServerInterface> getLastKnownServerInterfaces() const override;
|
|
|
|
|
2022-02-05 02:59:01 +08:00
|
|
|
int size() const override {
|
|
|
|
ASSERT(servers.size() == serverIDs.size());
|
|
|
|
return servers.size();
|
|
|
|
}
|
|
|
|
|
2022-02-11 11:19:50 +08:00
|
|
|
std::vector<UID> const& getServerIDs() const override { return serverIDs; }
|
2022-02-05 02:59:01 +08:00
|
|
|
|
2022-02-11 11:19:50 +08:00
|
|
|
const std::vector<Reference<TCServerInfo>>& getServers() const { return servers; }
|
2022-02-05 02:59:01 +08:00
|
|
|
|
2022-02-11 11:19:50 +08:00
|
|
|
std::string getServerIDsStr() const;
|
2022-02-05 02:59:01 +08:00
|
|
|
|
2022-02-11 11:19:50 +08:00
|
|
|
void addDataInFlightToTeam(int64_t delta) override;
|
2022-02-05 02:59:01 +08:00
|
|
|
|
2022-02-11 11:19:50 +08:00
|
|
|
int64_t getDataInFlightToTeam() const override;
|
2022-02-05 02:59:01 +08:00
|
|
|
|
2022-02-11 11:19:50 +08:00
|
|
|
int64_t getLoadBytes(bool includeInFlight = true, double inflightPenalty = 1.0) const override;
|
2022-02-05 02:59:01 +08:00
|
|
|
|
2022-02-11 11:19:50 +08:00
|
|
|
int64_t getMinAvailableSpace(bool includeInFlight = true) const override;
|
2022-02-05 02:59:01 +08:00
|
|
|
|
2022-02-11 11:19:50 +08:00
|
|
|
double getMinAvailableSpaceRatio(bool includeInFlight = true) const override;
|
2022-02-05 02:59:01 +08:00
|
|
|
|
2022-02-11 11:19:50 +08:00
|
|
|
bool hasHealthyAvailableSpace(double minRatio) const override;
|
2022-02-05 02:59:01 +08:00
|
|
|
|
|
|
|
Future<Void> updateStorageMetrics() override;
|
|
|
|
|
2022-02-11 11:19:50 +08:00
|
|
|
bool isOptimal() const override;
|
2022-02-05 02:59:01 +08:00
|
|
|
|
|
|
|
bool isWrongConfiguration() const override { return wrongConfiguration; }
|
|
|
|
void setWrongConfiguration(bool wrongConfiguration) override { this->wrongConfiguration = wrongConfiguration; }
|
|
|
|
bool isHealthy() const override { return healthy; }
|
|
|
|
void setHealthy(bool h) override { healthy = h; }
|
|
|
|
int getPriority() const override { return priority; }
|
|
|
|
void setPriority(int p) override { priority = p; }
|
2022-03-19 01:25:41 +08:00
|
|
|
void addref() const override { ReferenceCounted<TCTeamInfo>::addref(); }
|
|
|
|
void delref() const override { ReferenceCounted<TCTeamInfo>::delref(); }
|
2022-02-05 02:59:01 +08:00
|
|
|
|
2022-02-11 11:19:50 +08:00
|
|
|
bool hasServer(const UID& server) const;
|
2022-03-15 07:02:42 +08:00
|
|
|
bool hasWigglePausedServer() const;
|
2022-02-05 02:59:01 +08:00
|
|
|
|
2022-02-11 11:19:50 +08:00
|
|
|
void addServers(const std::vector<UID>& servers) override;
|
2022-02-05 02:59:01 +08:00
|
|
|
|
|
|
|
private:
|
|
|
|
// Calculate an "average" of the metrics replies that we received. Penalize teams from which we did not receive all
|
|
|
|
// replies.
|
2022-02-11 11:19:50 +08:00
|
|
|
int64_t getLoadAverage() const;
|
2022-02-16 14:43:06 +08:00
|
|
|
|
|
|
|
bool allServersHaveHealthyAvailableSpace() const;
|
2022-02-05 02:59:01 +08:00
|
|
|
};
|