foundationdb/fdbclient/BlobWorkerInterface.h

274 lines
8.7 KiB
C
Raw Normal View History

/*
* BlobWorkerInterface.h
*
* This source file is part of the FoundationDB open source project
*
2022-03-22 04:36:23 +08:00
* Copyright 2013-2022 Apple Inc. and the FoundationDB project authors
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#ifndef FDBCLIENT_BLOBWORKERINTERFACE_H
#define FDBCLIENT_BLOBWORKERINTERFACE_H
#pragma once
#include "fdbclient/BlobGranuleCommon.h"
#include "fdbclient/FDBTypes.h"
#include "fdbrpc/fdbrpc.h"
#include "fdbrpc/Locality.h"
struct BlobWorkerInterface {
constexpr static FileIdentifier file_identifier = 8358753;
// TODO: mimic what StorageServerInterface does with sequential endpoint IDs
RequestStream<ReplyPromise<Void>> waitFailure;
RequestStream<struct BlobGranuleFileRequest> blobGranuleFileRequest;
RequestStream<struct AssignBlobRangeRequest> assignBlobRangeRequest;
RequestStream<struct RevokeBlobRangeRequest> revokeBlobRangeRequest;
RequestStream<struct GetGranuleAssignmentsRequest> granuleAssignmentsRequest;
RequestStream<struct GranuleStatusStreamRequest> granuleStatusStreamRequest;
2021-10-01 23:08:00 +08:00
RequestStream<struct HaltBlobWorkerRequest> haltBlobWorker;
struct LocalityData locality;
UID myId;
BlobWorkerInterface() {}
explicit BlobWorkerInterface(const struct LocalityData& l, UID id) : locality(l), myId(id) {}
Blob integration (#6808) * Fixing leaked stream with explicit notify failed before destructor * better logic to prevent races in change feed fetching * Found new race that makes assert incorrect * handle server overloaded in initial read from fdb * Handling more blob error types in granule retry * Fixing rollback metadata problem, added better debugging * Fixing version race when fetching change feed metadata * Better racing split request handling * fixing assert * Handle change feed popped check in the blob worker * fix: do not use a RYW transaction for a versionstamp because of randomize API version (#6768) * more merge conflict issues * Change feed destroy fixes * Fixing change feed destroy and move race * Check error condition in BG file req * Using relative endpoints for blob worker interface * Fixing bug in previous fix * More destroy and move race fixes * Don't update empty version on destroy in case it gets rolled back. moved() and removing will take care of ensuring it is not read * Bug fix (#6796) * fix: do not use a RYW transaction for a versionstamp because of randomize API version * fix: if the initialSnapshotVersion was pruned, granule history was incorrect * added a way to compress null bytes in printable() * Fixing durability issue with moving and destroying change feeds * Adding fix for not fully deleting files for a granule that child granules need to re-snapshot * More destroy and move races * Fixing change feed destroy and pop races * Renaming bg prune to purge, and adding a C api and unit test for it * more cleanup * review comments * Observability for granule purging * better handling for change feed not registered * Fixed purging bugs (#6815) * fix: do not use a RYW transaction for a versionstamp because of randomize API version * fix: if the initialSnapshotVersion was pruned, granule history was incorrect * added a way to compress null bytes in printable() * fixed a few purging bugs Co-authored-by: Evan Tschannen <evan.tschannen@snowflake.com>
2022-04-09 05:15:25 +08:00
void initEndpoints() {
// TODO: specify endpoint priorities?
std::vector<std::pair<FlowReceiver*, TaskPriority>> streams;
streams.push_back(waitFailure.getReceiver());
streams.push_back(blobGranuleFileRequest.getReceiver());
streams.push_back(assignBlobRangeRequest.getReceiver());
streams.push_back(revokeBlobRangeRequest.getReceiver());
streams.push_back(granuleAssignmentsRequest.getReceiver());
streams.push_back(granuleStatusStreamRequest.getReceiver());
streams.push_back(haltBlobWorker.getReceiver());
FlowTransport::transport().addEndpoints(streams);
}
UID id() const { return myId; }
NetworkAddress address() const { return blobGranuleFileRequest.getEndpoint().getPrimaryAddress(); }
NetworkAddress stableAddress() const { return blobGranuleFileRequest.getEndpoint().getStableAddress(); }
bool operator==(const BlobWorkerInterface& r) const { return id() == r.id(); }
bool operator!=(const BlobWorkerInterface& r) const { return !(*this == r); }
std::string toString() const { return id().shortString(); }
template <class Archive>
void serialize(Archive& ar) {
Blob integration (#6808) * Fixing leaked stream with explicit notify failed before destructor * better logic to prevent races in change feed fetching * Found new race that makes assert incorrect * handle server overloaded in initial read from fdb * Handling more blob error types in granule retry * Fixing rollback metadata problem, added better debugging * Fixing version race when fetching change feed metadata * Better racing split request handling * fixing assert * Handle change feed popped check in the blob worker * fix: do not use a RYW transaction for a versionstamp because of randomize API version (#6768) * more merge conflict issues * Change feed destroy fixes * Fixing change feed destroy and move race * Check error condition in BG file req * Using relative endpoints for blob worker interface * Fixing bug in previous fix * More destroy and move race fixes * Don't update empty version on destroy in case it gets rolled back. moved() and removing will take care of ensuring it is not read * Bug fix (#6796) * fix: do not use a RYW transaction for a versionstamp because of randomize API version * fix: if the initialSnapshotVersion was pruned, granule history was incorrect * added a way to compress null bytes in printable() * Fixing durability issue with moving and destroying change feeds * Adding fix for not fully deleting files for a granule that child granules need to re-snapshot * More destroy and move races * Fixing change feed destroy and pop races * Renaming bg prune to purge, and adding a C api and unit test for it * more cleanup * review comments * Observability for granule purging * better handling for change feed not registered * Fixed purging bugs (#6815) * fix: do not use a RYW transaction for a versionstamp because of randomize API version * fix: if the initialSnapshotVersion was pruned, granule history was incorrect * added a way to compress null bytes in printable() * fixed a few purging bugs Co-authored-by: Evan Tschannen <evan.tschannen@snowflake.com>
2022-04-09 05:15:25 +08:00
// use adjusted endpoints
serializer(ar, myId, locality, waitFailure);
if (Archive::isDeserializing) {
blobGranuleFileRequest =
RequestStream<struct BlobGranuleFileRequest>(waitFailure.getEndpoint().getAdjustedEndpoint(1));
assignBlobRangeRequest =
RequestStream<struct AssignBlobRangeRequest>(waitFailure.getEndpoint().getAdjustedEndpoint(2));
revokeBlobRangeRequest =
RequestStream<struct RevokeBlobRangeRequest>(waitFailure.getEndpoint().getAdjustedEndpoint(3));
granuleAssignmentsRequest =
RequestStream<struct GetGranuleAssignmentsRequest>(waitFailure.getEndpoint().getAdjustedEndpoint(4));
granuleStatusStreamRequest =
RequestStream<struct GranuleStatusStreamRequest>(waitFailure.getEndpoint().getAdjustedEndpoint(5));
haltBlobWorker =
RequestStream<struct HaltBlobWorkerRequest>(waitFailure.getEndpoint().getAdjustedEndpoint(6));
}
}
};
struct BlobGranuleFileReply {
constexpr static FileIdentifier file_identifier = 6858612;
Arena arena;
VectorRef<BlobGranuleChunkRef> chunks;
template <class Ar>
void serialize(Ar& ar) {
serializer(ar, chunks, arena);
}
};
// TODO could do a reply promise stream of file mutations to bound memory requirements?
// Have to load whole snapshot file into memory though so it doesn't actually matter too much
struct BlobGranuleFileRequest {
constexpr static FileIdentifier file_identifier = 4150141;
Arena arena;
KeyRangeRef keyRange;
Version beginVersion = 0;
Version readVersion;
bool canCollapseBegin = true;
ReplyPromise<BlobGranuleFileReply> reply;
BlobGranuleFileRequest() {}
template <class Ar>
void serialize(Ar& ar) {
serializer(ar, keyRange, beginVersion, readVersion, canCollapseBegin, reply, arena);
}
};
struct RevokeBlobRangeRequest {
constexpr static FileIdentifier file_identifier = 4844288;
Arena arena;
KeyRangeRef keyRange;
int64_t managerEpoch;
int64_t managerSeqno;
bool dispose;
ReplyPromise<Void> reply;
RevokeBlobRangeRequest() {}
template <class Ar>
void serialize(Ar& ar) {
serializer(ar, keyRange, managerEpoch, managerSeqno, dispose, reply, arena);
}
};
/*
2022-03-09 23:49:49 +08:00
* Continue: Blob worker should continue handling a granule that was evaluated for a split
* Normal: Blob worker should open the granule and start processing it
*/
2022-03-09 23:49:49 +08:00
enum AssignRequestType { Normal = 0, Continue = 1 };
struct AssignBlobRangeRequest {
constexpr static FileIdentifier file_identifier = 905381;
Arena arena;
KeyRangeRef keyRange;
int64_t managerEpoch;
int64_t managerSeqno;
2021-09-23 01:46:20 +08:00
// If continueAssignment is true, this is just to instruct the worker that it *still* owns the range, so it should
// re-snapshot it and continue.
AssignRequestType type;
ReplyPromise<Void> reply;
AssignBlobRangeRequest() {}
template <class Ar>
void serialize(Ar& ar) {
serializer(ar, keyRange, managerEpoch, managerSeqno, type, reply, arena);
}
};
// reply per granule
// TODO: could eventually add other types of metrics to report back to the manager here
struct GranuleStatusReply : public ReplyPromiseStreamReply {
constexpr static FileIdentifier file_identifier = 7563104;
KeyRange granuleRange;
bool doSplit;
bool writeHotSplit;
int64_t epoch;
int64_t seqno;
UID granuleID;
Version startVersion;
GranuleStatusReply() {}
explicit GranuleStatusReply(KeyRange range,
bool doSplit,
bool writeHotSplit,
int64_t epoch,
int64_t seqno,
UID granuleID,
Version startVersion)
: granuleRange(range), doSplit(doSplit), writeHotSplit(writeHotSplit), epoch(epoch), seqno(seqno),
granuleID(granuleID), startVersion(startVersion) {}
int expectedSize() const { return sizeof(GranuleStatusReply) + granuleRange.expectedSize(); }
template <class Ar>
void serialize(Ar& ar) {
serializer(ar,
ReplyPromiseStreamReply::acknowledgeToken,
ReplyPromiseStreamReply::sequence,
granuleRange,
doSplit,
writeHotSplit,
epoch,
seqno,
granuleID,
startVersion);
}
};
// manager makes one request per worker, it sends all range updates through this stream
struct GranuleStatusStreamRequest {
constexpr static FileIdentifier file_identifier = 2289677;
int64_t managerEpoch;
ReplyPromiseStream<GranuleStatusReply> reply;
GranuleStatusStreamRequest() {}
explicit GranuleStatusStreamRequest(int64_t managerEpoch) : managerEpoch(managerEpoch) {}
template <class Ar>
void serialize(Ar& ar) {
serializer(ar, managerEpoch, reply);
}
};
2021-10-01 23:08:00 +08:00
struct HaltBlobWorkerRequest {
constexpr static FileIdentifier file_identifier = 1985879;
UID requesterID;
ReplyPromise<Void> reply;
int64_t managerEpoch;
HaltBlobWorkerRequest() {}
explicit HaltBlobWorkerRequest(int64_t managerEpoch, UID uid) : requesterID(uid), managerEpoch(managerEpoch) {}
template <class Ar>
void serialize(Ar& ar) {
serializer(ar, managerEpoch, requesterID, reply);
}
};
struct GranuleAssignmentRef {
KeyRangeRef range;
int64_t epochAssigned;
int64_t seqnoAssigned;
GranuleAssignmentRef() {}
explicit GranuleAssignmentRef(KeyRangeRef range, int64_t epochAssigned, int64_t seqnoAssigned)
: range(range), epochAssigned(epochAssigned), seqnoAssigned(seqnoAssigned) {}
template <class Ar>
void serialize(Ar& ar) {
serializer(ar, range, epochAssigned, seqnoAssigned);
}
};
struct GetGranuleAssignmentsReply {
constexpr static FileIdentifier file_identifier = 9191718;
Arena arena;
VectorRef<GranuleAssignmentRef> assignments;
template <class Ar>
void serialize(Ar& ar) {
serializer(ar, assignments, arena);
}
};
struct GetGranuleAssignmentsRequest {
constexpr static FileIdentifier file_identifier = 4121494;
int64_t managerEpoch;
ReplyPromise<GetGranuleAssignmentsReply> reply;
template <class Ar>
void serialize(Ar& ar) {
serializer(ar, managerEpoch, reply);
}
};
#endif