mako: add cpu usage statistics, including some refactoring of statistics accumulation

This commit is contained in:
Christian Wende 2023-01-20 11:14:36 +01:00
parent df0999bee2
commit 7d1e8e10f0
4 changed files with 297 additions and 135 deletions

View File

@ -41,7 +41,7 @@ struct ResumableStateForPopulate : std::enable_shared_from_this<ResumableStateFo
fdb::Transaction tx; fdb::Transaction tx;
boost::asio::io_context& io_context; boost::asio::io_context& io_context;
Arguments const& args; Arguments const& args;
ThreadStatistics& stats; WorkerStatistics& stats;
std::atomic<int>& stopcount; std::atomic<int>& stopcount;
int key_begin; int key_begin;
int key_end; int key_end;
@ -57,7 +57,7 @@ struct ResumableStateForPopulate : std::enable_shared_from_this<ResumableStateFo
fdb::Transaction tx, fdb::Transaction tx,
boost::asio::io_context& io_context, boost::asio::io_context& io_context,
Arguments const& args, Arguments const& args,
ThreadStatistics& stats, WorkerStatistics& stats,
std::atomic<int>& stopcount, std::atomic<int>& stopcount,
int key_begin, int key_begin,
int key_end) int key_end)
@ -79,7 +79,7 @@ struct ResumableStateForRunWorkload : std::enable_shared_from_this<ResumableStat
fdb::Transaction tx; fdb::Transaction tx;
boost::asio::io_context& io_context; boost::asio::io_context& io_context;
Arguments const& args; Arguments const& args;
ThreadStatistics& stats; WorkerStatistics& stats;
int64_t total_xacts; int64_t total_xacts;
std::atomic<int>& stopcount; std::atomic<int>& stopcount;
std::atomic<int> const& signal; std::atomic<int> const& signal;
@ -99,7 +99,7 @@ struct ResumableStateForRunWorkload : std::enable_shared_from_this<ResumableStat
fdb::Transaction tx, fdb::Transaction tx,
boost::asio::io_context& io_context, boost::asio::io_context& io_context,
Arguments const& args, Arguments const& args,
ThreadStatistics& stats, WorkerStatistics& stats,
std::atomic<int>& stopcount, std::atomic<int>& stopcount,
std::atomic<int> const& signal, std::atomic<int> const& signal,
int max_iters, int max_iters,

View File

@ -67,13 +67,14 @@
#include "time.hpp" #include "time.hpp"
#include "rapidjson/document.h" #include "rapidjson/document.h"
#include "rapidjson/error/en.h" #include "rapidjson/error/en.h"
#include "flow/Platform.h"
namespace mako { namespace mako {
/* args for threads */ /* args for threads */
struct alignas(64) ThreadArgs { struct alignas(64) ThreadArgs {
int worker_id; int process_idx;
int thread_id; int thread_idx;
int active_tenants; int active_tenants;
int total_tenants; int total_tenants;
pid_t parent_id; pid_t parent_id;
@ -116,7 +117,7 @@ Transaction createNewTransaction(Database db, Arguments const& args, int id = -1
tr.setOption(FDB_TR_OPTION_AUTHORIZATION_TOKEN, token_map_iter->second); tr.setOption(FDB_TR_OPTION_AUTHORIZATION_TOKEN, token_map_iter->second);
} else { } else {
logr.error("could not find token for tenant '{}'", tenant_name); logr.error("could not find token for tenant '{}'", tenant_name);
exit(1); _exit(1);
} }
} }
return tr; return tr;
@ -179,10 +180,10 @@ int cleanupNormalKeyspace(Database db, Arguments const& args) {
} }
/* populate database */ /* populate database */
int populate(Database db, const ThreadArgs& thread_args, int thread_tps, ThreadStatistics& stats) { int populate(Database db, const ThreadArgs& thread_args, int thread_tps, WorkerStatistics& stats) {
Arguments const& args = *thread_args.args; Arguments const& args = *thread_args.args;
const auto worker_id = thread_args.worker_id; const auto process_idx = thread_args.process_idx;
const auto thread_id = thread_args.thread_id; const auto thread_idx = thread_args.thread_idx;
auto xacts = 0; auto xacts = 0;
auto keystr = ByteString{}; auto keystr = ByteString{};
auto valstr = ByteString{}; auto valstr = ByteString{};
@ -204,8 +205,8 @@ int populate(Database db, const ThreadArgs& thread_args, int thread_tps, ThreadS
// Each tenant should have the same range populated // Each tenant should have the same range populated
for (auto t_id = 0; t_id < populate_iters; ++t_id) { for (auto t_id = 0; t_id < populate_iters; ++t_id) {
Transaction tx = createNewTransaction(db, args, t_id, args.active_tenants > 0 ? tenants : nullptr); Transaction tx = createNewTransaction(db, args, t_id, args.active_tenants > 0 ? tenants : nullptr);
const auto key_begin = insertBegin(args.rows, worker_id, thread_id, args.num_processes, args.num_threads); const auto key_begin = insertBegin(args.rows, process_idx, thread_idx, args.num_processes, args.num_threads);
const auto key_end = insertEnd(args.rows, worker_id, thread_id, args.num_processes, args.num_threads); const auto key_end = insertEnd(args.rows, process_idx, thread_idx, args.num_processes, args.num_threads);
auto key_checkpoint = key_begin; // in case of commit failure, restart from this key auto key_checkpoint = key_begin; // in case of commit failure, restart from this key
double required_keys = (key_end - key_begin + 1) * args.load_factor; double required_keys = (key_end - key_begin + 1) * args.load_factor;
for (auto i = key_begin; i <= key_end; i++) { for (auto i = key_begin; i <= key_end; i++) {
@ -291,7 +292,7 @@ int populate(Database db, const ThreadArgs& thread_args, int thread_tps, ThreadS
return 0; return 0;
} }
void updateErrorStatsRunMode(ThreadStatistics& stats, fdb::Error err, int op) { void updateErrorStatsRunMode(WorkerStatistics& stats, fdb::Error err, int op) {
if (err) { if (err) {
if (err.is(1020 /*not_commited*/)) { if (err.is(1020 /*not_commited*/)) {
stats.incrConflictCount(); stats.incrConflictCount();
@ -306,7 +307,7 @@ void updateErrorStatsRunMode(ThreadStatistics& stats, fdb::Error err, int op) {
/* run one iteration of configured transaction */ /* run one iteration of configured transaction */
int runOneTransaction(Transaction& tx, int runOneTransaction(Transaction& tx,
Arguments const& args, Arguments const& args,
ThreadStatistics& stats, WorkerStatistics& stats,
ByteString& key1, ByteString& key1,
ByteString& key2, ByteString& key2,
ByteString& val) { ByteString& val) {
@ -411,7 +412,7 @@ int runWorkload(Database db,
std::atomic<double> const& throttle_factor, std::atomic<double> const& throttle_factor,
int const thread_iters, int const thread_iters,
std::atomic<int> const& signal, std::atomic<int> const& signal,
ThreadStatistics& stats, WorkerStatistics& stats,
int const dotrace, int const dotrace,
int const dotagging) { int const dotagging) {
auto traceid = std::string{}; auto traceid = std::string{};
@ -528,20 +529,20 @@ int runWorkload(Database db,
return rc; return rc;
} }
std::string getStatsFilename(std::string_view dirname, int worker_id, int thread_id, int op) { std::string getStatsFilename(std::string_view dirname, int process_idx, int thread_id, int op) {
return fmt::format("{}/{}_{}_{}", dirname, worker_id + 1, thread_id + 1, opTable[op].name()); return fmt::format("{}/{}_{}_{}", dirname, process_idx + 1, thread_id + 1, opTable[op].name());
} }
std::string getStatsFilename(std::string_view dirname, int worker_id, int thread_id) { std::string getStatsFilename(std::string_view dirname, int process_idx, int thread_id) {
return fmt::format("{}/{}_{}", dirname, worker_id + 1, thread_id + 1); return fmt::format("{}/{}_{}", dirname, process_idx + 1, thread_id + 1);
} }
void dumpThreadSamples(Arguments const& args, void dumpThreadSamples(Arguments const& args,
pid_t parent_id, pid_t parent_id,
int worker_id, int process_idx,
int thread_id, int thread_id,
const ThreadStatistics& stats, const WorkerStatistics& stats,
bool overwrite = true) { bool overwrite = true) {
const auto dirname = fmt::format("{}{}", TEMP_DATA_STORE, parent_id); const auto dirname = fmt::format("{}{}", TEMP_DATA_STORE, parent_id);
const auto rc = mkdir(dirname.c_str(), S_IRWXU | S_IRWXG | S_IROTH | S_IXOTH); const auto rc = mkdir(dirname.c_str(), S_IRWXU | S_IRWXG | S_IROTH | S_IXOTH);
@ -551,21 +552,21 @@ void dumpThreadSamples(Arguments const& args,
} }
for (auto op = 0; op < MAX_OP; op++) { for (auto op = 0; op < MAX_OP; op++) {
if (args.txnspec.ops[op][OP_COUNT] > 0 || isAbstractOp(op)) { if (args.txnspec.ops[op][OP_COUNT] > 0 || isAbstractOp(op)) {
stats.writeToFile(getStatsFilename(dirname, worker_id, thread_id, op), op); stats.writeToFile(getStatsFilename(dirname, process_idx, thread_id, op), op);
} }
} }
} }
void runAsyncWorkload(Arguments const& args, void runAsyncWorkload(Arguments const& args,
pid_t pid_main, pid_t pid_main,
int worker_id, int process_idx,
shared_memory::Access shm, shared_memory::Access shm,
boost::asio::io_context& io_context, boost::asio::io_context& io_context,
std::vector<Database>& databases) { std::vector<Database>& databases) {
auto dump_samples = [&args, pid_main, worker_id](auto&& states) { auto dump_samples = [&args, pid_main, process_idx](auto&& states) {
auto overwrite = true; /* overwrite or append */ auto overwrite = true; /* overwrite or append */
for (const auto& state : states) { for (const auto& state : states) {
dumpThreadSamples(args, pid_main, worker_id, 0 /*thread_id*/, state->stats, overwrite); dumpThreadSamples(args, pid_main, process_idx, 0 /*thread_id*/, state->stats, overwrite);
overwrite = false; overwrite = false;
} }
}; };
@ -573,16 +574,16 @@ void runAsyncWorkload(Arguments const& args,
if (args.mode == MODE_BUILD) { if (args.mode == MODE_BUILD) {
auto states = std::vector<PopulateStateHandle>(args.async_xacts); auto states = std::vector<PopulateStateHandle>(args.async_xacts);
for (auto i = 0; i < args.async_xacts; i++) { for (auto i = 0; i < args.async_xacts; i++) {
const auto key_begin = insertBegin(args.rows, worker_id, i, args.num_processes, args.async_xacts); const auto key_begin = insertBegin(args.rows, process_idx, i, args.num_processes, args.async_xacts);
const auto key_end = insertEnd(args.rows, worker_id, i, args.num_processes, args.async_xacts); const auto key_end = insertEnd(args.rows, process_idx, i, args.num_processes, args.async_xacts);
auto db = databases[i % args.num_databases]; auto db = databases[i % args.num_databases];
auto state = auto state =
std::make_shared<ResumableStateForPopulate>(Logger(WorkerProcess{}, args.verbose, worker_id, i), std::make_shared<ResumableStateForPopulate>(Logger(WorkerProcess{}, args.verbose, process_idx, i),
db, db,
createNewTransaction(db, args), createNewTransaction(db, args),
io_context, io_context,
args, args,
shm.statsSlot(worker_id, i), shm.workerStatsSlot(process_idx, i),
stopcount, stopcount,
key_begin, key_begin,
key_end); key_end);
@ -605,17 +606,17 @@ void runAsyncWorkload(Arguments const& args,
const auto max_iters = const auto max_iters =
args.iteration == 0 args.iteration == 0
? -1 ? -1
: computeThreadIters(args.iteration, worker_id, i, args.num_processes, args.async_xacts); : computeThreadIters(args.iteration, process_idx, i, args.num_processes, args.async_xacts);
// argument validation should ensure max_iters > 0 // argument validation should ensure max_iters > 0
assert(args.iteration == 0 || max_iters > 0); assert(args.iteration == 0 || max_iters > 0);
auto state = auto state =
std::make_shared<ResumableStateForRunWorkload>(Logger(WorkerProcess{}, args.verbose, worker_id, i), std::make_shared<ResumableStateForRunWorkload>(Logger(WorkerProcess{}, args.verbose, process_idx, i),
db, db,
createNewTransaction(db, args), createNewTransaction(db, args),
io_context, io_context,
args, args,
shm.statsSlot(worker_id, i), shm.workerStatsSlot(process_idx, i),
stopcount, stopcount,
shm.headerConst().signal, shm.headerConst().signal,
max_iters, max_iters,
@ -637,32 +638,34 @@ void runAsyncWorkload(Arguments const& args,
/* mako worker thread */ /* mako worker thread */
void workerThread(const ThreadArgs& thread_args) { void workerThread(const ThreadArgs& thread_args) {
auto time_start = steady_clock::now();
const auto& args = *thread_args.args; const auto& args = *thread_args.args;
const auto parent_id = thread_args.parent_id; const auto parent_id = thread_args.parent_id;
const auto worker_id = thread_args.worker_id; const auto process_idx = thread_args.process_idx;
const auto thread_id = thread_args.thread_id; const auto thread_idx = thread_args.thread_idx;
const auto dotrace = (worker_id == 0 && thread_id == 0 && args.txntrace) ? args.txntrace : 0; const auto dotrace = (process_idx == 0 && thread_idx == 0 && args.txntrace) ? args.txntrace : 0;
auto database = thread_args.database; auto database = thread_args.database;
const auto dotagging = args.txntagging; const auto dotagging = args.txntagging;
const auto& signal = thread_args.shm.headerConst().signal; const auto& signal = thread_args.shm.headerConst().signal;
const auto& throttle_factor = thread_args.shm.headerConst().throttle_factor; const auto& throttle_factor = thread_args.shm.headerConst().throttle_factor;
auto& readycount = thread_args.shm.header().readycount; auto& readycount = thread_args.shm.header().readycount;
auto& stopcount = thread_args.shm.header().stopcount; auto& stopcount = thread_args.shm.header().stopcount;
auto& stats = thread_args.shm.statsSlot(worker_id, thread_id); auto& stats = thread_args.shm.workerStatsSlot(process_idx, thread_idx);
logr = Logger(WorkerProcess{}, args.verbose, worker_id, thread_id); logr = Logger(WorkerProcess{}, args.verbose, process_idx, thread_idx);
logr.debug("started, tid: {}", reinterpret_cast<uint64_t>(pthread_self())); logr.debug("started, tid: {}", reinterpret_cast<uint64_t>(pthread_self()));
const auto thread_tps = const auto thread_tps =
args.tpsmax == 0 ? 0 args.tpsmax == 0 ? 0
: computeThreadTps(args.tpsmax, worker_id, thread_id, args.num_processes, args.num_threads); : computeThreadTps(args.tpsmax, process_idx, thread_idx, args.num_processes, args.num_threads);
// argument validation should ensure thread_tps > 0 // argument validation should ensure thread_tps > 0
assert(args.tpsmax == 0 || thread_tps > 0); assert(args.tpsmax == 0 || thread_tps > 0);
const auto thread_iters = const auto thread_iters =
args.iteration == 0 args.iteration == 0
? -1 ? -1
: computeThreadIters(args.iteration, worker_id, thread_id, args.num_processes, args.num_threads); : computeThreadIters(args.iteration, process_idx, thread_idx, args.num_processes, args.num_threads);
// argument validation should ensure thread_iters > 0 // argument validation should ensure thread_iters > 0
assert(args.iteration == 0 || thread_iters > 0); assert(args.iteration == 0 || thread_iters > 0);
@ -692,12 +695,15 @@ void workerThread(const ThreadArgs& thread_args) {
} }
if (args.mode == MODE_BUILD || args.mode == MODE_RUN) { if (args.mode == MODE_BUILD || args.mode == MODE_RUN) {
dumpThreadSamples(args, parent_id, worker_id, thread_id, stats); dumpThreadSamples(args, parent_id, process_idx, thread_idx, stats);
} }
thread_args.shm.threadStatsSlot(process_idx, thread_idx)
.setCPUUtilization(getProcessorTimeThread() / toDoubleSeconds(steady_clock::now() - time_start) * 100.);
} }
/* mako worker process */ /* mako worker process */
int workerProcessMain(Arguments const& args, int worker_id, shared_memory::Access shm, pid_t pid_main) { int workerProcessMain(Arguments const& args, int process_idx, shared_memory::Access shm, pid_t pid_main) {
logr.debug("started"); logr.debug("started");
auto err = Error{}; auto err = Error{};
@ -712,12 +718,18 @@ int workerProcessMain(Arguments const& args, int worker_id, shared_memory::Acces
/* Each worker process will have its own network thread */ /* Each worker process will have its own network thread */
logr.debug("creating network thread"); logr.debug("creating network thread");
auto network_thread = std::thread([parent_logr = logr]() { auto network_thread = std::thread([parent_logr = logr, process_idx, shm]() {
auto time_start = steady_clock::now();
logr = parent_logr; logr = parent_logr;
logr.debug("network thread started"); logr.debug("network thread started");
if (auto err = network::run()) { if (auto err = network::run()) {
logr.error("network::run(): {}", err.what()); logr.error("network::run(): {}", err.what());
} }
shm.processStatsSlot(process_idx)
.setFDBNetworkCPUUtilization(getProcessorTimeThread() / toDoubleSeconds(steady_clock::now() - time_start) *
100.);
}); });
#if defined(__linux__) #if defined(__linux__)
pthread_setname_np(network_thread.native_handle(), "mako_network"); pthread_setname_np(network_thread.native_handle(), "mako_network");
@ -762,8 +774,8 @@ int workerProcessMain(Arguments const& args, int worker_id, shared_memory::Acces
for (auto i = 0; i < args.num_threads; i++) { for (auto i = 0; i < args.num_threads; i++) {
auto& this_args = thread_args[i]; auto& this_args = thread_args[i];
this_args.worker_id = worker_id; this_args.process_idx = process_idx;
this_args.thread_id = i; this_args.thread_idx = i;
this_args.parent_id = pid_main; this_args.parent_id = pid_main;
this_args.active_tenants = args.active_tenants; this_args.active_tenants = args.active_tenants;
this_args.total_tenants = args.total_tenants; this_args.total_tenants = args.total_tenants;
@ -788,11 +800,17 @@ int workerProcessMain(Arguments const& args, int worker_id, shared_memory::Acces
auto wg = WorkGuard(ctx.get_executor()); auto wg = WorkGuard(ctx.get_executor());
auto worker_threads = std::vector<std::thread>(args.num_threads); auto worker_threads = std::vector<std::thread>(args.num_threads);
for (auto i = 0; i < args.num_threads; i++) { for (auto i = 0; i < args.num_threads; i++) {
worker_threads[i] = std::thread([&ctx, &args, worker_id, i]() { worker_threads[i] = std::thread([&ctx, &args, process_idx, i, shm]() {
logr = Logger(WorkerProcess{}, args.verbose, worker_id); auto time_start = steady_clock::now();
logr = Logger(WorkerProcess{}, args.verbose, process_idx);
logr.debug("Async-mode worker thread {} started", i + 1); logr.debug("Async-mode worker thread {} started", i + 1);
ctx.run(); ctx.run();
logr.debug("Async-mode worker thread {} finished", i + 1); logr.debug("Async-mode worker thread {} finished", i + 1);
shm.threadStatsSlot(process_idx, i)
.setCPUUtilization(getProcessorTimeThread() / toDoubleSeconds(steady_clock::now() - time_start) *
100.);
}); });
#if defined(__linux__) #if defined(__linux__)
const auto thread_name = "mako_worker_" + std::to_string(i); const auto thread_name = "mako_worker_" + std::to_string(i);
@ -800,7 +818,7 @@ int workerProcessMain(Arguments const& args, int worker_id, shared_memory::Acces
#endif #endif
} }
shm.header().readycount.fetch_add(args.num_threads); shm.header().readycount.fetch_add(args.num_threads);
runAsyncWorkload(args, pid_main, worker_id, shm, ctx, databases); runAsyncWorkload(args, pid_main, process_idx, shm, ctx, databases);
wg.reset(); wg.reset();
for (auto& thread : worker_threads) for (auto& thread : worker_threads)
thread.join(); thread.join();
@ -1387,7 +1405,7 @@ int parseArguments(int argc, char* argv[], Arguments& args) {
break; break;
case ARG_VERSION: case ARG_VERSION:
logr.error("Version: {}", FDB_API_VERSION); logr.error("Version: {}", FDB_API_VERSION);
exit(0); _exit(0);
break; break;
case ARG_COMMITGET: case ARG_COMMITGET:
args.commit_get = 1; args.commit_get = 1;
@ -1452,7 +1470,7 @@ int parseArguments(int argc, char* argv[], Arguments& args) {
case ARG_TXNTAGGINGPREFIX: case ARG_TXNTAGGINGPREFIX:
if (strlen(optarg) > TAGPREFIXLENGTH_MAX) { if (strlen(optarg) > TAGPREFIXLENGTH_MAX) {
logr.error("the length of txntagging_prefix is larger than {}", TAGPREFIXLENGTH_MAX); logr.error("the length of txntagging_prefix is larger than {}", TAGPREFIXLENGTH_MAX);
exit(0); _exit(0);
} }
memcpy(args.txntagging_prefix, optarg, strlen(optarg)); memcpy(args.txntagging_prefix, optarg, strlen(optarg));
break; break;
@ -1698,15 +1716,13 @@ void Arguments::generateAuthorizationTokens() {
logr.info("generated {} tokens in {:6.3f} seconds", active_tenants, toDoubleSeconds(stopwatch.stop().diff())); logr.info("generated {} tokens in {:6.3f} seconds", active_tenants, toDoubleSeconds(stopwatch.stop().diff()));
} }
void printStats(Arguments const& args, ThreadStatistics const* stats, double const duration_sec, FILE* fp) { void printStats(Arguments const& args, WorkerStatistics const* stats, double const duration_sec, FILE* fp) {
static ThreadStatistics prev; static WorkerStatistics prev;
const auto num_effective_threads = args.async_xacts > 0 ? args.async_xacts : args.num_threads; const auto num_workers = args.async_xacts > 0 ? args.async_xacts : args.num_threads;
auto current = ThreadStatistics{}; auto current = WorkerStatistics{};
for (auto i = 0; i < args.num_processes; i++) { for (auto i = 0; i < args.num_processes * num_workers; i++) {
for (auto j = 0; j < num_effective_threads; j++) { current.combine(stats[i]);
current.combine(stats[(i * num_effective_threads) + j]);
}
} }
if (fp) { if (fp) {
@ -1803,7 +1819,7 @@ void printStatsHeader(Arguments const& args, bool show_commit, bool is_first_hea
fmt::print("\n"); fmt::print("\n");
} }
void printThreadStats(ThreadStatistics& final_stats, Arguments args, FILE* fp, bool is_report = false) { void printWorkerStats(WorkerStatistics& final_stats, Arguments args, FILE* fp, bool is_report = false) {
if (is_report) { if (is_report) {
for (auto op = 0; op < MAX_OP; op++) { for (auto op = 0; op < MAX_OP; op++) {
@ -2046,18 +2062,26 @@ void loadSample(int pid_main, int op, std::vector<DDSketchMako>& data_points, in
} }
void printReport(Arguments const& args, void printReport(Arguments const& args,
ThreadStatistics const* stats, WorkerStatistics const* worker_stats,
ThreadStatistics const* thread_stats,
ProcessStatistics const* process_stats,
double const duration_sec, double const duration_sec,
pid_t pid_main, pid_t pid_main,
FILE* fp) { FILE* fp) {
auto final_stats = ThreadStatistics{}; auto final_worker_stats = WorkerStatistics{};
const auto num_effective_threads = args.async_xacts > 0 ? args.async_xacts : args.num_threads; auto final_thread_stats = ThreadStatistics{};
auto final_process_stats = ProcessStatistics{};
const auto num_workers = args.async_xacts > 0 ? args.async_xacts : args.num_threads;
for (auto i = 0; i < args.num_processes * num_workers; i++) {
final_worker_stats.combine(worker_stats[i]);
}
for (auto i = 0; i < args.num_processes * args.num_threads; i++) {
final_thread_stats.combine(thread_stats[i]);
}
for (auto i = 0; i < args.num_processes; i++) { for (auto i = 0; i < args.num_processes; i++) {
for (auto j = 0; j < num_effective_threads; j++) { final_process_stats.combine(process_stats[i]);
const auto idx = i * num_effective_threads + j;
final_stats.combine(stats[idx]);
}
} }
/* overall stats */ /* overall stats */
@ -2084,13 +2108,21 @@ void printReport(Arguments const& args,
break; break;
} }
} }
const auto tps_f = final_stats.getOpCount(OP_TRANSACTION) / duration_sec; const auto tps_f = final_worker_stats.getOpCount(OP_TRANSACTION) / duration_sec;
const auto tps_i = static_cast<uint64_t>(tps_f); const auto tps_i = static_cast<uint64_t>(tps_f);
fmt::printf("Total Xacts: %8lu\n", final_stats.getOpCount(OP_TRANSACTION)); const auto cpu_external_network = final_process_stats.getTotalCPUUtilization() -
fmt::printf("Total Conflicts: %8lu\n", final_stats.getConflictCount()); final_thread_stats.getCPUUtilization() -
fmt::printf("Total Errors: %8lu\n", final_stats.getTotalErrorCount()); final_process_stats.getFDBNetworkCPUUtilization();
fmt::printf("Total Timeouts: %8lu\n", final_stats.getTotalTimeoutCount());
fmt::printf("Total Xacts: %8lu\n", final_worker_stats.getOpCount(OP_TRANSACTION));
fmt::printf("Total Conflicts: %8lu\n", final_worker_stats.getConflictCount());
fmt::printf("Total Errors: %8lu\n", final_worker_stats.getTotalErrorCount());
fmt::printf("Total Timeouts: %8lu\n", final_worker_stats.getTotalTimeoutCount());
fmt::printf("Overall TPS: %8lu\n\n", tps_i); fmt::printf("Overall TPS: %8lu\n\n", tps_i);
fmt::printf("%%CPU Worker Processes: %6.2f \n", final_process_stats.getTotalCPUUtilization());
fmt::printf("%%CPU Worker Threads: %6.2f \n", final_thread_stats.getCPUUtilization());
fmt::printf("%%CPU Local Network Threads: %6.2f \n", final_process_stats.getFDBNetworkCPUUtilization());
fmt::printf("%%CPU External Network Threads: %6.2f \n\n", cpu_external_network);
if (fp) { if (fp) {
fmt::fprintf(fp, "\"results\": {"); fmt::fprintf(fp, "\"results\": {");
@ -2099,11 +2131,15 @@ void printReport(Arguments const& args,
fmt::fprintf(fp, "\"totalThreads\": %d,", args.num_threads); fmt::fprintf(fp, "\"totalThreads\": %d,", args.num_threads);
fmt::fprintf(fp, "\"totalAsyncXacts\": %d,", args.async_xacts); fmt::fprintf(fp, "\"totalAsyncXacts\": %d,", args.async_xacts);
fmt::fprintf(fp, "\"targetTPS\": %d,", args.tpsmax); fmt::fprintf(fp, "\"targetTPS\": %d,", args.tpsmax);
fmt::fprintf(fp, "\"totalXacts\": %lu,", final_stats.getOpCount(OP_TRANSACTION)); fmt::fprintf(fp, "\"totalXacts\": %lu,", final_worker_stats.getOpCount(OP_TRANSACTION));
fmt::fprintf(fp, "\"totalConflicts\": %lu,", final_stats.getConflictCount()); fmt::fprintf(fp, "\"totalConflicts\": %lu,", final_worker_stats.getConflictCount());
fmt::fprintf(fp, "\"totalErrors\": %lu,", final_stats.getTotalErrorCount()); fmt::fprintf(fp, "\"totalErrors\": %lu,", final_worker_stats.getTotalErrorCount());
fmt::fprintf(fp, "\"totalTimeouts\": %lu,", final_stats.getTotalTimeoutCount()); fmt::fprintf(fp, "\"totalTimeouts\": %lu,", final_worker_stats.getTotalTimeoutCount());
fmt::fprintf(fp, "\"overallTPS\": %lu,", tps_i); fmt::fprintf(fp, "\"overallTPS\": %lu,", tps_i);
fmt::fprintf(fp, "\"workerProcesseCPU\": %.8f,", final_process_stats.getTotalCPUUtilization());
fmt::fprintf(fp, "\"workerThreadCPU\": %.8f,", final_thread_stats.getCPUUtilization());
fmt::fprintf(fp, "\"localNetworkCPU\": %.8f,", final_process_stats.getFDBNetworkCPUUtilization());
fmt::fprintf(fp, "\"externalNetworkCPU\": %.8f,", cpu_external_network);
} }
/* per-op stats */ /* per-op stats */
@ -2117,24 +2153,24 @@ void printReport(Arguments const& args,
auto first_op = true; auto first_op = true;
for (auto op = 0; op < MAX_OP; op++) { for (auto op = 0; op < MAX_OP; op++) {
if ((args.txnspec.ops[op][OP_COUNT] > 0 && op != OP_TRANSACTION) || op == OP_COMMIT) { if ((args.txnspec.ops[op][OP_COUNT] > 0 && op != OP_TRANSACTION) || op == OP_COMMIT) {
putField(final_stats.getOpCount(op)); putField(final_worker_stats.getOpCount(op));
if (fp) { if (fp) {
if (first_op) { if (first_op) {
first_op = false; first_op = false;
} else { } else {
fmt::fprintf(fp, ","); fmt::fprintf(fp, ",");
} }
fmt::fprintf(fp, "\"%s\": %lu", getOpName(op), final_stats.getOpCount(op)); fmt::fprintf(fp, "\"%s\": %lu", getOpName(op), final_worker_stats.getOpCount(op));
} }
} }
} }
/* TPS */ /* TPS */
const auto tps = final_stats.getOpCount(OP_TRANSACTION) / duration_sec; const auto tps = final_worker_stats.getOpCount(OP_TRANSACTION) / duration_sec;
putFieldFloat(tps, 2); putFieldFloat(tps, 2);
/* Conflicts */ /* Conflicts */
const auto conflicts_rate = final_stats.getConflictCount() / duration_sec; const auto conflicts_rate = final_worker_stats.getConflictCount() / duration_sec;
putFieldFloat(conflicts_rate, 2); putFieldFloat(conflicts_rate, 2);
fmt::print("\n"); fmt::print("\n");
@ -2147,14 +2183,14 @@ void printReport(Arguments const& args,
first_op = true; first_op = true;
for (auto op = 0; op < MAX_OP; op++) { for (auto op = 0; op < MAX_OP; op++) {
if ((args.txnspec.ops[op][OP_COUNT] > 0 && op != OP_TRANSACTION) || op == OP_COMMIT) { if ((args.txnspec.ops[op][OP_COUNT] > 0 && op != OP_TRANSACTION) || op == OP_COMMIT) {
putField(final_stats.getErrorCount(op)); putField(final_worker_stats.getErrorCount(op));
if (fp) { if (fp) {
if (first_op) { if (first_op) {
first_op = false; first_op = false;
} else { } else {
fmt::fprintf(fp, ","); fmt::fprintf(fp, ",");
} }
fmt::fprintf(fp, "\"%s\": %lu", getOpName(op), final_stats.getErrorCount(op)); fmt::fprintf(fp, "\"%s\": %lu", getOpName(op), final_worker_stats.getErrorCount(op));
} }
} }
} }
@ -2168,14 +2204,14 @@ void printReport(Arguments const& args,
first_op = true; first_op = true;
for (auto op = 0; op < MAX_OP; op++) { for (auto op = 0; op < MAX_OP; op++) {
if ((args.txnspec.ops[op][OP_COUNT] > 0 && op != OP_TRANSACTION) || op == OP_COMMIT) { if ((args.txnspec.ops[op][OP_COUNT] > 0 && op != OP_TRANSACTION) || op == OP_COMMIT) {
putField(final_stats.getTimeoutCount(op)); putField(final_worker_stats.getTimeoutCount(op));
if (fp) { if (fp) {
if (first_op) { if (first_op) {
first_op = false; first_op = false;
} else { } else {
fmt::fprintf(fp, ","); fmt::fprintf(fp, ",");
} }
fmt::fprintf(fp, "\"%s\": %lu", getOpName(op), final_stats.getTimeoutCount(op)); fmt::fprintf(fp, "\"%s\": %lu", getOpName(op), final_worker_stats.getTimeoutCount(op));
} }
} }
} }
@ -2200,14 +2236,14 @@ void printReport(Arguments const& args,
} }
} }
} }
final_stats.updateLatencies(data_points); final_worker_stats.updateLatencies(data_points);
printThreadStats(final_stats, args, fp); printWorkerStats(final_worker_stats, args, fp);
// export the ddsketch if the flag was set // export the ddsketch if the flag was set
if (args.stats_export_path[0] != 0) { if (args.stats_export_path[0] != 0) {
std::ofstream f(args.stats_export_path); std::ofstream f(args.stats_export_path);
f << final_stats; f << final_worker_stats;
} }
const auto command_remove = fmt::format("rm -rf {}{}", TEMP_DATA_STORE, pid_main); const auto command_remove = fmt::format("rm -rf {}{}", TEMP_DATA_STORE, pid_main);
@ -2218,7 +2254,9 @@ void printReport(Arguments const& args,
} }
int statsProcessMain(Arguments const& args, int statsProcessMain(Arguments const& args,
ThreadStatistics const* stats, WorkerStatistics const* worker_stats,
ThreadStatistics const* thread_stats,
ProcessStatistics const* process_stats,
std::atomic<double>& throttle_factor, std::atomic<double>& throttle_factor,
std::atomic<int> const& signal, std::atomic<int> const& signal,
std::atomic<int> const& stopcount, std::atomic<int> const& stopcount,
@ -2327,7 +2365,7 @@ int statsProcessMain(Arguments const& args,
if (fp) if (fp)
fmt::fprintf(fp, ","); fmt::fprintf(fp, ",");
} }
printStats(args, stats, toDoubleSeconds(time_now - time_prev), fp); printStats(args, worker_stats, toDoubleSeconds(time_now - time_prev), fp);
} }
time_prev = time_now; time_prev = time_now;
} }
@ -2343,7 +2381,8 @@ int statsProcessMain(Arguments const& args,
while (stopcount.load() < args.num_threads * args.num_processes) { while (stopcount.load() < args.num_threads * args.num_processes) {
usleep(10000); /* 10ms */ usleep(10000); /* 10ms */
} }
printReport(args, stats, toDoubleSeconds(time_now - time_start), pid_main, fp); printReport(
args, worker_stats, thread_stats, process_stats, toDoubleSeconds(time_now - time_start), pid_main, fp);
} }
if (fp) { if (fp) {
@ -2354,12 +2393,12 @@ int statsProcessMain(Arguments const& args,
return 0; return 0;
} }
ThreadStatistics mergeSketchReport(Arguments& args) { WorkerStatistics mergeSketchReport(Arguments& args) {
ThreadStatistics stats; WorkerStatistics stats;
for (int i = 0; i < args.num_report_files; i++) { for (int i = 0; i < args.num_report_files; i++) {
std::ifstream f{ args.report_files[i] }; std::ifstream f{ args.report_files[i] };
ThreadStatistics tmp; WorkerStatistics tmp;
f >> tmp; f >> tmp;
stats.combine(tmp); stats.combine(tmp);
} }
@ -2442,8 +2481,8 @@ int main(int argc, char* argv[]) {
} }
if (args.mode == MODE_REPORT) { if (args.mode == MODE_REPORT) {
ThreadStatistics stats = mergeSketchReport(args); WorkerStatistics stats = mergeSketchReport(args);
printThreadStats(stats, args, NULL, true); printWorkerStats(stats, args, NULL, true);
return 0; return 0;
} }
@ -2502,9 +2541,9 @@ int main(int argc, char* argv[]) {
}); });
const auto async_mode = args.async_xacts > 0; const auto async_mode = args.async_xacts > 0;
const auto nthreads_for_shm = async_mode ? args.async_xacts : args.num_threads; const auto num_workers = async_mode ? args.async_xacts : args.num_threads;
/* allocate */ /* allocate */
const auto shmsize = shared_memory::storageSize(args.num_processes, nthreads_for_shm); const auto shmsize = shared_memory::storageSize(args.num_processes, args.num_threads, num_workers);
auto shm = std::add_pointer_t<void>{}; auto shm = std::add_pointer_t<void>{};
if (ftruncate(shmfd, shmsize) < 0) { if (ftruncate(shmfd, shmsize) < 0) {
@ -2521,7 +2560,7 @@ int main(int argc, char* argv[]) {
} }
auto munmap_guard = ExitGuard([=]() { munmap(shm, shmsize); }); auto munmap_guard = ExitGuard([=]() { munmap(shm, shmsize); });
auto shm_access = shared_memory::Access(shm, args.num_processes, nthreads_for_shm); auto shm_access = shared_memory::Access(shm, args.num_processes, args.num_threads, num_workers);
/* initialize the shared memory */ /* initialize the shared memory */
shm_access.initMemory(); shm_access.initMemory();
@ -2537,7 +2576,7 @@ int main(int argc, char* argv[]) {
/* fork worker processes + 1 stats process */ /* fork worker processes + 1 stats process */
auto worker_pids = std::vector<pid_t>(args.num_processes + 1); auto worker_pids = std::vector<pid_t>(args.num_processes + 1);
auto worker_id = int{}; auto process_idx = int{};
/* forking (num_process + 1) children */ /* forking (num_process + 1) children */
/* last process is the stats handler */ /* last process is the stats handler */
@ -2554,7 +2593,7 @@ int main(int argc, char* argv[]) {
/* worker process */ /* worker process */
logr = Logger(WorkerProcess{}, args.verbose, p); logr = Logger(WorkerProcess{}, args.verbose, p);
proc_type = ProcKind::WORKER; proc_type = ProcKind::WORKER;
worker_id = p; process_idx = p;
} else { } else {
/* stats */ /* stats */
logr = Logger(StatsProcess{}, args.verbose); logr = Logger(StatsProcess{}, args.verbose);
@ -2574,18 +2613,29 @@ int main(int argc, char* argv[]) {
if (proc_type == ProcKind::WORKER) { if (proc_type == ProcKind::WORKER) {
/* worker process */ /* worker process */
workerProcessMain(args, worker_id, shm_access, pid_main); auto time_start = steady_clock::now();
workerProcessMain(args, process_idx, shm_access, pid_main);
shm_access.processStatsSlot(process_idx)
.setCPUUtilization(getProcessorTimeProcess() / toDoubleSeconds(steady_clock::now() - time_start) * 100.);
/* worker can exit here */ /* worker can exit here */
exit(0); _exit(0);
} else if (proc_type == ProcKind::STATS) { } else if (proc_type == ProcKind::STATS) {
/* stats */ /* stats */
if (args.mode == MODE_CLEAN) { if (args.mode == MODE_CLEAN) {
/* no stats needed for clean mode */ /* no stats needed for clean mode */
exit(0); _exit(0);
} }
statsProcessMain( statsProcessMain(args,
args, shm_access.statsConstArray(), shm_hdr.throttle_factor, shm_hdr.signal, shm_hdr.stopcount, pid_main); shm_access.workerStatsConstArray(),
exit(0); shm_access.threadStatsConstArray(),
shm_access.processStatsConstArray(),
shm_hdr.throttle_factor,
shm_hdr.signal,
shm_hdr.stopcount,
pid_main);
_exit(0);
} }
/* master */ /* master */

View File

@ -43,63 +43,136 @@ struct Header {
struct LayoutHelper { struct LayoutHelper {
Header hdr; Header hdr;
ThreadStatistics stats; WorkerStatistics stats;
}; };
inline size_t storageSize(int num_processes, int num_threads) noexcept { inline size_t storageSize(int num_processes, int num_threads, int num_workers) noexcept {
assert(num_processes >= 1 && num_threads >= 1); assert(num_processes >= 1 && num_threads >= 1);
return sizeof(LayoutHelper) + sizeof(ThreadStatistics) * ((num_processes * num_threads) - 1); return sizeof(LayoutHelper) + sizeof(WorkerStatistics) * ((num_processes * num_workers) - 1) +
sizeof(ThreadStatistics) * (num_threads * num_processes) + sizeof(ProcessStatistics) * num_processes;
} }
// class Access memory layout:
// Header | WorkerStatistics | WorkerStatistics * (num_processes * num_workers - 1) | ThreadStatistics * (num_processes
// * num_threads) | ProcessStatistics * (num_processes)
// all Statistics classes have alignas(64)
class Access { class Access {
void* base; void* base;
int num_processes; int num_processes;
int num_threads; int num_threads;
int num_workers;
static inline ThreadStatistics& statsSlot(void* shm_base, static inline WorkerStatistics& workerStatsSlot(void* shm_base,
int num_threads, int num_workers,
int process_idx, int process_idx,
int thread_idx) noexcept { int worker_idx) noexcept {
return (&static_cast<LayoutHelper*>(shm_base)->stats)[process_idx * num_threads + thread_idx]; return (&static_cast<LayoutHelper*>(shm_base)->stats)[process_idx * num_workers + worker_idx];
}
static inline ThreadStatistics& threadStatsSlot(void* shm_base,
int num_processes,
int num_threads,
int num_workers,
int process_idx,
int thread_idx) noexcept {
ThreadStatistics* thread_stat_base =
reinterpret_cast<ThreadStatistics*>(static_cast<char*>(shm_base) + sizeof(LayoutHelper) +
sizeof(WorkerStatistics) * num_processes * num_workers);
return thread_stat_base[process_idx * num_threads + thread_idx];
}
static inline ProcessStatistics& processStatsSlot(void* shm_base,
int num_processes,
int num_threads,
int num_workers,
int process_idx) noexcept {
ProcessStatistics* proc_stat_base =
reinterpret_cast<ProcessStatistics*>(static_cast<char*>(shm_base) + sizeof(LayoutHelper) +
sizeof(WorkerStatistics) * num_processes * num_workers +
sizeof(ThreadStatistics) * num_processes * num_threads);
return proc_stat_base[process_idx];
} }
public: public:
Access(void* shm, int num_processes, int num_threads) noexcept Access(void* shm, int num_processes, int num_threads, int num_workers) noexcept
: base(shm), num_processes(num_processes), num_threads(num_threads) {} : base(shm), num_processes(num_processes), num_threads(num_threads), num_workers(num_workers) {}
Access() noexcept : Access(nullptr, 0, 0) {} Access() noexcept : Access(nullptr, 0, 0, 0) {}
Access(const Access&) noexcept = default; Access(const Access&) noexcept = default;
Access& operator=(const Access&) noexcept = default; Access& operator=(const Access&) noexcept = default;
size_t size() const noexcept { return storageSize(num_processes, num_threads); } size_t size() const noexcept { return storageSize(num_processes, num_threads, num_workers); }
void initMemory() noexcept { void initMemory() noexcept {
new (&header()) Header{}; new (&header()) Header{};
for (auto i = 0; i < num_processes; i++) for (auto i = 0; i < num_processes; i++)
for (auto j = 0; j < num_threads; j++) for (auto j = 0; j < num_workers; j++) {
new (&statsSlot(i, j)) ThreadStatistics(); new (&workerStatsSlot(i, j)) WorkerStatistics();
}
for (auto i = 0; i < num_processes; i++)
for (auto j = 0; j < num_threads; j++) {
new (&threadStatsSlot(i, j)) ThreadStatistics();
}
for (auto i = 0; i < num_processes; i++) {
new (&processStatsSlot(i)) ProcessStatistics();
}
} }
Header const& headerConst() const noexcept { return *static_cast<Header const*>(base); } Header const& headerConst() const noexcept { return *static_cast<Header const*>(base); }
Header& header() const noexcept { return *static_cast<Header*>(base); } Header& header() const noexcept { return *static_cast<Header*>(base); }
ThreadStatistics const* statsConstArray() const noexcept { WorkerStatistics const* workerStatsConstArray() const noexcept {
return &statsSlot(base, num_threads, 0 /*process_id*/, 0 /*thread_id*/); return &workerStatsSlot(base, num_workers, 0 /*process_idx*/, 0 /*worker_idx*/);
} }
ThreadStatistics* statsArray() const noexcept { WorkerStatistics* workerStatsArray() const noexcept {
return &statsSlot(base, num_threads, 0 /*process_id*/, 0 /*thread_id*/); return &workerStatsSlot(base, num_workers, 0 /*process_idx*/, 0 /*worker_idx*/);
} }
ThreadStatistics const& statsConstSlot(int process_idx, int thread_idx) const noexcept { WorkerStatistics const& workerStatsConstSlot(int process_idx, int worker_idx) const noexcept {
return statsSlot(base, num_threads, process_idx, thread_idx); return workerStatsSlot(base, num_workers, process_idx, worker_idx);
} }
ThreadStatistics& statsSlot(int process_idx, int thread_idx) const noexcept { WorkerStatistics& workerStatsSlot(int process_idx, int worker_idx) const noexcept {
return statsSlot(base, num_threads, process_idx, thread_idx); return workerStatsSlot(base, num_workers, process_idx, worker_idx);
}
ThreadStatistics const* threadStatsConstArray() const noexcept {
return &threadStatsSlot(base, num_processes, num_threads, num_workers, 0 /*process_idx*/, 0 /*thread_idx*/);
}
ThreadStatistics* threadStatsArray() const noexcept {
return &threadStatsSlot(base, num_processes, num_threads, num_workers, 0 /*process_idx*/, 0 /*thread_idx*/);
}
ThreadStatistics const& threadStatsConstSlot(int process_idx, int thread_idx) const noexcept {
return threadStatsSlot(base, num_processes, num_threads, num_workers, process_idx, thread_idx);
}
ThreadStatistics& threadStatsSlot(int process_idx, int thread_idx) const noexcept {
return threadStatsSlot(base, num_processes, num_threads, num_workers, process_idx, thread_idx);
}
ProcessStatistics const* processStatsConstArray() const noexcept {
return &processStatsSlot(base, num_processes, num_threads, num_workers, 0 /*process_idx*/);
}
ProcessStatistics* processStatsArray() const noexcept {
return &processStatsSlot(base, num_processes, num_threads, num_workers, 0 /*process_idx*/);
}
ProcessStatistics const& processStatsConstSlot(int process_idx) const noexcept {
return processStatsSlot(base, num_processes, num_threads, num_workers, process_idx);
}
ProcessStatistics& processStatsSlot(int process_idx) const noexcept {
return processStatsSlot(base, num_processes, num_threads, num_workers, process_idx);
} }
}; };

View File

@ -88,7 +88,7 @@ public:
} }
}; };
class alignas(64) ThreadStatistics { class alignas(64) WorkerStatistics {
uint64_t conflicts{ 0 }; uint64_t conflicts{ 0 };
uint64_t total_errors{ 0 }; uint64_t total_errors{ 0 };
uint64_t total_timeouts{ 0 }; uint64_t total_timeouts{ 0 };
@ -100,7 +100,7 @@ class alignas(64) ThreadStatistics {
std::vector<DDSketchMako> sketches; std::vector<DDSketchMako> sketches;
public: public:
ThreadStatistics() noexcept { WorkerStatistics() noexcept {
std::fill(ops.begin(), ops.end(), 0); std::fill(ops.begin(), ops.end(), 0);
std::fill(errors.begin(), errors.end(), 0); std::fill(errors.begin(), errors.end(), 0);
std::fill(timeouts.begin(), timeouts.end(), 0); std::fill(timeouts.begin(), timeouts.end(), 0);
@ -109,8 +109,8 @@ public:
sketches.resize(MAX_OP); sketches.resize(MAX_OP);
} }
ThreadStatistics(const ThreadStatistics& other) = default; WorkerStatistics(const WorkerStatistics& other) = default;
ThreadStatistics& operator=(const ThreadStatistics& other) = default; WorkerStatistics& operator=(const WorkerStatistics& other) = default;
uint64_t getConflictCount() const noexcept { return conflicts; } uint64_t getConflictCount() const noexcept { return conflicts; }
@ -137,7 +137,7 @@ public:
uint64_t mean(int op) const noexcept { return sketches[op].mean(); } uint64_t mean(int op) const noexcept { return sketches[op].mean(); }
// with 'this' as final aggregation, factor in 'other' // with 'this' as final aggregation, factor in 'other'
void combine(const ThreadStatistics& other) { void combine(const WorkerStatistics& other) {
conflicts += other.conflicts; conflicts += other.conflicts;
for (auto op = 0; op < MAX_OP; op++) { for (auto op = 0; op < MAX_OP; op++) {
sketches[op].mergeWith(other.sketches[op]); sketches[op].mergeWith(other.sketches[op]);
@ -183,11 +183,11 @@ public:
void updateLatencies(const std::vector<DDSketchMako> other_sketches) { sketches = other_sketches; } void updateLatencies(const std::vector<DDSketchMako> other_sketches) { sketches = other_sketches; }
friend std::ofstream& operator<<(std::ofstream& os, ThreadStatistics& stats); friend std::ofstream& operator<<(std::ofstream& os, WorkerStatistics& stats);
friend std::ifstream& operator>>(std::ifstream& is, ThreadStatistics& stats); friend std::ifstream& operator>>(std::ifstream& is, WorkerStatistics& stats);
}; };
inline std::ofstream& operator<<(std::ofstream& os, ThreadStatistics& stats) { inline std::ofstream& operator<<(std::ofstream& os, WorkerStatistics& stats) {
rapidjson::StringBuffer ss; rapidjson::StringBuffer ss;
rapidjson::Writer<rapidjson::StringBuffer> writer(ss); rapidjson::Writer<rapidjson::StringBuffer> writer(ss);
writer.StartObject(); writer.StartObject();
@ -254,7 +254,7 @@ inline void populateArray(std::array<uint64_t, MAX_OP>& arr,
} }
} }
inline std::ifstream& operator>>(std::ifstream& is, ThreadStatistics& stats) { inline std::ifstream& operator>>(std::ifstream& is, WorkerStatistics& stats) {
std::stringstream buffer; std::stringstream buffer;
buffer << is.rdbuf(); buffer << is.rdbuf();
rapidjson::Document doc; rapidjson::Document doc;
@ -282,6 +282,45 @@ inline std::ifstream& operator>>(std::ifstream& is, ThreadStatistics& stats) {
return is; return is;
} }
class alignas(64) ThreadStatistics {
double cpu_utilization{ 0.0 };
public:
ThreadStatistics() noexcept {}
ThreadStatistics(const ThreadStatistics& other) = default;
ThreadStatistics& operator=(const ThreadStatistics& other) = default;
double getCPUUtilization() { return cpu_utilization; }
void setCPUUtilization(double cpu_utilization) { this->cpu_utilization = cpu_utilization; }
void combine(const ThreadStatistics& other) { cpu_utilization += other.cpu_utilization; }
};
class alignas(64) ProcessStatistics {
double total_cpu_utilization{ 0.0 };
double fdb_network_cpu_utilization{ 0.0 };
public:
ProcessStatistics() noexcept {}
ProcessStatistics(const ProcessStatistics& other) = default;
ProcessStatistics& operator=(const ProcessStatistics& other) = default;
double getTotalCPUUtilization() { return total_cpu_utilization; }
double getFDBNetworkCPUUtilization() { return fdb_network_cpu_utilization; }
void setCPUUtilization(double total_cpu_utilization) { this->total_cpu_utilization = total_cpu_utilization; }
void setFDBNetworkCPUUtilization(double fdb_network_cpu_utilization) {
this->fdb_network_cpu_utilization = fdb_network_cpu_utilization;
}
void combine(const ProcessStatistics& other) {
total_cpu_utilization += other.total_cpu_utilization;
fdb_network_cpu_utilization += other.fdb_network_cpu_utilization;
}
};
} // namespace mako } // namespace mako
#endif /* MAKO_STATS_HPP */ #endif /* MAKO_STATS_HPP */