foundationdb/flow/Histogram.h

175 lines
5.1 KiB
C
Raw Normal View History

/*
* Histogram.h
*
* This source file is part of the FoundationDB open source project
*
* Copyright 2013-2018 Apple Inc. and the FoundationDB project authors
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#ifndef FLOW_HISTOGRAM_H
#define FLOW_HISTOGRAM_H
#pragma once
2020-11-03 03:09:45 +08:00
#include <flow/Arena.h>
#include <string>
#include <map>
#include <unordered_map>
#include <iostream>
#include <iomanip>
#ifdef _WIN32
#include <intrin.h>
#pragma intrinsic(_BitScanReverse)
#endif
class Histogram;
class HistogramRegistry {
2020-11-06 02:26:51 +08:00
public:
void registerHistogram(Histogram* h);
void unregisterHistogram(Histogram* h);
Histogram* lookupHistogram(std::string const& name);
2020-11-06 02:26:51 +08:00
void logReport();
private:
// This map is ordered by key so that ops within the same group end up
// next to each other in the trace log.
2020-11-06 02:26:51 +08:00
std::map<std::string, Histogram*> histograms;
};
2020-11-06 02:26:51 +08:00
HistogramRegistry& GetHistogramRegistry();
/*
* A fast histogram with power-of-two spaced buckets.
*
* For more information about this technique, see:
* https://www.fsl.cs.stonybrook.edu/project-osprof.html
*/
2020-11-24 03:40:24 +08:00
class Histogram final : public ReferenceCounted<Histogram> {
public:
enum class Unit { microseconds, bytes, bytes_per_second, percentage, record_counter };
private:
//static const std::unordered_map<Unit, std::string> UnitToStringMapper;
const std::unordered_map<Unit, std::string> UnitToStringMapper;
Histogram(std::string const& group, std::string const& op, Unit unit, HistogramRegistry& registry, uint32_t lower, uint32_t upper)
: UnitToStringMapper (
2021-06-29 03:23:09 +08:00
{ { Histogram::Unit::microseconds, "microseconds" },
{ Histogram::Unit::bytes, "bytes" },
{ Histogram::Unit::bytes_per_second, "bytes_per_second" },
{ Histogram::Unit::percentage, "percentage" },
{ Histogram::Unit::record_counter, "record_counter" },
2021-06-29 03:23:09 +08:00
}),
group(group), op(op), unit(unit), registry(registry), lowerBound(lower), upperBound(upper), ReferenceCounted<Histogram>() {
ASSERT(UnitToStringMapper.find(unit) != UnitToStringMapper.end());
2020-11-06 02:26:51 +08:00
clear();
}
static std::string generateName(std::string const& group, std::string const& op) { return group + ":" + op; }
public:
2020-11-06 02:26:51 +08:00
~Histogram() { registry.unregisterHistogram(this); }
static Reference<Histogram> getHistogram(StringRef group, StringRef op, Unit unit, uint32_t lower = 0, uint32_t upper = UINT32_MAX) {
2020-11-06 02:26:51 +08:00
std::string group_str = group.toString();
std::string op_str = op.toString();
std::string name = generateName(group_str, op_str);
HistogramRegistry& registry = GetHistogramRegistry();
Histogram* h = registry.lookupHistogram(name);
if (!h) {
h = new Histogram(group_str, op_str, unit, registry, lower, upper);
registry.registerHistogram(h);
return Reference<Histogram>(h);
} else {
return Reference<Histogram>::addRef(h);
2020-11-06 02:26:51 +08:00
}
}
// This histogram buckets samples into powers of two.
2020-11-06 02:26:51 +08:00
inline void sample(uint32_t sample) {
size_t idx;
#ifdef _WIN32
2020-11-06 02:26:51 +08:00
unsigned long index;
// _BitScanReverse sets index to the position of the first non-zero bit, so
// _BitScanReverse(sample) ~= log_2(sample). _BitScanReverse returns false if
// sample is zero.
idx = _BitScanReverse(&index, sample) ? index : 0;
#else
// __builtin_clz counts the leading zeros in its uint32_t argument. So, 31-clz ~= log_2(sample).
// __builtin_clz(0) is undefined.
idx = sample ? (31 - __builtin_clz(sample)) : 0;
#endif
ASSERT(idx < 32);
buckets[idx]++;
2020-11-06 02:26:51 +08:00
}
inline void sampleSeconds(double delta) {
uint64_t delta_usec = (delta * 1000000);
if (delta_usec > UINT32_MAX) {
sample(UINT32_MAX);
} else {
sample((uint32_t)(delta * 1000000)); // convert to microseconds and truncate to integer
}
}
// Histogram buckets samples into linear interval of size 4 percent.
2021-06-24 05:54:41 +08:00
inline void samplePercentage(double pct) {
ASSERT(unit==Histogram::Unit::percentage);
ASSERT(pct>=0.0);
if (pct >= 1.28){
pct = 1.24;
}
size_t idx = (pct*100) / 4;
ASSERT(idx < 32);
buckets[idx]++;
}
2020-11-06 02:26:51 +08:00
// Histogram buckets samples into one of the same sized buckets
// This is used when the distance b/t upperBound and lowerBound are relativly small
inline void sampleRecordCounter(uint32_t sample) {
ASSERT(unit==Histogram::Unit::record_counter);
size_t idx = ( (sample - lowerBound) * 31.0 ) / (upperBound - lowerBound);
2021-06-29 05:16:41 +08:00
if(idx >= 32){ idx = 31;}
2021-06-29 04:55:22 +08:00
ASSERT(idx < 32);
buckets[idx]++;
}
2020-11-06 02:26:51 +08:00
void clear() {
for (uint32_t& i : buckets) {
i = 0;
}
}
void writeToLog();
std::string name() const { return generateName(this->group, this->op); }
2020-11-06 02:26:51 +08:00
std::string drawHistogram();
2020-11-06 02:26:51 +08:00
std::string const group;
std::string const op;
Unit const unit;
HistogramRegistry& registry;
uint32_t buckets[32];
uint32_t lowerBound;
uint32_t upperBound;
};
2020-11-24 03:40:24 +08:00
#endif // FLOW_HISTOGRAM_H