forked from OSchip/llvm-project
305 lines
9.2 KiB
C
305 lines
9.2 KiB
C
|
//===-- xray_fdr_controller.h ---------------------------------------------===//
|
||
|
//
|
||
|
// The LLVM Compiler Infrastructure
|
||
|
//
|
||
|
// This file is distributed under the University of Illinois Open Source
|
||
|
// License. See LICENSE.TXT for details.
|
||
|
//
|
||
|
//===----------------------------------------------------------------------===//
|
||
|
//
|
||
|
// This file is a part of XRay, a function call tracing system.
|
||
|
//
|
||
|
//===----------------------------------------------------------------------===//
|
||
|
#ifndef COMPILER_RT_LIB_XRAY_XRAY_FDR_CONTROLLER_H_
|
||
|
#define COMPILER_RT_LIB_XRAY_XRAY_FDR_CONTROLLER_H_
|
||
|
|
||
|
#include <time.h>
|
||
|
|
||
|
#include "xray/xray_interface.h"
|
||
|
#include "xray/xray_records.h"
|
||
|
#include "xray_buffer_queue.h"
|
||
|
#include "xray_fdr_log_writer.h"
|
||
|
|
||
|
namespace __xray {
|
||
|
|
||
|
template <size_t Version = 3> class FDRController {
|
||
|
BufferQueue *BQ;
|
||
|
BufferQueue::Buffer &B;
|
||
|
FDRLogWriter &W;
|
||
|
int (*WallClockReader)(clockid_t, struct timespec *) = 0;
|
||
|
uint64_t CycleThreshold = 0;
|
||
|
|
||
|
uint64_t LastFunctionEntryTSC = 0;
|
||
|
uint64_t LatestTSC = 0;
|
||
|
uint16_t LatestCPU = 0;
|
||
|
tid_t TId = 0;
|
||
|
pid_t PId = 0;
|
||
|
bool First = true;
|
||
|
|
||
|
uint32_t UndoableFunctionEnters = 0;
|
||
|
uint32_t UndoableTailExits = 0;
|
||
|
|
||
|
bool finalized() const { return BQ == nullptr || BQ->finalizing(); }
|
||
|
|
||
|
bool hasSpace(size_t S) {
|
||
|
return B.Data != nullptr &&
|
||
|
W.getNextRecord() + S <= reinterpret_cast<char *>(B.Data) + B.Size;
|
||
|
}
|
||
|
|
||
|
constexpr int32_t mask(int32_t FuncId) const {
|
||
|
return FuncId & ((1 << 29) - 1);
|
||
|
}
|
||
|
|
||
|
bool getNewBuffer() {
|
||
|
if (!returnBuffer())
|
||
|
return false;
|
||
|
if (BQ->getBuffer(B) != BufferQueue::ErrorCode::Ok)
|
||
|
return false;
|
||
|
|
||
|
W.resetRecord();
|
||
|
DCHECK_EQ(W.getNextRecord(), B.Data);
|
||
|
LatestTSC = 0;
|
||
|
LatestCPU = 0;
|
||
|
atomic_store(&B.Extents, 0, memory_order_release);
|
||
|
return true;
|
||
|
}
|
||
|
|
||
|
bool setupNewBuffer() {
|
||
|
if (finalized())
|
||
|
return false;
|
||
|
|
||
|
DCHECK(hasSpace(sizeof(MetadataRecord) * 3));
|
||
|
TId = GetTid();
|
||
|
PId = internal_getpid();
|
||
|
struct timespec TS {
|
||
|
0, 0
|
||
|
};
|
||
|
WallClockReader(CLOCK_MONOTONIC, &TS);
|
||
|
|
||
|
MetadataRecord Metadata[] = {
|
||
|
// Write out a MetadataRecord to signify that this is the start of a new
|
||
|
// buffer, associated with a particular thread, with a new CPU. For the
|
||
|
// data, we have 15 bytes to squeeze as much information as we can. At
|
||
|
// this point we only write down the following bytes:
|
||
|
// - Thread ID (tid_t, cast to 4 bytes type due to Darwin being 8
|
||
|
// bytes)
|
||
|
createMetadataRecord<MetadataRecord::RecordKinds::NewBuffer>(
|
||
|
static_cast<int32_t>(TId)),
|
||
|
|
||
|
// Also write the WalltimeMarker record. We only really need microsecond
|
||
|
// precision here, and enforce across platforms that we need 64-bit
|
||
|
// seconds and 32-bit microseconds encoded in the Metadata record.
|
||
|
createMetadataRecord<MetadataRecord::RecordKinds::WalltimeMarker>(
|
||
|
static_cast<int64_t>(TS.tv_sec),
|
||
|
static_cast<int32_t>(TS.tv_nsec / 1000)),
|
||
|
|
||
|
// Also write the Pid record.
|
||
|
createMetadataRecord<MetadataRecord::RecordKinds::Pid>(
|
||
|
static_cast<int32_t>(PId)),
|
||
|
};
|
||
|
|
||
|
if (finalized())
|
||
|
return false;
|
||
|
return W.writeMetadataRecords(Metadata);
|
||
|
}
|
||
|
|
||
|
bool prepareBuffer(size_t S) {
|
||
|
if (finalized())
|
||
|
return returnBuffer();
|
||
|
|
||
|
if (UNLIKELY(!hasSpace(S))) {
|
||
|
if (!getNewBuffer())
|
||
|
return false;
|
||
|
if (!setupNewBuffer())
|
||
|
return false;
|
||
|
}
|
||
|
|
||
|
if (First) {
|
||
|
First = false;
|
||
|
W.resetRecord();
|
||
|
atomic_store(&B.Extents, 0, memory_order_release);
|
||
|
return setupNewBuffer();
|
||
|
}
|
||
|
|
||
|
return true;
|
||
|
}
|
||
|
|
||
|
bool returnBuffer() {
|
||
|
if (BQ == nullptr)
|
||
|
return false;
|
||
|
|
||
|
if (finalized()) {
|
||
|
BQ->releaseBuffer(B); // ignore result.
|
||
|
return false;
|
||
|
}
|
||
|
|
||
|
First = true;
|
||
|
if (BQ->releaseBuffer(B) != BufferQueue::ErrorCode::Ok)
|
||
|
return false;
|
||
|
return true;
|
||
|
}
|
||
|
|
||
|
enum class PreambleResult { NoChange, WroteMetadata };
|
||
|
PreambleResult functionPreamble(uint64_t TSC, uint16_t CPU) {
|
||
|
if (UNLIKELY(LatestCPU != CPU || LatestTSC == 0)) {
|
||
|
// We update our internal tracking state for the Latest TSC and CPU we've
|
||
|
// seen, then write out the appropriate metadata and function records.
|
||
|
LatestTSC = TSC;
|
||
|
LatestCPU = CPU;
|
||
|
W.writeMetadata<MetadataRecord::RecordKinds::NewCPUId>(CPU, TSC);
|
||
|
return PreambleResult::WroteMetadata;
|
||
|
}
|
||
|
|
||
|
if (UNLIKELY(LatestCPU == LatestCPU && LatestTSC > TSC)) {
|
||
|
// The TSC has wrapped around, from the last TSC we've seen.
|
||
|
LatestTSC = TSC;
|
||
|
W.writeMetadata<MetadataRecord::RecordKinds::TSCWrap>(TSC);
|
||
|
return PreambleResult::WroteMetadata;
|
||
|
}
|
||
|
|
||
|
return PreambleResult::NoChange;
|
||
|
}
|
||
|
|
||
|
void rewindRecords(int32_t FuncId, uint64_t TSC, uint16_t CPU) {
|
||
|
// Undo one enter record, because at this point we are either at the state
|
||
|
// of:
|
||
|
// - We are exiting a function that we recently entered.
|
||
|
// - We are exiting a function that was the result of a sequence of tail
|
||
|
// exits, and we can check whether the tail exits can be re-wound.
|
||
|
//
|
||
|
FunctionRecord F;
|
||
|
W.undoWrites(sizeof(FunctionRecord));
|
||
|
internal_memcpy(&F, W.getNextRecord(), sizeof(FunctionRecord));
|
||
|
|
||
|
DCHECK(F.RecordKind ==
|
||
|
uint8_t(FunctionRecord::RecordKinds::FunctionEnter) &&
|
||
|
"Expected to find function entry recording when rewinding.");
|
||
|
DCHECK_EQ(F.FuncId, FuncId & ~(0x0F << 28));
|
||
|
|
||
|
LatestTSC -= F.TSCDelta;
|
||
|
if (--UndoableFunctionEnters != 0) {
|
||
|
LastFunctionEntryTSC -= F.TSCDelta;
|
||
|
return;
|
||
|
}
|
||
|
|
||
|
LastFunctionEntryTSC = 0;
|
||
|
auto RewindingTSC = LatestTSC;
|
||
|
auto RewindingRecordPtr = W.getNextRecord() - sizeof(FunctionRecord);
|
||
|
while (UndoableTailExits) {
|
||
|
internal_memcpy(&F, RewindingRecordPtr, sizeof(FunctionRecord));
|
||
|
DCHECK_EQ(F.RecordKind,
|
||
|
uint8_t(FunctionRecord::RecordKinds::FunctionTailExit));
|
||
|
RewindingTSC -= F.TSCDelta;
|
||
|
RewindingRecordPtr -= sizeof(FunctionRecord);
|
||
|
internal_memcpy(&F, RewindingRecordPtr, sizeof(FunctionRecord));
|
||
|
|
||
|
// This tail call exceeded the threshold duration. It will not be erased.
|
||
|
if ((TSC - RewindingTSC) >= CycleThreshold) {
|
||
|
UndoableTailExits = 0;
|
||
|
return;
|
||
|
}
|
||
|
|
||
|
--UndoableTailExits;
|
||
|
W.undoWrites(sizeof(FunctionRecord) * 2);
|
||
|
LatestTSC = RewindingTSC;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
public:
|
||
|
template <class WallClockFunc>
|
||
|
FDRController(BufferQueue *BQ, BufferQueue::Buffer &B, FDRLogWriter &W,
|
||
|
WallClockFunc R, uint64_t C)
|
||
|
: BQ(BQ), B(B), W(W), WallClockReader(R), CycleThreshold(C) {}
|
||
|
|
||
|
bool functionEnter(int32_t FuncId, uint64_t TSC, uint16_t CPU) {
|
||
|
if (finalized())
|
||
|
return returnBuffer();
|
||
|
|
||
|
if (!prepareBuffer(sizeof(MetadataRecord) + sizeof(FunctionRecord)))
|
||
|
return returnBuffer();
|
||
|
|
||
|
if (functionPreamble(TSC, CPU) == PreambleResult::WroteMetadata) {
|
||
|
UndoableFunctionEnters = 1;
|
||
|
} else {
|
||
|
++UndoableFunctionEnters;
|
||
|
}
|
||
|
|
||
|
LastFunctionEntryTSC = TSC;
|
||
|
LatestTSC = TSC;
|
||
|
return W.writeFunction(FDRLogWriter::FunctionRecordKind::Enter,
|
||
|
mask(FuncId), TSC - LatestTSC);
|
||
|
}
|
||
|
|
||
|
bool functionTailExit(int32_t FuncId, uint64_t TSC, uint16_t CPU) {
|
||
|
if (finalized())
|
||
|
return returnBuffer();
|
||
|
|
||
|
if (!prepareBuffer(sizeof(MetadataRecord) + sizeof(FunctionRecord)))
|
||
|
return returnBuffer();
|
||
|
|
||
|
if (functionPreamble(TSC, CPU) == PreambleResult::NoChange &&
|
||
|
UndoableFunctionEnters != 0 &&
|
||
|
TSC - LastFunctionEntryTSC < CycleThreshold) {
|
||
|
rewindRecords(FuncId, TSC, CPU);
|
||
|
return true;
|
||
|
}
|
||
|
|
||
|
UndoableTailExits = UndoableFunctionEnters ? UndoableTailExits + 1 : 0;
|
||
|
UndoableFunctionEnters = 0;
|
||
|
LatestTSC = TSC;
|
||
|
return W.writeFunction(FDRLogWriter::FunctionRecordKind::TailExit,
|
||
|
mask(FuncId), TSC - LatestTSC);
|
||
|
}
|
||
|
|
||
|
bool functionEnterArg(int32_t FuncId, uint64_t TSC, uint16_t CPU,
|
||
|
uint64_t Arg) {
|
||
|
if (finalized())
|
||
|
return returnBuffer();
|
||
|
|
||
|
if (!prepareBuffer((2 * sizeof(MetadataRecord)) + sizeof(FunctionRecord)))
|
||
|
return returnBuffer();
|
||
|
|
||
|
// Ignore the result of writing out the preamble.
|
||
|
functionPreamble(TSC, CPU);
|
||
|
|
||
|
LatestTSC = TSC;
|
||
|
LastFunctionEntryTSC = 0;
|
||
|
UndoableFunctionEnters = 0;
|
||
|
UndoableTailExits = 0;
|
||
|
|
||
|
W.writeFunction(FDRLogWriter::FunctionRecordKind::EnterArg, mask(FuncId),
|
||
|
TSC - LatestTSC);
|
||
|
return W.writeMetadata<MetadataRecord::RecordKinds::CallArgument>(Arg);
|
||
|
}
|
||
|
|
||
|
bool functionExit(int32_t FuncId, uint64_t TSC, uint16_t CPU) {
|
||
|
if (finalized())
|
||
|
return returnBuffer();
|
||
|
|
||
|
if (functionPreamble(TSC, CPU) == PreambleResult::NoChange &&
|
||
|
UndoableFunctionEnters != 0 &&
|
||
|
TSC - LastFunctionEntryTSC < CycleThreshold) {
|
||
|
rewindRecords(FuncId, TSC, CPU);
|
||
|
return true;
|
||
|
}
|
||
|
|
||
|
LatestTSC = TSC;
|
||
|
UndoableFunctionEnters = 0;
|
||
|
UndoableTailExits = 0;
|
||
|
return W.writeFunction(FDRLogWriter::FunctionRecordKind::Exit, mask(FuncId),
|
||
|
TSC - LatestTSC);
|
||
|
}
|
||
|
|
||
|
bool flush() {
|
||
|
if (finalized()) {
|
||
|
returnBuffer(); // ignore result.
|
||
|
return true;
|
||
|
}
|
||
|
return returnBuffer();
|
||
|
}
|
||
|
};
|
||
|
|
||
|
} // namespace __xray
|
||
|
|
||
|
#endif // COMPILER-RT_LIB_XRAY_XRAY_FDR_CONTROLLER_H_
|