llvm-project/compiler-rt/lib/xray/xray_profile_collector.h

89 lines
3.5 KiB
C++

//===-- xray_profile_collector.h -------------------------------*- C++ -*-===//
//
// The LLVM Compiler Infrastructure
//
// This file is distributed under the University of Illinois Open Source
// License. See LICENSE.TXT for details.
//
//===----------------------------------------------------------------------===//
//
// This file is a part of XRay, a dynamic runtime instrumentation system.
//
// This file defines the interface for a data collection service, for XRay
// profiling. What we implement here is an in-process service where
// FunctionCallTrie instances can be handed off by threads, to be
// consolidated/collected.
//
//===----------------------------------------------------------------------===//
#ifndef XRAY_XRAY_PROFILE_COLLECTOR_H
#define XRAY_XRAY_PROFILE_COLLECTOR_H
#include "xray_function_call_trie.h"
#include "xray/xray_log_interface.h"
namespace __xray {
/// The ProfileCollectorService implements a centralised mechanism for
/// collecting FunctionCallTrie instances, indexed by thread ID. On demand, the
/// ProfileCollectorService can be queried for the most recent state of the
/// data, in a form that allows traversal.
namespace profileCollectorService {
/// Posts the FunctionCallTrie associated with a specific Thread ID. This
/// will:
///
/// - Make a copy of the FunctionCallTrie and store that against the Thread
/// ID. This will use the global allocator for the service-managed
/// FunctionCallTrie instances.
/// - Queue up a pointer to the FunctionCallTrie.
/// - If the queue is long enough (longer than some arbitrary threshold) we
/// then pre-calculate a single FunctionCallTrie for the whole process.
///
///
/// We are making a copy of the FunctionCallTrie because the intent is to have
/// this function be called at thread exit, or soon after the profiling
/// handler is finalized through the XRay APIs. By letting threads each
/// process their own thread-local FunctionCallTrie instances, we're removing
/// the need for synchronisation across threads while we're profiling.
/// However, once we're done profiling, we can then collect copies of these
/// FunctionCallTrie instances and pay the cost of the copy.
///
/// NOTE: In the future, if this turns out to be more costly than "moving" the
/// FunctionCallTrie instances from the owning thread to the collector
/// service, then we can change the implementation to do it this way (moving)
/// instead.
void post(const FunctionCallTrie &T, tid_t TId);
/// The serialize will process all FunctionCallTrie instances in memory, and
/// turn those into specifically formatted blocks, each describing the
/// function call trie's contents in a compact form. In memory, this looks
/// like the following layout:
///
/// - block size (32 bits)
/// - block number (32 bits)
/// - thread id (64 bits)
/// - list of records:
/// - function ids in leaf to root order, terminated by
/// 0 (32 bits per function id)
/// - call count (64 bit)
/// - cumulative local time (64 bit)
/// - record delimiter (64 bit, 0x0)
///
void serialize();
/// The reset function will clear out any internal memory held by the
/// service. The intent is to have the resetting be done in calls to the
/// initialization routine, or explicitly through the flush log API.
void reset();
/// This nextBuffer function is meant to implement the iterator functionality,
/// provided in the XRay API.
XRayBuffer nextBuffer(XRayBuffer B);
} // namespace profileCollectorService
} // namespace __xray
#endif // XRAY_XRAY_PROFILE_COLLECTOR_H