2014-01-07 06:27:43 +08:00
|
|
|
//===--- CodeGenPGO.h - PGO Instrumentation for LLVM CodeGen ----*- C++ -*-===//
|
|
|
|
//
|
|
|
|
// The LLVM Compiler Infrastructure
|
|
|
|
//
|
|
|
|
// This file is distributed under the University of Illinois Open Source
|
|
|
|
// License. See LICENSE.TXT for details.
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
//
|
|
|
|
// Instrumentation-based profile-guided optimization
|
|
|
|
//
|
|
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
|
|
|
|
#ifndef CLANG_CODEGEN_CODEGENPGO_H
|
|
|
|
#define CLANG_CODEGEN_CODEGENPGO_H
|
|
|
|
|
|
|
|
#include "CGBuilder.h"
|
|
|
|
#include "CodeGenModule.h"
|
|
|
|
#include "CodeGenTypes.h"
|
|
|
|
#include "clang/Frontend/CodeGenOptions.h"
|
|
|
|
#include "llvm/ADT/OwningPtr.h"
|
|
|
|
#include "llvm/ADT/StringMap.h"
|
|
|
|
#include "llvm/Support/MemoryBuffer.h"
|
|
|
|
|
|
|
|
namespace clang {
|
|
|
|
namespace CodeGen {
|
|
|
|
class RegionCounter;
|
|
|
|
|
|
|
|
/// The raw counter data from an instrumented PGO binary
|
|
|
|
class PGOProfileData {
|
|
|
|
private:
|
|
|
|
/// The PGO data
|
|
|
|
llvm::OwningPtr<llvm::MemoryBuffer> DataBuffer;
|
|
|
|
/// Offsets into DataBuffer for each function's counters
|
|
|
|
llvm::StringMap<unsigned> DataOffsets;
|
2014-02-06 04:40:15 +08:00
|
|
|
/// Execution counts for each function.
|
|
|
|
llvm::StringMap<uint64_t> FunctionCounts;
|
|
|
|
/// The maximal execution count among all functions.
|
|
|
|
uint64_t MaxFunctionCount;
|
2014-01-07 06:27:43 +08:00
|
|
|
CodeGenModule &CGM;
|
|
|
|
public:
|
|
|
|
PGOProfileData(CodeGenModule &CGM, std::string Path);
|
|
|
|
/// Fill Counts with the profile data for the given function name. Returns
|
|
|
|
/// false on success.
|
|
|
|
bool getFunctionCounts(StringRef MangledName, std::vector<uint64_t> &Counts);
|
2014-02-06 04:40:15 +08:00
|
|
|
/// Return true if a function is hot. If we know nothing about the function,
|
|
|
|
/// return false.
|
|
|
|
bool isHotFunction(StringRef MangledName);
|
|
|
|
/// Return true if a function is cold. If we know nothing about the function,
|
|
|
|
/// return false.
|
|
|
|
bool isColdFunction(StringRef MangledName);
|
2014-01-07 06:27:43 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
/// Per-function PGO state. This class should generally not be used directly,
|
|
|
|
/// but instead through the CodeGenFunction and RegionCounter types.
|
|
|
|
class CodeGenPGO {
|
|
|
|
private:
|
|
|
|
CodeGenModule &CGM;
|
|
|
|
|
|
|
|
unsigned NumRegionCounters;
|
|
|
|
llvm::GlobalVariable *RegionCounters;
|
|
|
|
llvm::DenseMap<const Stmt*, unsigned> *RegionCounterMap;
|
|
|
|
std::vector<uint64_t> *RegionCounts;
|
|
|
|
uint64_t CurrentRegionCount;
|
|
|
|
|
|
|
|
public:
|
|
|
|
CodeGenPGO(CodeGenModule &CGM)
|
|
|
|
: CGM(CGM), NumRegionCounters(0), RegionCounters(0), RegionCounterMap(0),
|
|
|
|
RegionCounts(0), CurrentRegionCount(0) {}
|
|
|
|
~CodeGenPGO() {}
|
|
|
|
|
|
|
|
/// Whether or not we have PGO region data for the current function. This is
|
|
|
|
/// false both when we have no data at all and when our data has been
|
|
|
|
/// discarded.
|
|
|
|
bool haveRegionCounts() const { return RegionCounts != 0; }
|
|
|
|
|
|
|
|
/// Return the counter value of the current region.
|
|
|
|
uint64_t getCurrentRegionCount() const { return CurrentRegionCount; }
|
|
|
|
/// Return the counter value of the current region, or \p Min if it is larger.
|
|
|
|
uint64_t getCurrentRegionCountWithMin(uint64_t Min) {
|
|
|
|
return std::max(Min, CurrentRegionCount);
|
|
|
|
}
|
|
|
|
/// Set the counter value for the current region. This is used to keep track
|
|
|
|
/// of changes to the most recent counter from control flow and non-local
|
|
|
|
/// exits.
|
|
|
|
void setCurrentRegionCount(uint64_t Count) { CurrentRegionCount = Count; }
|
2014-01-14 05:24:18 +08:00
|
|
|
/// Indicate that the current region is never reached, and thus should have a
|
|
|
|
/// counter value of zero. This is important so that subsequent regions can
|
|
|
|
/// correctly track their parent counts.
|
|
|
|
void setCurrentRegionUnreachable() { setCurrentRegionCount(0); }
|
2014-01-07 06:27:43 +08:00
|
|
|
|
|
|
|
/// Calculate branch weights appropriate for PGO data
|
|
|
|
llvm::MDNode *createBranchWeights(uint64_t TrueCount, uint64_t FalseCount);
|
|
|
|
llvm::MDNode *createBranchWeights(ArrayRef<uint64_t> Weights);
|
|
|
|
|
|
|
|
/// Assign counters to regions and configure them for PGO of a given
|
|
|
|
/// function. Does nothing if instrumentation is not enabled and either
|
|
|
|
/// generates global variables or associates PGO data with each of the
|
|
|
|
/// counters depending on whether we are generating or using instrumentation.
|
|
|
|
void assignRegionCounters(GlobalDecl &GD);
|
|
|
|
/// Emit code to write counts for a given function to disk, if necessary.
|
|
|
|
void emitWriteoutFunction(GlobalDecl &GD);
|
|
|
|
/// Clean up region counter state. Must be called if assignRegionCounters is
|
|
|
|
/// used.
|
|
|
|
void destroyRegionCounters();
|
|
|
|
/// Emit the logic to register region counter write out functions. Returns a
|
|
|
|
/// function that implements this logic.
|
|
|
|
static llvm::Function *emitInitialization(CodeGenModule &CGM);
|
|
|
|
|
|
|
|
private:
|
|
|
|
void mapRegionCounters(const Decl *D);
|
|
|
|
void loadRegionCounts(GlobalDecl &GD, PGOProfileData *PGOData);
|
|
|
|
void emitCounterVariables();
|
|
|
|
|
|
|
|
/// Emit code to increment the counter at the given index
|
|
|
|
void emitCounterIncrement(CGBuilderTy &Builder, unsigned Counter);
|
|
|
|
|
|
|
|
/// Return the region counter for the given statement. This should only be
|
|
|
|
/// called on statements that have a dedicated counter.
|
|
|
|
unsigned getRegionCounter(const Stmt *S) {
|
|
|
|
if (RegionCounterMap == 0)
|
|
|
|
return 0;
|
|
|
|
return (*RegionCounterMap)[S];
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Return the region count for the counter at the given index.
|
|
|
|
uint64_t getRegionCount(unsigned Counter) {
|
|
|
|
if (!haveRegionCounts())
|
|
|
|
return 0;
|
|
|
|
return (*RegionCounts)[Counter];
|
|
|
|
}
|
|
|
|
|
|
|
|
friend class RegionCounter;
|
|
|
|
};
|
|
|
|
|
|
|
|
/// A counter for a particular region. This is the primary interface through
|
|
|
|
/// which clients manage PGO counters and their values.
|
|
|
|
class RegionCounter {
|
|
|
|
CodeGenPGO *PGO;
|
|
|
|
unsigned Counter;
|
|
|
|
uint64_t Count;
|
|
|
|
uint64_t ParentCount;
|
|
|
|
uint64_t RegionCount;
|
|
|
|
int64_t Adjust;
|
|
|
|
|
|
|
|
RegionCounter(CodeGenPGO &PGO, unsigned CounterIndex)
|
|
|
|
: PGO(&PGO), Counter(CounterIndex), Count(PGO.getRegionCount(Counter)),
|
|
|
|
ParentCount(PGO.getCurrentRegionCount()), Adjust(0) {}
|
|
|
|
|
|
|
|
public:
|
|
|
|
RegionCounter(CodeGenPGO &PGO, const Stmt *S)
|
|
|
|
: PGO(&PGO), Counter(PGO.getRegionCounter(S)),
|
|
|
|
Count(PGO.getRegionCount(Counter)),
|
|
|
|
ParentCount(PGO.getCurrentRegionCount()), Adjust(0) {}
|
|
|
|
|
|
|
|
/// Get the value of the counter. In most cases this is the number of times
|
|
|
|
/// the region of the counter was entered, but for switch labels it's the
|
|
|
|
/// number of direct jumps to that label.
|
|
|
|
uint64_t getCount() const { return Count; }
|
|
|
|
/// Get the value of the counter with adjustments applied. Adjustments occur
|
2014-02-18 03:21:03 +08:00
|
|
|
/// when control enters or leaves the region abnormally; i.e., if there is a
|
2014-01-07 06:27:43 +08:00
|
|
|
/// jump to a label within the region, or if the function can return from
|
|
|
|
/// within the region. The adjusted count, then, is the value of the counter
|
|
|
|
/// at the end of the region.
|
|
|
|
uint64_t getAdjustedCount() const {
|
2014-01-07 14:52:12 +08:00
|
|
|
assert((Adjust > 0 || (uint64_t)(-Adjust) <= Count) && "Negative count");
|
2014-01-07 06:27:43 +08:00
|
|
|
return Count + Adjust;
|
|
|
|
}
|
2014-02-18 03:21:03 +08:00
|
|
|
/// Get the value of the counter in this region's parent, i.e., the region
|
|
|
|
/// that was active when this region began. This is useful for deriving
|
|
|
|
/// counts in implicitly counted regions, like the false case of a condition
|
|
|
|
/// or the normal exits of a loop.
|
2014-01-07 06:27:43 +08:00
|
|
|
uint64_t getParentCount() const { return ParentCount; }
|
|
|
|
|
|
|
|
/// Get the number of times the condition of a loop will evaluate false. This
|
|
|
|
/// is the number of times we enter the loop, adjusted by the difference
|
|
|
|
/// between entering and exiting the loop body normally, excepting that
|
|
|
|
/// 'continue' statements also bring us back here.
|
|
|
|
///
|
|
|
|
/// Undefined if this counter is not counting a loop.
|
|
|
|
uint64_t getLoopExitCount() const {
|
|
|
|
return getParentCount() + getContinueCounter().getCount() +
|
|
|
|
getAdjustedCount() - getCount();
|
|
|
|
}
|
|
|
|
/// Get the associated break counter. Undefined if this counter is not
|
|
|
|
/// counting a loop.
|
|
|
|
RegionCounter getBreakCounter() const {
|
|
|
|
return RegionCounter(*PGO, Counter + 1);
|
|
|
|
}
|
|
|
|
/// Get the associated continue counter. Undefined if this counter is not
|
|
|
|
/// counting a loop.
|
|
|
|
RegionCounter getContinueCounter() const {
|
|
|
|
return RegionCounter(*PGO, Counter + 2);
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Activate the counter by emitting an increment and starting to track
|
|
|
|
/// adjustments. If AddIncomingFallThrough is true, the current region count
|
|
|
|
/// will be added to the counter for the purposes of tracking the region.
|
|
|
|
void beginRegion(CGBuilderTy &Builder, bool AddIncomingFallThrough=false) {
|
|
|
|
RegionCount = Count;
|
|
|
|
if (AddIncomingFallThrough)
|
|
|
|
RegionCount += PGO->getCurrentRegionCount();
|
|
|
|
PGO->setCurrentRegionCount(RegionCount);
|
|
|
|
PGO->emitCounterIncrement(Builder, Counter);
|
|
|
|
}
|
|
|
|
/// For counters on boolean branches, begins tracking adjustments for the
|
|
|
|
/// uncounted path.
|
|
|
|
void beginElseRegion() {
|
|
|
|
RegionCount = ParentCount - Count;
|
|
|
|
PGO->setCurrentRegionCount(RegionCount);
|
|
|
|
}
|
|
|
|
|
2014-01-14 05:24:22 +08:00
|
|
|
/// Adjust for non-local control flow after emitting a subexpression or
|
|
|
|
/// substatement. This must be called to account for constructs such as gotos,
|
|
|
|
/// labels, and returns, so that we can ensure that our region's count is
|
|
|
|
/// correct in the code that follows.
|
|
|
|
void adjustForControlFlow() {
|
2014-01-07 06:27:43 +08:00
|
|
|
Adjust += PGO->getCurrentRegionCount() - RegionCount;
|
|
|
|
}
|
|
|
|
/// Commit all adjustments to the current region. This should be called after
|
2014-01-14 05:24:22 +08:00
|
|
|
/// all blocks that adjust for control flow count have been emitted.
|
2014-01-07 06:27:43 +08:00
|
|
|
void applyAdjustmentsToRegion() {
|
|
|
|
PGO->setCurrentRegionCount(ParentCount + Adjust);
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
} // end namespace CodeGen
|
|
|
|
} // end namespace clang
|
|
|
|
|
|
|
|
#endif
|