2015-12-11 04:24:09 +08:00
|
|
|
/*===- InstrProfilingValue.c - Support library for PGO instrumentation ----===*\
|
|
|
|
|*
|
|
|
|
|* The LLVM Compiler Infrastructure
|
|
|
|
|*
|
|
|
|
|* This file is distributed under the University of Illinois Open Source
|
|
|
|
|* License. See LICENSE.TXT for details.
|
|
|
|
|*
|
|
|
|
\*===----------------------------------------------------------------------===*/
|
|
|
|
|
|
|
|
#include "InstrProfiling.h"
|
|
|
|
#include "InstrProfilingInternal.h"
|
2016-05-20 14:13:07 +08:00
|
|
|
#include "InstrProfilingUtil.h" /* For PS4 getenv shim. */
|
2015-12-11 04:24:09 +08:00
|
|
|
#include <limits.h>
|
|
|
|
#include <stdio.h>
|
|
|
|
#include <stdlib.h>
|
|
|
|
#include <string.h>
|
|
|
|
#define INSTR_PROF_VALUE_PROF_DATA
|
|
|
|
#define INSTR_PROF_COMMON_API_IMPL
|
|
|
|
#include "InstrProfData.inc"
|
|
|
|
|
|
|
|
#define PROF_OOM(Msg) PROF_ERR(Msg ":%s\n", "Out of memory");
|
|
|
|
#define PROF_OOM_RETURN(Msg) \
|
|
|
|
{ \
|
|
|
|
PROF_OOM(Msg) \
|
2015-12-29 15:13:59 +08:00
|
|
|
return NULL; \
|
2015-12-11 04:24:09 +08:00
|
|
|
}
|
|
|
|
|
2016-05-19 06:34:05 +08:00
|
|
|
COMPILER_RT_VISIBILITY uint32_t VPMaxNumValsPerSite =
|
|
|
|
INSTR_PROF_MAX_NUM_VAL_PER_SITE;
|
|
|
|
|
|
|
|
COMPILER_RT_VISIBILITY void lprofSetupValueProfiler() {
|
|
|
|
const char *Str = 0;
|
|
|
|
Str = getenv("LLVM_VP_MAX_NUM_VALS_PER_SITE");
|
|
|
|
if (Str && Str[0])
|
|
|
|
VPMaxNumValsPerSite = atoi(Str);
|
|
|
|
if (VPMaxNumValsPerSite > INSTR_PROF_MAX_NUM_VAL_PER_SITE)
|
|
|
|
VPMaxNumValsPerSite = INSTR_PROF_MAX_NUM_VAL_PER_SITE;
|
|
|
|
}
|
|
|
|
|
2016-05-20 05:35:34 +08:00
|
|
|
COMPILER_RT_VISIBILITY void lprofSetMaxValsPerSite(uint32_t MaxVals) {
|
|
|
|
VPMaxNumValsPerSite = MaxVals;
|
|
|
|
}
|
|
|
|
|
2015-12-11 04:24:09 +08:00
|
|
|
/* This method is only used in value profiler mock testing. */
|
2015-12-16 11:29:15 +08:00
|
|
|
COMPILER_RT_VISIBILITY void
|
2015-12-11 04:24:09 +08:00
|
|
|
__llvm_profile_set_num_value_sites(__llvm_profile_data *Data,
|
|
|
|
uint32_t ValueKind, uint16_t NumValueSites) {
|
|
|
|
*((uint16_t *)&Data->NumValueSites[ValueKind]) = NumValueSites;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* This method is only used in value profiler mock testing. */
|
2015-12-16 11:29:15 +08:00
|
|
|
COMPILER_RT_VISIBILITY const __llvm_profile_data *
|
2015-12-11 04:24:09 +08:00
|
|
|
__llvm_profile_iterate_data(const __llvm_profile_data *Data) {
|
|
|
|
return Data + 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* This method is only used in value profiler mock testing. */
|
2015-12-16 11:29:15 +08:00
|
|
|
COMPILER_RT_VISIBILITY void *
|
2015-12-11 04:24:09 +08:00
|
|
|
__llvm_get_function_addr(const __llvm_profile_data *Data) {
|
|
|
|
return Data->FunctionPointer;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Allocate an array that holds the pointers to the linked lists of
|
|
|
|
* value profile counter nodes. The number of element of the array
|
|
|
|
* is the total number of value profile sites instrumented. Returns
|
|
|
|
* 0 if allocation fails.
|
|
|
|
*/
|
|
|
|
|
|
|
|
static int allocateValueProfileCounters(__llvm_profile_data *Data) {
|
|
|
|
uint64_t NumVSites = 0;
|
|
|
|
uint32_t VKI;
|
|
|
|
for (VKI = IPVK_First; VKI <= IPVK_Last; ++VKI)
|
|
|
|
NumVSites += Data->NumValueSites[VKI];
|
|
|
|
|
|
|
|
ValueProfNode **Mem =
|
|
|
|
(ValueProfNode **)calloc(NumVSites, sizeof(ValueProfNode *));
|
|
|
|
if (!Mem)
|
|
|
|
return 0;
|
2015-12-16 11:29:15 +08:00
|
|
|
if (!COMPILER_RT_BOOL_CMPXCHG(&Data->Values, 0, Mem)) {
|
2015-12-11 04:24:09 +08:00
|
|
|
free(Mem);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
2015-12-16 11:29:15 +08:00
|
|
|
COMPILER_RT_VISIBILITY void
|
2015-12-11 04:24:09 +08:00
|
|
|
__llvm_profile_instrument_target(uint64_t TargetValue, void *Data,
|
|
|
|
uint32_t CounterIndex) {
|
|
|
|
|
|
|
|
__llvm_profile_data *PData = (__llvm_profile_data *)Data;
|
|
|
|
if (!PData)
|
|
|
|
return;
|
|
|
|
|
|
|
|
if (!PData->Values) {
|
|
|
|
if (!allocateValueProfileCounters(PData))
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
ValueProfNode **ValueCounters = (ValueProfNode **)PData->Values;
|
|
|
|
ValueProfNode *PrevVNode = NULL;
|
2016-05-20 05:35:34 +08:00
|
|
|
ValueProfNode *MinCountVNode = NULL;
|
2015-12-11 04:24:09 +08:00
|
|
|
ValueProfNode *CurrentVNode = ValueCounters[CounterIndex];
|
2016-05-20 05:35:34 +08:00
|
|
|
uint64_t MinCount = UINT64_MAX;
|
2015-12-11 04:24:09 +08:00
|
|
|
|
|
|
|
uint8_t VDataCount = 0;
|
|
|
|
while (CurrentVNode) {
|
2016-05-17 04:33:30 +08:00
|
|
|
if (TargetValue == CurrentVNode->Value) {
|
|
|
|
CurrentVNode->Count++;
|
2015-12-11 04:24:09 +08:00
|
|
|
return;
|
|
|
|
}
|
2016-05-20 05:35:34 +08:00
|
|
|
if (CurrentVNode->Count < MinCount) {
|
|
|
|
MinCount = CurrentVNode->Count;
|
|
|
|
MinCountVNode = CurrentVNode;
|
|
|
|
}
|
2015-12-11 04:24:09 +08:00
|
|
|
PrevVNode = CurrentVNode;
|
|
|
|
CurrentVNode = CurrentVNode->Next;
|
|
|
|
++VDataCount;
|
|
|
|
}
|
|
|
|
|
2016-05-20 05:35:34 +08:00
|
|
|
if (VDataCount >= VPMaxNumValsPerSite) {
|
|
|
|
/* Bump down the min count node's count. If it reaches 0,
|
|
|
|
* evict it. This eviction/replacement policy makes hot
|
|
|
|
* targets more sticky while cold targets less so. In other
|
|
|
|
* words, it makes it less likely for the hot targets to be
|
|
|
|
* prematurally evicted during warmup/establishment period,
|
|
|
|
* when their counts are still low. In a special case when
|
|
|
|
* the number of values tracked is reduced to only one, this
|
|
|
|
* policy will guarantee that the dominating target with >50%
|
|
|
|
* total count will survive in the end. Note that this scheme
|
|
|
|
* allows the runtime to track the min count node in an adaptive
|
|
|
|
* manner. It can correct previous mistakes and eventually
|
|
|
|
* lock on a cold target that is alread in stable state.
|
|
|
|
*
|
|
|
|
* In very rare cases, this replacement scheme may still lead
|
|
|
|
* to target loss. For instance, out of \c N value slots, \c N-1
|
|
|
|
* slots are occupied by luke warm targets during the warmup
|
|
|
|
* period and the remaining one slot is competed by two or more
|
|
|
|
* very hot targets. If those hot targets occur in an interleaved
|
|
|
|
* way, none of them will survive (gain enough weight to throw out
|
|
|
|
* other established entries) due to the ping-pong effect.
|
|
|
|
* To handle this situation, user can choose to increase the max
|
|
|
|
* number of tracked values per value site. Alternatively, a more
|
|
|
|
* expensive eviction mechanism can be implemented. It requires
|
|
|
|
* the runtime to track the total number of evictions per-site.
|
|
|
|
* When the total number of evictions reaches certain threshold,
|
|
|
|
* the runtime can wipe out more than one lowest count entries
|
|
|
|
* to give space for hot targets.
|
|
|
|
*/
|
|
|
|
if (!(--MinCountVNode->Count)) {
|
|
|
|
CurrentVNode = MinCountVNode;
|
|
|
|
CurrentVNode->Value = TargetValue;
|
|
|
|
CurrentVNode->Count++;
|
|
|
|
}
|
2015-12-11 04:24:09 +08:00
|
|
|
return;
|
2016-05-20 05:35:34 +08:00
|
|
|
}
|
2015-12-11 04:24:09 +08:00
|
|
|
|
|
|
|
CurrentVNode = (ValueProfNode *)calloc(1, sizeof(ValueProfNode));
|
|
|
|
if (!CurrentVNode)
|
|
|
|
return;
|
|
|
|
|
2016-05-17 04:33:30 +08:00
|
|
|
CurrentVNode->Value = TargetValue;
|
|
|
|
CurrentVNode->Count++;
|
2015-12-11 04:24:09 +08:00
|
|
|
|
|
|
|
uint32_t Success = 0;
|
|
|
|
if (!ValueCounters[CounterIndex])
|
2015-12-16 11:29:15 +08:00
|
|
|
Success =
|
|
|
|
COMPILER_RT_BOOL_CMPXCHG(&ValueCounters[CounterIndex], 0, CurrentVNode);
|
2015-12-11 04:24:09 +08:00
|
|
|
else if (PrevVNode && !PrevVNode->Next)
|
2015-12-16 11:29:15 +08:00
|
|
|
Success = COMPILER_RT_BOOL_CMPXCHG(&(PrevVNode->Next), 0, CurrentVNode);
|
2015-12-11 04:24:09 +08:00
|
|
|
|
|
|
|
if (!Success) {
|
|
|
|
free(CurrentVNode);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-05-13 05:43:49 +08:00
|
|
|
/*
|
2016-05-15 04:12:42 +08:00
|
|
|
* A wrapper struct that represents value profile runtime data.
|
|
|
|
* Like InstrProfRecord class which is used by profiling host tools,
|
|
|
|
* ValueProfRuntimeRecord also implements the abstract intefaces defined in
|
|
|
|
* ValueProfRecordClosure so that the runtime data can be serialized using
|
|
|
|
* shared C implementation.
|
2016-05-13 05:43:49 +08:00
|
|
|
*/
|
2016-05-15 04:12:42 +08:00
|
|
|
typedef struct ValueProfRuntimeRecord {
|
|
|
|
const __llvm_profile_data *Data;
|
|
|
|
ValueProfNode **NodesKind[IPVK_Last + 1];
|
|
|
|
uint8_t **SiteCountArray;
|
|
|
|
} ValueProfRuntimeRecord;
|
2016-05-13 05:43:49 +08:00
|
|
|
|
2016-05-15 04:12:42 +08:00
|
|
|
/* ValueProfRecordClosure Interface implementation. */
|
2016-05-13 05:43:49 +08:00
|
|
|
|
2016-05-15 04:12:42 +08:00
|
|
|
static uint32_t getNumValueSitesRT(const void *R, uint32_t VK) {
|
|
|
|
return ((const ValueProfRuntimeRecord *)R)->Data->NumValueSites[VK];
|
2016-05-13 05:43:49 +08:00
|
|
|
}
|
|
|
|
|
2016-05-15 04:12:42 +08:00
|
|
|
static uint32_t getNumValueDataRT(const void *R, uint32_t VK) {
|
|
|
|
uint32_t S = 0, I;
|
|
|
|
const ValueProfRuntimeRecord *Record = (const ValueProfRuntimeRecord *)R;
|
|
|
|
if (Record->SiteCountArray[VK] == INSTR_PROF_NULLPTR)
|
|
|
|
return 0;
|
|
|
|
for (I = 0; I < Record->Data->NumValueSites[VK]; I++)
|
|
|
|
S += Record->SiteCountArray[VK][I];
|
|
|
|
return S;
|
2016-05-13 05:43:49 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
static uint32_t getNumValueDataForSiteRT(const void *R, uint32_t VK,
|
|
|
|
uint32_t S) {
|
|
|
|
const ValueProfRuntimeRecord *Record = (const ValueProfRuntimeRecord *)R;
|
2016-05-15 04:12:42 +08:00
|
|
|
return Record->SiteCountArray[VK][S];
|
2016-05-13 05:43:49 +08:00
|
|
|
}
|
|
|
|
|
2016-05-15 04:12:42 +08:00
|
|
|
static ValueProfRuntimeRecord RTRecord;
|
|
|
|
static ValueProfRecordClosure RTRecordClosure = {
|
|
|
|
&RTRecord, INSTR_PROF_NULLPTR, /* GetNumValueKinds */
|
|
|
|
getNumValueSitesRT, getNumValueDataRT, getNumValueDataForSiteRT,
|
|
|
|
INSTR_PROF_NULLPTR, /* RemapValueData */
|
|
|
|
INSTR_PROF_NULLPTR, /* GetValueForSite, */
|
|
|
|
INSTR_PROF_NULLPTR /* AllocValueProfData */
|
|
|
|
};
|
|
|
|
|
|
|
|
static uint32_t
|
|
|
|
initializeValueProfRuntimeRecord(const __llvm_profile_data *Data,
|
|
|
|
uint8_t *SiteCountArray[]) {
|
|
|
|
unsigned I, J, S = 0, NumValueKinds = 0;
|
|
|
|
ValueProfNode **Nodes = (ValueProfNode **)Data->Values;
|
|
|
|
RTRecord.Data = Data;
|
|
|
|
RTRecord.SiteCountArray = SiteCountArray;
|
|
|
|
for (I = 0; I <= IPVK_Last; I++) {
|
|
|
|
uint16_t N = Data->NumValueSites[I];
|
|
|
|
if (!N)
|
|
|
|
continue;
|
|
|
|
|
|
|
|
NumValueKinds++;
|
|
|
|
|
|
|
|
RTRecord.NodesKind[I] = Nodes ? &Nodes[S] : INSTR_PROF_NULLPTR;
|
|
|
|
for (J = 0; J < N; J++) {
|
|
|
|
/* Compute value count for each site. */
|
|
|
|
uint32_t C = 0;
|
|
|
|
ValueProfNode *Site =
|
|
|
|
Nodes ? RTRecord.NodesKind[I][J] : INSTR_PROF_NULLPTR;
|
|
|
|
while (Site) {
|
|
|
|
C++;
|
|
|
|
Site = Site->Next;
|
|
|
|
}
|
|
|
|
if (C > UCHAR_MAX)
|
|
|
|
C = UCHAR_MAX;
|
|
|
|
RTRecord.SiteCountArray[I][J] = C;
|
|
|
|
}
|
|
|
|
S += N;
|
|
|
|
}
|
|
|
|
return NumValueKinds;
|
2016-05-13 05:43:49 +08:00
|
|
|
}
|
|
|
|
|
2016-05-15 04:12:42 +08:00
|
|
|
static ValueProfNode *getNextNValueData(uint32_t VK, uint32_t Site,
|
|
|
|
InstrProfValueData *Dst,
|
|
|
|
ValueProfNode *StartNode, uint32_t N) {
|
|
|
|
unsigned I;
|
|
|
|
ValueProfNode *VNode = StartNode ? StartNode : RTRecord.NodesKind[VK][Site];
|
2016-05-13 05:43:49 +08:00
|
|
|
for (I = 0; I < N; I++) {
|
2016-05-17 04:33:30 +08:00
|
|
|
Dst[I].Value = VNode->Value;
|
|
|
|
Dst[I].Count = VNode->Count;
|
2016-05-13 05:43:49 +08:00
|
|
|
VNode = VNode->Next;
|
|
|
|
}
|
2016-05-15 04:12:42 +08:00
|
|
|
return VNode;
|
2016-05-13 05:43:49 +08:00
|
|
|
}
|
|
|
|
|
2016-05-15 04:12:42 +08:00
|
|
|
static uint32_t getValueProfDataSizeWrapper() {
|
|
|
|
return getValueProfDataSize(&RTRecordClosure);
|
2016-05-13 05:43:49 +08:00
|
|
|
}
|
|
|
|
|
2016-05-15 04:12:42 +08:00
|
|
|
static uint32_t getNumValueDataForSiteWrapper(uint32_t VK, uint32_t S) {
|
|
|
|
return getNumValueDataForSiteRT(&RTRecord, VK, S);
|
2016-05-13 05:43:49 +08:00
|
|
|
}
|
|
|
|
|
2016-05-15 04:12:42 +08:00
|
|
|
static VPDataReaderType TheVPDataReader = {
|
|
|
|
initializeValueProfRuntimeRecord, getValueProfRecordHeaderSize,
|
|
|
|
getFirstValueProfRecord, getNumValueDataForSiteWrapper,
|
|
|
|
getValueProfDataSizeWrapper, getNextNValueData};
|
2015-12-11 04:24:09 +08:00
|
|
|
|
2016-05-15 04:12:42 +08:00
|
|
|
COMPILER_RT_VISIBILITY VPDataReaderType *lprofGetVPDataReader() {
|
|
|
|
return &TheVPDataReader;
|
2015-12-11 04:24:09 +08:00
|
|
|
}
|