2016-01-04 09:22:55 +08:00
|
|
|
/*===-- InstrProfData.inc - instr profiling runtime structures -*- C++ -*-=== *\
|
2015-11-23 13:47:05 +08:00
|
|
|
|*
|
2019-01-19 16:50:56 +08:00
|
|
|
|* Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
|
|
|* See https://llvm.org/LICENSE.txt for license information.
|
|
|
|
|* SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
2015-11-23 13:47:05 +08:00
|
|
|
|*
|
|
|
|
\*===----------------------------------------------------------------------===*/
|
|
|
|
/*
|
2021-02-12 13:46:35 +08:00
|
|
|
* This is the main file that defines all the data structure, signature,
|
2015-11-23 13:47:05 +08:00
|
|
|
* constant literals that are shared across profiling runtime library,
|
|
|
|
* compiler (instrumentation), and host tools (reader/writer). The entities
|
|
|
|
* defined in this file affect the profile runtime ABI, the raw profile format,
|
|
|
|
* or both.
|
|
|
|
*
|
2021-02-12 13:46:35 +08:00
|
|
|
* The file has two identical copies. The primary copy lives in LLVM and
|
2015-11-23 13:47:05 +08:00
|
|
|
* the other one sits in compiler-rt/lib/profile directory. To make changes
|
2021-02-12 13:46:35 +08:00
|
|
|
* in this file, first modify the primary copy and copy it over to compiler-rt.
|
2015-11-23 13:47:05 +08:00
|
|
|
* Testing of any change in this file can start only after the two copies are
|
|
|
|
* synced up.
|
|
|
|
*
|
|
|
|
* The first part of the file includes macros that defines types, names, and
|
|
|
|
* initializers for the member fields of the core data structures. The field
|
|
|
|
* declarations for one structure is enabled by defining the field activation
|
|
|
|
* macro associated with that structure. Only one field activation record
|
|
|
|
* can be defined at one time and the rest definitions will be filtered out by
|
|
|
|
* the preprocessor.
|
|
|
|
*
|
|
|
|
* Examples of how the template is used to instantiate structure definition:
|
|
|
|
* 1. To declare a structure:
|
2016-01-08 08:39:51 +08:00
|
|
|
*
|
2015-11-23 13:47:05 +08:00
|
|
|
* struct ProfData {
|
|
|
|
* #define INSTR_PROF_DATA(Type, LLVMType, Name, Initializer) \
|
|
|
|
* Type Name;
|
|
|
|
* #include "llvm/ProfileData/InstrProfData.inc"
|
|
|
|
* };
|
|
|
|
*
|
|
|
|
* 2. To construct LLVM type arrays for the struct type:
|
|
|
|
*
|
|
|
|
* Type *DataTypes[] = {
|
|
|
|
* #define INSTR_PROF_DATA(Type, LLVMType, Name, Initializer) \
|
|
|
|
* LLVMType,
|
|
|
|
* #include "llvm/ProfileData/InstrProfData.inc"
|
|
|
|
* };
|
|
|
|
*
|
|
|
|
* 4. To construct constant array for the initializers:
|
|
|
|
* #define INSTR_PROF_DATA(Type, LLVMType, Name, Initializer) \
|
|
|
|
* Initializer,
|
|
|
|
* Constant *ConstantVals[] = {
|
|
|
|
* #include "llvm/ProfileData/InstrProfData.inc"
|
|
|
|
* };
|
|
|
|
*
|
|
|
|
*
|
|
|
|
* The second part of the file includes definitions all other entities that
|
|
|
|
* are related to runtime ABI and format. When no field activation macro is
|
|
|
|
* defined, this file can be included to introduce the definitions.
|
|
|
|
*
|
|
|
|
\*===----------------------------------------------------------------------===*/
|
|
|
|
|
2016-06-09 00:39:43 +08:00
|
|
|
/* Functions marked with INSTR_PROF_VISIBILITY must have hidden visibility in
|
|
|
|
* the compiler runtime. */
|
|
|
|
#ifndef INSTR_PROF_VISIBILITY
|
|
|
|
#define INSTR_PROF_VISIBILITY
|
|
|
|
#endif
|
|
|
|
|
2015-11-23 13:47:05 +08:00
|
|
|
/* INSTR_PROF_DATA start. */
|
|
|
|
/* Definition of member fields of the per-function control structure. */
|
|
|
|
#ifndef INSTR_PROF_DATA
|
|
|
|
#define INSTR_PROF_DATA(Type, LLVMType, Name, Initializer)
|
|
|
|
#else
|
|
|
|
#define INSTR_PROF_DATA_DEFINED
|
|
|
|
#endif
|
2016-02-09 02:14:02 +08:00
|
|
|
INSTR_PROF_DATA(const uint64_t, llvm::Type::getInt64Ty(Ctx), NameRef, \
|
|
|
|
ConstantInt::get(llvm::Type::getInt64Ty(Ctx), \
|
2016-07-21 06:29:16 +08:00
|
|
|
IndexedInstrProf::ComputeHash(getPGOFuncNameVarInitializer(Inc->getName()))))
|
2015-11-23 13:47:05 +08:00
|
|
|
INSTR_PROF_DATA(const uint64_t, llvm::Type::getInt64Ty(Ctx), FuncHash, \
|
|
|
|
ConstantInt::get(llvm::Type::getInt64Ty(Ctx), \
|
|
|
|
Inc->getHash()->getZExtValue()))
|
|
|
|
INSTR_PROF_DATA(const IntPtrT, llvm::Type::getInt64PtrTy(Ctx), CounterPtr, \
|
|
|
|
ConstantExpr::getBitCast(CounterPtr, \
|
|
|
|
llvm::Type::getInt64PtrTy(Ctx)))
|
2016-03-29 02:47:44 +08:00
|
|
|
/* This is used to map function pointers for the indirect call targets to
|
|
|
|
* function name hashes during the conversion from raw to merged profile
|
|
|
|
* data.
|
|
|
|
*/
|
2015-11-23 13:47:05 +08:00
|
|
|
INSTR_PROF_DATA(const IntPtrT, llvm::Type::getInt8PtrTy(Ctx), FunctionPointer, \
|
|
|
|
FunctionAddr)
|
|
|
|
INSTR_PROF_DATA(IntPtrT, llvm::Type::getInt8PtrTy(Ctx), Values, \
|
2016-05-22 06:55:45 +08:00
|
|
|
ValuesPtrExpr)
|
2016-02-09 02:14:02 +08:00
|
|
|
INSTR_PROF_DATA(const uint32_t, llvm::Type::getInt32Ty(Ctx), NumCounters, \
|
|
|
|
ConstantInt::get(llvm::Type::getInt32Ty(Ctx), NumCounters))
|
2015-11-23 13:47:05 +08:00
|
|
|
INSTR_PROF_DATA(const uint16_t, Int16ArrayTy, NumValueSites[IPVK_Last+1], \
|
|
|
|
ConstantArray::get(Int16ArrayTy, Int16ArrayVals))
|
|
|
|
#undef INSTR_PROF_DATA
|
|
|
|
/* INSTR_PROF_DATA end. */
|
|
|
|
|
2016-05-17 04:33:30 +08:00
|
|
|
|
|
|
|
/* This is an internal data structure used by value profiler. It
|
|
|
|
* is defined here to allow serialization code sharing by LLVM
|
|
|
|
* to be used in unit test.
|
|
|
|
*
|
|
|
|
* typedef struct ValueProfNode {
|
|
|
|
* // InstrProfValueData VData;
|
|
|
|
* uint64_t Value;
|
|
|
|
* uint64_t Count;
|
|
|
|
* struct ValueProfNode *Next;
|
|
|
|
* } ValueProfNode;
|
|
|
|
*/
|
|
|
|
/* INSTR_PROF_VALUE_NODE start. */
|
|
|
|
#ifndef INSTR_PROF_VALUE_NODE
|
|
|
|
#define INSTR_PROF_VALUE_NODE(Type, LLVMType, Name, Initializer)
|
|
|
|
#else
|
|
|
|
#define INSTR_PROF_DATA_DEFINED
|
|
|
|
#endif
|
|
|
|
INSTR_PROF_VALUE_NODE(uint64_t, llvm::Type::getInt64Ty(Ctx), Value, \
|
|
|
|
ConstantInt::get(llvm::Type::GetInt64Ty(Ctx), 0))
|
|
|
|
INSTR_PROF_VALUE_NODE(uint64_t, llvm::Type::getInt64Ty(Ctx), Count, \
|
|
|
|
ConstantInt::get(llvm::Type::GetInt64Ty(Ctx), 0))
|
|
|
|
INSTR_PROF_VALUE_NODE(PtrToNodeT, llvm::Type::getInt8PtrTy(Ctx), Next, \
|
|
|
|
ConstantInt::get(llvm::Type::GetInt8PtrTy(Ctx), 0))
|
|
|
|
#undef INSTR_PROF_VALUE_NODE
|
|
|
|
/* INSTR_PROF_VALUE_NODE end. */
|
|
|
|
|
2015-11-23 13:47:05 +08:00
|
|
|
/* INSTR_PROF_RAW_HEADER start */
|
|
|
|
/* Definition of member fields of the raw profile header data structure. */
|
|
|
|
#ifndef INSTR_PROF_RAW_HEADER
|
|
|
|
#define INSTR_PROF_RAW_HEADER(Type, Name, Initializer)
|
|
|
|
#else
|
|
|
|
#define INSTR_PROF_DATA_DEFINED
|
|
|
|
#endif
|
|
|
|
INSTR_PROF_RAW_HEADER(uint64_t, Magic, __llvm_profile_get_magic())
|
|
|
|
INSTR_PROF_RAW_HEADER(uint64_t, Version, __llvm_profile_get_version())
|
|
|
|
INSTR_PROF_RAW_HEADER(uint64_t, DataSize, DataSize)
|
[profile] Add a mode to continuously sync counter updates to a file
Add support for continuously syncing profile counter updates to a file.
The motivation for this is that programs do not always exit cleanly. On
iOS, for example, programs are usually killed via a signal from the OS.
Running atexit() handlers after catching a signal is unreliable, so some
method for progressively writing out profile data is necessary.
The approach taken here is to mmap() the `__llvm_prf_cnts` section onto
a raw profile. To do this, the linker must page-align the counter and
data sections, and the runtime must ensure that counters are mapped to a
page-aligned offset within a raw profile.
Continuous mode is (for the moment) incompatible with the online merging
mode. This limitation is lifted in https://reviews.llvm.org/D69586.
Continuous mode is also (for the moment) incompatible with value
profiling, as I'm not sure whether there is interest in this and the
implementation may be tricky.
As I have not been able to test extensively on non-Darwin platforms,
only Darwin support is included for the moment. However, continuous mode
may "just work" without modification on Linux and some UNIX-likes. AIUI
the default value for the GNU linker's `--section-alignment` flag is set
to the page size on many systems. This appears to be true for LLD as
well, as its `no_nmagic` option is on by default. Continuous mode will
not "just work" on Fuchsia or Windows, as it's not possible to mmap() a
section on these platforms. There is a proposal to add a layer of
indirection to the profile instrumentation to support these platforms.
rdar://54210980
Differential Revision: https://reviews.llvm.org/D68351
2019-09-20 02:56:43 +08:00
|
|
|
INSTR_PROF_RAW_HEADER(uint64_t, PaddingBytesBeforeCounters, PaddingBytesBeforeCounters)
|
2015-11-23 13:47:05 +08:00
|
|
|
INSTR_PROF_RAW_HEADER(uint64_t, CountersSize, CountersSize)
|
[profile] Add a mode to continuously sync counter updates to a file
Add support for continuously syncing profile counter updates to a file.
The motivation for this is that programs do not always exit cleanly. On
iOS, for example, programs are usually killed via a signal from the OS.
Running atexit() handlers after catching a signal is unreliable, so some
method for progressively writing out profile data is necessary.
The approach taken here is to mmap() the `__llvm_prf_cnts` section onto
a raw profile. To do this, the linker must page-align the counter and
data sections, and the runtime must ensure that counters are mapped to a
page-aligned offset within a raw profile.
Continuous mode is (for the moment) incompatible with the online merging
mode. This limitation is lifted in https://reviews.llvm.org/D69586.
Continuous mode is also (for the moment) incompatible with value
profiling, as I'm not sure whether there is interest in this and the
implementation may be tricky.
As I have not been able to test extensively on non-Darwin platforms,
only Darwin support is included for the moment. However, continuous mode
may "just work" without modification on Linux and some UNIX-likes. AIUI
the default value for the GNU linker's `--section-alignment` flag is set
to the page size on many systems. This appears to be true for LLD as
well, as its `no_nmagic` option is on by default. Continuous mode will
not "just work" on Fuchsia or Windows, as it's not possible to mmap() a
section on these platforms. There is a proposal to add a layer of
indirection to the profile instrumentation to support these platforms.
rdar://54210980
Differential Revision: https://reviews.llvm.org/D68351
2019-09-20 02:56:43 +08:00
|
|
|
INSTR_PROF_RAW_HEADER(uint64_t, PaddingBytesAfterCounters, PaddingBytesAfterCounters)
|
2015-11-23 13:47:05 +08:00
|
|
|
INSTR_PROF_RAW_HEADER(uint64_t, NamesSize, NamesSize)
|
|
|
|
INSTR_PROF_RAW_HEADER(uint64_t, CountersDelta, (uintptr_t)CountersBegin)
|
2015-11-26 08:03:34 +08:00
|
|
|
INSTR_PROF_RAW_HEADER(uint64_t, NamesDelta, (uintptr_t)NamesBegin)
|
2015-11-23 13:47:05 +08:00
|
|
|
INSTR_PROF_RAW_HEADER(uint64_t, ValueKindLast, IPVK_Last)
|
2021-05-07 00:09:12 +08:00
|
|
|
INSTR_PROF_RAW_HEADER(uint64_t, BinaryIdsSize, __llvm_write_binary_ids(NULL))
|
2015-11-23 13:47:05 +08:00
|
|
|
#undef INSTR_PROF_RAW_HEADER
|
|
|
|
/* INSTR_PROF_RAW_HEADER end */
|
|
|
|
|
|
|
|
/* VALUE_PROF_FUNC_PARAM start */
|
|
|
|
/* Definition of parameter types of the runtime API used to do value profiling
|
|
|
|
* for a given value site.
|
|
|
|
*/
|
|
|
|
#ifndef VALUE_PROF_FUNC_PARAM
|
|
|
|
#define VALUE_PROF_FUNC_PARAM(ArgType, ArgName, ArgLLVMType)
|
|
|
|
#define INSTR_PROF_COMMA
|
|
|
|
#else
|
|
|
|
#define INSTR_PROF_DATA_DEFINED
|
|
|
|
#define INSTR_PROF_COMMA ,
|
|
|
|
#endif
|
|
|
|
VALUE_PROF_FUNC_PARAM(uint64_t, TargetValue, Type::getInt64Ty(Ctx)) \
|
|
|
|
INSTR_PROF_COMMA
|
|
|
|
VALUE_PROF_FUNC_PARAM(void *, Data, Type::getInt8PtrTy(Ctx)) INSTR_PROF_COMMA
|
|
|
|
VALUE_PROF_FUNC_PARAM(uint32_t, CounterIndex, Type::getInt32Ty(Ctx))
|
|
|
|
#undef VALUE_PROF_FUNC_PARAM
|
|
|
|
#undef INSTR_PROF_COMMA
|
|
|
|
/* VALUE_PROF_FUNC_PARAM end */
|
|
|
|
|
|
|
|
/* VALUE_PROF_KIND start */
|
|
|
|
#ifndef VALUE_PROF_KIND
|
2019-04-24 06:26:55 +08:00
|
|
|
#define VALUE_PROF_KIND(Enumerator, Value, Descr)
|
2015-11-23 13:47:05 +08:00
|
|
|
#else
|
|
|
|
#define INSTR_PROF_DATA_DEFINED
|
|
|
|
#endif
|
2016-04-07 06:30:14 +08:00
|
|
|
/* For indirect function call value profiling, the addresses of the target
|
2016-03-29 06:16:29 +08:00
|
|
|
* functions are profiled by the instrumented code. The target addresses are
|
|
|
|
* written in the raw profile data and converted to target function name's MD5
|
|
|
|
* hash by the profile reader during deserialization. Typically, this happens
|
2018-01-22 15:51:37 +08:00
|
|
|
* when the raw profile data is read during profile merging.
|
2016-03-29 06:16:29 +08:00
|
|
|
*
|
|
|
|
* For this remapping the ProfData is used. ProfData contains both the function
|
|
|
|
* name hash and the function address.
|
|
|
|
*/
|
2019-04-24 06:26:55 +08:00
|
|
|
VALUE_PROF_KIND(IPVK_IndirectCallTarget, 0, "indirect call target")
|
2017-03-16 05:46:31 +08:00
|
|
|
/* For memory intrinsic functions size profiling. */
|
2019-04-24 06:26:55 +08:00
|
|
|
VALUE_PROF_KIND(IPVK_MemOPSize, 1, "memory intrinsic functions size")
|
2015-11-23 13:47:05 +08:00
|
|
|
/* These two kinds must be the last to be
|
|
|
|
* declared. This is to make sure the string
|
|
|
|
* array created with the template can be
|
|
|
|
* indexed with the kind value.
|
|
|
|
*/
|
2019-04-24 06:26:55 +08:00
|
|
|
VALUE_PROF_KIND(IPVK_First, IPVK_IndirectCallTarget, "first")
|
|
|
|
VALUE_PROF_KIND(IPVK_Last, IPVK_MemOPSize, "last")
|
2015-11-23 13:47:05 +08:00
|
|
|
|
|
|
|
#undef VALUE_PROF_KIND
|
|
|
|
/* VALUE_PROF_KIND end */
|
|
|
|
|
2019-10-22 02:48:38 +08:00
|
|
|
#undef COVMAP_V2_OR_V3
|
|
|
|
#ifdef COVMAP_V2
|
|
|
|
#define COVMAP_V2_OR_V3
|
|
|
|
#endif
|
|
|
|
#ifdef COVMAP_V3
|
|
|
|
#define COVMAP_V2_OR_V3
|
|
|
|
#endif
|
|
|
|
|
2015-11-23 13:47:05 +08:00
|
|
|
/* COVMAP_FUNC_RECORD start */
|
|
|
|
/* Definition of member fields of the function record structure in coverage
|
|
|
|
* map.
|
|
|
|
*/
|
|
|
|
#ifndef COVMAP_FUNC_RECORD
|
|
|
|
#define COVMAP_FUNC_RECORD(Type, LLVMType, Name, Initializer)
|
|
|
|
#else
|
|
|
|
#define INSTR_PROF_DATA_DEFINED
|
|
|
|
#endif
|
2016-02-09 02:14:02 +08:00
|
|
|
#ifdef COVMAP_V1
|
2015-11-23 13:47:05 +08:00
|
|
|
COVMAP_FUNC_RECORD(const IntPtrT, llvm::Type::getInt8PtrTy(Ctx), \
|
|
|
|
NamePtr, llvm::ConstantExpr::getBitCast(NamePtr, \
|
2016-01-08 08:39:51 +08:00
|
|
|
llvm::Type::getInt8PtrTy(Ctx)))
|
2015-11-23 13:47:05 +08:00
|
|
|
COVMAP_FUNC_RECORD(const uint32_t, llvm::Type::getInt32Ty(Ctx), NameSize, \
|
2016-02-09 02:14:02 +08:00
|
|
|
llvm::ConstantInt::get(llvm::Type::getInt32Ty(Ctx), \
|
2015-11-23 13:47:05 +08:00
|
|
|
NameValue.size()))
|
2019-10-22 02:48:38 +08:00
|
|
|
#endif
|
|
|
|
#ifdef COVMAP_V2_OR_V3
|
2016-02-09 02:14:02 +08:00
|
|
|
COVMAP_FUNC_RECORD(const int64_t, llvm::Type::getInt64Ty(Ctx), NameRef, \
|
2019-10-22 02:48:38 +08:00
|
|
|
llvm::ConstantInt::get( \
|
|
|
|
llvm::Type::getInt64Ty(Ctx), NameHash))
|
2016-02-09 02:14:02 +08:00
|
|
|
#endif
|
2015-11-23 13:47:05 +08:00
|
|
|
COVMAP_FUNC_RECORD(const uint32_t, llvm::Type::getInt32Ty(Ctx), DataSize, \
|
2019-10-22 02:48:38 +08:00
|
|
|
llvm::ConstantInt::get( \
|
|
|
|
llvm::Type::getInt32Ty(Ctx), CoverageMapping.size()))
|
2015-11-23 13:47:05 +08:00
|
|
|
COVMAP_FUNC_RECORD(const uint64_t, llvm::Type::getInt64Ty(Ctx), FuncHash, \
|
2019-10-22 02:48:38 +08:00
|
|
|
llvm::ConstantInt::get( \
|
|
|
|
llvm::Type::getInt64Ty(Ctx), FuncHash))
|
|
|
|
#ifdef COVMAP_V3
|
|
|
|
COVMAP_FUNC_RECORD(const uint64_t, llvm::Type::getInt64Ty(Ctx), FilenamesRef, \
|
|
|
|
llvm::ConstantInt::get( \
|
|
|
|
llvm::Type::getInt64Ty(Ctx), FilenamesRef))
|
|
|
|
COVMAP_FUNC_RECORD(const char, \
|
|
|
|
llvm::ArrayType::get(llvm::Type::getInt8Ty(Ctx), \
|
|
|
|
CoverageMapping.size()), \
|
|
|
|
CoverageMapping,
|
|
|
|
llvm::ConstantDataArray::getRaw( \
|
|
|
|
CoverageMapping, CoverageMapping.size(), \
|
|
|
|
llvm::Type::getInt8Ty(Ctx)))
|
|
|
|
#endif
|
2015-11-23 13:47:05 +08:00
|
|
|
#undef COVMAP_FUNC_RECORD
|
|
|
|
/* COVMAP_FUNC_RECORD end. */
|
|
|
|
|
2016-01-04 02:36:30 +08:00
|
|
|
/* COVMAP_HEADER start */
|
|
|
|
/* Definition of member fields of coverage map header.
|
|
|
|
*/
|
|
|
|
#ifndef COVMAP_HEADER
|
|
|
|
#define COVMAP_HEADER(Type, LLVMType, Name, Initializer)
|
|
|
|
#else
|
|
|
|
#define INSTR_PROF_DATA_DEFINED
|
|
|
|
#endif
|
|
|
|
COVMAP_HEADER(uint32_t, Int32Ty, NRecords, \
|
2019-10-22 02:48:38 +08:00
|
|
|
llvm::ConstantInt::get(Int32Ty, NRecords))
|
2016-01-04 02:36:30 +08:00
|
|
|
COVMAP_HEADER(uint32_t, Int32Ty, FilenamesSize, \
|
|
|
|
llvm::ConstantInt::get(Int32Ty, FilenamesSize))
|
|
|
|
COVMAP_HEADER(uint32_t, Int32Ty, CoverageSize, \
|
|
|
|
llvm::ConstantInt::get(Int32Ty, CoverageMappingSize))
|
|
|
|
COVMAP_HEADER(uint32_t, Int32Ty, Version, \
|
2016-01-14 14:23:53 +08:00
|
|
|
llvm::ConstantInt::get(Int32Ty, CovMapVersion::CurrentVersion))
|
2016-01-04 02:36:30 +08:00
|
|
|
#undef COVMAP_HEADER
|
|
|
|
/* COVMAP_HEADER end. */
|
|
|
|
|
2015-11-23 13:47:05 +08:00
|
|
|
|
2017-04-14 07:37:15 +08:00
|
|
|
#ifdef INSTR_PROF_SECT_ENTRY
|
|
|
|
#define INSTR_PROF_DATA_DEFINED
|
2017-04-15 08:10:33 +08:00
|
|
|
INSTR_PROF_SECT_ENTRY(IPSK_data, \
|
2017-04-14 07:37:15 +08:00
|
|
|
INSTR_PROF_QUOTE(INSTR_PROF_DATA_COMMON), \
|
[InstrProf] Implement static profdata registration
Summary:
The motivating use case is eliminating duplicate profile data registered
for the same inline function in two object files. Before this change,
users would observe multiple symbol definition errors with VC link, but
links with LLD would succeed.
Users (Mozilla) have reported that PGO works well with clang-cl and LLD,
but when using LLD without this static registration, we would get into a
"relocation against a discarded section" situation. I'm not sure what
happens in that situation, but I suspect that duplicate, unused profile
information was retained. If so, this change will reduce the size of
such binaries with LLD.
Now, Windows uses static registration and is in line with all the other
platforms.
Reviewers: davidxl, wmi, inglorion, void, calixte
Subscribers: mgorny, krytarowski, eraman, fedor.sergeev, hiraditya, #sanitizers, dmajor, llvm-commits
Tags: #sanitizers, #llvm
Differential Revision: https://reviews.llvm.org/D57929
llvm-svn: 353547
2019-02-09 03:03:50 +08:00
|
|
|
INSTR_PROF_DATA_COFF, "__DATA,")
|
2017-04-15 08:10:33 +08:00
|
|
|
INSTR_PROF_SECT_ENTRY(IPSK_cnts, \
|
2017-04-14 07:37:15 +08:00
|
|
|
INSTR_PROF_QUOTE(INSTR_PROF_CNTS_COMMON), \
|
[InstrProf] Implement static profdata registration
Summary:
The motivating use case is eliminating duplicate profile data registered
for the same inline function in two object files. Before this change,
users would observe multiple symbol definition errors with VC link, but
links with LLD would succeed.
Users (Mozilla) have reported that PGO works well with clang-cl and LLD,
but when using LLD without this static registration, we would get into a
"relocation against a discarded section" situation. I'm not sure what
happens in that situation, but I suspect that duplicate, unused profile
information was retained. If so, this change will reduce the size of
such binaries with LLD.
Now, Windows uses static registration and is in line with all the other
platforms.
Reviewers: davidxl, wmi, inglorion, void, calixte
Subscribers: mgorny, krytarowski, eraman, fedor.sergeev, hiraditya, #sanitizers, dmajor, llvm-commits
Tags: #sanitizers, #llvm
Differential Revision: https://reviews.llvm.org/D57929
llvm-svn: 353547
2019-02-09 03:03:50 +08:00
|
|
|
INSTR_PROF_CNTS_COFF, "__DATA,")
|
2017-04-15 08:10:33 +08:00
|
|
|
INSTR_PROF_SECT_ENTRY(IPSK_name, \
|
2017-04-14 07:37:15 +08:00
|
|
|
INSTR_PROF_QUOTE(INSTR_PROF_NAME_COMMON), \
|
[InstrProf] Implement static profdata registration
Summary:
The motivating use case is eliminating duplicate profile data registered
for the same inline function in two object files. Before this change,
users would observe multiple symbol definition errors with VC link, but
links with LLD would succeed.
Users (Mozilla) have reported that PGO works well with clang-cl and LLD,
but when using LLD without this static registration, we would get into a
"relocation against a discarded section" situation. I'm not sure what
happens in that situation, but I suspect that duplicate, unused profile
information was retained. If so, this change will reduce the size of
such binaries with LLD.
Now, Windows uses static registration and is in line with all the other
platforms.
Reviewers: davidxl, wmi, inglorion, void, calixte
Subscribers: mgorny, krytarowski, eraman, fedor.sergeev, hiraditya, #sanitizers, dmajor, llvm-commits
Tags: #sanitizers, #llvm
Differential Revision: https://reviews.llvm.org/D57929
llvm-svn: 353547
2019-02-09 03:03:50 +08:00
|
|
|
INSTR_PROF_NAME_COFF, "__DATA,")
|
2017-04-15 08:10:33 +08:00
|
|
|
INSTR_PROF_SECT_ENTRY(IPSK_vals, \
|
2017-04-14 07:37:15 +08:00
|
|
|
INSTR_PROF_QUOTE(INSTR_PROF_VALS_COMMON), \
|
[InstrProf] Implement static profdata registration
Summary:
The motivating use case is eliminating duplicate profile data registered
for the same inline function in two object files. Before this change,
users would observe multiple symbol definition errors with VC link, but
links with LLD would succeed.
Users (Mozilla) have reported that PGO works well with clang-cl and LLD,
but when using LLD without this static registration, we would get into a
"relocation against a discarded section" situation. I'm not sure what
happens in that situation, but I suspect that duplicate, unused profile
information was retained. If so, this change will reduce the size of
such binaries with LLD.
Now, Windows uses static registration and is in line with all the other
platforms.
Reviewers: davidxl, wmi, inglorion, void, calixte
Subscribers: mgorny, krytarowski, eraman, fedor.sergeev, hiraditya, #sanitizers, dmajor, llvm-commits
Tags: #sanitizers, #llvm
Differential Revision: https://reviews.llvm.org/D57929
llvm-svn: 353547
2019-02-09 03:03:50 +08:00
|
|
|
INSTR_PROF_VALS_COFF, "__DATA,")
|
2017-04-15 08:10:33 +08:00
|
|
|
INSTR_PROF_SECT_ENTRY(IPSK_vnodes, \
|
2017-04-14 07:37:15 +08:00
|
|
|
INSTR_PROF_QUOTE(INSTR_PROF_VNODES_COMMON), \
|
[InstrProf] Implement static profdata registration
Summary:
The motivating use case is eliminating duplicate profile data registered
for the same inline function in two object files. Before this change,
users would observe multiple symbol definition errors with VC link, but
links with LLD would succeed.
Users (Mozilla) have reported that PGO works well with clang-cl and LLD,
but when using LLD without this static registration, we would get into a
"relocation against a discarded section" situation. I'm not sure what
happens in that situation, but I suspect that duplicate, unused profile
information was retained. If so, this change will reduce the size of
such binaries with LLD.
Now, Windows uses static registration and is in line with all the other
platforms.
Reviewers: davidxl, wmi, inglorion, void, calixte
Subscribers: mgorny, krytarowski, eraman, fedor.sergeev, hiraditya, #sanitizers, dmajor, llvm-commits
Tags: #sanitizers, #llvm
Differential Revision: https://reviews.llvm.org/D57929
llvm-svn: 353547
2019-02-09 03:03:50 +08:00
|
|
|
INSTR_PROF_VNODES_COFF, "__DATA,")
|
2017-04-15 08:10:33 +08:00
|
|
|
INSTR_PROF_SECT_ENTRY(IPSK_covmap, \
|
2017-04-14 07:37:15 +08:00
|
|
|
INSTR_PROF_QUOTE(INSTR_PROF_COVMAP_COMMON), \
|
[InstrProf] Implement static profdata registration
Summary:
The motivating use case is eliminating duplicate profile data registered
for the same inline function in two object files. Before this change,
users would observe multiple symbol definition errors with VC link, but
links with LLD would succeed.
Users (Mozilla) have reported that PGO works well with clang-cl and LLD,
but when using LLD without this static registration, we would get into a
"relocation against a discarded section" situation. I'm not sure what
happens in that situation, but I suspect that duplicate, unused profile
information was retained. If so, this change will reduce the size of
such binaries with LLD.
Now, Windows uses static registration and is in line with all the other
platforms.
Reviewers: davidxl, wmi, inglorion, void, calixte
Subscribers: mgorny, krytarowski, eraman, fedor.sergeev, hiraditya, #sanitizers, dmajor, llvm-commits
Tags: #sanitizers, #llvm
Differential Revision: https://reviews.llvm.org/D57929
llvm-svn: 353547
2019-02-09 03:03:50 +08:00
|
|
|
INSTR_PROF_COVMAP_COFF, "__LLVM_COV,")
|
2019-10-22 02:48:38 +08:00
|
|
|
INSTR_PROF_SECT_ENTRY(IPSK_covfun, \
|
|
|
|
INSTR_PROF_QUOTE(INSTR_PROF_COVFUN_COMMON), \
|
|
|
|
INSTR_PROF_COVFUN_COFF, "__LLVM_COV,")
|
2019-03-08 23:30:56 +08:00
|
|
|
INSTR_PROF_SECT_ENTRY(IPSK_orderfile, \
|
|
|
|
INSTR_PROF_QUOTE(INSTR_PROF_ORDERFILE_COMMON), \
|
|
|
|
INSTR_PROF_QUOTE(INSTR_PROF_ORDERFILE_COFF), "__DATA,")
|
2017-04-14 07:37:15 +08:00
|
|
|
|
|
|
|
#undef INSTR_PROF_SECT_ENTRY
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
2015-11-29 03:12:23 +08:00
|
|
|
#ifdef INSTR_PROF_VALUE_PROF_DATA
|
|
|
|
#define INSTR_PROF_DATA_DEFINED
|
|
|
|
|
2016-01-08 08:39:51 +08:00
|
|
|
#define INSTR_PROF_MAX_NUM_VAL_PER_SITE 255
|
|
|
|
/*!
|
2015-11-29 03:12:23 +08:00
|
|
|
* This is the header of the data structure that defines the on-disk
|
|
|
|
* layout of the value profile data of a particular kind for one function.
|
|
|
|
*/
|
|
|
|
typedef struct ValueProfRecord {
|
|
|
|
/* The kind of the value profile record. */
|
|
|
|
uint32_t Kind;
|
|
|
|
/*
|
|
|
|
* The number of value profile sites. It is guaranteed to be non-zero;
|
|
|
|
* otherwise the record for this kind won't be emitted.
|
|
|
|
*/
|
|
|
|
uint32_t NumValueSites;
|
2016-01-08 08:39:51 +08:00
|
|
|
/*
|
2015-11-29 03:12:23 +08:00
|
|
|
* The first element of the array that stores the number of profiled
|
|
|
|
* values for each value site. The size of the array is NumValueSites.
|
|
|
|
* Since NumValueSites is greater than zero, there is at least one
|
|
|
|
* element in the array.
|
|
|
|
*/
|
|
|
|
uint8_t SiteCountArray[1];
|
|
|
|
|
|
|
|
/*
|
|
|
|
* The fake declaration is for documentation purpose only.
|
|
|
|
* Align the start of next field to be on 8 byte boundaries.
|
|
|
|
uint8_t Padding[X];
|
|
|
|
*/
|
|
|
|
|
|
|
|
/* The array of value profile data. The size of the array is the sum
|
|
|
|
* of all elements in SiteCountArray[].
|
|
|
|
InstrProfValueData ValueData[];
|
|
|
|
*/
|
|
|
|
|
|
|
|
#ifdef __cplusplus
|
|
|
|
/*!
|
2019-01-16 05:59:17 +08:00
|
|
|
* Return the number of value sites.
|
2015-11-29 03:12:23 +08:00
|
|
|
*/
|
|
|
|
uint32_t getNumValueSites() const { return NumValueSites; }
|
2016-01-08 08:39:51 +08:00
|
|
|
/*!
|
2019-01-16 05:59:17 +08:00
|
|
|
* Read data from this record and save it to Record.
|
2015-11-29 03:12:23 +08:00
|
|
|
*/
|
|
|
|
void deserializeTo(InstrProfRecord &Record,
|
2019-01-16 05:59:17 +08:00
|
|
|
InstrProfSymtab *SymTab);
|
2015-11-29 03:12:23 +08:00
|
|
|
/*
|
|
|
|
* In-place byte swap:
|
|
|
|
* Do byte swap for this instance. \c Old is the original order before
|
|
|
|
* the swap, and \c New is the New byte order.
|
|
|
|
*/
|
|
|
|
void swapBytes(support::endianness Old, support::endianness New);
|
|
|
|
#endif
|
|
|
|
} ValueProfRecord;
|
|
|
|
|
|
|
|
/*!
|
|
|
|
* Per-function header/control data structure for value profiling
|
|
|
|
* data in indexed format.
|
|
|
|
*/
|
|
|
|
typedef struct ValueProfData {
|
|
|
|
/*
|
|
|
|
* Total size in bytes including this field. It must be a multiple
|
2016-01-08 08:39:51 +08:00
|
|
|
* of sizeof(uint64_t).
|
2015-11-29 03:12:23 +08:00
|
|
|
*/
|
|
|
|
uint32_t TotalSize;
|
2016-01-08 08:39:51 +08:00
|
|
|
/*
|
2015-11-29 03:12:23 +08:00
|
|
|
*The number of value profile kinds that has value profile data.
|
|
|
|
* In this implementation, a value profile kind is considered to
|
|
|
|
* have profile data if the number of value profile sites for the
|
|
|
|
* kind is not zero. More aggressively, the implementation can
|
|
|
|
* choose to check the actual data value: if none of the value sites
|
|
|
|
* has any profiled values, the kind can be skipped.
|
|
|
|
*/
|
|
|
|
uint32_t NumValueKinds;
|
|
|
|
|
2016-01-08 08:39:51 +08:00
|
|
|
/*
|
2015-11-29 03:12:23 +08:00
|
|
|
* Following are a sequence of variable length records. The prefix/header
|
|
|
|
* of each record is defined by ValueProfRecord type. The number of
|
|
|
|
* records is NumValueKinds.
|
|
|
|
* ValueProfRecord Record_1;
|
|
|
|
* ValueProfRecord Record_N;
|
|
|
|
*/
|
|
|
|
|
|
|
|
#if __cplusplus
|
|
|
|
/*!
|
|
|
|
* Return the total size in bytes of the on-disk value profile data
|
|
|
|
* given the data stored in Record.
|
|
|
|
*/
|
|
|
|
static uint32_t getSize(const InstrProfRecord &Record);
|
|
|
|
/*!
|
|
|
|
* Return a pointer to \c ValueProfData instance ready to be streamed.
|
|
|
|
*/
|
|
|
|
static std::unique_ptr<ValueProfData>
|
|
|
|
serializeFrom(const InstrProfRecord &Record);
|
|
|
|
/*!
|
2016-05-19 11:55:20 +08:00
|
|
|
* Check the integrity of the record.
|
2015-11-29 03:12:23 +08:00
|
|
|
*/
|
2016-05-19 11:55:20 +08:00
|
|
|
Error checkIntegrity();
|
2015-11-29 03:12:23 +08:00
|
|
|
/*!
|
|
|
|
* Return a pointer to \c ValueProfileData instance ready to be read.
|
|
|
|
* All data in the instance are properly byte swapped. The input
|
|
|
|
* data is assumed to be in little endian order.
|
|
|
|
*/
|
2016-05-19 11:55:20 +08:00
|
|
|
static Expected<std::unique_ptr<ValueProfData>>
|
2015-11-29 03:12:23 +08:00
|
|
|
getValueProfData(const unsigned char *SrcBuffer,
|
|
|
|
const unsigned char *const SrcBufferEnd,
|
|
|
|
support::endianness SrcDataEndianness);
|
|
|
|
/*!
|
|
|
|
* Swap byte order from \c Endianness order to host byte order.
|
|
|
|
*/
|
|
|
|
void swapBytesToHost(support::endianness Endianness);
|
|
|
|
/*!
|
|
|
|
* Swap byte order from host byte order to \c Endianness order.
|
|
|
|
*/
|
|
|
|
void swapBytesFromHost(support::endianness Endianness);
|
|
|
|
/*!
|
|
|
|
* Return the total size of \c ValueProfileData.
|
|
|
|
*/
|
|
|
|
uint32_t getSize() const { return TotalSize; }
|
|
|
|
/*!
|
|
|
|
* Read data from this data and save it to \c Record.
|
|
|
|
*/
|
|
|
|
void deserializeTo(InstrProfRecord &Record,
|
2019-01-16 05:59:17 +08:00
|
|
|
InstrProfSymtab *SymTab);
|
2015-12-03 05:48:22 +08:00
|
|
|
void operator delete(void *ptr) { ::operator delete(ptr); }
|
2015-11-29 03:12:23 +08:00
|
|
|
#endif
|
|
|
|
} ValueProfData;
|
|
|
|
|
2016-01-08 08:39:51 +08:00
|
|
|
/*
|
2015-11-29 03:12:23 +08:00
|
|
|
* The closure is designed to abstact away two types of value profile data:
|
2015-11-29 12:53:15 +08:00
|
|
|
* - InstrProfRecord which is the primary data structure used to
|
|
|
|
* represent profile data in host tools (reader, writer, and profile-use)
|
2015-11-29 03:12:23 +08:00
|
|
|
* - value profile runtime data structure suitable to be used by C
|
2015-11-29 12:53:15 +08:00
|
|
|
* runtime library.
|
2015-11-29 03:12:23 +08:00
|
|
|
*
|
|
|
|
* Both sources of data need to serialize to disk/memory-buffer in common
|
|
|
|
* format: ValueProfData. The abstraction allows compiler-rt's raw profiler
|
2015-11-29 12:53:15 +08:00
|
|
|
* writer to share the same format and code with indexed profile writer.
|
2015-11-29 03:12:23 +08:00
|
|
|
*
|
|
|
|
* For documentation of the member methods below, refer to corresponding methods
|
|
|
|
* in class InstrProfRecord.
|
|
|
|
*/
|
|
|
|
typedef struct ValueProfRecordClosure {
|
|
|
|
const void *Record;
|
|
|
|
uint32_t (*GetNumValueKinds)(const void *Record);
|
|
|
|
uint32_t (*GetNumValueSites)(const void *Record, uint32_t VKind);
|
|
|
|
uint32_t (*GetNumValueData)(const void *Record, uint32_t VKind);
|
|
|
|
uint32_t (*GetNumValueDataForSite)(const void *R, uint32_t VK, uint32_t S);
|
|
|
|
|
2016-01-08 08:39:51 +08:00
|
|
|
/*
|
2015-11-29 03:12:23 +08:00
|
|
|
* After extracting the value profile data from the value profile record,
|
|
|
|
* this method is used to map the in-memory value to on-disk value. If
|
|
|
|
* the method is null, value will be written out untranslated.
|
|
|
|
*/
|
|
|
|
uint64_t (*RemapValueData)(uint32_t, uint64_t Value);
|
|
|
|
void (*GetValueForSite)(const void *R, InstrProfValueData *Dst, uint32_t K,
|
2016-02-09 02:14:02 +08:00
|
|
|
uint32_t S);
|
2015-11-29 03:12:23 +08:00
|
|
|
ValueProfData *(*AllocValueProfData)(size_t TotalSizeInBytes);
|
|
|
|
} ValueProfRecordClosure;
|
|
|
|
|
2016-06-09 00:39:43 +08:00
|
|
|
INSTR_PROF_VISIBILITY ValueProfRecord *
|
|
|
|
getFirstValueProfRecord(ValueProfData *VPD);
|
|
|
|
INSTR_PROF_VISIBILITY ValueProfRecord *
|
|
|
|
getValueProfRecordNext(ValueProfRecord *VPR);
|
|
|
|
INSTR_PROF_VISIBILITY InstrProfValueData *
|
|
|
|
getValueProfRecordValueData(ValueProfRecord *VPR);
|
|
|
|
INSTR_PROF_VISIBILITY uint32_t
|
|
|
|
getValueProfRecordHeaderSize(uint32_t NumValueSites);
|
2015-11-29 12:53:15 +08:00
|
|
|
|
2015-11-29 03:12:23 +08:00
|
|
|
#undef INSTR_PROF_VALUE_PROF_DATA
|
2016-01-08 08:39:51 +08:00
|
|
|
#endif /* INSTR_PROF_VALUE_PROF_DATA */
|
2015-11-29 03:12:23 +08:00
|
|
|
|
|
|
|
|
|
|
|
#ifdef INSTR_PROF_COMMON_API_IMPL
|
|
|
|
#define INSTR_PROF_DATA_DEFINED
|
|
|
|
#ifdef __cplusplus
|
|
|
|
#define INSTR_PROF_INLINE inline
|
2016-01-27 08:14:15 +08:00
|
|
|
#define INSTR_PROF_NULLPTR nullptr
|
2015-11-29 03:12:23 +08:00
|
|
|
#else
|
|
|
|
#define INSTR_PROF_INLINE
|
2016-01-27 08:14:15 +08:00
|
|
|
#define INSTR_PROF_NULLPTR NULL
|
2015-11-29 03:12:23 +08:00
|
|
|
#endif
|
|
|
|
|
|
|
|
#ifndef offsetof
|
|
|
|
#define offsetof(TYPE, MEMBER) ((size_t) &((TYPE *)0)->MEMBER)
|
|
|
|
#endif
|
|
|
|
|
|
|
|
/*!
|
2019-01-16 05:59:17 +08:00
|
|
|
* Return the \c ValueProfRecord header size including the
|
2015-11-29 03:12:23 +08:00
|
|
|
* padding bytes.
|
|
|
|
*/
|
2016-06-09 00:39:43 +08:00
|
|
|
INSTR_PROF_VISIBILITY INSTR_PROF_INLINE
|
2015-11-29 03:12:23 +08:00
|
|
|
uint32_t getValueProfRecordHeaderSize(uint32_t NumValueSites) {
|
|
|
|
uint32_t Size = offsetof(ValueProfRecord, SiteCountArray) +
|
|
|
|
sizeof(uint8_t) * NumValueSites;
|
|
|
|
/* Round the size to multiple of 8 bytes. */
|
|
|
|
Size = (Size + 7) & ~7;
|
|
|
|
return Size;
|
|
|
|
}
|
|
|
|
|
2016-01-08 08:39:51 +08:00
|
|
|
/*!
|
2019-01-16 05:59:17 +08:00
|
|
|
* Return the total size of the value profile record including the
|
2015-11-29 03:12:23 +08:00
|
|
|
* header and the value data.
|
|
|
|
*/
|
2016-06-09 00:39:43 +08:00
|
|
|
INSTR_PROF_VISIBILITY INSTR_PROF_INLINE
|
2015-11-29 03:12:23 +08:00
|
|
|
uint32_t getValueProfRecordSize(uint32_t NumValueSites,
|
|
|
|
uint32_t NumValueData) {
|
|
|
|
return getValueProfRecordHeaderSize(NumValueSites) +
|
|
|
|
sizeof(InstrProfValueData) * NumValueData;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*!
|
2019-01-16 05:59:17 +08:00
|
|
|
* Return the pointer to the start of value data array.
|
2015-11-29 03:12:23 +08:00
|
|
|
*/
|
2016-06-09 00:39:43 +08:00
|
|
|
INSTR_PROF_VISIBILITY INSTR_PROF_INLINE
|
2015-11-29 03:12:23 +08:00
|
|
|
InstrProfValueData *getValueProfRecordValueData(ValueProfRecord *This) {
|
|
|
|
return (InstrProfValueData *)((char *)This + getValueProfRecordHeaderSize(
|
|
|
|
This->NumValueSites));
|
|
|
|
}
|
|
|
|
|
2016-01-08 08:39:51 +08:00
|
|
|
/*!
|
2019-01-16 05:59:17 +08:00
|
|
|
* Return the total number of value data for \c This record.
|
2015-11-29 03:12:23 +08:00
|
|
|
*/
|
2016-06-09 00:39:43 +08:00
|
|
|
INSTR_PROF_VISIBILITY INSTR_PROF_INLINE
|
2015-11-29 03:12:23 +08:00
|
|
|
uint32_t getValueProfRecordNumValueData(ValueProfRecord *This) {
|
|
|
|
uint32_t NumValueData = 0;
|
|
|
|
uint32_t I;
|
|
|
|
for (I = 0; I < This->NumValueSites; I++)
|
|
|
|
NumValueData += This->SiteCountArray[I];
|
|
|
|
return NumValueData;
|
|
|
|
}
|
|
|
|
|
2016-01-08 08:39:51 +08:00
|
|
|
/*!
|
2019-01-16 05:59:17 +08:00
|
|
|
* Use this method to advance to the next \c This \c ValueProfRecord.
|
2015-11-29 03:12:23 +08:00
|
|
|
*/
|
2016-06-09 00:39:43 +08:00
|
|
|
INSTR_PROF_VISIBILITY INSTR_PROF_INLINE
|
2015-11-29 03:12:23 +08:00
|
|
|
ValueProfRecord *getValueProfRecordNext(ValueProfRecord *This) {
|
|
|
|
uint32_t NumValueData = getValueProfRecordNumValueData(This);
|
|
|
|
return (ValueProfRecord *)((char *)This +
|
|
|
|
getValueProfRecordSize(This->NumValueSites,
|
|
|
|
NumValueData));
|
|
|
|
}
|
|
|
|
|
|
|
|
/*!
|
2019-01-16 05:59:17 +08:00
|
|
|
* Return the first \c ValueProfRecord instance.
|
2015-11-29 03:12:23 +08:00
|
|
|
*/
|
2016-06-09 00:39:43 +08:00
|
|
|
INSTR_PROF_VISIBILITY INSTR_PROF_INLINE
|
2015-11-29 03:12:23 +08:00
|
|
|
ValueProfRecord *getFirstValueProfRecord(ValueProfData *This) {
|
|
|
|
return (ValueProfRecord *)((char *)This + sizeof(ValueProfData));
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Closure based interfaces. */
|
|
|
|
|
2016-01-08 08:39:51 +08:00
|
|
|
/*!
|
2015-11-29 03:12:23 +08:00
|
|
|
* Return the total size in bytes of the on-disk value profile data
|
|
|
|
* given the data stored in Record.
|
|
|
|
*/
|
2016-06-09 00:39:43 +08:00
|
|
|
INSTR_PROF_VISIBILITY uint32_t
|
|
|
|
getValueProfDataSize(ValueProfRecordClosure *Closure) {
|
2015-11-29 03:12:23 +08:00
|
|
|
uint32_t Kind;
|
|
|
|
uint32_t TotalSize = sizeof(ValueProfData);
|
|
|
|
const void *Record = Closure->Record;
|
|
|
|
|
|
|
|
for (Kind = IPVK_First; Kind <= IPVK_Last; Kind++) {
|
|
|
|
uint32_t NumValueSites = Closure->GetNumValueSites(Record, Kind);
|
|
|
|
if (!NumValueSites)
|
|
|
|
continue;
|
|
|
|
TotalSize += getValueProfRecordSize(NumValueSites,
|
|
|
|
Closure->GetNumValueData(Record, Kind));
|
|
|
|
}
|
|
|
|
return TotalSize;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*!
|
|
|
|
* Extract value profile data of a function for the profile kind \c ValueKind
|
|
|
|
* from the \c Closure and serialize the data into \c This record instance.
|
|
|
|
*/
|
2016-06-09 00:39:43 +08:00
|
|
|
INSTR_PROF_VISIBILITY void
|
|
|
|
serializeValueProfRecordFrom(ValueProfRecord *This,
|
|
|
|
ValueProfRecordClosure *Closure,
|
|
|
|
uint32_t ValueKind, uint32_t NumValueSites) {
|
2015-11-29 03:12:23 +08:00
|
|
|
uint32_t S;
|
|
|
|
const void *Record = Closure->Record;
|
|
|
|
This->Kind = ValueKind;
|
|
|
|
This->NumValueSites = NumValueSites;
|
|
|
|
InstrProfValueData *DstVD = getValueProfRecordValueData(This);
|
|
|
|
|
|
|
|
for (S = 0; S < NumValueSites; S++) {
|
|
|
|
uint32_t ND = Closure->GetNumValueDataForSite(Record, ValueKind, S);
|
|
|
|
This->SiteCountArray[S] = ND;
|
2016-02-09 02:14:02 +08:00
|
|
|
Closure->GetValueForSite(Record, DstVD, ValueKind, S);
|
2015-11-29 03:12:23 +08:00
|
|
|
DstVD += ND;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/*!
|
|
|
|
* Extract value profile data of a function from the \c Closure
|
|
|
|
* and serialize the data into \c DstData if it is not NULL or heap
|
2016-05-12 05:16:11 +08:00
|
|
|
* memory allocated by the \c Closure's allocator method. If \c
|
|
|
|
* DstData is not null, the caller is expected to set the TotalSize
|
|
|
|
* in DstData.
|
2015-11-29 03:12:23 +08:00
|
|
|
*/
|
2016-06-09 00:39:43 +08:00
|
|
|
INSTR_PROF_VISIBILITY ValueProfData *
|
|
|
|
serializeValueProfDataFrom(ValueProfRecordClosure *Closure,
|
|
|
|
ValueProfData *DstData) {
|
2015-11-29 03:12:23 +08:00
|
|
|
uint32_t Kind;
|
2016-05-15 04:12:42 +08:00
|
|
|
uint32_t TotalSize =
|
2016-05-12 05:16:11 +08:00
|
|
|
DstData ? DstData->TotalSize : getValueProfDataSize(Closure);
|
2015-11-29 03:12:23 +08:00
|
|
|
|
|
|
|
ValueProfData *VPD =
|
|
|
|
DstData ? DstData : Closure->AllocValueProfData(TotalSize);
|
|
|
|
|
|
|
|
VPD->TotalSize = TotalSize;
|
|
|
|
VPD->NumValueKinds = Closure->GetNumValueKinds(Closure->Record);
|
|
|
|
ValueProfRecord *VR = getFirstValueProfRecord(VPD);
|
|
|
|
for (Kind = IPVK_First; Kind <= IPVK_Last; Kind++) {
|
|
|
|
uint32_t NumValueSites = Closure->GetNumValueSites(Closure->Record, Kind);
|
|
|
|
if (!NumValueSites)
|
|
|
|
continue;
|
|
|
|
serializeValueProfRecordFrom(VR, Closure, Kind, NumValueSites);
|
|
|
|
VR = getValueProfRecordNext(VR);
|
|
|
|
}
|
|
|
|
return VPD;
|
|
|
|
}
|
|
|
|
|
|
|
|
#undef INSTR_PROF_COMMON_API_IMPL
|
|
|
|
#endif /* INSTR_PROF_COMMON_API_IMPL */
|
2015-11-23 13:47:05 +08:00
|
|
|
|
|
|
|
/*============================================================================*/
|
|
|
|
|
|
|
|
#ifndef INSTR_PROF_DATA_DEFINED
|
|
|
|
|
2016-01-27 08:14:15 +08:00
|
|
|
#ifndef INSTR_PROF_DATA_INC
|
|
|
|
#define INSTR_PROF_DATA_INC
|
2015-11-23 13:47:05 +08:00
|
|
|
|
|
|
|
/* Helper macros. */
|
|
|
|
#define INSTR_PROF_SIMPLE_QUOTE(x) #x
|
|
|
|
#define INSTR_PROF_QUOTE(x) INSTR_PROF_SIMPLE_QUOTE(x)
|
|
|
|
#define INSTR_PROF_SIMPLE_CONCAT(x,y) x ## y
|
|
|
|
#define INSTR_PROF_CONCAT(x,y) INSTR_PROF_SIMPLE_CONCAT(x,y)
|
|
|
|
|
|
|
|
/* Magic number to detect file format and endianness.
|
2015-11-24 08:37:45 +08:00
|
|
|
* Use 255 at one end, since no UTF-8 file can use that character. Avoid 0,
|
|
|
|
* so that utilities, like strings, don't grab it as a string. 129 is also
|
2015-11-23 13:47:05 +08:00
|
|
|
* invalid UTF-8, and high enough to be interesting.
|
2015-11-24 08:37:45 +08:00
|
|
|
* Use "lprofr" in the centre to stand for "LLVM Profile Raw", or "lprofR"
|
2015-11-23 13:47:05 +08:00
|
|
|
* for 32-bit platforms.
|
|
|
|
*/
|
|
|
|
#define INSTR_PROF_RAW_MAGIC_64 (uint64_t)255 << 56 | (uint64_t)'l' << 48 | \
|
|
|
|
(uint64_t)'p' << 40 | (uint64_t)'r' << 32 | (uint64_t)'o' << 24 | \
|
|
|
|
(uint64_t)'f' << 16 | (uint64_t)'r' << 8 | (uint64_t)129
|
|
|
|
#define INSTR_PROF_RAW_MAGIC_32 (uint64_t)255 << 56 | (uint64_t)'l' << 48 | \
|
|
|
|
(uint64_t)'p' << 40 | (uint64_t)'r' << 32 | (uint64_t)'o' << 24 | \
|
|
|
|
(uint64_t)'f' << 16 | (uint64_t)'R' << 8 | (uint64_t)129
|
|
|
|
|
2016-02-09 02:14:02 +08:00
|
|
|
/* Raw profile format version (start from 1). */
|
2021-05-07 00:09:12 +08:00
|
|
|
#define INSTR_PROF_RAW_VERSION 6
|
2016-02-09 02:14:02 +08:00
|
|
|
/* Indexed profile format version (start from 1). */
|
2020-12-29 01:20:48 +08:00
|
|
|
#define INSTR_PROF_INDEX_VERSION 7
|
2019-10-22 02:48:38 +08:00
|
|
|
/* Coverage mapping format version (start from 0). */
|
2021-02-10 16:25:34 +08:00
|
|
|
#define INSTR_PROF_COVMAP_VERSION 5
|
2015-11-23 13:47:05 +08:00
|
|
|
|
2016-01-26 04:38:40 +08:00
|
|
|
/* Profile version is always of type uint64_t. Reserve the upper 8 bits in the
|
2016-01-09 06:55:54 +08:00
|
|
|
* version for other variants of profile. We set the lowest bit of the upper 8
|
|
|
|
* bits (i.e. bit 56) to 1 to indicate if this is an IR-level instrumentaiton
|
|
|
|
* generated profile, and 0 if this is a Clang FE generated profile.
|
2019-03-01 03:06:02 +08:00
|
|
|
* 1 in bit 57 indicates there are context-sensitive records in the profile.
|
2016-02-09 05:18:18 +08:00
|
|
|
*/
|
2016-01-09 06:55:54 +08:00
|
|
|
#define VARIANT_MASKS_ALL 0xff00000000000000ULL
|
|
|
|
#define GET_VERSION(V) ((V) & ~VARIANT_MASKS_ALL)
|
2016-02-09 05:18:18 +08:00
|
|
|
#define VARIANT_MASK_IR_PROF (0x1ULL << 56)
|
2019-03-01 03:06:02 +08:00
|
|
|
#define VARIANT_MASK_CSIR_PROF (0x1ULL << 57)
|
2020-10-03 04:00:40 +08:00
|
|
|
#define VARIANT_MASK_INSTR_ENTRY (0x1ULL << 58)
|
2016-07-22 12:08:16 +08:00
|
|
|
#define INSTR_PROF_RAW_VERSION_VAR __llvm_profile_raw_version
|
|
|
|
#define INSTR_PROF_PROFILE_RUNTIME_VAR __llvm_profile_runtime
|
2021-07-09 04:44:05 +08:00
|
|
|
#define INSTR_PROF_PROFILE_COUNTER_BIAS_VAR __llvm_profile_counter_bias
|
2016-01-09 06:55:54 +08:00
|
|
|
|
2016-07-22 07:19:18 +08:00
|
|
|
/* The variable that holds the name of the profile data
|
|
|
|
* specified via command line. */
|
|
|
|
#define INSTR_PROF_PROFILE_NAME_VAR __llvm_profile_filename
|
|
|
|
|
2017-04-14 07:37:15 +08:00
|
|
|
/* section name strings common to all targets other
|
|
|
|
than WIN32 */
|
|
|
|
#define INSTR_PROF_DATA_COMMON __llvm_prf_data
|
|
|
|
#define INSTR_PROF_NAME_COMMON __llvm_prf_names
|
|
|
|
#define INSTR_PROF_CNTS_COMMON __llvm_prf_cnts
|
|
|
|
#define INSTR_PROF_VALS_COMMON __llvm_prf_vals
|
|
|
|
#define INSTR_PROF_VNODES_COMMON __llvm_prf_vnds
|
|
|
|
#define INSTR_PROF_COVMAP_COMMON __llvm_covmap
|
2019-10-22 02:48:38 +08:00
|
|
|
#define INSTR_PROF_COVFUN_COMMON __llvm_covfun
|
2019-03-08 23:30:56 +08:00
|
|
|
#define INSTR_PROF_ORDERFILE_COMMON __llvm_orderfile
|
[InstrProf] Implement static profdata registration
Summary:
The motivating use case is eliminating duplicate profile data registered
for the same inline function in two object files. Before this change,
users would observe multiple symbol definition errors with VC link, but
links with LLD would succeed.
Users (Mozilla) have reported that PGO works well with clang-cl and LLD,
but when using LLD without this static registration, we would get into a
"relocation against a discarded section" situation. I'm not sure what
happens in that situation, but I suspect that duplicate, unused profile
information was retained. If so, this change will reduce the size of
such binaries with LLD.
Now, Windows uses static registration and is in line with all the other
platforms.
Reviewers: davidxl, wmi, inglorion, void, calixte
Subscribers: mgorny, krytarowski, eraman, fedor.sergeev, hiraditya, #sanitizers, dmajor, llvm-commits
Tags: #sanitizers, #llvm
Differential Revision: https://reviews.llvm.org/D57929
llvm-svn: 353547
2019-02-09 03:03:50 +08:00
|
|
|
/* Windows section names. Because these section names contain dollar characters,
|
|
|
|
* they must be quoted.
|
|
|
|
*/
|
|
|
|
#define INSTR_PROF_DATA_COFF ".lprfd$M"
|
|
|
|
#define INSTR_PROF_NAME_COFF ".lprfn$M"
|
|
|
|
#define INSTR_PROF_CNTS_COFF ".lprfc$M"
|
|
|
|
#define INSTR_PROF_VALS_COFF ".lprfv$M"
|
|
|
|
#define INSTR_PROF_VNODES_COFF ".lprfnd$M"
|
|
|
|
#define INSTR_PROF_COVMAP_COFF ".lcovmap$M"
|
2019-10-22 02:48:38 +08:00
|
|
|
#define INSTR_PROF_COVFUN_COFF ".lcovfun$M"
|
2019-03-08 23:30:56 +08:00
|
|
|
#define INSTR_PROF_ORDERFILE_COFF ".lorderfile$M"
|
2017-04-14 07:37:15 +08:00
|
|
|
|
|
|
|
#ifdef _WIN32
|
2015-11-23 13:47:05 +08:00
|
|
|
/* Runtime section names and name strings. */
|
2017-04-14 07:37:15 +08:00
|
|
|
#define INSTR_PROF_DATA_SECT_NAME INSTR_PROF_DATA_COFF
|
|
|
|
#define INSTR_PROF_NAME_SECT_NAME INSTR_PROF_NAME_COFF
|
|
|
|
#define INSTR_PROF_CNTS_SECT_NAME INSTR_PROF_CNTS_COFF
|
2016-05-22 06:55:45 +08:00
|
|
|
/* Array of pointers. Each pointer points to a list
|
|
|
|
* of value nodes associated with one value site.
|
|
|
|
*/
|
2017-04-14 07:37:15 +08:00
|
|
|
#define INSTR_PROF_VALS_SECT_NAME INSTR_PROF_VALS_COFF
|
2016-05-22 06:55:45 +08:00
|
|
|
/* Value profile nodes section. */
|
2017-04-14 07:37:15 +08:00
|
|
|
#define INSTR_PROF_VNODES_SECT_NAME INSTR_PROF_VNODES_COFF
|
|
|
|
#define INSTR_PROF_COVMAP_SECT_NAME INSTR_PROF_COVMAP_COFF
|
2019-10-22 02:48:38 +08:00
|
|
|
#define INSTR_PROF_COVFUN_SECT_NAME INSTR_PROF_COVFUN_COFF
|
2019-03-08 23:30:56 +08:00
|
|
|
#define INSTR_PROF_ORDERFILE_SECT_NAME INSTR_PROF_ORDERFILE_COFF
|
2017-04-14 07:37:15 +08:00
|
|
|
#else
|
|
|
|
/* Runtime section names and name strings. */
|
[InstrProf] Implement static profdata registration
Summary:
The motivating use case is eliminating duplicate profile data registered
for the same inline function in two object files. Before this change,
users would observe multiple symbol definition errors with VC link, but
links with LLD would succeed.
Users (Mozilla) have reported that PGO works well with clang-cl and LLD,
but when using LLD without this static registration, we would get into a
"relocation against a discarded section" situation. I'm not sure what
happens in that situation, but I suspect that duplicate, unused profile
information was retained. If so, this change will reduce the size of
such binaries with LLD.
Now, Windows uses static registration and is in line with all the other
platforms.
Reviewers: davidxl, wmi, inglorion, void, calixte
Subscribers: mgorny, krytarowski, eraman, fedor.sergeev, hiraditya, #sanitizers, dmajor, llvm-commits
Tags: #sanitizers, #llvm
Differential Revision: https://reviews.llvm.org/D57929
llvm-svn: 353547
2019-02-09 03:03:50 +08:00
|
|
|
#define INSTR_PROF_DATA_SECT_NAME INSTR_PROF_QUOTE(INSTR_PROF_DATA_COMMON)
|
|
|
|
#define INSTR_PROF_NAME_SECT_NAME INSTR_PROF_QUOTE(INSTR_PROF_NAME_COMMON)
|
|
|
|
#define INSTR_PROF_CNTS_SECT_NAME INSTR_PROF_QUOTE(INSTR_PROF_CNTS_COMMON)
|
2017-04-14 07:37:15 +08:00
|
|
|
/* Array of pointers. Each pointer points to a list
|
|
|
|
* of value nodes associated with one value site.
|
|
|
|
*/
|
[InstrProf] Implement static profdata registration
Summary:
The motivating use case is eliminating duplicate profile data registered
for the same inline function in two object files. Before this change,
users would observe multiple symbol definition errors with VC link, but
links with LLD would succeed.
Users (Mozilla) have reported that PGO works well with clang-cl and LLD,
but when using LLD without this static registration, we would get into a
"relocation against a discarded section" situation. I'm not sure what
happens in that situation, but I suspect that duplicate, unused profile
information was retained. If so, this change will reduce the size of
such binaries with LLD.
Now, Windows uses static registration and is in line with all the other
platforms.
Reviewers: davidxl, wmi, inglorion, void, calixte
Subscribers: mgorny, krytarowski, eraman, fedor.sergeev, hiraditya, #sanitizers, dmajor, llvm-commits
Tags: #sanitizers, #llvm
Differential Revision: https://reviews.llvm.org/D57929
llvm-svn: 353547
2019-02-09 03:03:50 +08:00
|
|
|
#define INSTR_PROF_VALS_SECT_NAME INSTR_PROF_QUOTE(INSTR_PROF_VALS_COMMON)
|
2017-04-14 07:37:15 +08:00
|
|
|
/* Value profile nodes section. */
|
[InstrProf] Implement static profdata registration
Summary:
The motivating use case is eliminating duplicate profile data registered
for the same inline function in two object files. Before this change,
users would observe multiple symbol definition errors with VC link, but
links with LLD would succeed.
Users (Mozilla) have reported that PGO works well with clang-cl and LLD,
but when using LLD without this static registration, we would get into a
"relocation against a discarded section" situation. I'm not sure what
happens in that situation, but I suspect that duplicate, unused profile
information was retained. If so, this change will reduce the size of
such binaries with LLD.
Now, Windows uses static registration and is in line with all the other
platforms.
Reviewers: davidxl, wmi, inglorion, void, calixte
Subscribers: mgorny, krytarowski, eraman, fedor.sergeev, hiraditya, #sanitizers, dmajor, llvm-commits
Tags: #sanitizers, #llvm
Differential Revision: https://reviews.llvm.org/D57929
llvm-svn: 353547
2019-02-09 03:03:50 +08:00
|
|
|
#define INSTR_PROF_VNODES_SECT_NAME INSTR_PROF_QUOTE(INSTR_PROF_VNODES_COMMON)
|
|
|
|
#define INSTR_PROF_COVMAP_SECT_NAME INSTR_PROF_QUOTE(INSTR_PROF_COVMAP_COMMON)
|
2019-10-22 02:48:38 +08:00
|
|
|
#define INSTR_PROF_COVFUN_SECT_NAME INSTR_PROF_QUOTE(INSTR_PROF_COVFUN_COMMON)
|
2019-03-08 23:30:56 +08:00
|
|
|
/* Order file instrumentation. */
|
|
|
|
#define INSTR_PROF_ORDERFILE_SECT_NAME \
|
|
|
|
INSTR_PROF_QUOTE(INSTR_PROF_ORDERFILE_COMMON)
|
2017-04-14 07:37:15 +08:00
|
|
|
#endif
|
2016-01-08 06:47:04 +08:00
|
|
|
|
2019-03-08 23:30:56 +08:00
|
|
|
#define INSTR_PROF_ORDERFILE_BUFFER_NAME _llvm_order_file_buffer
|
|
|
|
#define INSTR_PROF_ORDERFILE_BUFFER_NAME_STR \
|
|
|
|
INSTR_PROF_QUOTE(INSTR_PROF_ORDERFILE_BUFFER_NAME)
|
|
|
|
#define INSTR_PROF_ORDERFILE_BUFFER_IDX_NAME _llvm_order_file_buffer_idx
|
|
|
|
#define INSTR_PROF_ORDERFILE_BUFFER_IDX_NAME_STR \
|
|
|
|
INSTR_PROF_QUOTE(INSTR_PROF_ORDERFILE_BUFFER_IDX_NAME)
|
|
|
|
|
2015-11-23 13:47:05 +08:00
|
|
|
/* Macros to define start/stop section symbol for a given
|
|
|
|
* section on Linux. For instance
|
|
|
|
* INSTR_PROF_SECT_START(INSTR_PROF_DATA_SECT_NAME) will
|
|
|
|
* expand to __start___llvm_prof_data
|
|
|
|
*/
|
|
|
|
#define INSTR_PROF_SECT_START(Sect) \
|
|
|
|
INSTR_PROF_CONCAT(__start_,Sect)
|
|
|
|
#define INSTR_PROF_SECT_STOP(Sect) \
|
|
|
|
INSTR_PROF_CONCAT(__stop_,Sect)
|
|
|
|
|
|
|
|
/* Value Profiling API linkage name. */
|
|
|
|
#define INSTR_PROF_VALUE_PROF_FUNC __llvm_profile_instrument_target
|
|
|
|
#define INSTR_PROF_VALUE_PROF_FUNC_STR \
|
|
|
|
INSTR_PROF_QUOTE(INSTR_PROF_VALUE_PROF_FUNC)
|
2020-08-04 01:35:47 +08:00
|
|
|
#define INSTR_PROF_VALUE_PROF_MEMOP_FUNC __llvm_profile_instrument_memop
|
|
|
|
#define INSTR_PROF_VALUE_PROF_MEMOP_FUNC_STR \
|
|
|
|
INSTR_PROF_QUOTE(INSTR_PROF_VALUE_PROF_MEMOP_FUNC)
|
2015-11-23 13:47:05 +08:00
|
|
|
|
2015-11-24 02:03:25 +08:00
|
|
|
/* InstrProfile per-function control data alignment. */
|
|
|
|
#define INSTR_PROF_DATA_ALIGNMENT 8
|
|
|
|
|
2015-11-23 13:47:05 +08:00
|
|
|
/* The data structure that represents a tracked value by the
|
|
|
|
* value profiler.
|
|
|
|
*/
|
|
|
|
typedef struct InstrProfValueData {
|
2015-11-24 01:06:44 +08:00
|
|
|
/* Profiled value. */
|
2015-11-23 13:47:05 +08:00
|
|
|
uint64_t Value;
|
2015-11-24 01:06:44 +08:00
|
|
|
/* Number of times the value appears in the training run. */
|
2015-11-23 13:47:05 +08:00
|
|
|
uint64_t Count;
|
|
|
|
} InstrProfValueData;
|
|
|
|
|
2016-01-27 08:14:15 +08:00
|
|
|
#endif /* INSTR_PROF_DATA_INC */
|
2015-11-23 13:47:05 +08:00
|
|
|
|
2019-03-08 23:30:56 +08:00
|
|
|
#ifndef INSTR_ORDER_FILE_INC
|
2019-05-10 22:15:13 +08:00
|
|
|
/* The maximal # of functions: 128*1024 (the buffer size will be 128*4 KB). */
|
2019-03-08 23:30:56 +08:00
|
|
|
#define INSTR_ORDER_FILE_BUFFER_SIZE 131072
|
|
|
|
#define INSTR_ORDER_FILE_BUFFER_BITS 17
|
|
|
|
#define INSTR_ORDER_FILE_BUFFER_MASK 0x1ffff
|
|
|
|
#endif /* INSTR_ORDER_FILE_INC */
|
2015-11-23 13:47:05 +08:00
|
|
|
#else
|
|
|
|
#undef INSTR_PROF_DATA_DEFINED
|
|
|
|
#endif
|
2019-10-22 02:48:38 +08:00
|
|
|
|
|
|
|
#undef COVMAP_V2_OR_V3
|
2020-08-04 01:35:47 +08:00
|
|
|
|
|
|
|
#ifdef INSTR_PROF_VALUE_PROF_MEMOP_API
|
|
|
|
|
|
|
|
#ifdef __cplusplus
|
|
|
|
#define INSTR_PROF_INLINE inline
|
|
|
|
#else
|
|
|
|
#define INSTR_PROF_INLINE
|
|
|
|
#endif
|
|
|
|
|
|
|
|
/* The value range buckets (22 buckets) for the memop size value profiling looks
|
|
|
|
* like:
|
|
|
|
*
|
|
|
|
* [0, 0]
|
|
|
|
* [1, 1]
|
|
|
|
* [2, 2]
|
|
|
|
* [3, 3]
|
|
|
|
* [4, 4]
|
|
|
|
* [5, 5]
|
|
|
|
* [6, 6]
|
|
|
|
* [7, 7]
|
|
|
|
* [8, 8]
|
|
|
|
* [9, 15]
|
|
|
|
* [16, 16]
|
|
|
|
* [17, 31]
|
|
|
|
* [32, 32]
|
|
|
|
* [33, 63]
|
|
|
|
* [64, 64]
|
|
|
|
* [65, 127]
|
|
|
|
* [128, 128]
|
|
|
|
* [129, 255]
|
|
|
|
* [256, 256]
|
|
|
|
* [257, 511]
|
|
|
|
* [512, 512]
|
|
|
|
* [513, UINT64_MAX]
|
|
|
|
*
|
|
|
|
* Each range has a 'representative value' which is the lower end value of the
|
|
|
|
* range and used to store in the runtime profile data records and the VP
|
|
|
|
* metadata. For example, it's 2 for [2, 2] and 64 for [65, 127].
|
|
|
|
*/
|
[PGO] Fix two issues in PGOMemOPSizeOpt.
1. PGOMemOPSizeOpt grabs only the first, up to five (by default) entries from
the value profile metadata and preserves the remaining entries for the fallback
memop call site. If there are more than five entries, the rest of the entries
would get dropped. This is fine for PGOMemOPSizeOpt itself as it only promotes
up to 3 (by default) values, but potentially not for other downstream passes
that may use the value profile metadata.
2. PGOMemOPSizeOpt originally assumed that only values 0 through 8 are kept
track of. When the range buckets were introduced, it was changed to skip the
range buckets, but since it does not grab all entries (only five), if some range
buckets exist in the first five entries, it could potentially cause fewer
promotion opportunities (eg. if 4 out of 5 were range buckets, it may be able to
promote up to one non-range bucket, as opposed to 3.) Also, combined with 1, it
means that wrong entries may be preserved, as it didn't correctly keep track of
which were entries were skipped.
To fix this, PGOMemOPSizeOpt now grabs all the entries (up to the maximum number
of value profile buckets), keeps track of which entries were skipped, and
preserves all the remaining entries.
Differential Revision: https://reviews.llvm.org/D97592
2021-02-27 06:44:20 +08:00
|
|
|
#define INSTR_PROF_NUM_BUCKETS 22
|
2020-08-04 01:35:47 +08:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Clz and Popcount. This code was copied from
|
|
|
|
* compiler-rt/lib/fuzzer/{FuzzerBuiltins.h,FuzzerBuiltinsMsvc.h} and
|
|
|
|
* llvm/include/llvm/Support/MathExtras.h.
|
|
|
|
*/
|
|
|
|
#if defined(_MSC_VER) && !defined(__clang__)
|
|
|
|
|
|
|
|
#include <intrin.h>
|
|
|
|
INSTR_PROF_VISIBILITY INSTR_PROF_INLINE
|
|
|
|
int InstProfClzll(unsigned long long X) {
|
|
|
|
unsigned long LeadZeroIdx = 0;
|
|
|
|
#if !defined(_M_ARM64) && !defined(_M_X64)
|
|
|
|
// Scan the high 32 bits.
|
|
|
|
if (_BitScanReverse(&LeadZeroIdx, (unsigned long)(X >> 32)))
|
|
|
|
return (int)(63 - (LeadZeroIdx + 32)); // Create a bit offset
|
|
|
|
// from the MSB.
|
|
|
|
// Scan the low 32 bits.
|
|
|
|
if (_BitScanReverse(&LeadZeroIdx, (unsigned long)(X)))
|
|
|
|
return (int)(63 - LeadZeroIdx);
|
|
|
|
#else
|
|
|
|
if (_BitScanReverse64(&LeadZeroIdx, X)) return 63 - LeadZeroIdx;
|
|
|
|
#endif
|
|
|
|
return 64;
|
|
|
|
}
|
|
|
|
INSTR_PROF_VISIBILITY INSTR_PROF_INLINE
|
|
|
|
int InstProfPopcountll(unsigned long long X) {
|
|
|
|
// This code originates from https://reviews.llvm.org/rG30626254510f.
|
|
|
|
unsigned long long v = X;
|
|
|
|
v = v - ((v >> 1) & 0x5555555555555555ULL);
|
|
|
|
v = (v & 0x3333333333333333ULL) + ((v >> 2) & 0x3333333333333333ULL);
|
|
|
|
v = (v + (v >> 4)) & 0x0F0F0F0F0F0F0F0FULL;
|
|
|
|
return (int)((unsigned long long)(v * 0x0101010101010101ULL) >> 56);
|
|
|
|
}
|
|
|
|
|
|
|
|
#else
|
|
|
|
|
|
|
|
INSTR_PROF_VISIBILITY INSTR_PROF_INLINE
|
|
|
|
int InstProfClzll(unsigned long long X) { return __builtin_clzll(X); }
|
|
|
|
INSTR_PROF_VISIBILITY INSTR_PROF_INLINE
|
|
|
|
int InstProfPopcountll(unsigned long long X) { return __builtin_popcountll(X); }
|
|
|
|
|
|
|
|
#endif /* defined(_MSC_VER) && !defined(__clang__) */
|
|
|
|
|
|
|
|
/* Map an (observed) memop size value to the representative value of its range.
|
|
|
|
* For example, 5 -> 5, 22 -> 17, 99 -> 65, 256 -> 256, 1001 -> 513. */
|
|
|
|
INSTR_PROF_VISIBILITY INSTR_PROF_INLINE uint64_t
|
|
|
|
InstrProfGetRangeRepValue(uint64_t Value) {
|
|
|
|
if (Value <= 8)
|
|
|
|
// The first ranges are individually tracked. Use the value as is.
|
|
|
|
return Value;
|
|
|
|
else if (Value >= 513)
|
|
|
|
// The last range is mapped to its lowest value.
|
|
|
|
return 513;
|
|
|
|
else if (InstProfPopcountll(Value) == 1)
|
|
|
|
// If it's a power of two, use it as is.
|
|
|
|
return Value;
|
|
|
|
else
|
|
|
|
// Otherwise, take to the previous power of two + 1.
|
2021-03-10 04:46:13 +08:00
|
|
|
return (UINT64_C(1) << (64 - InstProfClzll(Value) - 1)) + 1;
|
2020-08-04 01:35:47 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
/* Return true if the range that an (observed) memop size value belongs to has
|
|
|
|
* only a single value in the range. For example, 0 -> true, 8 -> true, 10 ->
|
|
|
|
* false, 64 -> true, 100 -> false, 513 -> false. */
|
|
|
|
INSTR_PROF_VISIBILITY INSTR_PROF_INLINE unsigned
|
|
|
|
InstrProfIsSingleValRange(uint64_t Value) {
|
|
|
|
if (Value <= 8)
|
|
|
|
// The first ranges are individually tracked.
|
|
|
|
return 1;
|
|
|
|
else if (InstProfPopcountll(Value) == 1)
|
|
|
|
// If it's a power of two, there's only one value.
|
|
|
|
return 1;
|
|
|
|
else
|
|
|
|
// Otherwise, there's more than one value in the range.
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
#endif /* INSTR_PROF_VALUE_PROF_MEMOP_API */
|