forked from OSchip/llvm-project
1057 lines
38 KiB
C++
1057 lines
38 KiB
C++
//===-- AMDGPULibFunc.cpp -------------------------------------------------===//
|
|
//
|
|
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
|
|
// See https://llvm.org/LICENSE.txt for license information.
|
|
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
//
|
|
// This file contains utility functions to work with Itanium mangled names
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "AMDGPULibFunc.h"
|
|
#include "AMDGPU.h"
|
|
#include "llvm/ADT/StringExtras.h"
|
|
#include "llvm/ADT/StringMap.h"
|
|
#include "llvm/ADT/StringSwitch.h"
|
|
#include "llvm/IR/DerivedTypes.h"
|
|
#include "llvm/IR/Function.h"
|
|
#include "llvm/IR/Module.h"
|
|
#include "llvm/IR/ValueSymbolTable.h"
|
|
#include "llvm/Support/CommandLine.h"
|
|
#include "llvm/Support/raw_ostream.h"
|
|
|
|
using namespace llvm;
|
|
|
|
static cl::opt<bool> EnableOCLManglingMismatchWA(
|
|
"amdgpu-enable-ocl-mangling-mismatch-workaround", cl::init(true),
|
|
cl::ReallyHidden,
|
|
cl::desc("Enable the workaround for OCL name mangling mismatch."));
|
|
|
|
namespace {
|
|
|
|
enum EManglingParam {
|
|
E_NONE,
|
|
EX_EVENT,
|
|
EX_FLOAT4,
|
|
EX_INTV4,
|
|
EX_RESERVEDID,
|
|
EX_SAMPLER,
|
|
EX_SIZET,
|
|
EX_UINT,
|
|
EX_UINTV4,
|
|
E_ANY,
|
|
E_CONSTPTR_ANY,
|
|
E_CONSTPTR_SWAPGL,
|
|
E_COPY,
|
|
E_IMAGECOORDS,
|
|
E_POINTEE,
|
|
E_SETBASE_I32,
|
|
E_SETBASE_U32,
|
|
E_MAKEBASE_UNS,
|
|
E_V16_OF_POINTEE,
|
|
E_V2_OF_POINTEE,
|
|
E_V3_OF_POINTEE,
|
|
E_V4_OF_POINTEE,
|
|
E_V8_OF_POINTEE,
|
|
E_VLTLPTR_ANY,
|
|
};
|
|
|
|
struct ManglingRule {
|
|
const char *Name;
|
|
unsigned char Lead[2];
|
|
unsigned char Param[5];
|
|
|
|
int maxLeadIndex() const { return (std::max)(Lead[0], Lead[1]); }
|
|
int getNumLeads() const { return (Lead[0] ? 1 : 0) + (Lead[1] ? 1 : 0); }
|
|
|
|
unsigned getNumArgs() const;
|
|
|
|
static StringMap<int> buildManglingRulesMap();
|
|
};
|
|
|
|
// Information about library functions with unmangled names.
|
|
class UnmangledFuncInfo {
|
|
const char *Name;
|
|
unsigned NumArgs;
|
|
|
|
// Table for all lib functions with unmangled names.
|
|
static const UnmangledFuncInfo Table[];
|
|
|
|
// Number of entries in Table.
|
|
static const unsigned TableSize;
|
|
|
|
static StringMap<unsigned> buildNameMap();
|
|
|
|
public:
|
|
using ID = AMDGPULibFunc::EFuncId;
|
|
constexpr UnmangledFuncInfo(const char *_Name, unsigned _NumArgs)
|
|
: Name(_Name), NumArgs(_NumArgs) {}
|
|
// Get index to Table by function name.
|
|
static bool lookup(StringRef Name, ID &Id);
|
|
static unsigned toIndex(ID Id) {
|
|
assert(static_cast<unsigned>(Id) >
|
|
static_cast<unsigned>(AMDGPULibFunc::EI_LAST_MANGLED) &&
|
|
"Invalid unmangled library function");
|
|
return static_cast<unsigned>(Id) - 1 -
|
|
static_cast<unsigned>(AMDGPULibFunc::EI_LAST_MANGLED);
|
|
}
|
|
static ID toFuncId(unsigned Index) {
|
|
assert(Index < TableSize &&
|
|
"Invalid unmangled library function");
|
|
return static_cast<ID>(
|
|
Index + 1 + static_cast<unsigned>(AMDGPULibFunc::EI_LAST_MANGLED));
|
|
}
|
|
static unsigned getNumArgs(ID Id) { return Table[toIndex(Id)].NumArgs; }
|
|
static StringRef getName(ID Id) { return Table[toIndex(Id)].Name; }
|
|
};
|
|
|
|
unsigned ManglingRule::getNumArgs() const {
|
|
unsigned I=0;
|
|
while (I < (sizeof Param/sizeof Param[0]) && Param[I]) ++I;
|
|
return I;
|
|
}
|
|
|
|
// This table describes function formal argument type rules. The order of rules
|
|
// corresponds to the EFuncId enum at AMDGPULibFunc.h
|
|
//
|
|
// "<func name>", { <leads> }, { <param rules> }
|
|
// where:
|
|
// <leads> - list of integers that are one-based indexes of formal argument
|
|
// used to mangle a function name. Other argument types are derived from types
|
|
// of these 'leads'. The order of integers in this list correspond to the
|
|
// order in which these arguments are mangled in the EDG mangling scheme. The
|
|
// same order should be preserved for arguments in the AMDGPULibFunc structure
|
|
// when it is used for mangling. For example:
|
|
// { "vstorea_half", {3,1}, {E_ANY,EX_SIZET,E_ANY}},
|
|
// will be mangled in EDG scheme as vstorea_half_<3dparam>_<1stparam>
|
|
// When mangling from code use:
|
|
// AMDGPULibFunc insc;
|
|
// insc.param[0] = ... // describe 3rd parameter
|
|
// insc.param[1] = ... // describe 1rd parameter
|
|
//
|
|
// <param rules> - list of rules used to derive all of the function formal
|
|
// argument types. EX_ prefixed are simple types, other derived from the
|
|
// latest 'lead' argument type in the order of encoding from first to last.
|
|
// E_ANY - use prev lead type, E_CONSTPTR_ANY - make const pointer out of
|
|
// prev lead type, etc. see ParamIterator::getNextParam() for details.
|
|
|
|
static constexpr ManglingRule manglingRules[] = {
|
|
{ "", {0}, {0} },
|
|
{ "abs" , {1}, {E_ANY}},
|
|
{ "abs_diff" , {1}, {E_ANY,E_COPY}},
|
|
{ "acos" , {1}, {E_ANY}},
|
|
{ "acosh" , {1}, {E_ANY}},
|
|
{ "acospi" , {1}, {E_ANY}},
|
|
{ "add_sat" , {1}, {E_ANY,E_COPY}},
|
|
{ "all" , {1}, {E_ANY}},
|
|
{ "any" , {1}, {E_ANY}},
|
|
{ "asin" , {1}, {E_ANY}},
|
|
{ "asinh" , {1}, {E_ANY}},
|
|
{ "asinpi" , {1}, {E_ANY}},
|
|
{ "async_work_group_copy" , {1}, {E_ANY,E_CONSTPTR_SWAPGL,EX_SIZET,EX_EVENT}},
|
|
{ "async_work_group_strided_copy" , {1}, {E_ANY,E_CONSTPTR_SWAPGL,EX_SIZET,EX_SIZET,EX_EVENT}},
|
|
{ "atan" , {1}, {E_ANY}},
|
|
{ "atan2" , {1}, {E_ANY,E_COPY}},
|
|
{ "atan2pi" , {1}, {E_ANY,E_COPY}},
|
|
{ "atanh" , {1}, {E_ANY}},
|
|
{ "atanpi" , {1}, {E_ANY}},
|
|
{ "atomic_add" , {1}, {E_VLTLPTR_ANY,E_POINTEE}},
|
|
{ "atomic_and" , {1}, {E_VLTLPTR_ANY,E_POINTEE}},
|
|
{ "atomic_cmpxchg" , {1}, {E_VLTLPTR_ANY,E_POINTEE,E_POINTEE}},
|
|
{ "atomic_dec" , {1}, {E_VLTLPTR_ANY}},
|
|
{ "atomic_inc" , {1}, {E_VLTLPTR_ANY}},
|
|
{ "atomic_max" , {1}, {E_VLTLPTR_ANY,E_POINTEE}},
|
|
{ "atomic_min" , {1}, {E_VLTLPTR_ANY,E_POINTEE}},
|
|
{ "atomic_or" , {1}, {E_VLTLPTR_ANY,E_POINTEE}},
|
|
{ "atomic_sub" , {1}, {E_VLTLPTR_ANY,E_POINTEE}},
|
|
{ "atomic_xchg" , {1}, {E_VLTLPTR_ANY,E_POINTEE}},
|
|
{ "atomic_xor" , {1}, {E_VLTLPTR_ANY,E_POINTEE}},
|
|
{ "bitselect" , {1}, {E_ANY,E_COPY,E_COPY}},
|
|
{ "cbrt" , {1}, {E_ANY}},
|
|
{ "ceil" , {1}, {E_ANY}},
|
|
{ "clamp" , {1}, {E_ANY,E_COPY,E_COPY}},
|
|
{ "clz" , {1}, {E_ANY}},
|
|
{ "commit_read_pipe" , {1}, {E_ANY,EX_RESERVEDID}},
|
|
{ "commit_write_pipe" , {1}, {E_ANY,EX_RESERVEDID}},
|
|
{ "copysign" , {1}, {E_ANY,E_COPY}},
|
|
{ "cos" , {1}, {E_ANY}},
|
|
{ "cosh" , {1}, {E_ANY}},
|
|
{ "cospi" , {1}, {E_ANY}},
|
|
{ "cross" , {1}, {E_ANY,E_COPY}},
|
|
{ "ctz" , {1}, {E_ANY}},
|
|
{ "degrees" , {1}, {E_ANY}},
|
|
{ "distance" , {1}, {E_ANY,E_COPY}},
|
|
{ "divide" , {1}, {E_ANY,E_COPY}},
|
|
{ "dot" , {1}, {E_ANY,E_COPY}},
|
|
{ "erf" , {1}, {E_ANY}},
|
|
{ "erfc" , {1}, {E_ANY}},
|
|
{ "exp" , {1}, {E_ANY}},
|
|
{ "exp10" , {1}, {E_ANY}},
|
|
{ "exp2" , {1}, {E_ANY}},
|
|
{ "expm1" , {1}, {E_ANY}},
|
|
{ "fabs" , {1}, {E_ANY}},
|
|
{ "fast_distance" , {1}, {E_ANY,E_COPY}},
|
|
{ "fast_length" , {1}, {E_ANY}},
|
|
{ "fast_normalize" , {1}, {E_ANY}},
|
|
{ "fdim" , {1}, {E_ANY,E_COPY}},
|
|
{ "floor" , {1}, {E_ANY}},
|
|
{ "fma" , {1}, {E_ANY,E_COPY,E_COPY}},
|
|
{ "fmax" , {1}, {E_ANY,E_COPY}},
|
|
{ "fmin" , {1}, {E_ANY,E_COPY}},
|
|
{ "fmod" , {1}, {E_ANY,E_COPY}},
|
|
{ "fract" , {2}, {E_POINTEE,E_ANY}},
|
|
{ "frexp" , {1,2}, {E_ANY,E_ANY}},
|
|
{ "get_image_array_size" , {1}, {E_ANY}},
|
|
{ "get_image_channel_data_type" , {1}, {E_ANY}},
|
|
{ "get_image_channel_order" , {1}, {E_ANY}},
|
|
{ "get_image_dim" , {1}, {E_ANY}},
|
|
{ "get_image_height" , {1}, {E_ANY}},
|
|
{ "get_image_width" , {1}, {E_ANY}},
|
|
{ "get_pipe_max_packets" , {1}, {E_ANY}},
|
|
{ "get_pipe_num_packets" , {1}, {E_ANY}},
|
|
{ "hadd" , {1}, {E_ANY,E_COPY}},
|
|
{ "hypot" , {1}, {E_ANY,E_COPY}},
|
|
{ "ilogb" , {1}, {E_ANY}},
|
|
{ "isequal" , {1}, {E_ANY,E_COPY}},
|
|
{ "isfinite" , {1}, {E_ANY}},
|
|
{ "isgreater" , {1}, {E_ANY,E_COPY}},
|
|
{ "isgreaterequal" , {1}, {E_ANY,E_COPY}},
|
|
{ "isinf" , {1}, {E_ANY}},
|
|
{ "isless" , {1}, {E_ANY,E_COPY}},
|
|
{ "islessequal" , {1}, {E_ANY,E_COPY}},
|
|
{ "islessgreater" , {1}, {E_ANY,E_COPY}},
|
|
{ "isnan" , {1}, {E_ANY}},
|
|
{ "isnormal" , {1}, {E_ANY}},
|
|
{ "isnotequal" , {1}, {E_ANY,E_COPY}},
|
|
{ "isordered" , {1}, {E_ANY,E_COPY}},
|
|
{ "isunordered" , {1}, {E_ANY,E_COPY}},
|
|
{ "ldexp" , {1}, {E_ANY,E_SETBASE_I32}},
|
|
{ "length" , {1}, {E_ANY}},
|
|
{ "lgamma" , {1}, {E_ANY}},
|
|
{ "lgamma_r" , {1,2}, {E_ANY,E_ANY}},
|
|
{ "log" , {1}, {E_ANY}},
|
|
{ "log10" , {1}, {E_ANY}},
|
|
{ "log1p" , {1}, {E_ANY}},
|
|
{ "log2" , {1}, {E_ANY}},
|
|
{ "logb" , {1}, {E_ANY}},
|
|
{ "mad" , {1}, {E_ANY,E_COPY,E_COPY}},
|
|
{ "mad24" , {1}, {E_ANY,E_COPY,E_COPY}},
|
|
{ "mad_hi" , {1}, {E_ANY,E_COPY,E_COPY}},
|
|
{ "mad_sat" , {1}, {E_ANY,E_COPY,E_COPY}},
|
|
{ "max" , {1}, {E_ANY,E_COPY}},
|
|
{ "maxmag" , {1}, {E_ANY,E_COPY}},
|
|
{ "min" , {1}, {E_ANY,E_COPY}},
|
|
{ "minmag" , {1}, {E_ANY,E_COPY}},
|
|
{ "mix" , {1}, {E_ANY,E_COPY,E_COPY}},
|
|
{ "modf" , {2}, {E_POINTEE,E_ANY}},
|
|
{ "mul24" , {1}, {E_ANY,E_COPY}},
|
|
{ "mul_hi" , {1}, {E_ANY,E_COPY}},
|
|
{ "nan" , {1}, {E_ANY}},
|
|
{ "nextafter" , {1}, {E_ANY,E_COPY}},
|
|
{ "normalize" , {1}, {E_ANY}},
|
|
{ "popcount" , {1}, {E_ANY}},
|
|
{ "pow" , {1}, {E_ANY,E_COPY}},
|
|
{ "pown" , {1}, {E_ANY,E_SETBASE_I32}},
|
|
{ "powr" , {1}, {E_ANY,E_COPY}},
|
|
{ "prefetch" , {1}, {E_CONSTPTR_ANY,EX_SIZET}},
|
|
{ "radians" , {1}, {E_ANY}},
|
|
{ "recip" , {1}, {E_ANY}},
|
|
{ "remainder" , {1}, {E_ANY,E_COPY}},
|
|
{ "remquo" , {1,3}, {E_ANY,E_COPY,E_ANY}},
|
|
{ "reserve_read_pipe" , {1}, {E_ANY,EX_UINT}},
|
|
{ "reserve_write_pipe" , {1}, {E_ANY,EX_UINT}},
|
|
{ "rhadd" , {1}, {E_ANY,E_COPY}},
|
|
{ "rint" , {1}, {E_ANY}},
|
|
{ "rootn" , {1}, {E_ANY,E_SETBASE_I32}},
|
|
{ "rotate" , {1}, {E_ANY,E_COPY}},
|
|
{ "round" , {1}, {E_ANY}},
|
|
{ "rsqrt" , {1}, {E_ANY}},
|
|
{ "select" , {1,3}, {E_ANY,E_COPY,E_ANY}},
|
|
{ "shuffle" , {1,2}, {E_ANY,E_ANY}},
|
|
{ "shuffle2" , {1,3}, {E_ANY,E_COPY,E_ANY}},
|
|
{ "sign" , {1}, {E_ANY}},
|
|
{ "signbit" , {1}, {E_ANY}},
|
|
{ "sin" , {1}, {E_ANY}},
|
|
{ "sincos" , {2}, {E_POINTEE,E_ANY}},
|
|
{ "sinh" , {1}, {E_ANY}},
|
|
{ "sinpi" , {1}, {E_ANY}},
|
|
{ "smoothstep" , {1}, {E_ANY,E_COPY,E_COPY}},
|
|
{ "sqrt" , {1}, {E_ANY}},
|
|
{ "step" , {1}, {E_ANY,E_COPY}},
|
|
{ "sub_group_broadcast" , {1}, {E_ANY,EX_UINT}},
|
|
{ "sub_group_commit_read_pipe" , {1}, {E_ANY,EX_RESERVEDID}},
|
|
{ "sub_group_commit_write_pipe" , {1}, {E_ANY,EX_RESERVEDID}},
|
|
{ "sub_group_reduce_add" , {1}, {E_ANY}},
|
|
{ "sub_group_reduce_max" , {1}, {E_ANY}},
|
|
{ "sub_group_reduce_min" , {1}, {E_ANY}},
|
|
{ "sub_group_reserve_read_pipe" , {1}, {E_ANY,EX_UINT}},
|
|
{ "sub_group_reserve_write_pipe" , {1}, {E_ANY,EX_UINT}},
|
|
{ "sub_group_scan_exclusive_add" , {1}, {E_ANY}},
|
|
{ "sub_group_scan_exclusive_max" , {1}, {E_ANY}},
|
|
{ "sub_group_scan_exclusive_min" , {1}, {E_ANY}},
|
|
{ "sub_group_scan_inclusive_add" , {1}, {E_ANY}},
|
|
{ "sub_group_scan_inclusive_max" , {1}, {E_ANY}},
|
|
{ "sub_group_scan_inclusive_min" , {1}, {E_ANY}},
|
|
{ "sub_sat" , {1}, {E_ANY,E_COPY}},
|
|
{ "tan" , {1}, {E_ANY}},
|
|
{ "tanh" , {1}, {E_ANY}},
|
|
{ "tanpi" , {1}, {E_ANY}},
|
|
{ "tgamma" , {1}, {E_ANY}},
|
|
{ "trunc" , {1}, {E_ANY}},
|
|
{ "upsample" , {1}, {E_ANY,E_MAKEBASE_UNS}},
|
|
{ "vec_step" , {1}, {E_ANY}},
|
|
{ "vstore" , {3}, {E_POINTEE,EX_SIZET,E_ANY}},
|
|
{ "vstore16" , {3}, {E_V16_OF_POINTEE,EX_SIZET,E_ANY}},
|
|
{ "vstore2" , {3}, {E_V2_OF_POINTEE,EX_SIZET,E_ANY}},
|
|
{ "vstore3" , {3}, {E_V3_OF_POINTEE,EX_SIZET,E_ANY}},
|
|
{ "vstore4" , {3}, {E_V4_OF_POINTEE,EX_SIZET,E_ANY}},
|
|
{ "vstore8" , {3}, {E_V8_OF_POINTEE,EX_SIZET,E_ANY}},
|
|
{ "work_group_commit_read_pipe" , {1}, {E_ANY,EX_RESERVEDID}},
|
|
{ "work_group_commit_write_pipe" , {1}, {E_ANY,EX_RESERVEDID}},
|
|
{ "work_group_reduce_add" , {1}, {E_ANY}},
|
|
{ "work_group_reduce_max" , {1}, {E_ANY}},
|
|
{ "work_group_reduce_min" , {1}, {E_ANY}},
|
|
{ "work_group_reserve_read_pipe" , {1}, {E_ANY,EX_UINT}},
|
|
{ "work_group_reserve_write_pipe" , {1}, {E_ANY,EX_UINT}},
|
|
{ "work_group_scan_exclusive_add" , {1}, {E_ANY}},
|
|
{ "work_group_scan_exclusive_max" , {1}, {E_ANY}},
|
|
{ "work_group_scan_exclusive_min" , {1}, {E_ANY}},
|
|
{ "work_group_scan_inclusive_add" , {1}, {E_ANY}},
|
|
{ "work_group_scan_inclusive_max" , {1}, {E_ANY}},
|
|
{ "work_group_scan_inclusive_min" , {1}, {E_ANY}},
|
|
{ "write_imagef" , {1}, {E_ANY,E_IMAGECOORDS,EX_FLOAT4}},
|
|
{ "write_imagei" , {1}, {E_ANY,E_IMAGECOORDS,EX_INTV4}},
|
|
{ "write_imageui" , {1}, {E_ANY,E_IMAGECOORDS,EX_UINTV4}},
|
|
{ "ncos" , {1}, {E_ANY} },
|
|
{ "nexp2" , {1}, {E_ANY} },
|
|
{ "nfma" , {1}, {E_ANY, E_COPY, E_COPY} },
|
|
{ "nlog2" , {1}, {E_ANY} },
|
|
{ "nrcp" , {1}, {E_ANY} },
|
|
{ "nrsqrt" , {1}, {E_ANY} },
|
|
{ "nsin" , {1}, {E_ANY} },
|
|
{ "nsqrt" , {1}, {E_ANY} },
|
|
{ "ftz" , {1}, {E_ANY} },
|
|
{ "fldexp" , {1}, {E_ANY, EX_UINT} },
|
|
{ "class" , {1}, {E_ANY, EX_UINT} },
|
|
{ "rcbrt" , {1}, {E_ANY} },
|
|
};
|
|
|
|
// Library functions with unmangled name.
|
|
const UnmangledFuncInfo UnmangledFuncInfo::Table[] = {
|
|
{"__read_pipe_2", 4},
|
|
{"__read_pipe_4", 6},
|
|
{"__write_pipe_2", 4},
|
|
{"__write_pipe_4", 6},
|
|
};
|
|
|
|
const unsigned UnmangledFuncInfo::TableSize =
|
|
array_lengthof(UnmangledFuncInfo::Table);
|
|
|
|
static AMDGPULibFunc::Param getRetType(AMDGPULibFunc::EFuncId id,
|
|
const AMDGPULibFunc::Param (&Leads)[2]) {
|
|
AMDGPULibFunc::Param Res = Leads[0];
|
|
// TBD - This switch may require to be extended for other intrinsics
|
|
switch (id) {
|
|
case AMDGPULibFunc::EI_SINCOS:
|
|
Res.PtrKind = AMDGPULibFunc::BYVALUE;
|
|
break;
|
|
default:
|
|
break;
|
|
}
|
|
return Res;
|
|
}
|
|
|
|
class ParamIterator {
|
|
const AMDGPULibFunc::Param (&Leads)[2];
|
|
const ManglingRule& Rule;
|
|
int Index;
|
|
public:
|
|
ParamIterator(const AMDGPULibFunc::Param (&leads)[2],
|
|
const ManglingRule& rule)
|
|
: Leads(leads), Rule(rule), Index(0) {}
|
|
|
|
AMDGPULibFunc::Param getNextParam();
|
|
};
|
|
|
|
AMDGPULibFunc::Param ParamIterator::getNextParam() {
|
|
AMDGPULibFunc::Param P;
|
|
if (Index >= int(sizeof Rule.Param/sizeof Rule.Param[0])) return P;
|
|
|
|
const char R = Rule.Param[Index];
|
|
switch (R) {
|
|
case E_NONE: break;
|
|
case EX_UINT:
|
|
P.ArgType = AMDGPULibFunc::U32; break;
|
|
case EX_INTV4:
|
|
P.ArgType = AMDGPULibFunc::I32; P.VectorSize = 4; break;
|
|
case EX_UINTV4:
|
|
P.ArgType = AMDGPULibFunc::U32; P.VectorSize = 4; break;
|
|
case EX_FLOAT4:
|
|
P.ArgType = AMDGPULibFunc::F32; P.VectorSize = 4; break;
|
|
case EX_SIZET:
|
|
P.ArgType = AMDGPULibFunc::U64; break;
|
|
case EX_EVENT:
|
|
P.ArgType = AMDGPULibFunc::EVENT; break;
|
|
case EX_SAMPLER:
|
|
P.ArgType = AMDGPULibFunc::SAMPLER; break;
|
|
case EX_RESERVEDID: break; // TBD
|
|
default:
|
|
if (Index == (Rule.Lead[1] - 1)) P = Leads[1];
|
|
else P = Leads[0];
|
|
|
|
switch (R) {
|
|
case E_ANY:
|
|
case E_COPY: break;
|
|
|
|
case E_POINTEE:
|
|
P.PtrKind = AMDGPULibFunc::BYVALUE; break;
|
|
case E_V2_OF_POINTEE:
|
|
P.VectorSize = 2; P.PtrKind = AMDGPULibFunc::BYVALUE; break;
|
|
case E_V3_OF_POINTEE:
|
|
P.VectorSize = 3; P.PtrKind = AMDGPULibFunc::BYVALUE; break;
|
|
case E_V4_OF_POINTEE:
|
|
P.VectorSize = 4; P.PtrKind = AMDGPULibFunc::BYVALUE; break;
|
|
case E_V8_OF_POINTEE:
|
|
P.VectorSize = 8; P.PtrKind = AMDGPULibFunc::BYVALUE; break;
|
|
case E_V16_OF_POINTEE:
|
|
P.VectorSize = 16; P.PtrKind = AMDGPULibFunc::BYVALUE; break;
|
|
case E_CONSTPTR_ANY:
|
|
P.PtrKind |= AMDGPULibFunc::CONST; break;
|
|
case E_VLTLPTR_ANY:
|
|
P.PtrKind |= AMDGPULibFunc::VOLATILE; break;
|
|
case E_SETBASE_I32:
|
|
P.ArgType = AMDGPULibFunc::I32; break;
|
|
case E_SETBASE_U32:
|
|
P.ArgType = AMDGPULibFunc::U32; break;
|
|
|
|
case E_MAKEBASE_UNS:
|
|
P.ArgType &= ~AMDGPULibFunc::BASE_TYPE_MASK;
|
|
P.ArgType |= AMDGPULibFunc::UINT;
|
|
break;
|
|
|
|
case E_IMAGECOORDS:
|
|
switch (P.ArgType) {
|
|
case AMDGPULibFunc::IMG1DA: P.VectorSize = 2; break;
|
|
case AMDGPULibFunc::IMG1DB: P.VectorSize = 1; break;
|
|
case AMDGPULibFunc::IMG2DA: P.VectorSize = 4; break;
|
|
case AMDGPULibFunc::IMG1D: P.VectorSize = 1; break;
|
|
case AMDGPULibFunc::IMG2D: P.VectorSize = 2; break;
|
|
case AMDGPULibFunc::IMG3D: P.VectorSize = 4; break;
|
|
}
|
|
P.PtrKind = AMDGPULibFunc::BYVALUE;
|
|
P.ArgType = AMDGPULibFunc::I32;
|
|
break;
|
|
|
|
case E_CONSTPTR_SWAPGL: {
|
|
unsigned AS = AMDGPULibFunc::getAddrSpaceFromEPtrKind(P.PtrKind);
|
|
switch (AS) {
|
|
case AMDGPUAS::GLOBAL_ADDRESS: AS = AMDGPUAS::LOCAL_ADDRESS; break;
|
|
case AMDGPUAS::LOCAL_ADDRESS: AS = AMDGPUAS::GLOBAL_ADDRESS; break;
|
|
}
|
|
P.PtrKind = AMDGPULibFunc::getEPtrKindFromAddrSpace(AS);
|
|
P.PtrKind |= AMDGPULibFunc::CONST;
|
|
break;
|
|
}
|
|
|
|
default: llvm_unreachable("Unhandeled param rule");
|
|
}
|
|
}
|
|
++Index;
|
|
return P;
|
|
}
|
|
|
|
inline static void drop_front(StringRef& str, size_t n = 1) {
|
|
str = str.drop_front(n);
|
|
}
|
|
|
|
static bool eatTerm(StringRef& mangledName, const char c) {
|
|
if (mangledName.front() == c) {
|
|
drop_front(mangledName);
|
|
return true;
|
|
}
|
|
return false;
|
|
}
|
|
|
|
template <size_t N>
|
|
static bool eatTerm(StringRef& mangledName, const char (&str)[N]) {
|
|
if (mangledName.startswith(StringRef(str, N-1))) {
|
|
drop_front(mangledName, N-1);
|
|
return true;
|
|
}
|
|
return false;
|
|
}
|
|
|
|
static int eatNumber(StringRef& s) {
|
|
size_t const savedSize = s.size();
|
|
int n = 0;
|
|
while (!s.empty() && isDigit(s.front())) {
|
|
n = n*10 + s.front() - '0';
|
|
drop_front(s);
|
|
}
|
|
return s.size() < savedSize ? n : -1;
|
|
}
|
|
|
|
static StringRef eatLengthPrefixedName(StringRef& mangledName) {
|
|
int const Len = eatNumber(mangledName);
|
|
if (Len <= 0 || static_cast<size_t>(Len) > mangledName.size())
|
|
return StringRef();
|
|
StringRef Res = mangledName.substr(0, Len);
|
|
drop_front(mangledName, Len);
|
|
return Res;
|
|
}
|
|
|
|
} // end anonymous namespace
|
|
|
|
AMDGPUMangledLibFunc::AMDGPUMangledLibFunc() {
|
|
FuncId = EI_NONE;
|
|
FKind = NOPFX;
|
|
Leads[0].reset();
|
|
Leads[1].reset();
|
|
Name.clear();
|
|
}
|
|
|
|
AMDGPUUnmangledLibFunc::AMDGPUUnmangledLibFunc() {
|
|
FuncId = EI_NONE;
|
|
FuncTy = nullptr;
|
|
}
|
|
|
|
AMDGPUMangledLibFunc::AMDGPUMangledLibFunc(
|
|
EFuncId id, const AMDGPUMangledLibFunc ©From) {
|
|
FuncId = id;
|
|
FKind = copyFrom.FKind;
|
|
Leads[0] = copyFrom.Leads[0];
|
|
Leads[1] = copyFrom.Leads[1];
|
|
}
|
|
|
|
///////////////////////////////////////////////////////////////////////////////
|
|
// Demangling
|
|
|
|
static int parseVecSize(StringRef& mangledName) {
|
|
size_t const Len = eatNumber(mangledName);
|
|
switch (Len) {
|
|
case 2: case 3: case 4: case 8: case 16:
|
|
return Len;
|
|
default:
|
|
break;
|
|
}
|
|
return 1;
|
|
}
|
|
|
|
static AMDGPULibFunc::ENamePrefix parseNamePrefix(StringRef& mangledName) {
|
|
std::pair<StringRef, StringRef> const P = mangledName.split('_');
|
|
AMDGPULibFunc::ENamePrefix Pfx =
|
|
StringSwitch<AMDGPULibFunc::ENamePrefix>(P.first)
|
|
.Case("native", AMDGPULibFunc::NATIVE)
|
|
.Case("half" , AMDGPULibFunc::HALF)
|
|
.Default(AMDGPULibFunc::NOPFX);
|
|
|
|
if (Pfx != AMDGPULibFunc::NOPFX)
|
|
mangledName = P.second;
|
|
|
|
return Pfx;
|
|
}
|
|
|
|
StringMap<int> ManglingRule::buildManglingRulesMap() {
|
|
StringMap<int> Map(array_lengthof(manglingRules));
|
|
int Id = 0;
|
|
for (auto Rule : manglingRules)
|
|
Map.insert({Rule.Name, Id++});
|
|
return Map;
|
|
}
|
|
|
|
bool AMDGPUMangledLibFunc::parseUnmangledName(StringRef FullName) {
|
|
static const StringMap<int> manglingRulesMap =
|
|
ManglingRule::buildManglingRulesMap();
|
|
FuncId = static_cast<EFuncId>(manglingRulesMap.lookup(FullName));
|
|
return FuncId != EI_NONE;
|
|
}
|
|
|
|
///////////////////////////////////////////////////////////////////////////////
|
|
// Itanium Demangling
|
|
|
|
namespace {
|
|
struct ItaniumParamParser {
|
|
AMDGPULibFunc::Param Prev;
|
|
bool parseItaniumParam(StringRef& param, AMDGPULibFunc::Param &res);
|
|
};
|
|
} // namespace
|
|
|
|
bool ItaniumParamParser::parseItaniumParam(StringRef& param,
|
|
AMDGPULibFunc::Param &res) {
|
|
res.reset();
|
|
if (param.empty()) return false;
|
|
|
|
// parse pointer prefix
|
|
if (eatTerm(param, 'P')) {
|
|
if (eatTerm(param, 'K')) res.PtrKind |= AMDGPULibFunc::CONST;
|
|
if (eatTerm(param, 'V')) res.PtrKind |= AMDGPULibFunc::VOLATILE;
|
|
unsigned AS;
|
|
if (!eatTerm(param, "U3AS")) {
|
|
AS = 0;
|
|
} else {
|
|
AS = param.front() - '0';
|
|
drop_front(param, 1);
|
|
}
|
|
res.PtrKind |= AMDGPULibFuncBase::getEPtrKindFromAddrSpace(AS);
|
|
} else {
|
|
res.PtrKind = AMDGPULibFunc::BYVALUE;
|
|
}
|
|
|
|
// parse vector size
|
|
if (eatTerm(param,"Dv")) {
|
|
res.VectorSize = parseVecSize(param);
|
|
if (res.VectorSize==1 || !eatTerm(param, '_')) return false;
|
|
}
|
|
|
|
// parse type
|
|
char const TC = param.front();
|
|
if (isDigit(TC)) {
|
|
res.ArgType = StringSwitch<AMDGPULibFunc::EType>
|
|
(eatLengthPrefixedName(param))
|
|
.Case("ocl_image1darray" , AMDGPULibFunc::IMG1DA)
|
|
.Case("ocl_image1dbuffer", AMDGPULibFunc::IMG1DB)
|
|
.Case("ocl_image2darray" , AMDGPULibFunc::IMG2DA)
|
|
.Case("ocl_image1d" , AMDGPULibFunc::IMG1D)
|
|
.Case("ocl_image2d" , AMDGPULibFunc::IMG2D)
|
|
.Case("ocl_image3d" , AMDGPULibFunc::IMG3D)
|
|
.Case("ocl_event" , AMDGPULibFunc::DUMMY)
|
|
.Case("ocl_sampler" , AMDGPULibFunc::DUMMY)
|
|
.Default(AMDGPULibFunc::DUMMY);
|
|
} else {
|
|
drop_front(param);
|
|
switch (TC) {
|
|
case 'h': res.ArgType = AMDGPULibFunc::U8; break;
|
|
case 't': res.ArgType = AMDGPULibFunc::U16; break;
|
|
case 'j': res.ArgType = AMDGPULibFunc::U32; break;
|
|
case 'm': res.ArgType = AMDGPULibFunc::U64; break;
|
|
case 'c': res.ArgType = AMDGPULibFunc::I8; break;
|
|
case 's': res.ArgType = AMDGPULibFunc::I16; break;
|
|
case 'i': res.ArgType = AMDGPULibFunc::I32; break;
|
|
case 'l': res.ArgType = AMDGPULibFunc::I64; break;
|
|
case 'f': res.ArgType = AMDGPULibFunc::F32; break;
|
|
case 'd': res.ArgType = AMDGPULibFunc::F64; break;
|
|
case 'D': if (!eatTerm(param, 'h')) return false;
|
|
res.ArgType = AMDGPULibFunc::F16; break;
|
|
case 'S':
|
|
if (!eatTerm(param, '_')) {
|
|
eatNumber(param);
|
|
if (!eatTerm(param, '_')) return false;
|
|
}
|
|
res.VectorSize = Prev.VectorSize;
|
|
res.ArgType = Prev.ArgType;
|
|
break;
|
|
default:;
|
|
}
|
|
}
|
|
if (res.ArgType == 0) return false;
|
|
Prev.VectorSize = res.VectorSize;
|
|
Prev.ArgType = res.ArgType;
|
|
return true;
|
|
}
|
|
|
|
bool AMDGPUMangledLibFunc::parseFuncName(StringRef &mangledName) {
|
|
StringRef Name = eatLengthPrefixedName(mangledName);
|
|
FKind = parseNamePrefix(Name);
|
|
if (!parseUnmangledName(Name))
|
|
return false;
|
|
|
|
const ManglingRule& Rule = manglingRules[FuncId];
|
|
ItaniumParamParser Parser;
|
|
for (int I=0; I < Rule.maxLeadIndex(); ++I) {
|
|
Param P;
|
|
if (!Parser.parseItaniumParam(mangledName, P))
|
|
return false;
|
|
|
|
if ((I + 1) == Rule.Lead[0]) Leads[0] = P;
|
|
if ((I + 1) == Rule.Lead[1]) Leads[1] = P;
|
|
}
|
|
return true;
|
|
}
|
|
|
|
bool AMDGPUUnmangledLibFunc::parseFuncName(StringRef &Name) {
|
|
if (!UnmangledFuncInfo::lookup(Name, FuncId))
|
|
return false;
|
|
setName(Name);
|
|
return true;
|
|
}
|
|
|
|
bool AMDGPULibFunc::parse(StringRef FuncName, AMDGPULibFunc &F) {
|
|
if (FuncName.empty()) {
|
|
F.Impl = std::unique_ptr<AMDGPULibFuncImpl>();
|
|
return false;
|
|
}
|
|
|
|
if (eatTerm(FuncName, "_Z"))
|
|
F.Impl = std::make_unique<AMDGPUMangledLibFunc>();
|
|
else
|
|
F.Impl = std::make_unique<AMDGPUUnmangledLibFunc>();
|
|
if (F.Impl->parseFuncName(FuncName))
|
|
return true;
|
|
|
|
F.Impl = std::unique_ptr<AMDGPULibFuncImpl>();
|
|
return false;
|
|
}
|
|
|
|
StringRef AMDGPUMangledLibFunc::getUnmangledName(StringRef mangledName) {
|
|
StringRef S = mangledName;
|
|
if (eatTerm(S, "_Z"))
|
|
return eatLengthPrefixedName(S);
|
|
return StringRef();
|
|
}
|
|
|
|
///////////////////////////////////////////////////////////////////////////////
|
|
// Mangling
|
|
|
|
template <typename Stream>
|
|
void AMDGPUMangledLibFunc::writeName(Stream &OS) const {
|
|
const char *Pfx = "";
|
|
switch (FKind) {
|
|
case NATIVE: Pfx = "native_"; break;
|
|
case HALF: Pfx = "half_"; break;
|
|
default: break;
|
|
}
|
|
if (!Name.empty()) {
|
|
OS << Pfx << Name;
|
|
} else if (FuncId != EI_NONE) {
|
|
OS << Pfx;
|
|
const StringRef& S = manglingRules[FuncId].Name;
|
|
OS.write(S.data(), S.size());
|
|
}
|
|
}
|
|
|
|
std::string AMDGPUMangledLibFunc::mangle() const { return mangleNameItanium(); }
|
|
|
|
///////////////////////////////////////////////////////////////////////////////
|
|
// Itanium Mangling
|
|
|
|
static const char *getItaniumTypeName(AMDGPULibFunc::EType T) {
|
|
switch (T) {
|
|
case AMDGPULibFunc::U8: return "h";
|
|
case AMDGPULibFunc::U16: return "t";
|
|
case AMDGPULibFunc::U32: return "j";
|
|
case AMDGPULibFunc::U64: return "m";
|
|
case AMDGPULibFunc::I8: return "c";
|
|
case AMDGPULibFunc::I16: return "s";
|
|
case AMDGPULibFunc::I32: return "i";
|
|
case AMDGPULibFunc::I64: return "l";
|
|
case AMDGPULibFunc::F16: return "Dh";
|
|
case AMDGPULibFunc::F32: return "f";
|
|
case AMDGPULibFunc::F64: return "d";
|
|
case AMDGPULibFunc::IMG1DA: return "16ocl_image1darray";
|
|
case AMDGPULibFunc::IMG1DB: return "17ocl_image1dbuffer";
|
|
case AMDGPULibFunc::IMG2DA: return "16ocl_image2darray";
|
|
case AMDGPULibFunc::IMG1D: return "11ocl_image1d";
|
|
case AMDGPULibFunc::IMG2D: return "11ocl_image2d";
|
|
case AMDGPULibFunc::IMG3D: return "11ocl_image3d";
|
|
case AMDGPULibFunc::SAMPLER: return "11ocl_sampler";
|
|
case AMDGPULibFunc::EVENT: return "9ocl_event";
|
|
default: llvm_unreachable("Unhandeled param type");
|
|
}
|
|
return nullptr;
|
|
}
|
|
|
|
namespace {
|
|
// Itanium mangling ABI says:
|
|
// "5.1.8. Compression
|
|
// ... Each non-terminal in the grammar for which <substitution> appears on the
|
|
// right-hand side is both a source of future substitutions and a candidate
|
|
// for being substituted. There are two exceptions that appear to be
|
|
// substitution candidates from the grammar, but are explicitly excluded:
|
|
// 1. <builtin-type> other than vendor extended types ..."
|
|
|
|
// For the purpose of functions the following productions make sence for the
|
|
// substitution:
|
|
// <type> ::= <builtin-type>
|
|
// ::= <class-enum-type>
|
|
// ::= <array-type>
|
|
// ::=<CV-qualifiers> <type>
|
|
// ::= P <type> # pointer-to
|
|
// ::= <substitution>
|
|
//
|
|
// Note that while types like images, samplers and events are by the ABI encoded
|
|
// using <class-enum-type> production rule they're not used for substitution
|
|
// because clang consider them as builtin types.
|
|
//
|
|
// DvNN_ type is GCC extension for vectors and is a subject for the substitution.
|
|
|
|
|
|
class ItaniumMangler {
|
|
SmallVector<AMDGPULibFunc::Param, 10> Str; // list of accumulated substitutions
|
|
bool UseAddrSpace;
|
|
|
|
int findSubst(const AMDGPULibFunc::Param& P) const {
|
|
for(unsigned I = 0; I < Str.size(); ++I) {
|
|
const AMDGPULibFunc::Param& T = Str[I];
|
|
if (P.PtrKind == T.PtrKind &&
|
|
P.VectorSize == T.VectorSize &&
|
|
P.ArgType == T.ArgType) {
|
|
return I;
|
|
}
|
|
}
|
|
return -1;
|
|
}
|
|
|
|
template <typename Stream>
|
|
bool trySubst(Stream& os, const AMDGPULibFunc::Param& p) {
|
|
int const subst = findSubst(p);
|
|
if (subst < 0) return false;
|
|
// Substitutions are mangled as S(XX)?_ where XX is a hexadecimal number
|
|
// 0 1 2
|
|
// S_ S0_ S1_
|
|
if (subst == 0) os << "S_";
|
|
else os << 'S' << (subst-1) << '_';
|
|
return true;
|
|
}
|
|
|
|
public:
|
|
ItaniumMangler(bool useAddrSpace)
|
|
: UseAddrSpace(useAddrSpace) {}
|
|
|
|
template <typename Stream>
|
|
void operator()(Stream& os, AMDGPULibFunc::Param p) {
|
|
|
|
// Itanium mangling ABI 5.1.8. Compression:
|
|
// Logically, the substitutable components of a mangled name are considered
|
|
// left-to-right, components before the composite structure of which they
|
|
// are a part. If a component has been encountered before, it is substituted
|
|
// as described below. This decision is independent of whether its components
|
|
// have been substituted, so an implementation may optimize by considering
|
|
// large structures for substitution before their components. If a component
|
|
// has not been encountered before, its mangling is identified, and it is
|
|
// added to a dictionary of substitution candidates. No entity is added to
|
|
// the dictionary twice.
|
|
AMDGPULibFunc::Param Ptr;
|
|
|
|
if (p.PtrKind) {
|
|
if (trySubst(os, p)) return;
|
|
os << 'P';
|
|
if (p.PtrKind & AMDGPULibFunc::CONST) os << 'K';
|
|
if (p.PtrKind & AMDGPULibFunc::VOLATILE) os << 'V';
|
|
unsigned AS = UseAddrSpace
|
|
? AMDGPULibFuncBase::getAddrSpaceFromEPtrKind(p.PtrKind)
|
|
: 0;
|
|
if (EnableOCLManglingMismatchWA || AS != 0)
|
|
os << "U3AS" << AS;
|
|
Ptr = p;
|
|
p.PtrKind = 0;
|
|
}
|
|
|
|
if (p.VectorSize > 1) {
|
|
if (trySubst(os, p)) goto exit;
|
|
Str.push_back(p);
|
|
os << "Dv" << static_cast<unsigned>(p.VectorSize) << '_';
|
|
}
|
|
|
|
os << getItaniumTypeName((AMDGPULibFunc::EType)p.ArgType);
|
|
|
|
exit:
|
|
if (Ptr.ArgType) Str.push_back(Ptr);
|
|
}
|
|
};
|
|
} // namespace
|
|
|
|
std::string AMDGPUMangledLibFunc::mangleNameItanium() const {
|
|
SmallString<128> Buf;
|
|
raw_svector_ostream S(Buf);
|
|
SmallString<128> NameBuf;
|
|
raw_svector_ostream Name(NameBuf);
|
|
writeName(Name);
|
|
const StringRef& NameStr = Name.str();
|
|
S << "_Z" << static_cast<int>(NameStr.size()) << NameStr;
|
|
|
|
ItaniumMangler Mangler(true);
|
|
ParamIterator I(Leads, manglingRules[FuncId]);
|
|
Param P;
|
|
while ((P = I.getNextParam()).ArgType != 0)
|
|
Mangler(S, P);
|
|
return std::string(S.str());
|
|
}
|
|
|
|
///////////////////////////////////////////////////////////////////////////////
|
|
// Misc
|
|
|
|
static Type* getIntrinsicParamType(
|
|
LLVMContext& C,
|
|
const AMDGPULibFunc::Param& P,
|
|
bool useAddrSpace) {
|
|
Type* T = nullptr;
|
|
switch (P.ArgType) {
|
|
case AMDGPULibFunc::U8:
|
|
case AMDGPULibFunc::I8: T = Type::getInt8Ty(C); break;
|
|
case AMDGPULibFunc::U16:
|
|
case AMDGPULibFunc::I16: T = Type::getInt16Ty(C); break;
|
|
case AMDGPULibFunc::U32:
|
|
case AMDGPULibFunc::I32: T = Type::getInt32Ty(C); break;
|
|
case AMDGPULibFunc::U64:
|
|
case AMDGPULibFunc::I64: T = Type::getInt64Ty(C); break;
|
|
case AMDGPULibFunc::F16: T = Type::getHalfTy(C); break;
|
|
case AMDGPULibFunc::F32: T = Type::getFloatTy(C); break;
|
|
case AMDGPULibFunc::F64: T = Type::getDoubleTy(C); break;
|
|
|
|
case AMDGPULibFunc::IMG1DA:
|
|
case AMDGPULibFunc::IMG1DB:
|
|
case AMDGPULibFunc::IMG2DA:
|
|
case AMDGPULibFunc::IMG1D:
|
|
case AMDGPULibFunc::IMG2D:
|
|
case AMDGPULibFunc::IMG3D:
|
|
T = StructType::create(C,"ocl_image")->getPointerTo(); break;
|
|
case AMDGPULibFunc::SAMPLER:
|
|
T = StructType::create(C,"ocl_sampler")->getPointerTo(); break;
|
|
case AMDGPULibFunc::EVENT:
|
|
T = StructType::create(C,"ocl_event")->getPointerTo(); break;
|
|
default:
|
|
llvm_unreachable("Unhandeled param type");
|
|
return nullptr;
|
|
}
|
|
if (P.VectorSize > 1)
|
|
T = FixedVectorType::get(T, P.VectorSize);
|
|
if (P.PtrKind != AMDGPULibFunc::BYVALUE)
|
|
T = useAddrSpace ? T->getPointerTo((P.PtrKind & AMDGPULibFunc::ADDR_SPACE)
|
|
- 1)
|
|
: T->getPointerTo();
|
|
return T;
|
|
}
|
|
|
|
FunctionType *AMDGPUMangledLibFunc::getFunctionType(Module &M) const {
|
|
LLVMContext& C = M.getContext();
|
|
std::vector<Type*> Args;
|
|
ParamIterator I(Leads, manglingRules[FuncId]);
|
|
Param P;
|
|
while ((P=I.getNextParam()).ArgType != 0)
|
|
Args.push_back(getIntrinsicParamType(C, P, true));
|
|
|
|
return FunctionType::get(
|
|
getIntrinsicParamType(C, getRetType(FuncId, Leads), true),
|
|
Args, false);
|
|
}
|
|
|
|
unsigned AMDGPUMangledLibFunc::getNumArgs() const {
|
|
return manglingRules[FuncId].getNumArgs();
|
|
}
|
|
|
|
unsigned AMDGPUUnmangledLibFunc::getNumArgs() const {
|
|
return UnmangledFuncInfo::getNumArgs(FuncId);
|
|
}
|
|
|
|
std::string AMDGPUMangledLibFunc::getName() const {
|
|
SmallString<128> Buf;
|
|
raw_svector_ostream OS(Buf);
|
|
writeName(OS);
|
|
return std::string(OS.str());
|
|
}
|
|
|
|
Function *AMDGPULibFunc::getFunction(Module *M, const AMDGPULibFunc &fInfo) {
|
|
std::string FuncName = fInfo.mangle();
|
|
Function *F = dyn_cast_or_null<Function>(
|
|
M->getValueSymbolTable().lookup(FuncName));
|
|
|
|
// check formal with actual types conformance
|
|
if (F && !F->isDeclaration()
|
|
&& !F->isVarArg()
|
|
&& F->arg_size() == fInfo.getNumArgs()) {
|
|
return F;
|
|
}
|
|
return nullptr;
|
|
}
|
|
|
|
FunctionCallee AMDGPULibFunc::getOrInsertFunction(Module *M,
|
|
const AMDGPULibFunc &fInfo) {
|
|
std::string const FuncName = fInfo.mangle();
|
|
Function *F = dyn_cast_or_null<Function>(
|
|
M->getValueSymbolTable().lookup(FuncName));
|
|
|
|
// check formal with actual types conformance
|
|
if (F && !F->isDeclaration()
|
|
&& !F->isVarArg()
|
|
&& F->arg_size() == fInfo.getNumArgs()) {
|
|
return F;
|
|
}
|
|
|
|
FunctionType *FuncTy = fInfo.getFunctionType(*M);
|
|
|
|
bool hasPtr = false;
|
|
for (FunctionType::param_iterator
|
|
PI = FuncTy->param_begin(),
|
|
PE = FuncTy->param_end();
|
|
PI != PE; ++PI) {
|
|
const Type* argTy = static_cast<const Type*>(*PI);
|
|
if (argTy->isPointerTy()) {
|
|
hasPtr = true;
|
|
break;
|
|
}
|
|
}
|
|
|
|
FunctionCallee C;
|
|
if (hasPtr) {
|
|
// Do not set extra attributes for functions with pointer arguments.
|
|
C = M->getOrInsertFunction(FuncName, FuncTy);
|
|
} else {
|
|
AttributeList Attr;
|
|
LLVMContext &Ctx = M->getContext();
|
|
Attr = Attr.addFnAttribute(Ctx, Attribute::ReadOnly);
|
|
Attr = Attr.addFnAttribute(Ctx, Attribute::NoUnwind);
|
|
C = M->getOrInsertFunction(FuncName, FuncTy, Attr);
|
|
}
|
|
|
|
return C;
|
|
}
|
|
|
|
StringMap<unsigned> UnmangledFuncInfo::buildNameMap() {
|
|
StringMap<unsigned> Map;
|
|
for (unsigned I = 0; I != TableSize; ++I)
|
|
Map[Table[I].Name] = I;
|
|
return Map;
|
|
}
|
|
|
|
bool UnmangledFuncInfo::lookup(StringRef Name, ID &Id) {
|
|
static const StringMap<unsigned> Map = buildNameMap();
|
|
auto Loc = Map.find(Name);
|
|
if (Loc != Map.end()) {
|
|
Id = toFuncId(Loc->second);
|
|
return true;
|
|
}
|
|
Id = AMDGPULibFunc::EI_NONE;
|
|
return false;
|
|
}
|
|
|
|
AMDGPULibFunc::AMDGPULibFunc(const AMDGPULibFunc &F) {
|
|
if (auto *MF = dyn_cast<AMDGPUMangledLibFunc>(F.Impl.get()))
|
|
Impl.reset(new AMDGPUMangledLibFunc(*MF));
|
|
else if (auto *UMF = dyn_cast<AMDGPUUnmangledLibFunc>(F.Impl.get()))
|
|
Impl.reset(new AMDGPUUnmangledLibFunc(*UMF));
|
|
else
|
|
Impl = std::unique_ptr<AMDGPULibFuncImpl>();
|
|
}
|
|
|
|
AMDGPULibFunc &AMDGPULibFunc::operator=(const AMDGPULibFunc &F) {
|
|
if (this == &F)
|
|
return *this;
|
|
new (this) AMDGPULibFunc(F);
|
|
return *this;
|
|
}
|
|
|
|
AMDGPULibFunc::AMDGPULibFunc(EFuncId Id, const AMDGPULibFunc &CopyFrom) {
|
|
assert(AMDGPULibFuncBase::isMangled(Id) && CopyFrom.isMangled() &&
|
|
"not supported");
|
|
Impl.reset(new AMDGPUMangledLibFunc(
|
|
Id, *cast<AMDGPUMangledLibFunc>(CopyFrom.Impl.get())));
|
|
}
|
|
|
|
AMDGPULibFunc::AMDGPULibFunc(StringRef Name, FunctionType *FT) {
|
|
Impl.reset(new AMDGPUUnmangledLibFunc(Name, FT));
|
|
}
|
|
|
|
void AMDGPULibFunc::initMangled() { Impl.reset(new AMDGPUMangledLibFunc()); }
|
|
|
|
AMDGPULibFunc::Param *AMDGPULibFunc::getLeads() {
|
|
if (!Impl)
|
|
initMangled();
|
|
return cast<AMDGPUMangledLibFunc>(Impl.get())->Leads;
|
|
}
|
|
|
|
const AMDGPULibFunc::Param *AMDGPULibFunc::getLeads() const {
|
|
return cast<const AMDGPUMangledLibFunc>(Impl.get())->Leads;
|
|
}
|