forked from OSchip/llvm-project
[CUDA][HIP] Mark device var used by host only
Add device variables to llvm.compiler.used if they are ODR-used by either host or device functions. This is necessary to prevent them from being eliminated by whole-program optimization where the compiler has no way to know a device variable is used by some host code. Reviewed by: Artem Belevich Differential Revision: https://reviews.llvm.org/D98814
This commit is contained in:
parent
3597f02fd5
commit
d5c0f00e21
|
@ -1089,6 +1089,28 @@ void CGNVCUDARuntime::transformManagedVars() {
|
|||
llvm::Function *CGNVCUDARuntime::finalizeModule() {
|
||||
if (CGM.getLangOpts().CUDAIsDevice) {
|
||||
transformManagedVars();
|
||||
|
||||
// Mark ODR-used device variables as compiler used to prevent it from being
|
||||
// eliminated by optimization. This is necessary for device variables
|
||||
// ODR-used by host functions. Sema correctly marks them as ODR-used no
|
||||
// matter whether they are ODR-used by device or host functions.
|
||||
//
|
||||
// We do not need to do this if the variable has used attribute since it
|
||||
// has already been added.
|
||||
//
|
||||
// Static device variables have been externalized at this point, therefore
|
||||
// variables with LLVM private or internal linkage need not be added.
|
||||
for (auto &&Info : DeviceVars) {
|
||||
auto Kind = Info.Flags.getKind();
|
||||
if (!Info.Var->isDeclaration() &&
|
||||
!llvm::GlobalValue::isLocalLinkage(Info.Var->getLinkage()) &&
|
||||
(Kind == DeviceVarFlags::Variable ||
|
||||
Kind == DeviceVarFlags::Surface ||
|
||||
Kind == DeviceVarFlags::Texture) &&
|
||||
Info.D->isUsed() && !Info.D->hasAttr<UsedAttr>()) {
|
||||
CGM.addCompilerUsedGlobal(Info.Var);
|
||||
}
|
||||
}
|
||||
return nullptr;
|
||||
}
|
||||
return makeModuleCtorFunction();
|
||||
|
|
|
@ -0,0 +1,47 @@
|
|||
// REQUIRES: amdgpu-registered-target
|
||||
// RUN: %clang_cc1 -triple amdgcn-amd-amdhsa -fcuda-is-device -x hip %s \
|
||||
// RUN: -std=c++11 -O3 -mllvm -amdgpu-internalize-symbols -emit-llvm -o - \
|
||||
// RUN: | FileCheck %s
|
||||
|
||||
#include "Inputs/cuda.h"
|
||||
|
||||
// Check device variables used by neither host nor device functioins are not kept.
|
||||
|
||||
// CHECK-NOT: @v1
|
||||
__device__ int v1;
|
||||
|
||||
// CHECK-NOT: @v2
|
||||
__constant__ int v2;
|
||||
|
||||
// CHECK-NOT: @_ZL2v3
|
||||
static __device__ int v3;
|
||||
|
||||
// Check device variables used by host functions are kept.
|
||||
|
||||
// CHECK-DAG: @u1
|
||||
__device__ int u1;
|
||||
|
||||
// CHECK-DAG: @u2
|
||||
__constant__ int u2;
|
||||
|
||||
// Check host-used static device var is in llvm.compiler.used.
|
||||
// CHECK-DAG: @_ZL2u3
|
||||
static __device__ int u3;
|
||||
|
||||
// Check device-used static device var is emitted but is not in llvm.compiler.used.
|
||||
// CHECK-DAG: @_ZL2u4
|
||||
static __device__ int u4;
|
||||
|
||||
// Check device variables with used attribute are always kept.
|
||||
// CHECK-DAG: @u5
|
||||
__device__ __attribute__((used)) int u5;
|
||||
|
||||
int fun1() {
|
||||
return u1 + u2 + u3;
|
||||
}
|
||||
|
||||
__global__ void kern1(int **x) {
|
||||
*x = &u4;
|
||||
}
|
||||
// Check the exact list of variables to ensure @_ZL2u4 is not among them.
|
||||
// CHECK: @llvm.compiler.used = {{[^@]*}} @_ZL2u3 {{[^@]*}} @u1 {{[^@]*}} @u2 {{[^@]*}} @u5
|
Loading…
Reference in New Issue