forked from OSchip/llvm-project
[CUDA][HIP] Allow function-scope static const variable
CUDA 8.0 E.3.9.4 says: Within the body of a __device__ or __global__ function, only __shared__ variables or variables without any device memory qualifiers may be declared with static storage class. It is unclear how a function-scope non-const static variable without device memory qualifier is implemented, therefore only static const variable without device memory qualifier is allowed, which can be emitted as a global variable in constant address space. Currently clang only allows function-scope static variable with __shared__ qualifier. This patch also allows function-scope static const variable without device memory qualifier and emits it as a global variable in constant address space. Differential Revision: https://reviews.llvm.org/D49931 llvm-svn: 338188
This commit is contained in:
parent
39e5137f43
commit
a4005e13f7
clang
include/clang/Basic
lib
test
|
@ -7129,7 +7129,8 @@ def err_shared_var_init : Error<
|
||||||
"initialization is not supported for __shared__ variables.">;
|
"initialization is not supported for __shared__ variables.">;
|
||||||
def err_device_static_local_var : Error<
|
def err_device_static_local_var : Error<
|
||||||
"within a %select{__device__|__global__|__host__|__host__ __device__}0 "
|
"within a %select{__device__|__global__|__host__|__host__ __device__}0 "
|
||||||
"function, only __shared__ variables may be marked 'static'">;
|
"function, only __shared__ variables or const variables without device "
|
||||||
|
"memory qualifier may be marked 'static'">;
|
||||||
def err_cuda_vla : Error<
|
def err_cuda_vla : Error<
|
||||||
"cannot use variable-length arrays in "
|
"cannot use variable-length arrays in "
|
||||||
"%select{__device__|__global__|__host__|__host__ __device__}0 functions">;
|
"%select{__device__|__global__|__host__|__host__ __device__}0 functions">;
|
||||||
|
|
|
@ -3176,6 +3176,10 @@ LangAS CodeGenModule::GetGlobalVarAddressSpace(const VarDecl *D) {
|
||||||
return LangAS::cuda_constant;
|
return LangAS::cuda_constant;
|
||||||
else if (D && D->hasAttr<CUDASharedAttr>())
|
else if (D && D->hasAttr<CUDASharedAttr>())
|
||||||
return LangAS::cuda_shared;
|
return LangAS::cuda_shared;
|
||||||
|
else if (D && D->hasAttr<CUDADeviceAttr>())
|
||||||
|
return LangAS::cuda_device;
|
||||||
|
else if (D && D->getType().isConstQualified())
|
||||||
|
return LangAS::cuda_constant;
|
||||||
else
|
else
|
||||||
return LangAS::cuda_device;
|
return LangAS::cuda_device;
|
||||||
}
|
}
|
||||||
|
|
|
@ -11914,14 +11914,25 @@ void Sema::FinalizeDeclaration(Decl *ThisDecl) {
|
||||||
NewAttr->setInherited(true);
|
NewAttr->setInherited(true);
|
||||||
VD->addAttr(NewAttr);
|
VD->addAttr(NewAttr);
|
||||||
}
|
}
|
||||||
// CUDA E.2.9.4: Within the body of a __device__ or __global__
|
// CUDA 8.0 E.3.9.4: Within the body of a __device__ or __global__
|
||||||
// function, only __shared__ variables may be declared with
|
// function, only __shared__ variables or variables without any device
|
||||||
// static storage class.
|
// memory qualifiers may be declared with static storage class.
|
||||||
if (getLangOpts().CUDA && !VD->hasAttr<CUDASharedAttr>() &&
|
// Note: It is unclear how a function-scope non-const static variable
|
||||||
CUDADiagIfDeviceCode(VD->getLocation(),
|
// without device memory qualifier is implemented, therefore only static
|
||||||
diag::err_device_static_local_var)
|
// const variable without device memory qualifier is allowed.
|
||||||
<< CurrentCUDATarget())
|
[&]() {
|
||||||
VD->setInvalidDecl();
|
if (!getLangOpts().CUDA)
|
||||||
|
return;
|
||||||
|
if (VD->hasAttr<CUDASharedAttr>())
|
||||||
|
return;
|
||||||
|
if (VD->getType().isConstQualified() &&
|
||||||
|
!(VD->hasAttr<CUDADeviceAttr>() || VD->hasAttr<CUDAConstantAttr>()))
|
||||||
|
return;
|
||||||
|
if (CUDADiagIfDeviceCode(VD->getLocation(),
|
||||||
|
diag::err_device_static_local_var)
|
||||||
|
<< CurrentCUDATarget())
|
||||||
|
VD->setInvalidDecl();
|
||||||
|
}();
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -112,6 +112,9 @@ __constant__ EC_I_EC c_ec_i_ec;
|
||||||
// CHECK: @_ZZ2dfvE4s_ec = internal addrspace(3) global %struct.EC undef
|
// CHECK: @_ZZ2dfvE4s_ec = internal addrspace(3) global %struct.EC undef
|
||||||
// CHECK: @_ZZ2dfvE5s_etc = internal addrspace(3) global %struct.ETC undef
|
// CHECK: @_ZZ2dfvE5s_etc = internal addrspace(3) global %struct.ETC undef
|
||||||
|
|
||||||
|
// CHECK: @_ZZ2dfvE11const_array = internal addrspace(4) constant [5 x i32] [i32 1, i32 2, i32 3, i32 4, i32 5]
|
||||||
|
// CHECK: @_ZZ2dfvE9const_int = internal addrspace(4) constant i32 123
|
||||||
|
|
||||||
// We should not emit global initializers for device-side variables.
|
// We should not emit global initializers for device-side variables.
|
||||||
// CHECK-NOT: @__cxx_global_var_init
|
// CHECK-NOT: @__cxx_global_var_init
|
||||||
|
|
||||||
|
@ -234,6 +237,9 @@ __device__ void df() {
|
||||||
static __shared__ ETC s_etc;
|
static __shared__ ETC s_etc;
|
||||||
// CHECK-NOT: call void @_ZN3ETCC1IJEEEDpT_(%struct.ETC* addrspacecast (%struct.ETC addrspace(3)* @_ZZ2dfvE5s_etc to %struct.ETC*))
|
// CHECK-NOT: call void @_ZN3ETCC1IJEEEDpT_(%struct.ETC* addrspacecast (%struct.ETC addrspace(3)* @_ZZ2dfvE5s_etc to %struct.ETC*))
|
||||||
|
|
||||||
|
static const int const_array[] = {1, 2, 3, 4, 5};
|
||||||
|
static const int const_int = 123;
|
||||||
|
|
||||||
// anchor point separating constructors and destructors
|
// anchor point separating constructors and destructors
|
||||||
df(); // CHECK: call void @_Z2dfv()
|
df(); // CHECK: call void @_Z2dfv()
|
||||||
|
|
||||||
|
|
|
@ -207,17 +207,22 @@ __device__ void df_sema() {
|
||||||
// expected-error@-1 {{initialization is not supported for __shared__ variables.}}
|
// expected-error@-1 {{initialization is not supported for __shared__ variables.}}
|
||||||
|
|
||||||
static __device__ int ds;
|
static __device__ int ds;
|
||||||
// expected-error@-1 {{within a __device__ function, only __shared__ variables may be marked 'static'}}
|
// expected-error@-1 {{within a __device__ function, only __shared__ variables or const variables without device memory qualifier may be marked 'static'}}
|
||||||
static __constant__ int dc;
|
static __constant__ int dc;
|
||||||
// expected-error@-1 {{within a __device__ function, only __shared__ variables may be marked 'static'}}
|
// expected-error@-1 {{within a __device__ function, only __shared__ variables or const variables without device memory qualifier may be marked 'static'}}
|
||||||
static int v;
|
static int v;
|
||||||
// expected-error@-1 {{within a __device__ function, only __shared__ variables may be marked 'static'}}
|
// expected-error@-1 {{within a __device__ function, only __shared__ variables or const variables without device memory qualifier may be marked 'static'}}
|
||||||
|
static const int cv = 1;
|
||||||
|
static const __device__ int cds = 1;
|
||||||
|
// expected-error@-1 {{within a __device__ function, only __shared__ variables or const variables without device memory qualifier may be marked 'static'}}
|
||||||
|
static const __constant__ int cdc = 1;
|
||||||
|
// expected-error@-1 {{within a __device__ function, only __shared__ variables or const variables without device memory qualifier may be marked 'static'}}
|
||||||
}
|
}
|
||||||
|
|
||||||
__host__ __device__ void hd_sema() {
|
__host__ __device__ void hd_sema() {
|
||||||
static int x = 42;
|
static int x = 42;
|
||||||
#ifdef __CUDA_ARCH__
|
#ifdef __CUDA_ARCH__
|
||||||
// expected-error@-2 {{within a __host__ __device__ function, only __shared__ variables may be marked 'static'}}
|
// expected-error@-2 {{within a __host__ __device__ function, only __shared__ variables or const variables without device memory qualifier may be marked 'static'}}
|
||||||
#endif
|
#endif
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue