llvm-project/clang/lib/Headers/__clang_cuda_builtin_vars.h

/*===---- cuda_builtin_vars.h - CUDA built-in variables ---------------------===
 *
 * Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 * See https://llvm.org/LICENSE.txt for license information.
 * SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 *
 *===-----------------------------------------------------------------------===
 */

#ifndef __CUDA_BUILTIN_VARS_H
#define __CUDA_BUILTIN_VARS_H

// Forward declares from vector_types.h.
struct uint3;
struct dim3;

// The file implements built-in CUDA variables using __declspec(property).
// https://msdn.microsoft.com/en-us/library/yhfk0thd.aspx
// All read accesses of built-in variable fields get converted into calls to a
// getter function which in turn calls the appropriate builtin to fetch the
// value.
//
// Example:
//    int x = threadIdx.x;
// IR output:
//  %0 = call i32 @llvm.nvvm.read.ptx.sreg.tid.x() #3
// PTX output:
//  mov.u32     %r2, %tid.x;

#define __CUDA_DEVICE_BUILTIN(FIELD, INTRINSIC)                                \
  __declspec(property(get = __fetch_builtin_##FIELD)) unsigned int FIELD;      \
  static inline __attribute__((always_inline))                                 \
      __attribute__((device)) unsigned int __fetch_builtin_##FIELD(void) {     \
    return INTRINSIC;                                                          \
  }

#if __cplusplus >= 201103L
#define __DELETE =delete
#else
#define __DELETE
#endif

// Make sure nobody can create instances of the special variable types.  nvcc
// also disallows taking address of special variables, so we disable address-of
// operator as well.
#define __CUDA_DISALLOW_BUILTINVAR_ACCESS(TypeName)                            \
  __attribute__((device)) TypeName() __DELETE;                                 \
  __attribute__((device)) TypeName(const TypeName &) __DELETE;                 \
  __attribute__((device)) void operator=(const TypeName &) const __DELETE;     \
  __attribute__((device)) TypeName *operator&() const __DELETE

struct __cuda_builtin_threadIdx_t {
  __CUDA_DEVICE_BUILTIN(x,__nvvm_read_ptx_sreg_tid_x());
  __CUDA_DEVICE_BUILTIN(y,__nvvm_read_ptx_sreg_tid_y());
  __CUDA_DEVICE_BUILTIN(z,__nvvm_read_ptx_sreg_tid_z());
  // threadIdx should be convertible to uint3 (in fact in nvcc, it *is* a
  // uint3).  This function is defined after we pull in vector_types.h.
  __attribute__((device)) operator uint3() const;
private:
  __CUDA_DISALLOW_BUILTINVAR_ACCESS(__cuda_builtin_threadIdx_t);
};

struct __cuda_builtin_blockIdx_t {
  __CUDA_DEVICE_BUILTIN(x,__nvvm_read_ptx_sreg_ctaid_x());
  __CUDA_DEVICE_BUILTIN(y,__nvvm_read_ptx_sreg_ctaid_y());
  __CUDA_DEVICE_BUILTIN(z,__nvvm_read_ptx_sreg_ctaid_z());
  // blockIdx should be convertible to uint3 (in fact in nvcc, it *is* a
  // uint3).  This function is defined after we pull in vector_types.h.
  __attribute__((device)) operator uint3() const;
private:
  __CUDA_DISALLOW_BUILTINVAR_ACCESS(__cuda_builtin_blockIdx_t);
};

struct __cuda_builtin_blockDim_t {
  __CUDA_DEVICE_BUILTIN(x,__nvvm_read_ptx_sreg_ntid_x());
  __CUDA_DEVICE_BUILTIN(y,__nvvm_read_ptx_sreg_ntid_y());
  __CUDA_DEVICE_BUILTIN(z,__nvvm_read_ptx_sreg_ntid_z());
  // blockDim should be convertible to dim3 (in fact in nvcc, it *is* a
  // dim3).  This function is defined after we pull in vector_types.h.
  __attribute__((device)) operator dim3() const;
private:
  __CUDA_DISALLOW_BUILTINVAR_ACCESS(__cuda_builtin_blockDim_t);
};

struct __cuda_builtin_gridDim_t {
  __CUDA_DEVICE_BUILTIN(x,__nvvm_read_ptx_sreg_nctaid_x());
  __CUDA_DEVICE_BUILTIN(y,__nvvm_read_ptx_sreg_nctaid_y());
  __CUDA_DEVICE_BUILTIN(z,__nvvm_read_ptx_sreg_nctaid_z());
  // gridDim should be convertible to dim3 (in fact in nvcc, it *is* a
  // dim3).  This function is defined after we pull in vector_types.h.
  __attribute__((device)) operator dim3() const;
private:
  __CUDA_DISALLOW_BUILTINVAR_ACCESS(__cuda_builtin_gridDim_t);
};

#define __CUDA_BUILTIN_VAR                                                     \
  extern const __attribute__((device)) __attribute__((weak))
__CUDA_BUILTIN_VAR __cuda_builtin_threadIdx_t threadIdx;
__CUDA_BUILTIN_VAR __cuda_builtin_blockIdx_t blockIdx;
__CUDA_BUILTIN_VAR __cuda_builtin_blockDim_t blockDim;
__CUDA_BUILTIN_VAR __cuda_builtin_gridDim_t gridDim;

// warpSize should translate to read of %WARP_SZ but there's currently no
// builtin to do so. According to PTX v4.2 docs 'to date, all target
// architectures have a WARP_SZ value of 32'.
__attribute__((device)) const int warpSize = 32;

#undef __CUDA_DEVICE_BUILTIN
#undef __CUDA_BUILTIN_VAR
#undef __CUDA_DISALLOW_BUILTINVAR_ACCESS

#endif /* __CUDA_BUILTIN_VARS_H */
[cuda] Added support for CUDA built-in variables. Added cuda_builtin_vars.h which implements built-in CUDA variables using __declattr(property). Fields of built-in variables (except for warpSize) are implemented using __declattr(property) which replaces read/write of a member field with a call to a getter/setter member function, in this case with appropriate NVPTX builtin. Added a test case to check diagnostics on attempt to construct or improperly access a built-in variable. Differential Revision: http://reviews.llvm.org/D9064 llvm-svn: 235448 2015-04-22 06:14:13 +08:00			`/*===---- cuda_builtin_vars.h - CUDA built-in variables ---------------------===`
			`*`
Move the builtin headers to use the new license file header. Summary: These all had somewhat custom file headers with different text from the ones I searched for previously, and so I missed them. Thanks to Hal and Kristina and others who prompted me to fix this, and sorry it took so long. Reviewers: hfinkel Subscribers: mcrosier, javed.absar, cfe-commits Tags: #clang Differential Revision: https://reviews.llvm.org/D60406 llvm-svn: 357941 2019-04-09 04:51:30 +08:00			`* Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.`
			`* See https://llvm.org/LICENSE.txt for license information.`
			`* SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception`
[cuda] Added support for CUDA built-in variables. Added cuda_builtin_vars.h which implements built-in CUDA variables using __declattr(property). Fields of built-in variables (except for warpSize) are implemented using __declattr(property) which replaces read/write of a member field with a call to a getter/setter member function, in this case with appropriate NVPTX builtin. Added a test case to check diagnostics on attempt to construct or improperly access a built-in variable. Differential Revision: http://reviews.llvm.org/D9064 llvm-svn: 235448 2015-04-22 06:14:13 +08:00			`*`
			`*===-----------------------------------------------------------------------===`
			`*/`

			`#ifndef __CUDA_BUILTIN_VARS_H`
			`#define __CUDA_BUILTIN_VARS_H`

[CUDA] Add conversion operators for threadIdx, blockIdx, gridDim, and blockDim to uint3 and dim3. Summary: This lets you write, e.g. uint3 a = threadIdx; uint3 b = blockIdx; dim3 c = gridDim; dim3 d = blockDim; which is legal in nvcc, but was not legal in clang. The fact that e.g. the type of threadIdx is not actually uint3 is still observable, but now you have to try to observe it. Reviewers: tra Subscribers: echristo, cfe-commits Differential Revision: http://reviews.llvm.org/D17561 llvm-svn: 261777 2016-02-25 05:49:33 +08:00			`// Forward declares from vector_types.h.`
			`struct uint3;`
			`struct dim3;`

[cuda] Added support for CUDA built-in variables. Added cuda_builtin_vars.h which implements built-in CUDA variables using __declattr(property). Fields of built-in variables (except for warpSize) are implemented using __declattr(property) which replaces read/write of a member field with a call to a getter/setter member function, in this case with appropriate NVPTX builtin. Added a test case to check diagnostics on attempt to construct or improperly access a built-in variable. Differential Revision: http://reviews.llvm.org/D9064 llvm-svn: 235448 2015-04-22 06:14:13 +08:00			`// The file implements built-in CUDA variables using __declspec(property).`
			`// https://msdn.microsoft.com/en-us/library/yhfk0thd.aspx`
			`// All read accesses of built-in variable fields get converted into calls to a`
[CUDA] Add conversion operators for threadIdx, blockIdx, gridDim, and blockDim to uint3 and dim3. Summary: This lets you write, e.g. uint3 a = threadIdx; uint3 b = blockIdx; dim3 c = gridDim; dim3 d = blockDim; which is legal in nvcc, but was not legal in clang. The fact that e.g. the type of threadIdx is not actually uint3 is still observable, but now you have to try to observe it. Reviewers: tra Subscribers: echristo, cfe-commits Differential Revision: http://reviews.llvm.org/D17561 llvm-svn: 261777 2016-02-25 05:49:33 +08:00			`// getter function which in turn calls the appropriate builtin to fetch the`
[cuda] Added support for CUDA built-in variables. Added cuda_builtin_vars.h which implements built-in CUDA variables using __declattr(property). Fields of built-in variables (except for warpSize) are implemented using __declattr(property) which replaces read/write of a member field with a call to a getter/setter member function, in this case with appropriate NVPTX builtin. Added a test case to check diagnostics on attempt to construct or improperly access a built-in variable. Differential Revision: http://reviews.llvm.org/D9064 llvm-svn: 235448 2015-04-22 06:14:13 +08:00			`// value.`
			`//`
			`// Example:`
			`// int x = threadIdx.x;`
			`// IR output:`
NVPTX: Use the nvvm builtins to read SRegs rather than the legacy ptx ones The ptx spellings were removed from LLVM in r274769. llvm-svn: 274770 2016-07-08 00:41:08 +08:00			`// %0 = call i32 @llvm.nvvm.read.ptx.sreg.tid.x() #3`
[cuda] Added support for CUDA built-in variables. Added cuda_builtin_vars.h which implements built-in CUDA variables using __declattr(property). Fields of built-in variables (except for warpSize) are implemented using __declattr(property) which replaces read/write of a member field with a call to a getter/setter member function, in this case with appropriate NVPTX builtin. Added a test case to check diagnostics on attempt to construct or improperly access a built-in variable. Differential Revision: http://reviews.llvm.org/D9064 llvm-svn: 235448 2015-04-22 06:14:13 +08:00			`// PTX output:`
			`// mov.u32 %r2, %tid.x;`

			`#define __CUDA_DEVICE_BUILTIN(FIELD, INTRINSIC) \`
			`__declspec(property(get = __fetch_builtin_##FIELD)) unsigned int FIELD; \`
			`static inline __attribute__((always_inline)) \`
			`__attribute__((device)) unsigned int __fetch_builtin_##FIELD(void) { \`
			`return INTRINSIC; \`
			`}`

			`#if __cplusplus >= 201103L`
			`#define __DELETE =delete`
			`#else`
			`#define __DELETE`
			`#endif`

Fix typos in clang Found via codespell -q 3 -I ../clang-whitelist.txt Where whitelist consists of: archtype cas classs checkk compres definit frome iff inteval ith lod methode nd optin ot pres statics te thru Patch by luzpaz! (This is a subset of D44188 that applies cleanly with a few files that have dubious fixes reverted.) Differential revision: https://reviews.llvm.org/D44188 llvm-svn: 329399 2018-04-06 23:14:32 +08:00			`// Make sure nobody can create instances of the special variable types. nvcc`
[cuda] Added support for CUDA built-in variables. Added cuda_builtin_vars.h which implements built-in CUDA variables using __declattr(property). Fields of built-in variables (except for warpSize) are implemented using __declattr(property) which replaces read/write of a member field with a call to a getter/setter member function, in this case with appropriate NVPTX builtin. Added a test case to check diagnostics on attempt to construct or improperly access a built-in variable. Differential Revision: http://reviews.llvm.org/D9064 llvm-svn: 235448 2015-04-22 06:14:13 +08:00			`// also disallows taking address of special variables, so we disable address-of`
			`// operator as well.`
			`#define __CUDA_DISALLOW_BUILTINVAR_ACCESS(TypeName) \`
			`__attribute__((device)) TypeName() __DELETE; \`
			`__attribute__((device)) TypeName(const TypeName &) __DELETE; \`
			`__attribute__((device)) void operator=(const TypeName &) const __DELETE; \`
			`__attribute__((device)) TypeName *operator&() const __DELETE`

			`struct __cuda_builtin_threadIdx_t {`
NVPTX: Use the nvvm builtins to read SRegs rather than the legacy ptx ones The ptx spellings were removed from LLVM in r274769. llvm-svn: 274770 2016-07-08 00:41:08 +08:00			`__CUDA_DEVICE_BUILTIN(x,__nvvm_read_ptx_sreg_tid_x());`
			`__CUDA_DEVICE_BUILTIN(y,__nvvm_read_ptx_sreg_tid_y());`
			`__CUDA_DEVICE_BUILTIN(z,__nvvm_read_ptx_sreg_tid_z());`
[CUDA] Add conversion operators for threadIdx, blockIdx, gridDim, and blockDim to uint3 and dim3. Summary: This lets you write, e.g. uint3 a = threadIdx; uint3 b = blockIdx; dim3 c = gridDim; dim3 d = blockDim; which is legal in nvcc, but was not legal in clang. The fact that e.g. the type of threadIdx is not actually uint3 is still observable, but now you have to try to observe it. Reviewers: tra Subscribers: echristo, cfe-commits Differential Revision: http://reviews.llvm.org/D17561 llvm-svn: 261777 2016-02-25 05:49:33 +08:00			`// threadIdx should be convertible to uint3 (in fact in nvcc, it is a`
			`// uint3). This function is defined after we pull in vector_types.h.`
			`__attribute__((device)) operator uint3() const;`
[cuda] Added support for CUDA built-in variables. Added cuda_builtin_vars.h which implements built-in CUDA variables using __declattr(property). Fields of built-in variables (except for warpSize) are implemented using __declattr(property) which replaces read/write of a member field with a call to a getter/setter member function, in this case with appropriate NVPTX builtin. Added a test case to check diagnostics on attempt to construct or improperly access a built-in variable. Differential Revision: http://reviews.llvm.org/D9064 llvm-svn: 235448 2015-04-22 06:14:13 +08:00			`private:`
			`__CUDA_DISALLOW_BUILTINVAR_ACCESS(__cuda_builtin_threadIdx_t);`
			`};`

			`struct __cuda_builtin_blockIdx_t {`
NVPTX: Use the nvvm builtins to read SRegs rather than the legacy ptx ones The ptx spellings were removed from LLVM in r274769. llvm-svn: 274770 2016-07-08 00:41:08 +08:00			`__CUDA_DEVICE_BUILTIN(x,__nvvm_read_ptx_sreg_ctaid_x());`
			`__CUDA_DEVICE_BUILTIN(y,__nvvm_read_ptx_sreg_ctaid_y());`
			`__CUDA_DEVICE_BUILTIN(z,__nvvm_read_ptx_sreg_ctaid_z());`
[CUDA] Add conversion operators for threadIdx, blockIdx, gridDim, and blockDim to uint3 and dim3. Summary: This lets you write, e.g. uint3 a = threadIdx; uint3 b = blockIdx; dim3 c = gridDim; dim3 d = blockDim; which is legal in nvcc, but was not legal in clang. The fact that e.g. the type of threadIdx is not actually uint3 is still observable, but now you have to try to observe it. Reviewers: tra Subscribers: echristo, cfe-commits Differential Revision: http://reviews.llvm.org/D17561 llvm-svn: 261777 2016-02-25 05:49:33 +08:00			`// blockIdx should be convertible to uint3 (in fact in nvcc, it is a`
			`// uint3). This function is defined after we pull in vector_types.h.`
			`__attribute__((device)) operator uint3() const;`
[cuda] Added support for CUDA built-in variables. Added cuda_builtin_vars.h which implements built-in CUDA variables using __declattr(property). Fields of built-in variables (except for warpSize) are implemented using __declattr(property) which replaces read/write of a member field with a call to a getter/setter member function, in this case with appropriate NVPTX builtin. Added a test case to check diagnostics on attempt to construct or improperly access a built-in variable. Differential Revision: http://reviews.llvm.org/D9064 llvm-svn: 235448 2015-04-22 06:14:13 +08:00			`private:`
			`__CUDA_DISALLOW_BUILTINVAR_ACCESS(__cuda_builtin_blockIdx_t);`
			`};`

			`struct __cuda_builtin_blockDim_t {`
NVPTX: Use the nvvm builtins to read SRegs rather than the legacy ptx ones The ptx spellings were removed from LLVM in r274769. llvm-svn: 274770 2016-07-08 00:41:08 +08:00			`__CUDA_DEVICE_BUILTIN(x,__nvvm_read_ptx_sreg_ntid_x());`
			`__CUDA_DEVICE_BUILTIN(y,__nvvm_read_ptx_sreg_ntid_y());`
			`__CUDA_DEVICE_BUILTIN(z,__nvvm_read_ptx_sreg_ntid_z());`
[CUDA] Add conversion operators for threadIdx, blockIdx, gridDim, and blockDim to uint3 and dim3. Summary: This lets you write, e.g. uint3 a = threadIdx; uint3 b = blockIdx; dim3 c = gridDim; dim3 d = blockDim; which is legal in nvcc, but was not legal in clang. The fact that e.g. the type of threadIdx is not actually uint3 is still observable, but now you have to try to observe it. Reviewers: tra Subscribers: echristo, cfe-commits Differential Revision: http://reviews.llvm.org/D17561 llvm-svn: 261777 2016-02-25 05:49:33 +08:00			`// blockDim should be convertible to dim3 (in fact in nvcc, it is a`
			`// dim3). This function is defined after we pull in vector_types.h.`
			`__attribute__((device)) operator dim3() const;`
[cuda] Added support for CUDA built-in variables. Added cuda_builtin_vars.h which implements built-in CUDA variables using __declattr(property). Fields of built-in variables (except for warpSize) are implemented using __declattr(property) which replaces read/write of a member field with a call to a getter/setter member function, in this case with appropriate NVPTX builtin. Added a test case to check diagnostics on attempt to construct or improperly access a built-in variable. Differential Revision: http://reviews.llvm.org/D9064 llvm-svn: 235448 2015-04-22 06:14:13 +08:00			`private:`
			`__CUDA_DISALLOW_BUILTINVAR_ACCESS(__cuda_builtin_blockDim_t);`
			`};`

			`struct __cuda_builtin_gridDim_t {`
NVPTX: Use the nvvm builtins to read SRegs rather than the legacy ptx ones The ptx spellings were removed from LLVM in r274769. llvm-svn: 274770 2016-07-08 00:41:08 +08:00			`__CUDA_DEVICE_BUILTIN(x,__nvvm_read_ptx_sreg_nctaid_x());`
			`__CUDA_DEVICE_BUILTIN(y,__nvvm_read_ptx_sreg_nctaid_y());`
			`__CUDA_DEVICE_BUILTIN(z,__nvvm_read_ptx_sreg_nctaid_z());`
[CUDA] Add conversion operators for threadIdx, blockIdx, gridDim, and blockDim to uint3 and dim3. Summary: This lets you write, e.g. uint3 a = threadIdx; uint3 b = blockIdx; dim3 c = gridDim; dim3 d = blockDim; which is legal in nvcc, but was not legal in clang. The fact that e.g. the type of threadIdx is not actually uint3 is still observable, but now you have to try to observe it. Reviewers: tra Subscribers: echristo, cfe-commits Differential Revision: http://reviews.llvm.org/D17561 llvm-svn: 261777 2016-02-25 05:49:33 +08:00			`// gridDim should be convertible to dim3 (in fact in nvcc, it is a`
			`// dim3). This function is defined after we pull in vector_types.h.`
			`__attribute__((device)) operator dim3() const;`
[cuda] Added support for CUDA built-in variables. Added cuda_builtin_vars.h which implements built-in CUDA variables using __declattr(property). Fields of built-in variables (except for warpSize) are implemented using __declattr(property) which replaces read/write of a member field with a call to a getter/setter member function, in this case with appropriate NVPTX builtin. Added a test case to check diagnostics on attempt to construct or improperly access a built-in variable. Differential Revision: http://reviews.llvm.org/D9064 llvm-svn: 235448 2015-04-22 06:14:13 +08:00			`private:`
			`__CUDA_DISALLOW_BUILTINVAR_ACCESS(__cuda_builtin_gridDim_t);`
			`};`

			`#define __CUDA_BUILTIN_VAR \`
			`extern const __attribute__((device)) __attribute__((weak))`
			`__CUDA_BUILTIN_VAR __cuda_builtin_threadIdx_t threadIdx;`
			`__CUDA_BUILTIN_VAR __cuda_builtin_blockIdx_t blockIdx;`
			`__CUDA_BUILTIN_VAR __cuda_builtin_blockDim_t blockDim;`
			`__CUDA_BUILTIN_VAR __cuda_builtin_gridDim_t gridDim;`

			`// warpSize should translate to read of %WARP_SZ but there's currently no`
			`// builtin to do so. According to PTX v4.2 docs 'to date, all target`
			`// architectures have a WARP_SZ value of 32'.`
			`__attribute__((device)) const int warpSize = 32;`

			`#undef __CUDA_DEVICE_BUILTIN`
			`#undef __CUDA_BUILTIN_VAR`
			`#undef __CUDA_DISALLOW_BUILTINVAR_ACCESS`

			`#endif /* __CUDA_BUILTIN_VARS_H */`