CbC/CbC_llvm: clang/lib/Headers/__clang_cuda_builtin

annotate clang/lib/Headers/__clang_cuda_builtin_vars.h @ 150:1d019706d866

LLVM10

author	anatofuz
date	Thu, 13 Feb 2020 15:10:13 +0900
parents
children	2e18cbf3894f

rev	line source
150 1d019706d866 LLVM10 anatofuz parents: diff changeset	1 /*===---- cuda_builtin_vars.h - CUDA built-in variables ---------------------===
1d019706d866 LLVM10 anatofuz parents: diff changeset	2 *
1d019706d866 LLVM10 anatofuz parents: diff changeset	3 * Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
1d019706d866 LLVM10 anatofuz parents: diff changeset	4 * See https://llvm.org/LICENSE.txt for license information.
1d019706d866 LLVM10 anatofuz parents: diff changeset	5 * SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
1d019706d866 LLVM10 anatofuz parents: diff changeset	6 *
1d019706d866 LLVM10 anatofuz parents: diff changeset	7 *===-----------------------------------------------------------------------===
1d019706d866 LLVM10 anatofuz parents: diff changeset	8 */
1d019706d866 LLVM10 anatofuz parents: diff changeset	9
1d019706d866 LLVM10 anatofuz parents: diff changeset	10 #ifndef __CUDA_BUILTIN_VARS_H
1d019706d866 LLVM10 anatofuz parents: diff changeset	11 #define __CUDA_BUILTIN_VARS_H
1d019706d866 LLVM10 anatofuz parents: diff changeset	12
1d019706d866 LLVM10 anatofuz parents: diff changeset	13 // Forward declares from vector_types.h.
1d019706d866 LLVM10 anatofuz parents: diff changeset	14 struct uint3;
1d019706d866 LLVM10 anatofuz parents: diff changeset	15 struct dim3;
1d019706d866 LLVM10 anatofuz parents: diff changeset	16
1d019706d866 LLVM10 anatofuz parents: diff changeset	17 // The file implements built-in CUDA variables using __declspec(property).
1d019706d866 LLVM10 anatofuz parents: diff changeset	18 // https://msdn.microsoft.com/en-us/library/yhfk0thd.aspx
1d019706d866 LLVM10 anatofuz parents: diff changeset	19 // All read accesses of built-in variable fields get converted into calls to a
1d019706d866 LLVM10 anatofuz parents: diff changeset	20 // getter function which in turn calls the appropriate builtin to fetch the
1d019706d866 LLVM10 anatofuz parents: diff changeset	21 // value.
1d019706d866 LLVM10 anatofuz parents: diff changeset	22 //
1d019706d866 LLVM10 anatofuz parents: diff changeset	23 // Example:
1d019706d866 LLVM10 anatofuz parents: diff changeset	24 // int x = threadIdx.x;
1d019706d866 LLVM10 anatofuz parents: diff changeset	25 // IR output:
1d019706d866 LLVM10 anatofuz parents: diff changeset	26 // %0 = call i32 @llvm.nvvm.read.ptx.sreg.tid.x() #3
1d019706d866 LLVM10 anatofuz parents: diff changeset	27 // PTX output:
1d019706d866 LLVM10 anatofuz parents: diff changeset	28 // mov.u32 %r2, %tid.x;
1d019706d866 LLVM10 anatofuz parents: diff changeset	29
1d019706d866 LLVM10 anatofuz parents: diff changeset	30 #define __CUDA_DEVICE_BUILTIN(FIELD, INTRINSIC) \
1d019706d866 LLVM10 anatofuz parents: diff changeset	31 __declspec(property(get = __fetch_builtin_##FIELD)) unsigned int FIELD; \
1d019706d866 LLVM10 anatofuz parents: diff changeset	32 static inline __attribute__((always_inline)) \
1d019706d866 LLVM10 anatofuz parents: diff changeset	33 __attribute__((device)) unsigned int __fetch_builtin_##FIELD(void) { \
1d019706d866 LLVM10 anatofuz parents: diff changeset	34 return INTRINSIC; \
1d019706d866 LLVM10 anatofuz parents: diff changeset	35 }
1d019706d866 LLVM10 anatofuz parents: diff changeset	36
1d019706d866 LLVM10 anatofuz parents: diff changeset	37 #if __cplusplus >= 201103L
1d019706d866 LLVM10 anatofuz parents: diff changeset	38 #define __DELETE =delete
1d019706d866 LLVM10 anatofuz parents: diff changeset	39 #else
1d019706d866 LLVM10 anatofuz parents: diff changeset	40 #define __DELETE
1d019706d866 LLVM10 anatofuz parents: diff changeset	41 #endif
1d019706d866 LLVM10 anatofuz parents: diff changeset	42
1d019706d866 LLVM10 anatofuz parents: diff changeset	43 // Make sure nobody can create instances of the special variable types. nvcc
1d019706d866 LLVM10 anatofuz parents: diff changeset	44 // also disallows taking address of special variables, so we disable address-of
1d019706d866 LLVM10 anatofuz parents: diff changeset	45 // operator as well.
1d019706d866 LLVM10 anatofuz parents: diff changeset	46 #define __CUDA_DISALLOW_BUILTINVAR_ACCESS(TypeName) \
1d019706d866 LLVM10 anatofuz parents: diff changeset	47 __attribute__((device)) TypeName() __DELETE; \
1d019706d866 LLVM10 anatofuz parents: diff changeset	48 __attribute__((device)) TypeName(const TypeName &) __DELETE; \
1d019706d866 LLVM10 anatofuz parents: diff changeset	49 __attribute__((device)) void operator=(const TypeName &) const __DELETE; \
1d019706d866 LLVM10 anatofuz parents: diff changeset	50 __attribute__((device)) TypeName *operator&() const __DELETE
1d019706d866 LLVM10 anatofuz parents: diff changeset	51
1d019706d866 LLVM10 anatofuz parents: diff changeset	52 struct __cuda_builtin_threadIdx_t {
1d019706d866 LLVM10 anatofuz parents: diff changeset	53 __CUDA_DEVICE_BUILTIN(x,__nvvm_read_ptx_sreg_tid_x());
1d019706d866 LLVM10 anatofuz parents: diff changeset	54 __CUDA_DEVICE_BUILTIN(y,__nvvm_read_ptx_sreg_tid_y());
1d019706d866 LLVM10 anatofuz parents: diff changeset	55 __CUDA_DEVICE_BUILTIN(z,__nvvm_read_ptx_sreg_tid_z());
1d019706d866 LLVM10 anatofuz parents: diff changeset	56 // threadIdx should be convertible to uint3 (in fact in nvcc, it is a
1d019706d866 LLVM10 anatofuz parents: diff changeset	57 // uint3). This function is defined after we pull in vector_types.h.
1d019706d866 LLVM10 anatofuz parents: diff changeset	58 __attribute__((device)) operator uint3() const;
1d019706d866 LLVM10 anatofuz parents: diff changeset	59 private:
1d019706d866 LLVM10 anatofuz parents: diff changeset	60 __CUDA_DISALLOW_BUILTINVAR_ACCESS(__cuda_builtin_threadIdx_t);
1d019706d866 LLVM10 anatofuz parents: diff changeset	61 };
1d019706d866 LLVM10 anatofuz parents: diff changeset	62
1d019706d866 LLVM10 anatofuz parents: diff changeset	63 struct __cuda_builtin_blockIdx_t {
1d019706d866 LLVM10 anatofuz parents: diff changeset	64 __CUDA_DEVICE_BUILTIN(x,__nvvm_read_ptx_sreg_ctaid_x());
1d019706d866 LLVM10 anatofuz parents: diff changeset	65 __CUDA_DEVICE_BUILTIN(y,__nvvm_read_ptx_sreg_ctaid_y());
1d019706d866 LLVM10 anatofuz parents: diff changeset	66 __CUDA_DEVICE_BUILTIN(z,__nvvm_read_ptx_sreg_ctaid_z());
1d019706d866 LLVM10 anatofuz parents: diff changeset	67 // blockIdx should be convertible to uint3 (in fact in nvcc, it is a
1d019706d866 LLVM10 anatofuz parents: diff changeset	68 // uint3). This function is defined after we pull in vector_types.h.
1d019706d866 LLVM10 anatofuz parents: diff changeset	69 __attribute__((device)) operator uint3() const;
1d019706d866 LLVM10 anatofuz parents: diff changeset	70 private:
1d019706d866 LLVM10 anatofuz parents: diff changeset	71 __CUDA_DISALLOW_BUILTINVAR_ACCESS(__cuda_builtin_blockIdx_t);
1d019706d866 LLVM10 anatofuz parents: diff changeset	72 };
1d019706d866 LLVM10 anatofuz parents: diff changeset	73
1d019706d866 LLVM10 anatofuz parents: diff changeset	74 struct __cuda_builtin_blockDim_t {
1d019706d866 LLVM10 anatofuz parents: diff changeset	75 __CUDA_DEVICE_BUILTIN(x,__nvvm_read_ptx_sreg_ntid_x());
1d019706d866 LLVM10 anatofuz parents: diff changeset	76 __CUDA_DEVICE_BUILTIN(y,__nvvm_read_ptx_sreg_ntid_y());
1d019706d866 LLVM10 anatofuz parents: diff changeset	77 __CUDA_DEVICE_BUILTIN(z,__nvvm_read_ptx_sreg_ntid_z());
1d019706d866 LLVM10 anatofuz parents: diff changeset	78 // blockDim should be convertible to dim3 (in fact in nvcc, it is a
1d019706d866 LLVM10 anatofuz parents: diff changeset	79 // dim3). This function is defined after we pull in vector_types.h.
1d019706d866 LLVM10 anatofuz parents: diff changeset	80 __attribute__((device)) operator dim3() const;
1d019706d866 LLVM10 anatofuz parents: diff changeset	81 private:
1d019706d866 LLVM10 anatofuz parents: diff changeset	82 __CUDA_DISALLOW_BUILTINVAR_ACCESS(__cuda_builtin_blockDim_t);
1d019706d866 LLVM10 anatofuz parents: diff changeset	83 };
1d019706d866 LLVM10 anatofuz parents: diff changeset	84
1d019706d866 LLVM10 anatofuz parents: diff changeset	85 struct __cuda_builtin_gridDim_t {
1d019706d866 LLVM10 anatofuz parents: diff changeset	86 __CUDA_DEVICE_BUILTIN(x,__nvvm_read_ptx_sreg_nctaid_x());
1d019706d866 LLVM10 anatofuz parents: diff changeset	87 __CUDA_DEVICE_BUILTIN(y,__nvvm_read_ptx_sreg_nctaid_y());
1d019706d866 LLVM10 anatofuz parents: diff changeset	88 __CUDA_DEVICE_BUILTIN(z,__nvvm_read_ptx_sreg_nctaid_z());
1d019706d866 LLVM10 anatofuz parents: diff changeset	89 // gridDim should be convertible to dim3 (in fact in nvcc, it is a
1d019706d866 LLVM10 anatofuz parents: diff changeset	90 // dim3). This function is defined after we pull in vector_types.h.
1d019706d866 LLVM10 anatofuz parents: diff changeset	91 __attribute__((device)) operator dim3() const;
1d019706d866 LLVM10 anatofuz parents: diff changeset	92 private:
1d019706d866 LLVM10 anatofuz parents: diff changeset	93 __CUDA_DISALLOW_BUILTINVAR_ACCESS(__cuda_builtin_gridDim_t);
1d019706d866 LLVM10 anatofuz parents: diff changeset	94 };
1d019706d866 LLVM10 anatofuz parents: diff changeset	95
1d019706d866 LLVM10 anatofuz parents: diff changeset	96 #define __CUDA_BUILTIN_VAR \
1d019706d866 LLVM10 anatofuz parents: diff changeset	97 extern const __attribute__((device)) __attribute__((weak))
1d019706d866 LLVM10 anatofuz parents: diff changeset	98 __CUDA_BUILTIN_VAR __cuda_builtin_threadIdx_t threadIdx;
1d019706d866 LLVM10 anatofuz parents: diff changeset	99 __CUDA_BUILTIN_VAR __cuda_builtin_blockIdx_t blockIdx;
1d019706d866 LLVM10 anatofuz parents: diff changeset	100 __CUDA_BUILTIN_VAR __cuda_builtin_blockDim_t blockDim;
1d019706d866 LLVM10 anatofuz parents: diff changeset	101 __CUDA_BUILTIN_VAR __cuda_builtin_gridDim_t gridDim;
1d019706d866 LLVM10 anatofuz parents: diff changeset	102
1d019706d866 LLVM10 anatofuz parents: diff changeset	103 // warpSize should translate to read of %WARP_SZ but there's currently no
1d019706d866 LLVM10 anatofuz parents: diff changeset	104 // builtin to do so. According to PTX v4.2 docs 'to date, all target
1d019706d866 LLVM10 anatofuz parents: diff changeset	105 // architectures have a WARP_SZ value of 32'.
1d019706d866 LLVM10 anatofuz parents: diff changeset	106 __attribute__((device)) const int warpSize = 32;
1d019706d866 LLVM10 anatofuz parents: diff changeset	107
1d019706d866 LLVM10 anatofuz parents: diff changeset	108 #undef __CUDA_DEVICE_BUILTIN
1d019706d866 LLVM10 anatofuz parents: diff changeset	109 #undef __CUDA_BUILTIN_VAR
1d019706d866 LLVM10 anatofuz parents: diff changeset	110 #undef __CUDA_DISALLOW_BUILTINVAR_ACCESS
1d019706d866 LLVM10 anatofuz parents: diff changeset	111
1d019706d866 LLVM10 anatofuz parents: diff changeset	112 #endif /* __CUDA_BUILTIN_VARS_H */

Mercurial > hg > CbC > CbC_llvm

annotate clang/lib/Headers/__clang_cuda_builtin_vars.h @ 150:1d019706d866