cuda_utils.h 481 Bytes
Newer Older
1
2
#pragma once

3
4
5
6
7
8
9
10
11
12
#if defined(__CUDACC__) || defined(_NVHPC_CUDA)
  #define HOST_DEVICE_INLINE __forceinline__ __host__ __device__
  #define DEVICE_INLINE __forceinline__ __device__
  #define HOST_INLINE __forceinline__ __host__
#else
  #define HOST_DEVICE_INLINE inline
  #define DEVICE_INLINE inline
  #define HOST_INLINE inline
#endif

13
int64_t get_device_attribute(int64_t attribute, int64_t device_id);
14

15
int64_t get_max_shared_memory_per_block_device_attribute(int64_t device_id);