Unverified Commit 4f4cad7e authored by Weile's avatar Weile Committed by GitHub
Browse files

Add CUDA support for hipDeviceAttributeWarpSize (#205)

Add macro definition to map hipDeviceAttributeWarpSize to cudaDevAttrWarpSize
for CUDA compatibility in the GetWarpSize() function.
parent fbb3a80e
...@@ -460,6 +460,7 @@ namespace TransferBench ...@@ -460,6 +460,7 @@ namespace TransferBench
// Enumerations // Enumerations
#define hipDeviceAttributeClockRate cudaDevAttrClockRate #define hipDeviceAttributeClockRate cudaDevAttrClockRate
#define hipDeviceAttributeMultiprocessorCount cudaDevAttrMultiProcessorCount #define hipDeviceAttributeMultiprocessorCount cudaDevAttrMultiProcessorCount
#define hipDeviceAttributeWarpSize cudaDevAttrWarpSize
#define hipErrorPeerAccessAlreadyEnabled cudaErrorPeerAccessAlreadyEnabled #define hipErrorPeerAccessAlreadyEnabled cudaErrorPeerAccessAlreadyEnabled
#define hipFuncCachePreferShared cudaFuncCachePreferShared #define hipFuncCachePreferShared cudaFuncCachePreferShared
#define hipMemcpyDefault cudaMemcpyDefault #define hipMemcpyDefault cudaMemcpyDefault
...@@ -4104,6 +4105,7 @@ static bool IsConfiguredGid(union ibv_gid const& gid) ...@@ -4104,6 +4105,7 @@ static bool IsConfiguredGid(union ibv_gid const& gid)
#undef hipDeviceAttributeClockRate #undef hipDeviceAttributeClockRate
#undef hipDeviceAttributeMaxSharedMemoryPerMultiprocessor #undef hipDeviceAttributeMaxSharedMemoryPerMultiprocessor
#undef hipDeviceAttributeMultiprocessorCount #undef hipDeviceAttributeMultiprocessorCount
#undef hipDeviceAttributeWarpSize
#undef hipErrorPeerAccessAlreadyEnabled #undef hipErrorPeerAccessAlreadyEnabled
#undef hipFuncCachePreferShared #undef hipFuncCachePreferShared
#undef hipMemcpyDefault #undef hipMemcpyDefault
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment