Unverified Commit 7e099371 authored by Peng's avatar Peng Committed by GitHub
Browse files

Merge pull request #23 from ashishfarmer/launch_bounds_fix

Fix launch bounds for cleanup(...) call
parents f2fcce58 a640c63b
......@@ -194,7 +194,11 @@ struct MaxNormFunctor
};
__global__ void cleanup(
__global__ void
#ifdef __HIP_PLATFORM_HCC__
__launch_bounds__(1024)
#endif
cleanup(
float* output,
float* output_per_tensor,
float* ret,
......@@ -231,7 +235,11 @@ __global__ void cleanup(
}
}
__global__ void cleanup_v2(
__global__ void
#ifdef __HIP_PLATFORM_HCC__
__launch_bounds__(1024)
#endif
cleanup_v2(
float* output,
float* output_per_tensor,
float* ret,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment