Unverified Commit ceeab469 authored by gilbertlee-amd's avatar gilbertlee-amd Committed by GitHub
Browse files

Another fix for CUDA kernel (#84)

parent 47480a59
...@@ -284,7 +284,9 @@ __global__ void __launch_bounds__(BLOCKSIZE) ...@@ -284,7 +284,9 @@ __global__ void __launch_bounds__(BLOCKSIZE)
__threadfence_system(); __threadfence_system();
p.stopCycle = GetTimestamp(); p.stopCycle = GetTimestamp();
p.startCycle = startCycle; p.startCycle = startCycle;
#if !defined(__NVCC__)
p.xccId = xccId; p.xccId = xccId;
#endif
__trace_hwreg(); __trace_hwreg();
} }
} }
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment