Commit 59b0fb60 authored by xiabo's avatar xiabo
Browse files

mmcv编译不过修改

parent f7e64e20
...@@ -78,7 +78,11 @@ __global__ void correlation_forward_cuda_kernel( ...@@ -78,7 +78,11 @@ __global__ void correlation_forward_cuda_kernel(
} }
// accumulate // accumulate
for (int offset = 16; offset > 0; offset /= 2) for (int offset = 16; offset > 0; offset /= 2)
#ifdef HIP_DIFF
prod_sum += __shfl_down(FULL_MASK, prod_sum, offset);
#else
prod_sum += __shfl_down_sync(FULL_MASK, float(prod_sum), offset); prod_sum += __shfl_down_sync(FULL_MASK, float(prod_sum), offset);
#endif
if (thread == 0) { if (thread == 0) {
output[n][ph][pw][h][w] = prod_sum; output[n][ph][pw][h][w] = prod_sum;
} }
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment