"src/git@developer.sourcefind.cn:renzhc/diffusers_dcu.git" did not exist on "64b3e0f5390728f62887be7820a5e2724d0fb419"
Unverified Commit 7d05704c authored by mcarilli's avatar mcarilli Committed by GitHub
Browse files

Merge pull request #126 from NVIDIA/nhwc_sbn_patch_Pr

patching grid reduction to be volta-safe
parents 438f6f9f 38bada23
...@@ -508,6 +508,7 @@ welford_kernel_c_last( ...@@ -508,6 +508,7 @@ welford_kernel_c_last(
} }
__threadfence(); __threadfence();
__syncthreads(); // ensuring writes to staging_ is visible to all blocks
__shared__ bool is_last_block_done; __shared__ bool is_last_block_done;
// mark block done // mark block done
...@@ -724,6 +725,7 @@ __global__ void reduce_bn_c_last_kernel( ...@@ -724,6 +725,7 @@ __global__ void reduce_bn_c_last_kernel(
} }
__threadfence(); __threadfence();
__syncthreads(); // ensuring writes to staging_ is visible to all blocks
__shared__ bool is_last_block_done; __shared__ bool is_last_block_done;
// mark block done // mark block done
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment