Commit f1295380 authored by Eddie Yan's avatar Eddie Yan
Browse files

Update layer_norm_cuda_kernel.cu

parent 1ec6b0e9
...@@ -645,6 +645,8 @@ void cuComputeGradInput( ...@@ -645,6 +645,8 @@ void cuComputeGradInput(
k_grad_input[l] = static_cast<T>(f_grad_input); k_grad_input[l] = static_cast<T>(f_grad_input);
} }
} }
// prevent race where buf is written again before reads are done
__syncthreads();
} }
} }
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment