Commit f1295380 authored by Eddie Yan's avatar Eddie Yan
Browse files

Update layer_norm_cuda_kernel.cu

parent 1ec6b0e9
......@@ -645,6 +645,8 @@ void cuComputeGradInput(
k_grad_input[l] = static_cast<T>(f_grad_input);
}
}
// prevent race where buf is written again before reads are done
__syncthreads();
}
}
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment