"git@developer.sourcefind.cn:OpenDAS/torchaudio.git" did not exist on "9912e54df0522915f0f15dd637636327301b9d75"
Commit dfd9b5d5 authored by Rick Ho's avatar Rick Ho
Browse files

fix smart schedule shadow sync bug

parent 0a6becae
......@@ -338,7 +338,7 @@ void fmoe_cuda_fused_backward_impl(
collect_fn(si, i / num_expert, 0);
if (i / num_expert == rank) {
cudaEventCreate(evt_reduce + i % num_expert);
cudaEventRecord(evt_reduce[i % num_expert], smgr->stream(num_expert));
cudaEventRecord(evt_reduce[i % num_expert], smgr->stream(0));
}
++si;
}
......@@ -367,7 +367,6 @@ void fmoe_cuda_fused_backward_impl(
for (long i = 0, si = 0; i < world_size * num_expert; ++i) {
if (stored_models[i]) {
if (i / num_expert == rank) {
FMOE_SWE(smgr->stream(0), evt_reduce[i % num_expert]);
FMOE_SWE(smgr->torchStream(), evt_reduce[i % num_expert]);
set_grad_fn(si, i % num_expert);
}
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment