fix shadow

945004e7 · Rick Ho · 226e0779 · 945004e7 · 945004e7
Commit 945004e7 authored Sep 11, 2023 by Rick Ho
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 3 deletions

cuda/fastermoe/smart_schedule.cpp cuda/fastermoe/smart_schedule.cpp +1 -2

fmoe/fastermoe/schedule.py fmoe/fastermoe/schedule.py +1 -1

No files found.
--- a/cuda/fastermoe/smart_schedule.cpp
+++ b/cuda/fastermoe/smart_schedule.cpp
@@ -44,10 +44,9 @@ void _reduce_grad(
        long expert_size) {
    auto smgr = getCudaStreamManager(t.device().index());
-    auto torch_stream = c10::cuda::getCurrentCUDAStream().stream();
    cudaEvent_t evt_stash;
    cudaEventCreate(&evt_stash);
-    cudaEventRecord(evt_stash, torch_stream);
+    cudaEventRecord(evt_stash, smgr->torchStream());
    FMOE_SWE(smgr->stream(0), evt_stash);
    cudaEventDestroy(evt_stash);

--- a/fmoe/fastermoe/schedule.py
+++ b/fmoe/fastermoe/schedule.py
@@ -37,7 +37,7 @@ class MoEForward(Function):
                try:
                    # To skip torch autograd's version check.
                    with torch.autograd.graph.saved_tensors_hooks(nothing, nothing):
-                        y0 = expert_fn(x, torch.tensor([x.shape[0]], dtype=torch.int64))
+                        y0 = expert_fn(x, torch.tensor([x.shape[0]], dtype=torch.int64), expert_idx)
                except Exception as e:
                    # Ignore the error and fall back for compatibility to older
                    # versions of PyTorch