fix scatter bug across gpus

90c4bccf · Rich Ho · 670d70ed · 90c4bccf
Commit 90c4bccf authored May 19, 2021 by Rich Ho
Hide whitespace changes
Inline Side-by-side

Showing with 4 additions and 4 deletions

fmoe/functions.py fmoe/functions.py +4 -4

No files found.
--- a/fmoe/functions.py
+++ b/fmoe/functions.py
@@ -117,7 +117,7 @@ class MOEScatter(Function):
            )
        else:
            global_input_buf = local_input_buf
-        ctx.moe_args = inp.shape[0], world_size
+        ctx.moe_args = inp.shape[0], pos.shape[0], world_size
        variables = (pos, local_expert_count, global_expert_count)
        ctx.save_for_backward(*variables)
        return global_input_buf
@@ -125,19 +125,19 @@ class MOEScatter(Function):
    @staticmethod
    def backward(ctx, global_grad_in):
        (pos, local_expert_count, global_expert_count) = ctx.saved_tensors
-        (local_batch_size, world_size) = ctx.moe_args
+        (inp_batch_size, buf_batch_size, world_size) = ctx.moe_args

        if world_size > 1:
            (local_grad_in,) = fmoe_cuda.global_gather(
                global_grad_in,
                local_expert_count,
                global_expert_count,
-                local_batch_size,
+                buf_batch_size,
                world_size,
            )
        else:
            local_grad_in = global_grad_in
-        grad_in = _local_gather(local_grad_in, pos, local_batch_size)
+        grad_in = _local_gather(local_grad_in, pos, inp_batch_size)
        return grad_in, None, None, None, None, None