update

c5d719cf · Jiezhong Qiu · 79f16297 · c5d719cf
Commit c5d719cf authored Dec 29, 2020 by Jiezhong Qiu
Hide whitespace changes
Inline Side-by-side

Showing with 3 additions and 3 deletions

pytorch/cuda/moe.py pytorch/cuda/moe.py +3 -3

No files found.
--- a/pytorch/cuda/moe.py
+++ b/pytorch/cuda/moe.py
@@ -20,8 +20,8 @@ class MOEFunction(Function):
    @staticmethod
    def backward(ctx, grad_out):
        grad_input, grad_weight = moe_cuda.backward(
-            grad_out.contiguous(), *ctx.saved_variables)
-        return grad_input, grad_weight
+            grad_out.contiguous(), *ctx.saved_tensors)
+        return grad_input, None, grad_weight


 class MOELayer(nn.Module):
@@ -46,7 +46,7 @@ out_feat = 512
 moe = MOELayer(num_expert, in_feat, out_feat).cuda()

 input = torch.rand(batch_size, in_feat).cuda()
-gate = torch.randint(low=0, high=num_expert, size=(batch_size, )).int().cuda()
+gate = torch.randint(low=0, high=num_expert, size=(batch_size, ), requires_grad=False).int().cuda()

 output = moe(input, gate)