Commit 3be6ac10 authored by Jiezhong Qiu's avatar Jiezhong Qiu
Browse files

update

parent 6212aa28
...@@ -133,7 +133,6 @@ def test_dp(): ...@@ -133,7 +133,6 @@ def test_dp():
moe = MOELayer(num_expert, in_feat, out_feat).cuda() moe = MOELayer(num_expert, in_feat, out_feat).cuda()
moe_dp = torch.nn.DataParallel(moe, device_ids=[0,1,2]) moe_dp = torch.nn.DataParallel(moe, device_ids=[0,1,2])
for i in range(5): for i in range(5):
print(i, "forward")
output = moe_dp(inp, gate) output = moe_dp(inp, gate)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment