fix expert number

bc8e8181 · Rick Ho · 761b4ffc · bc8e8181
Commit bc8e8181 authored Jan 27, 2021 by Rick Ho
Hide whitespace changes
Inline Side-by-side

Showing with 1 addition and 1 deletion

fmoe/moe.py fmoe/moe.py +1 -1

No files found.
--- a/fmoe/moe.py
+++ b/fmoe/moe.py
@@ -43,7 +43,7 @@ class FFFN(nn.Module):
                world_size=world_size)
        self.h4toh = FMoE(num_expert, d_hidden, d_model, 
                world_size=world_size)
-        self.gate = nn.Linear(d_model, num_expert)
+        self.gate = nn.Linear(d_model, num_expert * world_size)
        self.layer_norm = nn.LayerNorm(d_model)
        self.bias = torch.nn.parameter.Parameter(torch.zeros(d_model,
                dtype=torch.float32))