Commit a43caff7 authored by Jiezhong Qiu's avatar Jiezhong Qiu
Browse files

update

parent 4f7a182b
...@@ -98,7 +98,7 @@ class HierarchicalMoEPositionwiseFF(nn.Module): ...@@ -98,7 +98,7 @@ class HierarchicalMoEPositionwiseFF(nn.Module):
self.d_inner = d_inner self.d_inner = d_inner
self.dropout = dropout self.dropout = dropout
self.block_net = nn.Linear(n_block, d_inner) self.block_net = nn.Linear(d_model, n_block)
self.W1 = nn.Parameter(torch.Tensor(n_block, d_block, d_model)) self.W1 = nn.Parameter(torch.Tensor(n_block, d_block, d_model))
self.b1 = nn.Parameter(torch.Tensor(n_block, d_block)) self.b1 = nn.Parameter(torch.Tensor(n_block, d_block))
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment