Commit 6429fa29 authored by Jiezhong Qiu's avatar Jiezhong Qiu
Browse files

2 out of 32 experts

parent 1bde1726
......@@ -34,7 +34,7 @@ class PositionalEmbedding(nn.Module):
return pos_emb[:,None,:]
class CustomizedMoEPositionwiseFF(nn.Module):
def __init__(self, d_model, d_inner, dropout, pre_lnorm=False, top_k=2, num_expert=4):
def __init__(self, d_model, d_inner, dropout, pre_lnorm=False, top_k=2, num_expert=32):
super(CustomizedMoEPositionwiseFF, self).__init__()
print("CustomizedMoEPositionwiseFF num_expert=%d top_k=%d" % (num_expert, top_k))
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment