Commit 09379ad8 authored by alexeib's avatar alexeib Committed by Myle Ott
Browse files

add big en_fr transformer architecture

parent e774fda7
...@@ -432,6 +432,11 @@ def transformer_vaswani_wmt_en_de_big(args): ...@@ -432,6 +432,11 @@ def transformer_vaswani_wmt_en_de_big(args):
args.dropout = getattr(args, 'dropout', 0.3) args.dropout = getattr(args, 'dropout', 0.3)
base_architecture(args) base_architecture(args)
@register_model_architecture('transformer', 'transformer_vaswani_wmt_en_fr_big')
def transformer_vaswani_wmt_en_fr_big(args):
args.dropout = getattr(args, 'dropout', 0.1)
transformer_vaswani_wmt_en_de_big(args)
@register_model_architecture('transformer', 'transformer_wmt_en_de_big') @register_model_architecture('transformer', 'transformer_wmt_en_de_big')
def transformer_wmt_en_de_big(args): def transformer_wmt_en_de_big(args):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment