"git@developer.sourcefind.cn:chenpangpang/transformers.git" did not exist on "f03c0c1423d4635f3e71a6c24053f01f6f02063c"
Commit bcd4aa8f authored by thomwolf's avatar thomwolf
Browse files

update evaluation example

parent a69ec2c7
...@@ -44,18 +44,18 @@ parser = argparse.ArgumentParser(description='PyTorch Transformer Language Model ...@@ -44,18 +44,18 @@ parser = argparse.ArgumentParser(description='PyTorch Transformer Language Model
parser.add_argument('--model_name', type=str, default='transfo-xl-wt103', parser.add_argument('--model_name', type=str, default='transfo-xl-wt103',
choices=['transfo-xl-wt103'], #, 'lm1b', 'enwik8', 'text8'], choices=['transfo-xl-wt103'], #, 'lm1b', 'enwik8', 'text8'],
help='pretrained model name') help='pretrained model name')
parser.add_argument('--split', type=str, default='all', parser.add_argument('--split', type=str, default='test',
choices=['all', 'valid', 'test'], choices=['all', 'valid', 'test'],
help='which split to evaluate') help='which split to evaluate')
parser.add_argument('--batch_size', type=int, default=10, parser.add_argument('--batch_size', type=int, default=10,
help='batch size') help='batch size')
parser.add_argument('--tgt_len', type=int, default=5, parser.add_argument('--tgt_len', type=int, default=128,
help='number of tokens to predict') help='number of tokens to predict')
parser.add_argument('--ext_len', type=int, default=0, parser.add_argument('--ext_len', type=int, default=0,
help='length of the extended context') help='length of the extended context')
parser.add_argument('--mem_len', type=int, default=0, parser.add_argument('--mem_len', type=int, default=1600,
help='length of the retained previous heads') help='length of the retained previous heads')
parser.add_argument('--clamp_len', type=int, default=-1, parser.add_argument('--clamp_len', type=int, default=1000,
help='max positional embedding index') help='max positional embedding index')
parser.add_argument('--cuda', action='store_true', parser.add_argument('--cuda', action='store_true',
help='use CUDA') help='use CUDA')
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment