help="A path to a directory containing vocabulary files required by the tokenizer or the model id of a predefined tokenizer hosted inside a model repo on the Hugging Face Hub.",
)
group.add_argument(
"--eos-token",
type=str,
default=None,
help="EOS token to add after each document. Default: None",