Commit 0bab56b7 authored by Yoach Lacombe's avatar Yoach Lacombe
Browse files

fix name and add min new tokens

parent a0bc9e78
......@@ -126,7 +126,7 @@ def main():
"adam_beta2": training_args.adam_beta2,
"temperature": model_args.temperature,
},
init_kwargs={"wandb": {"name": data_args.wandb_run_name}} if data_args.wandb_run_name else None,
init_kwargs={"wandb": {"name": data_args.wandb_run_name}} if data_args.wandb_run_name else {},
)
# Detecting last checkpoint and eventually continue from last checkpoint
......@@ -750,6 +750,10 @@ def main():
"do_sample": model_args.do_sample,
"temperature": model_args.temperature,
"max_length": model_args.max_length,
# Because of the delayed pattern mask, generation might stop earlier because of unexpected behaviour
# on the first tokens of the codebooks that are delayed.
# This fix the issue.
"min_new_tokens": num_codebooks + 1,
}
# Define gradient update step fn
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment