Commit c380000e authored by Mostofa Patwary's avatar Mostofa Patwary
Browse files

fixed exit interval

parent 097fa65b
...@@ -884,9 +884,9 @@ def train(forward_step_func, model, optimizer, lr_scheduler, ...@@ -884,9 +884,9 @@ def train(forward_step_func, model, optimizer, lr_scheduler,
# Exiting based on iterations # Exiting based on iterations
if args.exit_interval and iteration % args.exit_interval == 0: if args.exit_interval and iteration % args.exit_interval == 0:
#if not saved_checkpoint: if not saved_checkpoint:
# save_checkpoint_and_time(iteration, model, optimizer, save_checkpoint_and_time(iteration, model, optimizer,
# lr_scheduler) lr_scheduler)
torch.distributed.barrier() torch.distributed.barrier()
print_datetime('exiting program at iteration {}'.format(iteration)) print_datetime('exiting program at iteration {}'.format(iteration))
sys.exit() sys.exit()
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment