Unverified Commit 28f7ca1f authored by Zeyao Du's avatar Zeyao Du Committed by GitHub
Browse files

swap optimizer.step and scheduler.step

parent c589862b
...@@ -602,8 +602,8 @@ def main(): ...@@ -602,8 +602,8 @@ def main():
nb_tr_examples += input_ids.size(0) nb_tr_examples += input_ids.size(0)
nb_tr_steps += 1 nb_tr_steps += 1
if (step + 1) % args.gradient_accumulation_steps == 0: if (step + 1) % args.gradient_accumulation_steps == 0:
scheduler.step() # Update learning rate schedule
optimizer.step() optimizer.step()
scheduler.step() # Update learning rate schedule
optimizer.zero_grad() optimizer.zero_grad()
global_step += 1 global_step += 1
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment