Merge pull request #1056 from Morizeyao/master

Swap of optimizer.step and scheduler.step for lm finetuning examples

Merge pull request #1056 from Morizeyao/master
Swap of optimizer.step and scheduler.step for lm finetuning examples
933841d9 · Thomas Wolf · GitHub · b0b9b809 · d86b49ac · 933841d9
Unverified Commit 933841d9 authored Aug 20, 2019 by Thomas Wolf Committed by GitHub Aug 20, 2019
Showing with 2 additions and 2 deletions

examples/lm_finetuning/finetune_on_pregenerated.py examples/lm_finetuning/finetune_on_pregenerated.py +1 -1

examples/lm_finetuning/simple_lm_finetuning.py examples/lm_finetuning/simple_lm_finetuning.py +1 -1

No files found.
--- a/examples/lm_finetuning/finetune_on_pregenerated.py
+++ b/examples/lm_finetuning/finetune_on_pregenerated.py
@@ -314,8 +314,8 @@ def main():
                mean_loss = tr_loss * args.gradient_accumulation_steps / nb_tr_steps
                pbar.set_postfix_str(f"Loss: {mean_loss:.5f}")
                if (step + 1) % args.gradient_accumulation_steps == 0:
-                    scheduler.step()  # Update learning rate schedule
                    optimizer.step()
+                    scheduler.step()  # Update learning rate schedule
                    optimizer.zero_grad()
                    global_step += 1

--- a/examples/lm_finetuning/simple_lm_finetuning.py
+++ b/examples/lm_finetuning/simple_lm_finetuning.py
@@ -602,8 +602,8 @@ def main():
                nb_tr_examples += input_ids.size(0)
                nb_tr_steps += 1
                if (step + 1) % args.gradient_accumulation_steps == 0:
-                    scheduler.step()  # Update learning rate schedule
                    optimizer.step()
+                    scheduler.step()  # Update learning rate schedule
                    optimizer.zero_grad()
                    global_step += 1