Update example files so that tr_loss is not affected by args.gradient_accumulation_step

ed8fad73 · Mathieu Prouveur · c36cca07 · ed8fad73 · ed8fad73
Commit ed8fad73 authored Apr 24, 2019 by Mathieu Prouveur
Show whitespace changes
Inline Side-by-side

Showing with 2 additions and 2 deletions

examples/run_classifier.py examples/run_classifier.py +1 -1

examples/run_swag.py examples/run_swag.py +1 -1

No files found.
--- a/examples/run_classifier.py
+++ b/examples/run_classifier.py
@@ -845,7 +845,7 @@ def main():
                else:
                    loss.backward()

-                tr_loss += loss.item()
+                tr_loss += loss.item() * args.gradient_accumulation_steps
                nb_tr_examples += input_ids.size(0)
                nb_tr_steps += 1
                if (step + 1) % args.gradient_accumulation_steps == 0:

--- a/examples/run_swag.py
+++ b/examples/run_swag.py
@@ -452,7 +452,7 @@ def main():
                    loss = loss * args.loss_scale
                if args.gradient_accumulation_steps > 1:
                    loss = loss / args.gradient_accumulation_steps
-                tr_loss += loss.item()
+                tr_loss += loss.item() * args.gradient_accumulation_steps
                nb_tr_examples += input_ids.size(0)
                nb_tr_steps += 1