Add substep callbacks (#12951)

Co-authored-by: Lukas Wutschitz <lukas.wutschitz@microsoft.com>

Add substep callbacks (#12951)
Co-authored-by: Lukas Wutschitz <lukas.wutschitz@microsoft.com>
fe6ff4a9 · wulu473 · GitHub · f84226b7 · fe6ff4a9 · fe6ff4a9
Unverified Commit fe6ff4a9 authored Jul 30, 2021 by wulu473 Committed by GitHub Jul 30, 2021
Show whitespace changes
Inline Side-by-side

Showing with 11 additions and 0 deletions

src/transformers/trainer.py src/transformers/trainer.py +2 -0

src/transformers/trainer_callback.py src/transformers/trainer_callback.py +9 -0

No files found.
--- a/src/transformers/trainer.py
+++ b/src/transformers/trainer.py
@@ -1334,6 +1334,8 @@ class Trainer:
                    self.control = self.callback_handler.on_step_end(args, self.state, self.control)

                    self._maybe_log_save_evaluate(tr_loss, model, trial, epoch, ignore_keys_for_eval)
+                else:
+                    self.control = self.callback_handler.on_substep_end(args, self.state, self.control)

                if self.control.should_epoch_stop or self.control.should_training_stop:
                    break

--- a/src/transformers/trainer_callback.py
+++ b/src/transformers/trainer_callback.py
@@ -242,6 +242,12 @@ class TrainerCallback:
        """
        pass

+    def on_substep_end(self, args: TrainingArguments, state: TrainerState, control: TrainerControl, **kwargs):
+        """
+        Event called at the end of an substep during gradient accumulation.
+        """
+        pass
+
    def on_step_end(self, args: TrainingArguments, state: TrainerState, control: TrainerControl, **kwargs):
        """
        Event called at the end of a training step. If using gradient accumulation, one training step might take
@@ -355,6 +361,9 @@ class CallbackHandler(TrainerCallback):
        control.should_save = False
        return self.call_event("on_step_begin", args, state, control)

+    def on_substep_end(self, args: TrainingArguments, state: TrainerState, control: TrainerControl):
+        return self.call_event("on_substep_end", args, state, control)
+
    def on_step_end(self, args: TrainingArguments, state: TrainerState, control: TrainerControl):
        return self.call_event("on_step_end", args, state, control)