Add option to skip overflow check in step() method

7ba6a038 · Thor Johnsen · c7b34549 · 7ba6a038
Commit 7ba6a038 authored Apr 10, 2020 by Thor Johnsen
Hide whitespace changes
Inline Side-by-side

Showing with 7 additions and 3 deletions

apex/contrib/optimizers/distributed_fused_adam.py apex/contrib/optimizers/distributed_fused_adam.py +7 -3

No files found.
--- a/apex/contrib/optimizers/distributed_fused_adam.py
+++ b/apex/contrib/optimizers/distributed_fused_adam.py
@@ -538,7 +538,7 @@ class DistributedFusedAdam(torch.optim.Optimizer):
        for block_id in range(self._num_blocks):
            self._partial_step_single_shard(block_id, undo=True)
-    def step(self, closure=None):
+    def step(self, closure=None, skip_overflow_check=False):
        loss = None
        if closure is not None:
            loss = closure()
@@ -560,8 +560,12 @@ class DistributedFusedAdam(torch.optim.Optimizer):
            # Check for overflow
            # Store state for loss scaler calculation
-            self.strided_check_finite(self._new_params, stride=self._shard_size, start=0, end=self._net_total_param_size)
+            if skip_overflow_check:
-            if self.peek_overflow:
+                has_overflow = False
+            else:
+                self.strided_check_finite(self._new_params, stride=self._shard_size, start=0, end=self._net_total_param_size)
+                has_overflow = self.peek_overflow
+            if has_overflow:
                print("Reverting step")
                self.revert_step()
            else: