Only warn once in LossScaler constructor

03b0eeb8 · Michael Carilli · a153c41a · 03b0eeb8
Commit 03b0eeb8 authored Feb 04, 2019 by Michael Carilli
Hide whitespace changes
Inline Side-by-side

Showing with 13 additions and 11 deletions

apex/amp/scaler.py apex/amp/scaler.py +13 -11

No files found.
--- a/apex/amp/scaler.py
+++ b/apex/amp/scaler.py
@@ -31,13 +31,15 @@ class LossScaler(object):
        try:
            import amp_C
            LossScaler.has_fused_kernel = True
-            LossScaler.scale_check_overflow = amp_C.scale_check_overflow
+            LossScaler.scale_check_overflow_cuda = amp_C.scale_check_overflow
            self._overflow_buf = torch.cuda.ByteTensor(1024,)
        except ImportError as err:
-            print("Warning:  Amp fused downscale kernel is unavailable, possibly because apex "
+            if not LossScaler.warned_no_fused_kernel:
-                  "was installed without --cuda_ext.  Using Python fallback.  ImportError was: ", err)
+                print("Warning:  Amp fused downscale kernel is unavailable, possibly because apex "
+                      "was installed without --cuda_ext.  Using Python fallback.  ImportError was: ",
+                      err)
            LossScaler.has_fused_kernel = False
-            LossScaler.scale_check_overflow = scale_check_overflow_python
+            LossScaler.warned_no_fused_kernel = True
    def loss_scale(self):
        return self._loss_scale
@@ -49,19 +51,19 @@ class LossScaler(object):
        for p in iter_params(param_groups):
            if p.grad is not None:
                if LossScaler.has_fused_kernel and p.grad.data.type() == "torch.cuda.FloatTensor":
-                    LossScaler.scale_check_overflow(p.grad.data,
+                    LossScaler.scale_check_overflow_cuda(p.grad.data,
-                                                    1. / scale,
+                                                         1./scale,
-                                                    self._overflow_buf)
+                                                         self._overflow_buf)
                else:
-                    if p.grad.data.type() != "torch.cuda.FloatTensor"
+                    if (p.grad.data.type() != "torch.cuda.FloatTensor"
-                            and not LossScaler.warned_fp16_grad:
+                            and not LossScaler.warned_fp16_grad):
                        logger = logging.getLogger("apex.amp")
                        logger.warning("Incoming grads are not fp32 (not master grads). "
                                       "Downscaling non-fp32 grads may indicate an error. "
                                       "When using Amp, you don't need to call .half() on your model.")
                        LossScaler.warned_fp16_grad = True
-                    self._has_overflow = LossScaler.scale_check_overflow(p.grad.data,
+                    self._has_overflow = scale_check_overflow_python(p.grad.data,
-                                                                         1. / scale)
+                                                                     1./scale)
                    if self._has_overflow:
                        break