[syncbn update] (#287)

update input size check to fix github issue #262 update SyncBatchNorm count check so that size 1 input with cross GPU synchronization runs fine.

[syncbn update] (#287)
update input size check to fix github issue #262 update SyncBatchNorm count check so that size 1 input with cross GPU synchronization runs fine.
a5289067 · jjsjann123 · mcarilli · ffbb52ba · a5289067
Commit a5289067 authored May 17, 2019 by jjsjann123 Committed by mcarilli May 17, 2019
Hide whitespace changes
Inline Side-by-side

Showing with 3 additions and 3 deletions

apex/parallel/optimized_sync_batchnorm_kernel.py apex/parallel/optimized_sync_batchnorm_kernel.py +3 -3

No files found.
--- a/apex/parallel/optimized_sync_batchnorm_kernel.py
+++ b/apex/parallel/optimized_sync_batchnorm_kernel.py
@@ -26,9 +26,6 @@ class SyncBatchnormFunction(Function):
                count = int(input.numel()/input.size(1))
                mean, var_biased = syncbn.welford_mean_var(input)
-            if count == 1:
-                raise ValueError('Expected more than 1 value per channel when training, got input size{}'.format(input.size()))
            if torch.distributed.is_initialized():
                if not process_group:
                    process_group = torch.distributed.group.WORLD
@@ -45,6 +42,9 @@ class SyncBatchnormFunction(Function):
                inv_std = 1.0 / torch.sqrt(var_biased + eps)
                var = var_biased * (count) / (count-1) 
+            if count == 1 and world_size < 2:
+                raise ValueError('Expected more than 1 value per channel when training, got input size{}'.format(input.size()))
            r_m_inc = mean if running_mean.dtype != torch.float16 else mean.half()
            r_v_inc = var if running_variance.dtype != torch.float16 else var.half()
            running_mean.data = running_mean.data * (1-momentum) + momentum*r_m_inc