[syncBN]

test update to resolve https://github.com/NVIDIA/apex/issues/134#issue-403525480 Using identical learning rate for both DDP with sync BN and single process BN. The previous configure leaves the impression that sync BN requires adjusting lr in the script, which is not true.

[syncBN]
test update to resolve https://github.com/NVIDIA/apex/issues/134#issue-403525480 Using identical learning rate for both DDP with sync BN and single process BN. The previous configure leaves the impression that sync BN requires adjusting lr in the script, which is not true.
63e47d29 · jiej · c8bc3e62 · 63e47d29
Commit 63e47d29 authored Jan 28, 2019 by jiej
Hide whitespace changes
Inline Side-by-side

Showing with 3 additions and 5 deletions

tests/synced_batchnorm/two_gpu_unit_test.py tests/synced_batchnorm/two_gpu_unit_test.py +3 -5

No files found.
--- a/tests/synced_batchnorm/two_gpu_unit_test.py
+++ b/tests/synced_batchnorm/two_gpu_unit_test.py
@@ -92,6 +92,8 @@ inp_bn = inp_t.clone().requires_grad_()
 grad_bn = grad_output_t.clone().detach()
 out_bn = bn(inp_bn)
 out_bn.backward(grad_bn)
+for param in bn.parameters():
+    param.grad = param.grad / args.world_size
 bn_opt = optim.SGD(bn.parameters(), lr=1.0)

 sbn = apex.parallel.SyncBatchNorm(feature_size).cuda()
@@ -103,7 +105,7 @@ if args.fp16:
 if args.fp64:
    sbn.double()
 sbn = DDP(sbn)
-sbn_opt = optim.SGD(sbn.parameters(), lr=1.0*args.world_size)
+sbn_opt = optim.SGD(sbn.parameters(), lr=1.0)
 inp_sbn = inp_t.clone().requires_grad_()
 grad_sbn = grad_output_t.clone().detach()
 out_sbn = sbn(inp_sbn[start:finish])
@@ -159,11 +161,7 @@ sbn_opt.step()

 if args.local_rank == 0:
    compare("comparing bn vs sbn bias: ", bn.bias, sbn.module.bias, error)
-    compare("comparing bn vs ref bias: ", bn.bias, bias_r.view(-1) - grad_bias_r, error)
-    sbn_result = compare("comparing sbn vs ref bias: ", sbn.module.bias, bias_r.view(-1) - grad_bias_r, error) and sbn_result
    compare("comparing bn vs sbn weight: ", bn.weight, sbn.module.weight, error)
-    compare("comparing bn vs ref weight: ", bn.weight, (weight_r.view(-1) - grad_weight_r), error)
-    sbn_result = compare("comparing sbn vs ref weight: ", sbn.module.weight, (weight_r.view(-1) - grad_weight_r), error) and sbn_result


 if sbn_result: