allreduce_different_streams is now hidden

72bce160 · Michael Carilli · 3b4a0a23 · 72bce160 · 72bce160
Commit 72bce160 authored May 01, 2019 by Michael Carilli
Hide whitespace changes
Inline Side-by-side

Showing with 6 additions and 5 deletions

apex/parallel/distributed.py apex/parallel/distributed.py +4 -4

tests/distributed/DDP/ddp_race_condition_test.py tests/distributed/DDP/ddp_race_condition_test.py +2 -1

No files found.
--- a/apex/parallel/distributed.py
+++ b/apex/parallel/distributed.py
@@ -200,10 +200,10 @@ class DistributedDataParallel(Module):
        if self.allreduce_communicators:
            assert len(allreduce_communicators[0]) == num_allreduce_streams
            assert len(allreduce_communicators[0]) == len(allreduce_communicators[1])
-            assert allreduce_different_streams
+            assert self.allreduce_different_streams
        if self.allreduce_different_streams and delay_allreduce:
-            raise ValueError("allreduce_different_streams may only be used if delay_allreduce=False.")
+            raise ValueError("self.allreduce_different_streams may only be used if delay_allreduce=False.")
        if shared_param is not None:
            raise ValueError("shared_param is no longer supported as an option.  It was misleadingly named from the start.  It turns out overlapping communication with computation should work fine with shared parameters.  If you still wish to delay communication to the end of the backward pass, use delay_allreduce=True|False instead.")
@@ -259,8 +259,8 @@ class DistributedDataParallel(Module):
    def __setstate__(self, state):
        super(DistributedDataParallel, self).__setstate__(state)
-        if allreduce_different_streams and delay_allreduce:
+        if self.allreduce_different_streams and delay_allreduce:
-            raise ValueError("allreduce_different_streams may only be used if delay_allreduce=False.")
+            raise ValueError("self.allreduce_different_streams may only be used if delay_allreduce=False.")
        if self.delay_allreduce:
            self.needs_refresh = True

--- a/tests/distributed/DDP/ddp_race_condition_test.py
+++ b/tests/distributed/DDP/ddp_race_condition_test.py
@@ -35,8 +35,9 @@ class Model(Module):
 model = Model()
 # model = DDP(model, message_size=1, gradient_predivide_factor=8.0)
-model = DDP(model, delay_allreduce=True)
+# model = DDP(model, delay_allreduce=True)
 # model = DDP(model, message_size=1, allreduce_trigger_params=[model.b])
+model = DDP(model, message_size=1, allreduce_trigger_params=[model.b], num_allreduce_streams=3)
 x = torch.cuda.FloatTensor(4096*4096)