fix typos (#446)

6f28ea30 · Haibin Lin · GitHub · 5412a334 · 6f28ea30 · 6f28ea30
Unverified Commit 6f28ea30 authored Sep 28, 2020 by Haibin Lin Committed by GitHub Sep 28, 2020
Hide whitespace changes
Inline Side-by-side

Showing with 4 additions and 4 deletions

deepspeed/runtime/pipe/p2p.py deepspeed/runtime/pipe/p2p.py +1 -1

deepspeed/runtime/zero/stage2.py deepspeed/runtime/zero/stage2.py +3 -3

No files found.
--- a/deepspeed/runtime/pipe/p2p.py
+++ b/deepspeed/runtime/pipe/p2p.py
@@ -14,7 +14,7 @@ def init_process_groups(grid):
    global _groups, _grid
    _grid = grid

-    assert _grid.pipe_parallel_size > 1, "There is no model parallelism"
+    assert _grid.pipe_parallel_size > 1, "There is no pipeline parallelism"

    _groups = [dist.new_group(ranks=group) for group in _grid.p2p_groups]


--- a/deepspeed/runtime/zero/stage2.py
+++ b/deepspeed/runtime/zero/stage2.py
@@ -260,7 +260,7 @@ class FP16_DeepSpeedZeroOptimizer(object):
            for p, q in zip(self.fp16_groups[i], updated_params):
                p.data = q.data

-            #divide the flat weights into near equal paritition equal to the data parallel degree
+            #divide the flat weights into near equal partition equal to the data parallel degree
            #each process will compute on a different part of the partition
            data_parallel_partitions = self.get_data_parallel_partitions(
                self.fp16_groups_flat[i])
@@ -367,10 +367,10 @@ class FP16_DeepSpeedZeroOptimizer(object):
        #stores the offset at which a parameter gradient needs to be inserted in a partition
        self.grad_partition_insertion_offset = {}

-        #the offset in the gradient at which it must be inserted at the beginning of the paritition
+        #the offset in the gradient at which it must be inserted at the beginning of the partition
        self.grad_start_offset = {}

-        #will store the averaged gradients required by this parititon
+        #will store the averaged gradients required by this partition
        self.averaged_gradients = {}

        # store index of first parameter in each partition