onlly support pp=1

7b585440 · mshoeybi · e923ec52 · 7b585440 · 7b585440
Commit 7b585440 authored Aug 19, 2021 by mshoeybi
Hide whitespace changes
Inline Side-by-side

Showing with 4 additions and 2 deletions

megatron/arguments.py megatron/arguments.py +1 -0

megatron/mpu/random.py megatron/mpu/random.py +3 -2

No files found.
--- a/megatron/arguments.py
+++ b/megatron/arguments.py
@@ -236,6 +236,7 @@ def parse_args(extra_args_provider=None, defaults={},
        assert args.checkpoint_activations, \
            'for distribute-checkpointed-activations to work you '\
            'need to enable checkpoint-activations'
+        assert args.pipeline_model_parallel_size == 1

    _print_args(args)
    return args

--- a/megatron/mpu/random.py
+++ b/megatron/mpu/random.py
@@ -289,7 +289,8 @@ class CheckpointFunction(torch.autograd.Function):
        return (None, None) + grads


-def checkpoint(function, *args):
+def checkpoint(function, distribute_checkpointed_activations, *args):
    """Checkpoint a model or part of the model.
    This has been directly copied from torch.utils.checkpoint."""
-    return CheckpointFunction.apply(function, *args)
+    return CheckpointFunction.apply(function,
+                                    distribute_checkpointed_activations, *args)