check in (#1210)

2205cff2 · eqy · GitHub · fa8bd7e6 · 2205cff2 · 2205cff2
Unverified Commit 2205cff2 authored Nov 09, 2021 by eqy Committed by GitHub Nov 09, 2021
2 changed files
--- a/apex/transformer/pipeline_parallel/schedules/fwd_bwd_pipelining_with_interleaving.py
+++ b/apex/transformer/pipeline_parallel/schedules/fwd_bwd_pipelining_with_interleaving.py
@@ -49,10 +49,6 @@ def _forward_backward_pipelining_with_interleaving(
    """
    if not isinstance(model, list):
        raise RuntimeError("`model` must be a list of `nn.Module`'s'")
-    # TODO (mkozuki): Sanity check the following condition.
-    if len(batch) != len(model):
-        msg = f"`batch` and `model` must have the same number of elements. Actual {len(batch)} and {len(model)}"
-        raise RuntimeError(msg)

    num_model_chunks = len(model)
    input_tensors = [[] for _ in range(num_model_chunks)]
@@ -122,7 +118,7 @@ def _forward_backward_pipelining_with_interleaving(
        input_tensor = input_tensors[model_chunk_id][-1]
        output_tensor = forward_step(
            forward_step_func,
-            get_kth_microbatch(batch[model_chunk_id], curr_iters[model_chunk_id]),
+            get_kth_microbatch(batch, curr_iters[model_chunk_id]),
            model[model_chunk_id],
            input_tensor,
            losses_reduced,

--- a/tests/L0/run_transformer/run_pipeline_parallel_test.py
+++ b/tests/L0/run_transformer/run_pipeline_parallel_test.py
@@ -125,10 +125,7 @@ def forward_backward_func_template(
    torch.optim.Adam(_param_groups)

    tensor_shape = [batch_size // parallel_state.get_data_parallel_world_size(), hidden_size]
-    if virtual_pipeline_model_parallel_size is None:
-        batch = (torch.randn(tensor_shape).cuda(),)
-    else:
-        batch = [(torch.randn(tensor_shape).cuda(),) for _ in range(virtual_pipeline_model_parallel_size)]
+    batch = (torch.randn(tensor_shape).cuda(),)
    tensor_shape[0] = micro_batch_size

    update_num_microbatches(0)