Add temporary assert to finetuning until it can be fixed.

113c6362 · Jared Casper · 42c1cf42 · 113c6362
Commit 113c6362 authored May 18, 2021 by Jared Casper
Hide whitespace changes
Inline Side-by-side

Showing with 3 additions and 1 deletion

tasks/finetune_utils.py tasks/finetune_utils.py +3 -1

No files found.
--- a/tasks/finetune_utils.py
+++ b/tasks/finetune_utils.py
@@ -19,7 +19,7 @@ from functools import partial
 import torch
-from megatron import get_args
+from megatron import get_args, get_num_microbatches
 from megatron import print_rank_0
 from megatron import get_timers
 from megatron import mpu
@@ -154,6 +154,8 @@ def _train(model, optimizer, lr_scheduler, forward_step,
    args = get_args()
    timers = get_timers()
+    assert get_num_microbatches() == 1, "finetuning with gradient accumulation doesn't currently work"
    # Turn on training mode which enables dropout.
    for m in model:
        m.train()