fixed assert issue in clip grads for none grads

82945c1a · mohammad · 571f10a0 · 82945c1a
Commit 82945c1a authored Jan 05, 2021 by mohammad
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 2 deletions

megatron/optimizer/clip_grads.py megatron/optimizer/clip_grads.py +2 -2

No files found.
--- a/megatron/optimizer/clip_grads.py
+++ b/megatron/optimizer/clip_grads.py
@@ -53,14 +53,14 @@ def clip_grad_norm_fp32(parameters, max_norm, norm_type=2):
    grads = []
    grads_for_norm = []
    for param in parameters:
-        # Make sure the grads are in fp32
-        assert param.grad.type() == 'torch.cuda.FloatTensor'
        grad_not_none = param.grad is not None
        is_not_shared = not hasattr(param, 'shared') or not param.shared
        is_not_tp_duplicate = param.tensor_model_parallel or \
                              (mpu.get_tensor_model_parallel_rank() == 0)
        grad = param.grad.detach()
        if grad_not_none:
+            # Make sure the grads are in fp32
+            assert param.grad.type() == 'torch.cuda.FloatTensor'
            grads.append(grad)
        if grad_not_none and is_not_shared and is_not_tp_duplicate:
            grads_for_norm.append(grad)