[PyTorch] Fix incorrect variable name in LayerNormMLP backward (#548)

Fix incorrect variable name in LayerNormMLP backward Signed-off-by: Tim Moon <tmoon@nvidia.com>

[PyTorch] Fix incorrect variable name in LayerNormMLP backward (#548)
Fix incorrect variable name in LayerNormMLP backward Signed-off-by: Tim Moon <tmoon@nvidia.com>
92c1e500 · Tim Moon · GitHub · 4f1d70fb · 92c1e500
Unverified Commit 92c1e500 authored Dec 01, 2023 by Tim Moon Committed by GitHub Dec 01, 2023
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 2 deletions

transformer_engine/pytorch/module/layernorm_mlp.py transformer_engine/pytorch/module/layernorm_mlp.py +2 -2

No files found.
--- a/transformer_engine/pytorch/module/layernorm_mlp.py
+++ b/transformer_engine/pytorch/module/layernorm_mlp.py
@@ -914,7 +914,7 @@ class _LayerNormMLP(torch.autograd.Function):
            # Handle custom DDP from mcore.
            if ctx.fuse_wgrad_accumulation and hasattr(fc1_weight, 'grad_added_to_main_grad'):
                fc1_weight.grad_added_to_main_grad = True
-                if getattr(weight, 'zero_out_wgrad', False):
+                if getattr(fc1_weight, 'zero_out_wgrad', False):
                    fc1_wgrad = torch.zeros(fc1_weight.main_grad.shape,
                                            dtype=fc1_weight.dtype,
                                            device=torch.cuda.current_device(),
@@ -935,7 +935,7 @@ class _LayerNormMLP(torch.autograd.Function):
            # Handle custom DDP from mcore.
            if ctx.fuse_wgrad_accumulation and hasattr(fc2_weight, 'grad_added_to_main_grad'):
                fc2_weight.grad_added_to_main_grad = True
-                if getattr(weight, 'zero_out_wgrad', False):
+                if getattr(fc2_weight, 'zero_out_wgrad', False):
                    fc2_wgrad = torch.zeros(fc2_weight.main_grad.shape,
                                            dtype=fc2_weight.dtype,
                                            device=torch.cuda.current_device(),