Update transformer.py

031a4157 · wxj · a45f4c2a · 031a4157
Commit 031a4157 authored Jan 17, 2025 by wxj
Show whitespace changes
Inline Side-by-side

Showing with 2 additions and 2 deletions

megatron/legacy/model/transformer.py megatron/legacy/model/transformer.py +2 -2

No files found.
--- a/megatron/legacy/model/transformer.py
+++ b/megatron/legacy/model/transformer.py
@@ -165,7 +165,7 @@ class ParallelMLP(MegatronModule):
            is_expert=is_expert,
        )

-    @torch.compile(mode="max-autotune-no-cudagraphs")
+    # @torch.compile(mode="max-autotune-no-cudagraphs")
    def forward(self, hidden_states):

        # [s, b, 4hp]
@@ -1213,7 +1213,7 @@ class ParallelTransformerLayer(MegatronModule):

        return retriever_output, norm_input, norm_output

-    @torch.compile(mode="max-autotune-no-cudagraphs")
+    # @torch.compile(mode="max-autotune-no-cudagraphs")
    def forward(self, hidden_states, attention_mask,
                encoder_output=None, enc_dec_attn_mask=None,
                retriever_input=None,