Update transformer.py, 关闭整个模型的torch.compile

c5369391 · wxj · 473449d8 · c5369391
Commit c5369391 authored Jan 16, 2025 by wxj
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 2 deletions

megatron/legacy/model/transformer.py megatron/legacy/model/transformer.py +2 -2

No files found.
--- a/megatron/legacy/model/transformer.py
+++ b/megatron/legacy/model/transformer.py
@@ -165,7 +165,7 @@ class ParallelMLP(MegatronModule):
            is_expert=is_expert,
        )
-    @torch.compile(mode="max-autotune-no-cudagraphs")
+    # @torch.compile(mode="max-autotune-no-cudagraphs")
    def forward(self, hidden_states):
        # [s, b, 4hp]
@@ -1213,7 +1213,7 @@ class ParallelTransformerLayer(MegatronModule):
        return retriever_output, norm_input, norm_output
-    @torch.compile(mode="max-autotune-no-cudagraphs")
+    # @torch.compile(mode="max-autotune-no-cudagraphs")
    def forward(self, hidden_states, attention_mask,
                encoder_output=None, enc_dec_attn_mask=None,
                retriever_input=None,