Update transformer.py, 添加torch.compile

473449d8 · wxj · 50fe58fa · 473449d8
Commit 473449d8 authored Dec 31, 2024 by wxj
Hide whitespace changes
Inline Side-by-side

Showing with 1 addition and 0 deletions

megatron/legacy/model/transformer.py megatron/legacy/model/transformer.py +1 -0

No files found.
--- a/megatron/legacy/model/transformer.py
+++ b/megatron/legacy/model/transformer.py
@@ -1213,6 +1213,7 @@ class ParallelTransformerLayer(MegatronModule):

        return retriever_output, norm_input, norm_output

+    @torch.compile(mode="max-autotune-no-cudagraphs")
    def forward(self, hidden_states, attention_mask,
                encoder_output=None, enc_dec_attn_mask=None,
                retriever_input=None,