[Fix] Fix sage-attn distribute bug (#235)

0dd7ca09 · gushiqiao · GitHub · 79c3caa2 · 0dd7ca09 · 0dd7ca09
Commit 0dd7ca09 authored Aug 21, 2025 by gushiqiao Committed by GitHub Aug 21, 2025
Showing with 3 additions and 2 deletions

lightx2v/common/ops/attn/ulysses_attn.py lightx2v/common/ops/attn/ulysses_attn.py +2 -2

lightx2v/models/networks/wan/infer/transformer_infer.py lightx2v/models/networks/wan/infer/transformer_infer.py +1 -0

No files found.
--- a/lightx2v/common/ops/attn/ulysses_attn.py
+++ b/lightx2v/common/ops/attn/ulysses_attn.py
@@ -12,7 +12,7 @@ class UlyssesAttnWeight(AttnWeightTemplate):
    def __init__(self):
        self.config = {}
-    def apply(self, q, k, v, img_qkv_len, cu_seqlens_qkv, attention_module=None, seq_p_group=None):
+    def apply(self, q, k, v, img_qkv_len, cu_seqlens_qkv, attention_module=None, seq_p_group=None, model_cls=None):
        """
        执行 Ulysses 注意力机制，结合图像和文本的查询、键和值。
@@ -77,7 +77,7 @@ class UlyssesAttnWeight(AttnWeightTemplate):
        # 调用注意力函数计算注意力结果
        # attn = attention(attention_type=attention_type, q=q, k=k, v=v, cu_seqlens_q=cu_seqlens_qkv, cu_seqlens_kv=cu_seqlens_qkv, max_seqlen_q=max_seqlen_qkv, max_seqlen_kv=max_seqlen_qkv)
-        attn = attention_module.apply(q=q, k=k, v=v, cu_seqlens_q=cu_seqlens_qkv, cu_seqlens_kv=cu_seqlens_qkv, max_seqlen_q=max_seqlen_qkv, max_seqlen_kv=max_seqlen_qkv)
+        attn = attention_module.apply(q=q, k=k, v=v, cu_seqlens_q=cu_seqlens_qkv, cu_seqlens_kv=cu_seqlens_qkv, max_seqlen_q=max_seqlen_qkv, max_seqlen_kv=max_seqlen_qkv, model_cls=model_cls)
        # 分割图像和文本的注意力结果
        img_attn, txt_attn = attn[: img_q.shape[0], :], attn[img_q.shape[0] :,]

--- a/lightx2v/models/networks/wan/infer/transformer_infer.py
+++ b/lightx2v/models/networks/wan/infer/transformer_infer.py
@@ -164,6 +164,7 @@ class WanTransformerInfer(BaseTransformerInfer):
                cu_seqlens_qkv=cu_seqlens_q,
                attention_module=weights.self_attn_1,
                seq_p_group=self.seq_p_group,
+                model_cls=self.config["model_cls"],
            )
        else:
            attn_out = weights.self_attn_1.apply(