Fix attention masks properly for multiple batches.

6bcf57ff · comfyanonymous · 11e3221f · 6bcf57ff
Commit 6bcf57ff authored Feb 17, 2024 by comfyanonymous
Hide whitespace changes
Inline Side-by-side

Showing with 3 additions and 3 deletions

comfy/ldm/modules/attention.py comfy/ldm/modules/attention.py +3 -3

No files found.
--- a/comfy/ldm/modules/attention.py
+++ b/comfy/ldm/modules/attention.py
@@ -118,7 +118,7 @@ def attention_basic(q, k, v, heads, mask=None):
                bs = 1
            else:
                bs = mask.shape[0]
-            mask = mask.reshape(bs, -1, mask.shape[-2], mask.shape[-1]).expand(-1, heads, -1, -1).reshape(-1, mask.shape[-2], mask.shape[-1])
+            mask = mask.reshape(bs, -1, mask.shape[-2], mask.shape[-1]).expand(b, heads, -1, -1).reshape(-1, mask.shape[-2], mask.shape[-1])
            sim.add_(mask)

    # attention, what we cannot get enough of
@@ -175,7 +175,7 @@ def attention_sub_quad(query, key, value, heads, mask=None):
            bs = 1
        else:
            bs = mask.shape[0]
-        mask = mask.reshape(bs, -1, mask.shape[-2], mask.shape[-1]).expand(-1, heads, -1, -1).reshape(-1, mask.shape[-2], mask.shape[-1])
+        mask = mask.reshape(bs, -1, mask.shape[-2], mask.shape[-1]).expand(b, heads, -1, -1).reshape(-1, mask.shape[-2], mask.shape[-1])

    hidden_states = efficient_dot_product_attention(
        query,
@@ -240,7 +240,7 @@ def attention_split(q, k, v, heads, mask=None):
            bs = 1
        else:
            bs = mask.shape[0]
-        mask = mask.reshape(bs, -1, mask.shape[-2], mask.shape[-1]).expand(-1, heads, -1, -1).reshape(-1, mask.shape[-2], mask.shape[-1])
+        mask = mask.reshape(bs, -1, mask.shape[-2], mask.shape[-1]).expand(b, heads, -1, -1).reshape(-1, mask.shape[-2], mask.shape[-1])

    # print("steps", steps, mem_required, mem_free_total, modifier, q.element_size(), tensor_size)
    first_op_done = False