Add back need_weights in FlashMHA

19d12610 · Tri Dao · 6cc73425 · 19d12610
Commit 19d12610 authored Aug 09, 2022 by Tri Dao
Hide whitespace changes
Inline Side-by-side

Showing with 1 addition and 1 deletion

flash_attn/flash_attention.py flash_attn/flash_attention.py +1 -1

No files found.
--- a/flash_attn/flash_attention.py
+++ b/flash_attn/flash_attention.py
@@ -98,7 +98,7 @@ class FlashMHA(nn.Module):
        self.inner_attn = FlashAttention(attention_dropout=attention_dropout, **factory_kwargs)
        self.out_proj = nn.Linear(embed_dim, embed_dim, bias=bias, **factory_kwargs)
-    def forward(self, x, key_padding_mask=None):
+    def forward(self, x, key_padding_mask=None, need_weights=False):
        """x: (batch, seqlen, hidden_dim) (where hidden_dim = num heads * head dim)
        key_padding_mask: bool tensor of shape (batch, seqlen)
        """