Allow disabling torch 2_0 attention (#3273)

* Allow disabling torch 2_0 attention * make style * Update src/diffusers/models/attention.py

Allow disabling torch 2_0 attention (#3273)
* Allow disabling torch 2_0 attention * make style * Update src/diffusers/models/attention.py
4d35d7fe · Patrick von Platen · GitHub · a7b0671c · 4d35d7fe
Unverified Commit 4d35d7fe authored Apr 28, 2023 by Patrick von Platen Committed by GitHub Apr 28, 2023
Hide whitespace changes
Inline Side-by-side

Showing with 3 additions and 3 deletions

src/diffusers/models/attention.py src/diffusers/models/attention.py +3 -3

No files found.
--- a/src/diffusers/models/attention.py
+++ b/src/diffusers/models/attention.py
@@ -71,6 +71,7 @@ class AttentionBlock(nn.Module):
        self.proj_attn = nn.Linear(channels, channels, bias=True)
        self._use_memory_efficient_attention_xformers = False
+        self._use_2_0_attn = True
        self._attention_op = None
    def reshape_heads_to_batch_dim(self, tensor, merge_head_and_batch=True):
@@ -142,9 +143,8 @@ class AttentionBlock(nn.Module):
        scale = 1 / math.sqrt(self.channels / self.num_heads)
-        use_torch_2_0_attn = (
+        _use_2_0_attn = self._use_2_0_attn and not self._use_memory_efficient_attention_xformers
-            hasattr(F, "scaled_dot_product_attention") and not self._use_memory_efficient_attention_xformers
+        use_torch_2_0_attn = hasattr(F, "scaled_dot_product_attention") and _use_2_0_attn
-        )
        query_proj = self.reshape_heads_to_batch_dim(query_proj, merge_head_and_batch=not use_torch_2_0_attn)
        key_proj = self.reshape_heads_to_batch_dim(key_proj, merge_head_and_batch=not use_torch_2_0_attn)