Relax assert to allow both bf16 and fp16

13403e81 · Tri Dao · 64f42cd0 · 13403e81
Commit 13403e81 authored Sep 11, 2022 by Tri Dao
Show whitespace changes
Inline Side-by-side

Showing with 1 addition and 1 deletion

flash_attn/flash_attention.py flash_attn/flash_attention.py +1 -1

No files found.
--- a/flash_attn/flash_attention.py
+++ b/flash_attn/flash_attention.py
@@ -34,7 +34,7 @@ class FlashAttention(nn.Module):
            key_padding_mask: a bool tensor of shape (B, S)
        """
        assert not need_weights
-        assert qkv.dtype == torch.float16
+        assert qkv.dtype in [torch.float16, torch.bfloat16]
        assert qkv.is_cuda

        if cu_seqlens is None: