"examples/multimodal/vscode:/vscode.git/clone" did not exist on "1412e44ba92a38afef5d026ab5225189c280014b"
Commit 965934b8 authored by zhuwenwen's avatar zhuwenwen
Browse files

support sinks

parent 8b1077ba
......@@ -453,8 +453,9 @@ class FlashAttentionImpl(AttentionImpl):
self.sinks = sinks
if self.sinks is not None:
assert self.vllm_flash_attn_version == 3, (
"Sinks are only supported in FlashAttention 3")
if not current_platform.is_rocm():
assert self.vllm_flash_attn_version == 3, (
"Sinks are only supported in FlashAttention 3")
assert self.sinks.shape[0] == num_heads, (
"Sinks must have the same number of heads as the number of "
"heads in the layer")
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment