Unverified Commit 41cfa506 authored by vllmellm's avatar vllmellm Committed by GitHub
Browse files

[ROCm][AITER] fix wrong argument passed to AITER `flash_attn_varlen_func` (#31880)


Signed-off-by: default avatarvllmellm <vllm.ellm@embeddedllm.com>
parent d111bc53
......@@ -54,7 +54,7 @@ class AiterTritonMLAImpl(AiterMLAImpl):
k,
v,
softmax_scale=softmax_scale,
return_softmax_lse=return_softmax_lse,
return_lse=return_softmax_lse,
**kwargs,
)
# Transpose the LSE if Triton MHA is used:
......
......@@ -236,7 +236,7 @@ class AiterMLAImpl(MLACommonImpl[AiterMLAMetadata]):
k=k,
v=v,
softmax_scale=softmax_scale,
return_softmax_lse=return_softmax_lse,
return_lse=return_softmax_lse,
**kwargs,
)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment