update common.py

2da6fd72 · zhuwenwen · f246ee95 · 2da6fd72 · 2da6fd72
Commit 2da6fd72 authored Jun 23, 2025 by zhuwenwen
Hide whitespace changes
Inline Side-by-side

Showing with 1 addition and 2 deletions

vllm/attention/backends/mla/common.py vllm/attention/backends/mla/common.py +0 -1

vllm/v1/attention/backends/mla/common.py vllm/v1/attention/backends/mla/common.py +1 -1

No files found.
--- a/vllm/attention/backends/mla/common.py
+++ b/vllm/attention/backends/mla/common.py
@@ -1031,7 +1031,6 @@ class MLACommonImpl(MLAAttentionImpl[T], Generic[T]):
        # and the one from vllm_flash_attn. The former is used on RoCM and the
        # latter has an additional parameter to control FA2 vs FA3
        self.flash_attn_varlen_func = flash_attn_varlen_func
-        # self.vllm_flash_attn_version = None
        self.vllm_flash_attn_version = get_flash_attn_version()
        if self.vllm_flash_attn_version is not None:
            self.flash_attn_varlen_func = \

--- a/vllm/v1/attention/backends/mla/common.py
+++ b/vllm/v1/attention/backends/mla/common.py
@@ -656,7 +656,7 @@ class MLACommonImpl(MLAAttentionImpl[M], Generic[M]):
            q=q,
            k=k,
            v=maybe_padded_v,
-            return_softmax_lse=return_softmax_lse,
+            # return_softmax_lse=return_softmax_lse,
            softmax_scale=softmax_scale,
            **kwargs,
        )