update fp8_mqa_logits and fp8_paged_mqa_logits

259605da · zhuwenwen · a55b8f91 · 259605da
Commit 259605da authored Dec 12, 2025 by zhuwenwen
Show whitespace changes
Inline Side-by-side

Showing with 2 additions and 2 deletions

vllm/model_executor/models/deepseek_v2.py vllm/model_executor/models/deepseek_v2.py +2 -2

No files found.
--- a/vllm/model_executor/models/deepseek_v2.py
+++ b/vllm/model_executor/models/deepseek_v2.py
@@ -627,7 +627,7 @@ def sparse_attn_indexer(
                chunk.cu_seq_lens,
                chunk.num_reqs,
            )
-            if current_platform.is_rocm():
+            if not current_platform.is_rocm():
                logits = fp8_mqa_logits(
                    q_fp8[chunk.token_start:chunk.token_end],
                    (k_fp8, k_scale),
@@ -680,7 +680,7 @@ def sparse_attn_indexer(
        next_n = padded_q_fp8_decode_tokens.shape[1]
        assert batch_size == decode_metadata.seq_lens.shape[0]
        num_padded_tokens = batch_size * next_n
-        if current_platform.is_rocm():
+        if not current_platform.is_rocm():
            logits = fp8_paged_mqa_logits(
                padded_q_fp8_decode_tokens,
                kv_cache,