Unverified Commit 42e1a72e authored by hlu1's avatar hlu1 Committed by GitHub
Browse files

[Deepseek V3.2] Enable flashmla_auto with MTP (#12294)


Signed-off-by: default avatarHao Lu <14827759+hlu1@users.noreply.github.com>
parent 83a7c89c
......@@ -1222,11 +1222,9 @@ class NativeSparseAttnBackend(AttentionBackend):
if self.enable_auto_select_prefill_impl:
if self.nsa_kv_cache_store_fp8:
if (
# TODO(hlu1): enable MTP
is_blackwell()
and forward_batch is not None
and forward_batch.forward_mode.is_extend()
and forward_batch.spec_algorithm.is_none()
and forward_batch.forward_mode == ForwardMode.EXTEND
):
total_kv_tokens = forward_batch.seq_lens_sum
total_q_tokens = forward_batch.extend_num_tokens
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment