Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
67475a6e
Unverified
Commit
67475a6e
authored
Dec 09, 2025
by
Jaya Yuan
Committed by
GitHub
Dec 09, 2025
Browse files
[DCP][Bugfix][CI] Fix accuracy issue of DCP when using FLASH_ATTN_MLA (#30309)
Signed-off-by:
FENP
<
yuanyongjie.yyj@antgroup.com
>
parent
9c32df61
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
6 additions
and
2 deletions
+6
-2
tests/distributed/test_context_parallel.py
tests/distributed/test_context_parallel.py
+4
-1
vllm/v1/attention/backends/mla/flashattn_mla.py
vllm/v1/attention/backends/mla/flashattn_mla.py
+2
-1
No files found.
tests/distributed/test_context_parallel.py
View file @
67475a6e
...
...
@@ -123,8 +123,11 @@ class CPTestSettings:
CP_TEXT_GENERATION_MODELS
=
{
"deepseek-ai/DeepSeek-V2-Lite-Chat"
:
[
CPTestSettings
.
detailed
(
dcp_multipliers
=
[
1
]),
CPTestSettings
.
detailed
(
dcp_multipliers
=
[
0.5
,
1
],
cp_kv_cache_interleave_size
=
64
dcp_multipliers
=
[
0.5
],
cp_kv_cache_interleave_size
=
64
,
attn_backend
=
"FLASHMLA"
,
),
],
"Qwen/Qwen2.5-1.5B-Instruct"
:
[
...
...
vllm/v1/attention/backends/mla/flashattn_mla.py
View file @
67475a6e
...
...
@@ -105,13 +105,14 @@ class FlashAttnMLAMetadataBuilder(MLACommonMetadataBuilder[FlashAttnMLAMetadata]
vllm_config
:
VllmConfig
,
device
:
torch
.
device
,
):
interleave_size
=
vllm_config
.
parallel_config
.
cp_kv_cache_interleave_size
super
().
__init__
(
kv_cache_spec
,
layer_names
,
vllm_config
,
device
,
FlashAttnMLAMetadata
,
supports_dcp_with_varlen
=
True
,
supports_dcp_with_varlen
=
(
interleave_size
==
1
)
,
)
self
.
max_num_splits
=
0
# No upper bound on the number of splits.
self
.
fa_aot_schedule
=
get_flash_attn_version
()
==
3
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment