Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
96abd293
Commit
96abd293
authored
Mar 11, 2026
by
yangql
Browse files
dpsk_v32的mtp层的dense加载适配
parent
0daa00fb
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
12 additions
and
2 deletions
+12
-2
vllm/model_executor/models/deepseek_mtp.py
vllm/model_executor/models/deepseek_mtp.py
+12
-1
vllm/v1/attention/ops/flashmla.py
vllm/v1/attention/ops/flashmla.py
+0
-1
No files found.
vllm/model_executor/models/deepseek_mtp.py
View file @
96abd293
...
...
@@ -78,7 +78,9 @@ class DeepSeekMultiTokenPredictorLayer(nn.Module):
self
.
device
=
current_platform
.
device_type
self
.
is_v32
=
hasattr
(
config
,
"index_topk"
)
#添加判断,默认开启DSA
force_disable_dsa
=
os
.
environ
.
get
(
"VLLM_DISABLE_DSA"
,
"0"
)
==
"1"
self
.
is_v32
=
hasattr
(
config
,
"index_topk"
)
and
not
force_disable_dsa
if
self
.
is_v32
:
topk_tokens
=
config
.
index_topk
topk_indices_buffer
=
torch
.
empty
(
...
...
@@ -282,9 +284,18 @@ class DeepSeekMTP(nn.Module, DeepseekV2MixtureOfExperts):
params_dict
=
dict
(
self
.
named_parameters
())
loaded_params
:
set
[
str
]
=
set
()
# 判断是否加载"indexer"权重
model_has_indexer
=
any
(
"indexer"
in
param_name
for
param_name
in
params_dict
.
keys
())
for
name
,
loaded_weight
in
weights
:
if
"rotary_emb.inv_freq"
in
name
:
continue
# 跳过加载"indexer"权重
if
"indexer"
in
name
and
not
model_has_indexer
:
logger
.
info
(
f
"Skipping indexer weight (DSA disabled):
{
name
}
"
)
continue
spec_layer
=
get_spec_layer_idx_from_weight_name
(
self
.
config
,
name
)
if
spec_layer
is
None
:
continue
...
...
vllm/v1/attention/ops/flashmla.py
View file @
96abd293
...
...
@@ -136,7 +136,6 @@ def get_mla_metadata_dense_fp8(
cache_seqlens
,
num_q_tokens_per_head_k
,
num_heads_k
,
# 16,
)
else
:
return
torch
.
ops
.
_flashmla_extension_C
.
get_mla_decoding_metadata_dense_fp8
(
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment