Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
a3f4b5b8
Commit
a3f4b5b8
authored
Dec 22, 2025
by
zhuwenwen
Browse files
update weights_not_loaded and flash_mla_with_kvcache
parent
d89f7579
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
3 additions
and
0 deletions
+3
-0
vllm/model_executor/model_loader/default_loader.py
vllm/model_executor/model_loader/default_loader.py
+1
-0
vllm/v1/attention/backends/mla/flashmla.py
vllm/v1/attention/backends/mla/flashmla.py
+2
-0
No files found.
vllm/model_executor/model_loader/default_loader.py
View file @
a3f4b5b8
...
@@ -272,6 +272,7 @@ class DefaultModelLoader(BaseModelLoader):
...
@@ -272,6 +272,7 @@ class DefaultModelLoader(BaseModelLoader):
# that have loaded weights tracking currently.
# that have loaded weights tracking currently.
if
model_config
.
quantization
is
None
and
loaded_weights
is
not
None
:
if
model_config
.
quantization
is
None
and
loaded_weights
is
not
None
:
weights_not_loaded
=
weights_to_load
-
loaded_weights
weights_not_loaded
=
weights_to_load
-
loaded_weights
weights_not_loaded
=
{
k
for
k
in
weights_not_loaded
if
not
k
.
endwith
(
"indexer.weights_proj.bias"
)}
if
weights_not_loaded
:
if
weights_not_loaded
:
raise
ValueError
(
"Following weights were not initialized from "
raise
ValueError
(
"Following weights were not initialized from "
f
"checkpoint:
{
weights_not_loaded
}
"
)
f
"checkpoint:
{
weights_not_loaded
}
"
)
vllm/v1/attention/backends/mla/flashmla.py
View file @
a3f4b5b8
...
@@ -210,6 +210,8 @@ class FlashMLAImpl(MLACommonImpl[FlashMLAMetadata]):
...
@@ -210,6 +210,8 @@ class FlashMLAImpl(MLACommonImpl[FlashMLAMetadata]):
causal
=
True
,
causal
=
True
,
descale_q
=
layer
.
_q_scale
.
reshape
(
1
),
descale_q
=
layer
.
_q_scale
.
reshape
(
1
),
descale_k
=
layer
.
_k_scale
.
reshape
(
1
),
descale_k
=
layer
.
_k_scale
.
reshape
(
1
),
is_fp8_kvcache
=
False
,
indices
=
None
,
)
)
return
o
,
lse
return
o
,
lse
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment