Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
bfffd59a
Commit
bfffd59a
authored
Sep 02, 2025
by
lizhigong
Browse files
fix deepseek pp + mtp issue
parent
4a62a3eb
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
6 additions
and
4 deletions
+6
-4
vllm/v1/worker/gpu_model_runner.py
vllm/v1/worker/gpu_model_runner.py
+6
-4
No files found.
vllm/v1/worker/gpu_model_runner.py
View file @
bfffd59a
...
...
@@ -2088,7 +2088,8 @@ class GPUModelRunner(LoRAModelRunnerMixin):
hidden_states
=
outputs
if
self
.
speculative_config
and
self
.
speculative_config
.
use_eagle
()
and
not
is_profile
:
assert
isinstance
(
self
.
drafter
,
EagleProposer
)
#assert isinstance(self.drafter, EagleProposer)
if
hasattr
(
self
,
'drafter'
)
and
isinstance
(
self
.
drafter
,
EagleProposer
):
self
.
drafter
.
dummy_run
(
num_tokens
,
attn_metadata
)
# This is necessary to avoid blocking DP.
...
...
@@ -2677,9 +2678,10 @@ class GPUModelRunner(LoRAModelRunnerMixin):
kv_caches
=
self
.
initialize_kv_cache_tensors
(
kv_cache_config
)
if
self
.
speculative_config
and
self
.
speculative_config
.
use_eagle
():
assert
isinstance
(
self
.
drafter
,
EagleProposer
)
#
assert isinstance(self.drafter, EagleProposer)
# validate all draft model layers belong to the same kv cache
# group
if
hasattr
(
self
,
'drafter'
)
and
isinstance
(
self
.
drafter
,
EagleProposer
):
self
.
drafter
.
validate_same_kv_cache_group
(
kv_cache_config
)
if
has_kv_transfer_group
():
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment