Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
3adffd5b
Unverified
Commit
3adffd5b
authored
Jan 09, 2026
by
Nick Hill
Committed by
GitHub
Jan 09, 2026
Browse files
[Misc] Enable async scheduling by default with spec decoding (#31998)
Signed-off-by:
Nick Hill
<
nickhill123@gmail.com
>
parent
97ba96fb
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
27 additions
and
22 deletions
+27
-22
vllm/config/vllm.py
vllm/config/vllm.py
+27
-22
No files found.
vllm/config/vllm.py
View file @
3adffd5b
...
@@ -582,11 +582,8 @@ class VllmConfig:
...
@@ -582,11 +582,8 @@ class VllmConfig:
)
)
if
self
.
speculative_config
.
disable_padded_drafter_batch
:
if
self
.
speculative_config
.
disable_padded_drafter_batch
:
raise
ValueError
(
raise
ValueError
(
"async scheduling for EAGLE/MTP kind of speculative "
"Async scheduling is not compatible with "
"decoding is enabled, but disable_padded_drafter_batch=True "
"disable_padded_drafter_batch=True."
"disable_padded_drafter_batch=True is not supported for "
"this situation now. please set "
"disable_padded_drafter_batch=Fasle"
)
)
if
not
executor_supports_async_sched
:
if
not
executor_supports_async_sched
:
raise
ValueError
(
raise
ValueError
(
...
@@ -597,32 +594,40 @@ class VllmConfig:
...
@@ -597,32 +594,40 @@ class VllmConfig:
elif
self
.
scheduler_config
.
async_scheduling
is
None
:
elif
self
.
scheduler_config
.
async_scheduling
is
None
:
# Enable async scheduling unless there is an incompatible option.
# Enable async scheduling unless there is an incompatible option.
if
self
.
parallel_config
.
pipeline_parallel_size
>
1
:
if
self
.
parallel_config
.
pipeline_parallel_size
>
1
:
logger
.
warning
(
logger
.
warning
_once
(
"Async scheduling is not yet supported with "
"Async scheduling is not yet supported with "
"pipeline_parallel_size > 1 and will be disabled."
"pipeline_parallel_size > 1 and will be disabled."
,
scope
=
"local"
,
)
)
self
.
scheduler_config
.
async_scheduling
=
False
self
.
scheduler_config
.
async_scheduling
=
False
elif
self
.
speculative_config
is
not
None
:
elif
(
if
self
.
speculative_config
.
method
not
in
get_args
(
EagleModelTypes
):
self
.
speculative_config
is
not
None
logger
.
warning
(
and
self
.
speculative_config
.
method
not
in
get_args
(
EagleModelTypes
)
):
logger
.
warning_once
(
"Async scheduling not supported with %s-based "
"Async scheduling not supported with %s-based "
"speculative decoding and will be disabled."
,
"speculative decoding and will be disabled."
,
self
.
speculative_config
.
method
,
self
.
speculative_config
.
method
,
scope
=
"local"
,
)
)
else
:
self
.
scheduler_config
.
async_scheduling
=
False
logger
.
warning
(
elif
(
"Async scheduling will be disabled because some features do "
self
.
speculative_config
is
not
None
"not currently work in conjunction with speculative decoding. "
and
self
.
speculative_config
.
disable_padded_drafter_batch
"To use async scheduling with spec decoding anyway, "
):
"enable it explicitly via async_scheduling=True."
logger
.
warning_once
(
"Async scheduling is not compatible with "
"disable_padded_drafter_batch=True and will be disabled."
,
scope
=
"local"
,
)
)
self
.
scheduler_config
.
async_scheduling
=
False
self
.
scheduler_config
.
async_scheduling
=
False
elif
not
executor_supports_async_sched
:
elif
not
executor_supports_async_sched
:
logger
.
warning
(
logger
.
warning
_once
(
"Async scheduling will be disabled because it is not supported "
"Async scheduling will be disabled because it is not supported "
"with the `%s` distributed executor backend (only `mp`, `uni`, and "
"with the `%s` distributed executor backend (only `mp`, `uni`, and "
"`external_launcher` are supported)."
,
"`external_launcher` are supported)."
,
executor_backend
,
executor_backend
,
scope
=
"local"
,
)
)
self
.
scheduler_config
.
async_scheduling
=
False
self
.
scheduler_config
.
async_scheduling
=
False
else
:
else
:
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment