Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
02a58803
Unverified
Commit
02a58803
authored
Dec 12, 2025
by
Wentao Ye
Committed by
GitHub
Dec 12, 2025
Browse files
[CI] Fix mypy for vllm/v1/executor (#30517)
Signed-off-by:
yewentao256
<
zhyanwentao@126.com
>
parent
d2c919dc
Changes
5
Hide whitespace changes
Inline
Side-by-side
Showing
5 changed files
with
20 additions
and
13 deletions
+20
-13
tools/pre_commit/mypy.py
tools/pre_commit/mypy.py
+1
-1
vllm/v1/executor/abstract.py
vllm/v1/executor/abstract.py
+1
-1
vllm/v1/executor/multiproc_executor.py
vllm/v1/executor/multiproc_executor.py
+7
-3
vllm/v1/executor/ray_executor.py
vllm/v1/executor/ray_executor.py
+3
-3
vllm/v1/executor/uniproc_executor.py
vllm/v1/executor/uniproc_executor.py
+8
-5
No files found.
tools/pre_commit/mypy.py
View file @
02a58803
...
...
@@ -43,6 +43,7 @@ FILES = [
"vllm/worker"
,
"vllm/v1/core"
,
"vllm/v1/engine"
,
"vllm/v1/executor"
,
"vllm/v1/metrics"
,
"vllm/v1/pool"
,
"vllm/v1/sample"
,
...
...
@@ -60,7 +61,6 @@ SEPARATE_GROUPS = [
"vllm/model_executor"
,
# v1 related
"vllm/v1/attention"
,
"vllm/v1/executor"
,
"vllm/v1/kv_offload"
,
"vllm/v1/spec_decode"
,
"vllm/v1/structured_output"
,
...
...
vllm/v1/executor/abstract.py
View file @
02a58803
...
...
@@ -219,7 +219,7 @@ class Executor(ABC):
def
sample_tokens
(
self
,
grammar_output
:
GrammarOutput
|
None
,
non_block
:
bool
=
False
)
->
ModelRunnerOutput
|
None
|
Future
[
ModelRunnerOutput
|
None
]:
)
->
ModelRunnerOutput
|
Future
[
ModelRunnerOutput
]:
output
=
self
.
collective_rpc
(
# type: ignore[call-overload]
"sample_tokens"
,
args
=
(
grammar_output
,),
non_block
=
non_block
)
...
...
vllm/v1/executor/multiproc_executor.py
View file @
02a58803
...
...
@@ -294,8 +294,8 @@ class MultiprocExecutor(Executor):
kwargs
:
dict
|
None
=
None
,
non_block
:
bool
=
False
,
unique_reply_rank
:
int
|
None
=
None
,
kv_output_aggregator
:
KVOutputAggregator
=
None
,
)
->
Any
|
list
[
Any
]
|
Future
[
Any
|
list
[
Any
]]
:
kv_output_aggregator
:
KVOutputAggregator
|
None
=
None
,
)
->
Any
:
"""Returns single result if unique_reply_rank and/or kv_output_aggregator
is provided, otherwise list."""
assert
self
.
rpc_broadcast_mq
is
not
None
,
(
...
...
@@ -476,6 +476,8 @@ class WorkerProc:
"""Wrapper that runs one Worker in a separate process."""
READY_STR
=
"READY"
rpc_broadcast_mq
:
MessageQueue
|
None
worker_response_mq
:
MessageQueue
|
None
def
_init_message_queues
(
self
,
input_shm_handle
:
Handle
,
vllm_config
:
VllmConfig
...
...
@@ -487,7 +489,7 @@ class WorkerProc:
)
# Initializes a message queue for sending the model output
self
.
worker_response_mq
:
MessageQueue
=
MessageQueue
(
1
,
1
)
self
.
worker_response_mq
=
MessageQueue
(
1
,
1
)
self
.
peer_response_handles
=
[]
else
:
# Initialize remote MessageQueue for receiving SchedulerOutput across nodes
...
...
@@ -720,6 +722,7 @@ class WorkerProc:
try
:
reader
.
close
()
worker
=
WorkerProc
(
*
args
,
**
kwargs
)
assert
worker
.
worker_response_mq
is
not
None
# Send READY once we know everything is loaded
ready_writer
.
send
(
...
...
@@ -804,6 +807,7 @@ class WorkerProc:
def
worker_busy_loop
(
self
,
cancel
:
threading
.
Event
|
None
=
None
):
"""Main busy loop for Multiprocessing Workers"""
assert
self
.
rpc_broadcast_mq
is
not
None
while
True
:
method
,
args
,
kwargs
,
output_rank
=
self
.
rpc_broadcast_mq
.
dequeue
(
cancel
=
cancel
,
indefinite
=
True
...
...
vllm/v1/executor/ray_executor.py
View file @
02a58803
...
...
@@ -413,7 +413,7 @@ class RayDistributedExecutor(Executor):
self
,
grammar_output
:
"GrammarOutput | None"
,
non_block
:
bool
=
False
,
)
->
ModelRunnerOutput
|
Future
[
ModelRunnerOutput
]:
)
->
ModelRunnerOutput
|
None
|
Future
[
ModelRunnerOutput
|
None
]:
"""Execute the model on the Ray workers.
The scheduler output to use should have been provided in
...
...
@@ -428,7 +428,7 @@ class RayDistributedExecutor(Executor):
"""
scheduler_output
=
self
.
scheduler_output
if
scheduler_output
is
None
:
return
COMPLETED_NONE_FUTURE
if
non_block
else
None
# noqa
return
COMPLETED_NONE_FUTURE
if
non_block
else
None
self
.
scheduler_output
=
None
...
...
@@ -439,7 +439,7 @@ class RayDistributedExecutor(Executor):
scheduler_output
:
SchedulerOutput
,
grammar_output
:
"GrammarOutput | None"
,
non_block
:
bool
=
False
,
)
->
ModelRunnerOutput
|
Future
[
ModelRunnerOutput
]:
)
->
ModelRunnerOutput
|
None
|
Future
[
ModelRunnerOutput
|
None
]:
# Build the compiled DAG for the first time.
if
self
.
forward_dag
is
None
:
# type: ignore
self
.
forward_dag
=
self
.
_compiled_ray_dag
(
enable_asyncio
=
False
)
...
...
vllm/v1/executor/uniproc_executor.py
View file @
02a58803
...
...
@@ -67,7 +67,7 @@ class UniProcExecutor(Executor):
kwargs
:
dict
|
None
=
None
,
non_block
:
bool
=
False
,
single_value
:
bool
=
False
,
)
->
Any
|
list
[
Any
]
|
Future
[
Any
|
list
[
Any
]]
:
)
->
Any
:
if
kwargs
is
None
:
kwargs
=
{}
...
...
@@ -79,10 +79,13 @@ class UniProcExecutor(Executor):
result
=
run_method
(
self
.
driver_worker
,
method
,
args
,
kwargs
)
if
isinstance
(
result
,
AsyncModelRunnerOutput
):
if
(
async_thread
:
=
self
.
async_output_thread
)
is
not
None
:
get_output
=
result
.
get_output
if
not
single_value
:
get_output
=
lambda
go
=
result
.
get_output
:
[
go
()]
return
async_thread
.
submit
(
get_output
)
if
single_value
:
return
async_thread
.
submit
(
result
.
get_output
)
def
get_output_list
()
->
list
[
Any
]:
return
[
result
.
get_output
()]
return
async_thread
.
submit
(
get_output_list
)
result
=
result
.
get_output
()
future
=
Future
[
Any
]()
future
.
set_result
(
result
if
single_value
else
[
result
])
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment