Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
3d13ca0e
Unverified
Commit
3d13ca0e
authored
May 07, 2025
by
Nick Hill
Committed by
GitHub
May 08, 2025
Browse files
[BugFix] Fix `--disable-log-stats` in V1 server mode (#17600)
Signed-off-by:
Nick Hill
<
nhill@redhat.com
>
parent
66ab3b13
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
7 additions
and
5 deletions
+7
-5
vllm/v1/engine/async_llm.py
vllm/v1/engine/async_llm.py
+3
-2
vllm/v1/engine/core_client.py
vllm/v1/engine/core_client.py
+4
-3
No files found.
vllm/v1/engine/async_llm.py
View file @
3d13ca0e
...
@@ -120,6 +120,7 @@ class AsyncLLM(EngineClient):
...
@@ -120,6 +120,7 @@ class AsyncLLM(EngineClient):
executor_class
=
executor_class
,
executor_class
=
executor_class
,
log_stats
=
self
.
log_stats
,
log_stats
=
self
.
log_stats
,
)
)
if
self
.
stat_loggers
:
for
stat_logger
in
self
.
stat_loggers
[
0
]:
for
stat_logger
in
self
.
stat_loggers
[
0
]:
stat_logger
.
log_engine_initialized
()
stat_logger
.
log_engine_initialized
()
self
.
output_handler
:
Optional
[
asyncio
.
Task
]
=
None
self
.
output_handler
:
Optional
[
asyncio
.
Task
]
=
None
...
...
vllm/v1/engine/core_client.py
View file @
3d13ca0e
...
@@ -442,9 +442,10 @@ class MPClient(EngineCoreClient):
...
@@ -442,9 +442,10 @@ class MPClient(EngineCoreClient):
logger
.
info
(
"Core engine process %d ready."
,
eng_id
)
logger
.
info
(
"Core engine process %d ready."
,
eng_id
)
identities
.
discard
(
eng_id
)
identities
.
discard
(
eng_id
)
# Setup KV cache config with initialization state from
# Setup KV cache config with initialization state from
# engine core process.
# engine core process. Sum values from all engines in DP case.
self
.
vllm_config
.
cache_config
.
num_gpu_blocks
=
message_dict
[
num_gpu_blocks
=
self
.
vllm_config
.
cache_config
.
num_gpu_blocks
or
0
'num_gpu_blocks'
]
num_gpu_blocks
+=
message_dict
[
'num_gpu_blocks'
]
self
.
vllm_config
.
cache_config
.
num_gpu_blocks
=
num_gpu_blocks
def
_init_core_engines
(
def
_init_core_engines
(
self
,
self
,
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment