Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
dynamo
Commits
7802f969
Unverified
Commit
7802f969
authored
Nov 10, 2025
by
Biswa Panda
Committed by
GitHub
Nov 10, 2025
Browse files
feat: disable kv events in vLLM when lora is enabled (#4128)
parent
5c46fa4c
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
21 additions
and
0 deletions
+21
-0
components/src/dynamo/vllm/args.py
components/src/dynamo/vllm/args.py
+18
-0
components/src/dynamo/vllm/main.py
components/src/dynamo/vllm/main.py
+3
-0
No files found.
components/src/dynamo/vllm/args.py
View file @
7802f969
...
@@ -326,6 +326,24 @@ def create_kv_events_config(config: Config) -> Optional[KVEventsConfig]:
...
@@ -326,6 +326,24 @@ def create_kv_events_config(config: Config) -> Optional[KVEventsConfig]:
if
not
config
.
engine_args
.
enable_prefix_caching
:
if
not
config
.
engine_args
.
enable_prefix_caching
:
return
None
return
None
# There is a bug with KV events publishing when LORA is enabled.
# This is fixed in https://github.com/vllm-project/vllm/pull/27728 but not released yet.
# remove below check once new vLLM version is released with the fix.
if
config
.
engine_args
.
enable_lora
:
if
config
.
engine_args
.
kv_events_config
is
None
:
# No explicit kv events config provided by user, we'll disable kv cache because LoRA is enabled and its not supported yet.
return
None
else
:
# User provided their own kv events config and it'll not work when LoRA is enabled.
message
=
(
"KV events doesn't work when LoRA is enabled due to upstream vLLM bug. "
"Please see https://github.com/vllm-project/vllm/pull/27728."
"For now, either disable lora or dont use explicit kv envents config."
"Dont set both --kv-events-config and --enable-lora in vllm command line args."
)
logger
.
error
(
message
)
raise
ValueError
(
message
)
# If user provided their own config, use that
# If user provided their own config, use that
if
c
:
=
getattr
(
config
.
engine_args
,
"kv_events_config"
):
if
c
:
=
getattr
(
config
.
engine_args
,
"kv_events_config"
):
logger
.
info
(
f
"Using user-provided kv_events_config
{
c
}
"
)
logger
.
info
(
f
"Using user-provided kv_events_config
{
c
}
"
)
...
...
components/src/dynamo/vllm/main.py
View file @
7802f969
...
@@ -153,6 +153,9 @@ def setup_kv_event_publisher(
...
@@ -153,6 +153,9 @@ def setup_kv_event_publisher(
logger
.
info
(
"Skipping KV event publisher setup for decode worker"
)
logger
.
info
(
"Skipping KV event publisher setup for decode worker"
)
return
None
return
None
if
config
.
engine_args
.
kv_events_config
is
None
:
return
None
# Get data_parallel_size to create publishers for all dp_ranks
# Get data_parallel_size to create publishers for all dp_ranks
data_parallel_size
=
getattr
(
vllm_config
.
parallel_config
,
"data_parallel_size"
,
1
)
data_parallel_size
=
getattr
(
vllm_config
.
parallel_config
,
"data_parallel_size"
,
1
)
kv_publishers
=
[]
kv_publishers
=
[]
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment