Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
dynamo
Commits
b5fa0a34
"lib/runtime/src/vscode:/vscode.git/clone" did not exist on "74221fd716d1edbad2a102cb5c5c8d52e64e4631"
Unverified
Commit
b5fa0a34
authored
Aug 21, 2025
by
Alec
Committed by
GitHub
Aug 21, 2025
Browse files
fix: --kv-event-config now respects command line (#2627)
parent
4c380caa
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
32 additions
and
14 deletions
+32
-14
components/backends/vllm/src/dynamo/vllm/args.py
components/backends/vllm/src/dynamo/vllm/args.py
+32
-14
No files found.
components/backends/vllm/src/dynamo/vllm/args.py
View file @
b5fa0a34
...
@@ -254,6 +254,32 @@ async def configure_ports_with_etcd(config: Config, etcd_client):
...
@@ -254,6 +254,32 @@ async def configure_ports_with_etcd(config: Config, etcd_client):
set_side_channel_host_and_port
(
base_side_channel_port
)
set_side_channel_host_and_port
(
base_side_channel_port
)
def
create_kv_events_config
(
config
:
Config
)
->
Optional
[
KVEventsConfig
]:
"""Create KVEventsConfig for prefix caching if needed."""
# If prefix caching is not enabled, no events config needed
if
not
config
.
engine_args
.
enable_prefix_caching
:
return
None
# If user provided their own config, use that
if
getattr
(
config
.
engine_args
,
"kv_events_config"
):
logger
.
info
(
"Using user-provided kv_events_config"
)
return
None
# Create default events config for prefix caching
logger
.
info
(
"Creating Dynamo default kv_events_config for prefix caching"
)
if
config
.
kv_port
is
None
:
raise
ValueError
(
"config.kv_port is not set; call configure_ports_with_etcd(...) before overwrite_args "
"or provide --kv-event-config to supply an explicit endpoint."
)
dp_rank
=
config
.
engine_args
.
data_parallel_rank
or
0
return
KVEventsConfig
(
enable_kv_cache_events
=
True
,
publisher
=
"zmq"
,
endpoint
=
f
"tcp://*:
{
config
.
kv_port
-
dp_rank
}
"
,
# vLLM will iterate dp_rank for us, so we need to subtract it out TODO: fix in vLLM
)
def
create_kv_transfer_config
(
config
:
Config
)
->
Optional
[
KVTransferConfig
]:
def
create_kv_transfer_config
(
config
:
Config
)
->
Optional
[
KVTransferConfig
]:
"""Create KVTransferConfig based on user config or connector list.
"""Create KVTransferConfig based on user config or connector list.
...
@@ -313,24 +339,16 @@ def overwrite_args(config):
...
@@ -313,24 +339,16 @@ def overwrite_args(config):
# a NoneType error when the processor accesses the tokenizer.
# a NoneType error when the processor accesses the tokenizer.
"skip_tokenizer_init"
:
False
,
"skip_tokenizer_init"
:
False
,
"disable_log_requests"
:
True
,
"disable_log_requests"
:
True
,
# KV routing relies on logging KV metrics
"disable_log_stats"
:
False
,
"disable_log_stats"
:
False
,
}
}
kv_config
=
create_kv_transfer_config
(
config
)
kv_
transfer_
config
=
create_kv_transfer_config
(
config
)
if
kv_config
:
if
kv_
transfer_
config
:
defaults
[
"kv_transfer_config"
]
=
kv_config
defaults
[
"kv_transfer_config"
]
=
kv_
transfer_
config
if
config
.
engine_args
.
enable_prefix_caching
:
kv_events_config
=
create_kv_events_config
(
config
)
dp_rank
=
config
.
engine_args
.
data_parallel_rank
or
0
if
kv_events_config
:
defaults
|=
{
defaults
[
"kv_events_config"
]
=
kv_events_config
# Always setting up kv events if enable prefix cache.
"kv_events_config"
:
KVEventsConfig
(
enable_kv_cache_events
=
True
,
publisher
=
"zmq"
,
endpoint
=
f
"tcp://*:
{
config
.
kv_port
-
dp_rank
}
"
,
# vLLM will iterate dp_rank for us, so we need to subtract it out TODO: fix in vLLM
)
}
logger
.
debug
(
"Setting Dynamo defaults for vLLM"
)
logger
.
debug
(
"Setting Dynamo defaults for vLLM"
)
for
key
,
value
in
defaults
.
items
():
for
key
,
value
in
defaults
.
items
():
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment