Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
7d44c691
Unverified
Commit
7d44c691
authored
Jul 28, 2025
by
Nick Hill
Committed by
GitHub
Jul 28, 2025
Browse files
[P/D] Log warnings related to prefill KV expiry (#21753)
Signed-off-by:
Nick Hill
<
nhill@redhat.com
>
parent
e17a4d3b
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
12 additions
and
0 deletions
+12
-0
vllm/distributed/kv_transfer/kv_connector/v1/nixl_connector.py
...distributed/kv_transfer/kv_connector/v1/nixl_connector.py
+12
-0
No files found.
vllm/distributed/kv_transfer/kv_connector/v1/nixl_connector.py
View file @
7d44c691
...
...
@@ -1025,6 +1025,11 @@ class NixlConnectorWorker:
# Sorted dict, oldest requests are put first so we can exit early.
if
now
<
expires
:
break
count
=
self
.
consumer_notification_counts_by_req
.
pop
(
req_id
,
0
)
logger
.
warning
(
"Releasing expired KV blocks for request %s which were "
"retrieved by %d decode worker(s) within %d seconds."
,
req_id
,
count
,
envs
.
VLLM_NIXL_ABORT_REQUEST_TIMEOUT
)
del
self
.
_reqs_to_send
[
req_id
]
done_sending
.
add
(
req_id
)
...
...
@@ -1040,6 +1045,13 @@ class NixlConnectorWorker:
for
notifs
in
self
.
nixl_wrapper
.
get_new_notifs
().
values
():
for
notif
in
notifs
:
req_id
,
tp_ratio
=
notif
.
decode
(
"utf-8"
).
rsplit
(
":"
,
1
)
if
req_id
not
in
self
.
_reqs_to_send
:
logger
.
error
(
"Potentially invalid KV blocks for "
"unrecognized request %s were retrieved by "
"a decode worker. They may have expired."
,
req_id
)
continue
self
.
consumer_notification_counts_by_req
[
req_id
]
+=
1
# Wait all consumers (D) to be done reading before freeing.
if
self
.
consumer_notification_counts_by_req
[
req_id
]
==
int
(
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment