Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
10d9872d
Unverified
Commit
10d9872d
authored
Apr 13, 2026
by
zhanqiuhu
Committed by
GitHub
Apr 13, 2026
Browse files
[CI][Metrics] Fix local_cache_hit assertion after prompt tokens metrics updates (#39709)
Signed-off-by:
ZhanqiuHu
<
zhu@redhat.com
>
parent
ccd0d1d9
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
4 additions
and
4 deletions
+4
-4
tests/v1/kv_connector/nixl_integration/test_multi_connector_edge_cases.py
...ector/nixl_integration/test_multi_connector_edge_cases.py
+4
-4
No files found.
tests/v1/kv_connector/nixl_integration/test_multi_connector_edge_cases.py
View file @
10d9872d
...
@@ -341,8 +341,8 @@ def test_full_decode_gpu_cache_hit_metrics():
...
@@ -341,8 +341,8 @@ def test_full_decode_gpu_cache_hit_metrics():
print
(
f
"FULL CACHE HIT:
{
P
}
tokens, cached=
{
cached
}
, nixl=
{
expected_nixl
}
"
)
print
(
f
"FULL CACHE HIT:
{
P
}
tokens, cached=
{
cached
}
, nixl=
{
expected_nixl
}
"
)
print
(
f
" metrics delta:
{
d
}
, nixl_bytes_delta=
{
n1
-
n0
}
"
)
print
(
f
" metrics delta:
{
d
}
, nixl_bytes_delta=
{
n1
-
n0
}
"
)
assert
len
(
proxy_text
)
>
0
,
"proxy returned empty response"
assert
len
(
proxy_text
)
>
0
,
"proxy returned empty response"
assert
d
[
"local_cache_hit"
]
==
cached
,
(
assert
d
[
"local_cache_hit"
]
==
cached
-
1
,
(
f
"expected local_cache_hit=
{
cached
}
, got
{
d
[
'local_cache_hit'
]
}
"
f
"expected local_cache_hit=
{
cached
-
1
}
, got
{
d
[
'local_cache_hit'
]
}
"
)
)
assert
d
[
"external_kv_transfer"
]
==
expected_nixl
,
(
assert
d
[
"external_kv_transfer"
]
==
expected_nixl
,
(
f
"expected external_kv_transfer=
{
expected_nixl
}
, "
f
"expected external_kv_transfer=
{
expected_nixl
}
, "
...
@@ -383,8 +383,8 @@ def test_partial_decode_gpu_cache_hit_metrics():
...
@@ -383,8 +383,8 @@ def test_partial_decode_gpu_cache_hit_metrics():
f
"expected external_kv_transfer=
{
expected_nixl
}
, "
f
"expected external_kv_transfer=
{
expected_nixl
}
, "
f
"got
{
d
[
'external_kv_transfer'
]
}
"
f
"got
{
d
[
'external_kv_transfer'
]
}
"
)
)
assert
d
[
"local_cache_hit"
]
==
cached
,
(
assert
d
[
"local_cache_hit"
]
==
cached
-
1
,
(
f
"expected local_cache_hit=
{
cached
}
, got
{
d
[
'local_cache_hit'
]
}
"
f
"expected local_cache_hit=
{
cached
-
1
}
, got
{
d
[
'local_cache_hit'
]
}
"
)
)
assert
d
[
"local_compute"
]
==
1
,
(
assert
d
[
"local_compute"
]
==
1
,
(
f
"expected local_compute=1 (recomputed last token), got
{
d
[
'local_compute'
]
}
"
f
"expected local_compute=1 (recomputed last token), got
{
d
[
'local_compute'
]
}
"
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment