Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
5bdd1552
Unverified
Commit
5bdd1552
authored
Nov 17, 2025
by
Nick Hill
Committed by
GitHub
Nov 18, 2025
Browse files
[CI] Fix async scheduling + spec decoding test flake (#28902)
Signed-off-by:
Nick Hill
<
nhill@redhat.com
>
parent
0168f69e
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
5 additions
and
3 deletions
+5
-3
tests/v1/e2e/test_async_scheduling.py
tests/v1/e2e/test_async_scheduling.py
+5
-3
No files found.
tests/v1/e2e/test_async_scheduling.py
View file @
5bdd1552
...
@@ -84,6 +84,7 @@ def test_with_spec_decoding(monkeypatch: pytest.MonkeyPatch):
...
@@ -84,6 +84,7 @@ def test_with_spec_decoding(monkeypatch: pytest.MonkeyPatch):
"num_speculative_tokens"
:
2
,
"num_speculative_tokens"
:
2
,
"model"
:
"nm-testing/Llama3_2_1B_speculator.eagle3"
,
"model"
:
"nm-testing/Llama3_2_1B_speculator.eagle3"
,
}
}
# Set small draft model len to force doesn't-fit-in-drafter case.
spec_config_short
=
spec_config
|
{
"max_model_len"
:
50
}
spec_config_short
=
spec_config
|
{
"max_model_len"
:
50
}
# test_preemption, executor, async_scheduling,
# test_preemption, executor, async_scheduling,
...
@@ -174,13 +175,14 @@ def run_tests(
...
@@ -174,13 +175,14 @@ def run_tests(
):
):
if
"spec_mml=None"
in
test_config
:
if
"spec_mml=None"
in
test_config
:
assert
(
assert
(
pytest
.
approx
(
test_acceptance_rate
,
rel
=
5e-2
)
test_acceptance_rate
>
base_acceptance_rate
==
base_acceptance_rate
or
test_acceptance_rate
==
pytest
.
approx
(
base_acceptance_rate
,
rel
=
5e-2
)
)
)
else
:
else
:
# Currently the reported acceptance rate is expected to be
# Currently the reported acceptance rate is expected to be
# lower when we sometimes skip drafting altogether.
# lower when we sometimes skip drafting altogether.
assert
test_acceptance_rate
>
0.
05
assert
test_acceptance_rate
>
0.
1
print
(
print
(
f
"PASSED: config=[
{
test_config
}
], params=
{
params
}
"
f
"PASSED: config=[
{
test_config
}
], params=
{
params
}
"
f
" accept_rate=
{
test_acceptance_rate
}
"
f
" accept_rate=
{
test_acceptance_rate
}
"
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment