Unverified Commit e6ce4db3 authored by Dmitry Tokarev's avatar Dmitry Tokarev Committed by GitHub
Browse files

test(fault_tolerance): skip flaky sglang migration NATS combo, drop stale...


test(fault_tolerance): skip flaky sglang migration NATS combo, drop stale graceful_shutdown xfail (#8404)
Signed-off-by: default avatarDmitry Tokarev <dtokarev@nvidia.com>
Co-authored-by: default avatarClaude Opus 4.7 (1M context) <noreply@anthropic.com>
parent d795e1a4
......@@ -46,13 +46,7 @@ pytestmark = [
"immediate_kill",
[
pytest.param(True, id="worker_failure"),
pytest.param(
False,
id="graceful_shutdown",
marks=pytest.mark.xfail(
strict=False, reason="SGLang graceful shutdown not yet implemented"
),
),
pytest.param(False, id="graceful_shutdown"),
],
),
pytest.mark.parametrize(
......@@ -241,6 +235,22 @@ def test_request_migration_sglang_aggregated(
stream: True for streaming, False for non-streaming
"""
# TODO(<LINEAR-ID>): Flaky on NATS transport — first-token delay routinely
# exceeds the 6s threshold in utils.validate_response. Other parameter
# combinations (including the TCP variant) are stable.
if (
migration_limit == 3
and migration_max_seq_len is None
and immediate_kill is True
and request_api == "chat"
and stream is True
and request.getfixturevalue("request_plane") == "nats"
):
pytest.skip(
"Flaky on NATS transport: first-token delay > 6s threshold. "
"OPS-4446"
)
# Step 1: Start the frontend
with DynamoFrontendProcess(
request,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment