Unverified Commit 44a40a0b authored by Jacky's avatar Jacky Committed by GitHub
Browse files

test: Allow prefill cancellation tests to fail (#3300)


Signed-off-by: default avatarJacky <18255193+kthui@users.noreply.github.com>
parent 3aa30778
......@@ -344,6 +344,11 @@ def test_request_cancellation_trtllm_decode_first_decode_cancel(
@pytest.mark.gpu_1
@pytest.mark.e2e
@pytest.mark.model(FAULT_TOLERANCE_MODEL_NAME)
@pytest.mark.xfail(
reason="Time-sensitive test: Relies on request timeout (0.1s) to cancel during remote prefill phase. "
"May fail if prefill completes too quickly or timeout triggers at a different phase.",
strict=False,
)
def test_request_cancellation_trtllm_decode_first_remote_prefill_cancel(
request, runtime_services, predownload_models
):
......@@ -403,6 +408,11 @@ def test_request_cancellation_trtllm_decode_first_remote_prefill_cancel(
@pytest.mark.gpu_1
@pytest.mark.e2e
@pytest.mark.model(FAULT_TOLERANCE_MODEL_NAME)
@pytest.mark.xfail(
reason="Time-sensitive test: Relies on request timeout (0.1s) to cancel during prefill phase. "
"May fail if prefill completes too quickly or timeout triggers at a different phase.",
strict=False,
)
def test_request_cancellation_trtllm_prefill_first_prefill_cancel(
request, runtime_services, predownload_models
):
......
......@@ -316,6 +316,11 @@ def test_request_cancellation_vllm_decode(
@pytest.mark.gpu_1
@pytest.mark.e2e
@pytest.mark.model(FAULT_TOLERANCE_MODEL_NAME)
@pytest.mark.xfail(
reason="Time-sensitive test: Relies on request timeout (0.1s) to cancel during prefill phase. "
"May fail if prefill completes too quickly or timeout triggers at a different phase.",
strict=False,
)
def test_request_cancellation_vllm_prefill(
request, runtime_services, predownload_models
):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment