Unverified Commit 44cfbb68 authored by Yan Ru Pei's avatar Yan Ru Pei Committed by GitHub
Browse files

test(router): add single-worker mocker soak test (#8234)


Signed-off-by: default avatarPeaBrane <yanrpei@gmail.com>
parent 2ac22df7
......@@ -120,6 +120,17 @@ TEST_PAYLOAD: Dict[str, Any] = {
"stream": True,
"max_tokens": 10,
}
SOAK_TEST_PAYLOAD: Dict[str, Any] = {
"model": MODEL_NAME,
"messages": [
{
"role": "user",
"content": "one two three four five six seven eight nine ten",
}
],
"stream": False,
"max_tokens": 1,
}
def _build_mocker_command(
......@@ -824,6 +835,49 @@ def test_mocker_router(
)
@pytest.mark.timeout(180)
@pytest.mark.parametrize("router_mode", ["kv", "round-robin", "random"])
@pytest.mark.parametrize(
"durable_kv_events", [False], ids=["nondurable"], indirect=True
)
@pytest.mark.parametrize("request_plane", ["nats", "tcp"], indirect=True)
def test_mocker_router_soak(
request,
runtime_services_dynamic_ports,
predownload_tokenizers,
router_mode,
durable_kv_events,
request_plane,
):
mocker_args = {
"speedup_ratio": 1000.0,
"block_size": BLOCK_SIZE,
"durable_kv_events": durable_kv_events,
}
with MockerProcess(
request,
mocker_args=mocker_args,
num_mockers=2,
request_plane=request_plane,
) as mockers:
frontend_port = get_unique_ports(
request, num_ports=1, request_plane=request_plane
)[0]
_test_router_basic(
engine_workers=mockers,
block_size=BLOCK_SIZE,
request=request,
frontend_port=frontend_port,
test_payload=SOAK_TEST_PAYLOAD,
num_requests=1024,
request_plane=request_plane,
router_mode=router_mode,
min_initial_workers=mockers.num_workers,
)
@pytest.mark.parametrize("store_backend", ["etcd", "file"])
@pytest.mark.parametrize(
"durable_kv_events", [False], ids=["nondurable"], indirect=True
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment