test: Remove completions endpoint from vllm tests. (#1575)

Signed-off-by: Pavithra Vijayakrishnan <160681768+pvijayakrish@users.noreply.github.com>

test: Remove completions endpoint from vllm tests. (#1575)
Signed-off-by: Pavithra Vijayakrishnan <160681768+pvijayakrish@users.noreply.github.com>
e7cfe0f6 · Pavithra Vijayakrishnan · GitHub · 2528ea2c · e7cfe0f6
Unverified Commit e7cfe0f6 authored Jun 18, 2025 by Pavithra Vijayakrishnan Committed by GitHub Jun 18, 2025
Hide whitespace changes
Inline Side-by-side

Showing with 5 additions and 10 deletions

tests/serve/test_dynamo_serve.py tests/serve/test_dynamo_serve.py +5 -10

No files found.
--- a/tests/serve/test_dynamo_serve.py
+++ b/tests/serve/test_dynamo_serve.py
@@ -87,10 +87,9 @@ deployment_graphs = {
            module="graphs.agg:Frontend",
            config="configs/agg.yaml",
            directory="/workspace/examples/llm",
-            endpoints=["v1/chat/completions", "v1/completions"],
+            endpoints=["v1/chat/completions"],
            response_handlers=[
                chat_completions_response_handler,
-                completions_response_handler,
            ],
            marks=[pytest.mark.gpu_1, pytest.mark.vllm],
        ),
@@ -115,10 +114,9 @@ deployment_graphs = {
            module="graphs.disagg:Frontend",
            config="configs/disagg.yaml",
            directory="/workspace/examples/llm",
-            endpoints=["v1/chat/completions", "v1/completions"],
+            endpoints=["v1/chat/completions"],
            response_handlers=[
                chat_completions_response_handler,
-                completions_response_handler,
            ],
            marks=[pytest.mark.gpu_2, pytest.mark.vllm],
        ),
@@ -129,10 +127,9 @@ deployment_graphs = {
            module="graphs.agg_router:Frontend",
            config="configs/agg_router.yaml",
            directory="/workspace/examples/llm",
-            endpoints=["v1/chat/completions", "v1/completions"],
+            endpoints=["v1/chat/completions"],
            response_handlers=[
                chat_completions_response_handler,
-                completions_response_handler,
            ],
            marks=[pytest.mark.gpu_1, pytest.mark.vllm],
            # FIXME: This is a hack to allow deployments to start before sending any requests.
@@ -147,10 +144,9 @@ deployment_graphs = {
            module="graphs.disagg_router:Frontend",
            config="configs/disagg_router.yaml",
            directory="/workspace/examples/llm",
-            endpoints=["v1/chat/completions", "v1/completions"],
+            endpoints=["v1/chat/completions"],
            response_handlers=[
                chat_completions_response_handler,
-                completions_response_handler,
            ],
            marks=[pytest.mark.gpu_2, pytest.mark.vllm],
            # FIXME: This is a hack to allow deployments to start before sending any requests.
@@ -165,10 +161,9 @@ deployment_graphs = {
            module="graphs.agg:Frontend",
            config="configs/agg.yaml",
            directory="/workspace/examples/multimodal",
-            endpoints=["v1/chat/completions", "v1/completions"],
+            endpoints=["v1/chat/completions"],
            response_handlers=[
                chat_completions_response_handler,
-                completions_response_handler,
            ],
            marks=[pytest.mark.gpu_2, pytest.mark.vllm],
        ),