Unverified Commit e7cfe0f6 authored by Pavithra Vijayakrishnan's avatar Pavithra Vijayakrishnan Committed by GitHub
Browse files

test: Remove completions endpoint from vllm tests. (#1575)


Signed-off-by: default avatarPavithra Vijayakrishnan <160681768+pvijayakrish@users.noreply.github.com>
parent 2528ea2c
...@@ -87,10 +87,9 @@ deployment_graphs = { ...@@ -87,10 +87,9 @@ deployment_graphs = {
module="graphs.agg:Frontend", module="graphs.agg:Frontend",
config="configs/agg.yaml", config="configs/agg.yaml",
directory="/workspace/examples/llm", directory="/workspace/examples/llm",
endpoints=["v1/chat/completions", "v1/completions"], endpoints=["v1/chat/completions"],
response_handlers=[ response_handlers=[
chat_completions_response_handler, chat_completions_response_handler,
completions_response_handler,
], ],
marks=[pytest.mark.gpu_1, pytest.mark.vllm], marks=[pytest.mark.gpu_1, pytest.mark.vllm],
), ),
...@@ -115,10 +114,9 @@ deployment_graphs = { ...@@ -115,10 +114,9 @@ deployment_graphs = {
module="graphs.disagg:Frontend", module="graphs.disagg:Frontend",
config="configs/disagg.yaml", config="configs/disagg.yaml",
directory="/workspace/examples/llm", directory="/workspace/examples/llm",
endpoints=["v1/chat/completions", "v1/completions"], endpoints=["v1/chat/completions"],
response_handlers=[ response_handlers=[
chat_completions_response_handler, chat_completions_response_handler,
completions_response_handler,
], ],
marks=[pytest.mark.gpu_2, pytest.mark.vllm], marks=[pytest.mark.gpu_2, pytest.mark.vllm],
), ),
...@@ -129,10 +127,9 @@ deployment_graphs = { ...@@ -129,10 +127,9 @@ deployment_graphs = {
module="graphs.agg_router:Frontend", module="graphs.agg_router:Frontend",
config="configs/agg_router.yaml", config="configs/agg_router.yaml",
directory="/workspace/examples/llm", directory="/workspace/examples/llm",
endpoints=["v1/chat/completions", "v1/completions"], endpoints=["v1/chat/completions"],
response_handlers=[ response_handlers=[
chat_completions_response_handler, chat_completions_response_handler,
completions_response_handler,
], ],
marks=[pytest.mark.gpu_1, pytest.mark.vllm], marks=[pytest.mark.gpu_1, pytest.mark.vllm],
# FIXME: This is a hack to allow deployments to start before sending any requests. # FIXME: This is a hack to allow deployments to start before sending any requests.
...@@ -147,10 +144,9 @@ deployment_graphs = { ...@@ -147,10 +144,9 @@ deployment_graphs = {
module="graphs.disagg_router:Frontend", module="graphs.disagg_router:Frontend",
config="configs/disagg_router.yaml", config="configs/disagg_router.yaml",
directory="/workspace/examples/llm", directory="/workspace/examples/llm",
endpoints=["v1/chat/completions", "v1/completions"], endpoints=["v1/chat/completions"],
response_handlers=[ response_handlers=[
chat_completions_response_handler, chat_completions_response_handler,
completions_response_handler,
], ],
marks=[pytest.mark.gpu_2, pytest.mark.vllm], marks=[pytest.mark.gpu_2, pytest.mark.vllm],
# FIXME: This is a hack to allow deployments to start before sending any requests. # FIXME: This is a hack to allow deployments to start before sending any requests.
...@@ -165,10 +161,9 @@ deployment_graphs = { ...@@ -165,10 +161,9 @@ deployment_graphs = {
module="graphs.agg:Frontend", module="graphs.agg:Frontend",
config="configs/agg.yaml", config="configs/agg.yaml",
directory="/workspace/examples/multimodal", directory="/workspace/examples/multimodal",
endpoints=["v1/chat/completions", "v1/completions"], endpoints=["v1/chat/completions"],
response_handlers=[ response_handlers=[
chat_completions_response_handler, chat_completions_response_handler,
completions_response_handler,
], ],
marks=[pytest.mark.gpu_2, pytest.mark.vllm], marks=[pytest.mark.gpu_2, pytest.mark.vllm],
), ),
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment