Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
be292b7c
Unverified
Commit
be292b7c
authored
Mar 09, 2026
by
Wentao Ye
Committed by
GitHub
Mar 09, 2026
Browse files
[Bug] Fix pooling model benchmark script (#36300)
Signed-off-by:
yewentao256
<
zhyanwentao@126.com
>
parent
77a73458
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
13 additions
and
5 deletions
+13
-5
vllm/benchmarks/lib/endpoint_request_func.py
vllm/benchmarks/lib/endpoint_request_func.py
+11
-0
vllm/benchmarks/serve.py
vllm/benchmarks/serve.py
+2
-5
No files found.
vllm/benchmarks/lib/endpoint_request_func.py
View file @
be292b7c
...
@@ -795,6 +795,17 @@ ASYNC_REQUEST_FUNCS: dict[str, RequestFunc] = {
...
@@ -795,6 +795,17 @@ ASYNC_REQUEST_FUNCS: dict[str, RequestFunc] = {
"vllm-rerank"
:
async_request_vllm_rerank
,
"vllm-rerank"
:
async_request_vllm_rerank
,
}
}
POOLING_BACKENDS
=
{
"openai-embeddings"
,
"openai-embeddings-chat"
,
"openai-embeddings-clip"
,
"openai-embeddings-vlm2vec"
,
"infinity-embeddings"
,
"infinity-embeddings-clip"
,
"vllm-pooling"
,
"vllm-rerank"
,
}
OPENAI_COMPATIBLE_BACKENDS
=
[
OPENAI_COMPATIBLE_BACKENDS
=
[
k
k
for
k
,
v
in
ASYNC_REQUEST_FUNCS
.
items
()
for
k
,
v
in
ASYNC_REQUEST_FUNCS
.
items
()
...
...
vllm/benchmarks/serve.py
View file @
be292b7c
...
@@ -45,6 +45,7 @@ from vllm.benchmarks.datasets import SampleRequest, add_dataset_parser, get_samp
...
@@ -45,6 +45,7 @@ from vllm.benchmarks.datasets import SampleRequest, add_dataset_parser, get_samp
from
vllm.benchmarks.lib.endpoint_request_func
import
(
from
vllm.benchmarks.lib.endpoint_request_func
import
(
ASYNC_REQUEST_FUNCS
,
ASYNC_REQUEST_FUNCS
,
OPENAI_COMPATIBLE_BACKENDS
,
OPENAI_COMPATIBLE_BACKENDS
,
POOLING_BACKENDS
,
RequestFuncInput
,
RequestFuncInput
,
RequestFuncOutput
,
RequestFuncOutput
,
)
)
...
@@ -1721,11 +1722,7 @@ async def main_async(args: argparse.Namespace) -> dict[str, Any]:
...
@@ -1721,11 +1722,7 @@ async def main_async(args: argparse.Namespace) -> dict[str, Any]:
goodput_config_dict
=
check_goodput_args
(
args
)
goodput_config_dict
=
check_goodput_args
(
args
)
backend
=
args
.
backend
backend
=
args
.
backend
task_type
=
(
task_type
=
TaskType
.
POOLING
if
backend
in
POOLING_BACKENDS
else
TaskType
.
GENERATION
TaskType
.
POOLING
if
"embeddings"
in
backend
or
"rerank"
in
backend
else
TaskType
.
GENERATION
)
# Collect the sampling parameters.
# Collect the sampling parameters.
if
task_type
==
TaskType
.
GENERATION
:
if
task_type
==
TaskType
.
GENERATION
:
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment