Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
fd1ce98c
Unverified
Commit
fd1ce98c
authored
Sep 11, 2025
by
wang.yuqi
Committed by
GitHub
Sep 11, 2025
Browse files
[CI] Split mteb test from Language Models Test (#24634)
Signed-off-by:
wang.yuqi
<
noooop@126.com
>
parent
d11ec124
Changes
16
Show whitespace changes
Inline
Side-by-side
Showing
16 changed files
with
56 additions
and
40 deletions
+56
-40
.buildkite/test-pipeline.yaml
.buildkite/test-pipeline.yaml
+10
-0
tests/entrypoints/pooling/correctness/test_mteb_embed.py
tests/entrypoints/pooling/correctness/test_mteb_embed.py
+3
-4
tests/entrypoints/pooling/correctness/test_mteb_score.py
tests/entrypoints/pooling/correctness/test_mteb_score.py
+3
-9
tests/models/language/pooling_mteb_test/__init__.py
tests/models/language/pooling_mteb_test/__init__.py
+0
-0
tests/models/language/pooling_mteb_test/mteb_utils.py
tests/models/language/pooling_mteb_test/mteb_utils.py
+0
-0
tests/models/language/pooling_mteb_test/test_baai.py
tests/models/language/pooling_mteb_test/test_baai.py
+6
-4
tests/models/language/pooling_mteb_test/test_bge_reranker_v2_gemma.py
.../language/pooling_mteb_test/test_bge_reranker_v2_gemma.py
+3
-3
tests/models/language/pooling_mteb_test/test_cross_encoder.py
...s/models/language/pooling_mteb_test/test_cross_encoder.py
+3
-2
tests/models/language/pooling_mteb_test/test_gte.py
tests/models/language/pooling_mteb_test/test_gte.py
+6
-4
tests/models/language/pooling_mteb_test/test_intfloat.py
tests/models/language/pooling_mteb_test/test_intfloat.py
+4
-2
tests/models/language/pooling_mteb_test/test_jina.py
tests/models/language/pooling_mteb_test/test_jina.py
+5
-4
tests/models/language/pooling_mteb_test/test_mxbai_rerank.py
tests/models/language/pooling_mteb_test/test_mxbai_rerank.py
+1
-1
tests/models/language/pooling_mteb_test/test_nomic.py
tests/models/language/pooling_mteb_test/test_nomic.py
+4
-2
tests/models/language/pooling_mteb_test/test_qwen3_reranker.py
.../models/language/pooling_mteb_test/test_qwen3_reranker.py
+1
-1
tests/models/language/pooling_mteb_test/test_snowflake_arctic_embed.py
...language/pooling_mteb_test/test_snowflake_arctic_embed.py
+4
-2
tests/models/language/pooling_mteb_test/test_st_projector.py
tests/models/language/pooling_mteb_test/test_st_projector.py
+3
-2
No files found.
.buildkite/test-pipeline.yaml
View file @
fd1ce98c
...
...
@@ -642,6 +642,16 @@ steps:
commands
:
-
pytest -v -s models/language/pooling -m 'not core_model'
-
label
:
Language Models Test (MTEB)
timeout_in_minutes
:
110
mirror_hardwares
:
[
amdexperimental
]
optional
:
true
source_file_dependencies
:
-
vllm/
-
tests/models/language/pooling_mteb_test
commands
:
-
pytest -v -s models/language/pooling_mteb_test
-
label
:
Multi-Modal Processor Test
# 44min
timeout_in_minutes
:
60
source_file_dependencies
:
...
...
tests/entrypoints/pooling/correctness/test_mteb_embed.py
View file @
fd1ce98c
...
...
@@ -4,9 +4,8 @@ import os
import
pytest
from
tests.models.language.pooling.mteb_utils
import
(
MTEB_EMBED_TASKS
,
MTEB_EMBED_TOL
,
OpenAIClientMtebEncoder
,
from
tests.models.language.pooling_mteb_test.mteb_utils
import
(
MTEB_EMBED_TASKS
,
MTEB_EMBED_TOL
,
OpenAIClientMtebEncoder
,
run_mteb_embed_task
)
from
tests.utils
import
RemoteOpenAIServer
...
...
tests/entrypoints/pooling/correctness/test_mteb_score.py
View file @
fd1ce98c
...
...
@@ -4,15 +4,9 @@ import os
import
pytest
# yapf conflicts with isort for this block
# yapf: disable
from
tests.models.language.pooling.mteb_utils
import
(
MTEB_RERANK_LANGS
,
MTEB_RERANK_TASKS
,
MTEB_RERANK_TOL
,
RerankClientMtebEncoder
,
ScoreClientMtebEncoder
,
run_mteb_rerank
)
# yapf: enable
from
tests.models.language.pooling_mteb_test.mteb_utils
import
(
MTEB_RERANK_LANGS
,
MTEB_RERANK_TASKS
,
MTEB_RERANK_TOL
,
RerankClientMtebEncoder
,
ScoreClientMtebEncoder
,
run_mteb_rerank
)
from
tests.utils
import
RemoteOpenAIServer
os
.
environ
[
"VLLM_LOGGING_LEVEL"
]
=
"WARNING"
...
...
tests/models/language/pooling_mteb_test/__init__.py
0 → 100644
View file @
fd1ce98c
tests/models/language/pooling/mteb_utils.py
→
tests/models/language/pooling
_mteb_test
/mteb_utils.py
View file @
fd1ce98c
File moved
tests/models/language/pooling/test_baai.py
→
tests/models/language/pooling
_mteb_test
/test_baai.py
View file @
fd1ce98c
...
...
@@ -2,10 +2,12 @@
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
pytest
from
...utils
import
(
CLSPoolingEmbedModelInfo
,
CLSPoolingRerankModelInfo
,
EmbedModelInfo
,
LASTPoolingEmbedModelInfo
,
RerankModelInfo
)
from
.embed_utils
import
correctness_test_embed_models
from
tests.models.language.pooling.embed_utils
import
(
correctness_test_embed_models
)
from
tests.models.utils
import
(
CLSPoolingEmbedModelInfo
,
CLSPoolingRerankModelInfo
,
EmbedModelInfo
,
LASTPoolingEmbedModelInfo
,
RerankModelInfo
)
from
.mteb_utils
import
mteb_test_embed_models
,
mteb_test_rerank_models
MODELS
=
[
...
...
tests/models/language/pooling/test_bge_reranker_v2_gemma.py
→
tests/models/language/pooling
_mteb_test
/test_bge_reranker_v2_gemma.py
View file @
fd1ce98c
...
...
@@ -7,9 +7,9 @@ import pytest
import
torch
from
tests.conftest
import
HfRunner
from
...utils
import
LASTPoolingRerankModelInfo
,
R
erank
M
odel
Info
from
.mteb_utils
import
VllmMtebEncoder
,
mteb_test_r
erank
_m
odel
s
from
tests.models.language.pooling_mteb_test.mteb_utils
import
(
VllmMtebEncoder
,
mteb_test_r
erank
_m
odel
s
)
from
tests.models.utils
import
LASTPoolingRerankModelInfo
,
R
erank
M
odel
Info
RERANK_MODELS
=
[
LASTPoolingRerankModelInfo
(
"BAAI/bge-reranker-v2-gemma"
,
...
...
tests/models/language/pooling/test_cross_encoder.py
→
tests/models/language/pooling
_mteb_test
/test_cross_encoder.py
View file @
fd1ce98c
...
...
@@ -2,8 +2,9 @@
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
pytest
from
...utils
import
(
CLSPoolingRerankModelInfo
,
LASTPoolingRerankModelInfo
,
RerankModelInfo
)
from
tests.models.utils
import
(
CLSPoolingRerankModelInfo
,
LASTPoolingRerankModelInfo
,
RerankModelInfo
)
from
.mteb_utils
import
mteb_test_rerank_models
RERANK_MODELS
=
[
...
...
tests/models/language/pooling/test_gte.py
→
tests/models/language/pooling
_mteb_test
/test_gte.py
View file @
fd1ce98c
...
...
@@ -3,10 +3,12 @@
import
pytest
from
...utils
import
(
CLSPoolingEmbedModelInfo
,
CLSPoolingRerankModelInfo
,
EmbedModelInfo
,
LASTPoolingEmbedModelInfo
,
RerankModelInfo
)
from
.embed_utils
import
correctness_test_embed_models
from
tests.models.language.pooling.embed_utils
import
(
correctness_test_embed_models
)
from
tests.models.utils
import
(
CLSPoolingEmbedModelInfo
,
CLSPoolingRerankModelInfo
,
EmbedModelInfo
,
LASTPoolingEmbedModelInfo
,
RerankModelInfo
)
from
.mteb_utils
import
mteb_test_embed_models
,
mteb_test_rerank_models
MODELS
=
[
...
...
tests/models/language/pooling/test_intfloat.py
→
tests/models/language/pooling
_mteb_test
/test_intfloat.py
View file @
fd1ce98c
...
...
@@ -2,8 +2,10 @@
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
pytest
from
...utils
import
CLSPoolingEmbedModelInfo
,
EmbedModelInfo
from
.embed_utils
import
correctness_test_embed_models
from
tests.models.language.pooling.embed_utils
import
(
correctness_test_embed_models
)
from
tests.models.utils
import
CLSPoolingEmbedModelInfo
,
EmbedModelInfo
from
.mteb_utils
import
mteb_test_embed_models
MODELS
=
[
...
...
tests/models/language/pooling/test_jina.py
→
tests/models/language/pooling
_mteb_test
/test_jina.py
View file @
fd1ce98c
...
...
@@ -4,12 +4,13 @@ from functools import partial
import
pytest
from
tests.models.language.pooling.embed_utils
import
(
check_embeddings_close
,
correctness_test_embed_models
,
matryoshka_fy
)
from
tests.models.utils
import
(
CLSPoolingEmbedModelInfo
,
CLSPoolingRerankModelInfo
,
EmbedModelInfo
,
RerankModelInfo
)
from
vllm
import
PoolingParams
from
...utils
import
(
CLSPoolingEmbedModelInfo
,
CLSPoolingRerankModelInfo
,
EmbedModelInfo
,
RerankModelInfo
)
from
.embed_utils
import
(
check_embeddings_close
,
correctness_test_embed_models
,
matryoshka_fy
)
from
.mteb_utils
import
mteb_test_embed_models
,
mteb_test_rerank_models
EMBEDDING_MODELS
=
[
...
...
tests/models/language/pooling/test_mxbai_rerank.py
→
tests/models/language/pooling
_mteb_test
/test_mxbai_rerank.py
View file @
fd1ce98c
...
...
@@ -6,8 +6,8 @@ import pytest
import
torch
from
tests.conftest
import
HfRunner
from
tests.models.utils
import
LASTPoolingRerankModelInfo
,
RerankModelInfo
from
...utils
import
LASTPoolingRerankModelInfo
,
RerankModelInfo
from
.mteb_utils
import
mteb_test_rerank_models
mxbai_rerank_hf_overrides
=
{
...
...
tests/models/language/pooling/test_nomic.py
→
tests/models/language/pooling
_mteb_test
/test_nomic.py
View file @
fd1ce98c
...
...
@@ -3,8 +3,10 @@
import
pytest
from
...utils
import
CLSPoolingEmbedModelInfo
,
EmbedModelInfo
from
.embed_utils
import
correctness_test_embed_models
from
tests.models.language.pooling.embed_utils
import
(
correctness_test_embed_models
)
from
tests.models.utils
import
CLSPoolingEmbedModelInfo
,
EmbedModelInfo
from
.mteb_utils
import
mteb_test_embed_models
MODELS
=
[
...
...
tests/models/language/pooling/test_qwen3_reranker.py
→
tests/models/language/pooling
_mteb_test
/test_qwen3_reranker.py
View file @
fd1ce98c
...
...
@@ -6,9 +6,9 @@ import pytest
import
torch
from
tests.conftest
import
HfRunner
from
tests.models.utils
import
LASTPoolingRerankModelInfo
,
RerankModelInfo
from
tests.utils
import
multi_gpu_test
from
...utils
import
LASTPoolingRerankModelInfo
,
RerankModelInfo
from
.mteb_utils
import
mteb_test_rerank_models
qwen3_reranker_hf_overrides
=
{
...
...
tests/models/language/pooling/test_snowflake_arctic_embed.py
→
tests/models/language/pooling
_mteb_test
/test_snowflake_arctic_embed.py
View file @
fd1ce98c
...
...
@@ -3,8 +3,10 @@
import
pytest
from
...utils
import
CLSPoolingEmbedModelInfo
,
EmbedModelInfo
from
.embed_utils
import
correctness_test_embed_models
from
tests.models.language.pooling.embed_utils
import
(
correctness_test_embed_models
)
from
tests.models.utils
import
CLSPoolingEmbedModelInfo
,
EmbedModelInfo
from
.mteb_utils
import
mteb_test_embed_models
MODELS
=
[
...
...
tests/models/language/pooling/test_st_projector.py
→
tests/models/language/pooling
_mteb_test
/test_st_projector.py
View file @
fd1ce98c
...
...
@@ -2,8 +2,9 @@
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
pytest
from
..
.utils
import
(
CLSPoolingEmbedModelInfo
,
EmbedModelInfo
,
from
tests.models
.utils
import
(
CLSPoolingEmbedModelInfo
,
EmbedModelInfo
,
LASTPoolingEmbedModelInfo
)
from
.mteb_utils
import
mteb_test_embed_models
# ST models with projector (Dense) layers
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment