Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
045b396d
Unverified
Commit
045b396d
authored
Oct 12, 2025
by
Isotr0py
Committed by
GitHub
Oct 12, 2025
Browse files
[Bugfix][CI/Build] Fix failing Mteb CI (#26638)
Signed-off-by:
Isotr0py
<
mozf@mail2.sysu.edu.cn
>
parent
76852017
Changes
5
Hide whitespace changes
Inline
Side-by-side
Showing
5 changed files
with
13 additions
and
2 deletions
+13
-2
tests/models/language/pooling_mteb_test/mteb_utils.py
tests/models/language/pooling_mteb_test/mteb_utils.py
+1
-1
tests/models/language/pooling_mteb_test/test_jina.py
tests/models/language/pooling_mteb_test/test_jina.py
+5
-0
tests/models/language/pooling_mteb_test/test_st_projector.py
tests/models/language/pooling_mteb_test/test_st_projector.py
+1
-0
tests/models/utils.py
tests/models/utils.py
+1
-0
vllm/model_executor/layers/layernorm.py
vllm/model_executor/layers/layernorm.py
+5
-1
No files found.
tests/models/language/pooling_mteb_test/mteb_utils.py
View file @
045b396d
...
...
@@ -191,7 +191,7 @@ def mteb_test_embed_models(
with
vllm_runner
(
model_info
.
name
,
runner
=
"pooling"
,
max_model_len
=
None
,
max_model_len
=
model_info
.
max_model_len
,
**
vllm_extra_kwargs
,
)
as
vllm_model
:
model_config
=
vllm_model
.
llm
.
llm_engine
.
model_config
...
...
tests/models/language/pooling_mteb_test/test_jina.py
View file @
045b396d
...
...
@@ -25,6 +25,11 @@ EMBEDDING_MODELS = [
mteb_score
=
0.824413164
,
architecture
=
"XLMRobertaModel"
,
is_matryoshka
=
True
,
# The default max length of the model is 8194, which will crash
# CUDAGraph due to odd length for Gemm. We set it to 8192 to avoid
# avoid this issue.
max_model_len
=
8192
,
dtype
=
"float32"
,
)
]
...
...
tests/models/language/pooling_mteb_test/test_st_projector.py
View file @
045b396d
...
...
@@ -23,6 +23,7 @@ ST_PROJECTOR_MODELS = [
architecture
=
"Gemma3TextModel"
,
mteb_score
=
0.7473819294684156
,
enable_test
=
True
,
dtype
=
"float32"
,
),
]
...
...
tests/models/utils.py
View file @
045b396d
...
...
@@ -369,6 +369,7 @@ class ModelInfo:
name
:
str
architecture
:
str
=
""
dtype
:
str
=
"auto"
max_model_len
:
Optional
[
int
]
=
None
hf_dtype
:
str
=
"float32"
hf_overrides
:
Optional
[
dict
[
str
,
Any
]]
=
None
default_pooling_type
:
str
=
""
...
...
vllm/model_executor/layers/layernorm.py
View file @
045b396d
...
...
@@ -318,7 +318,11 @@ class GemmaRMSNorm(CustomOp):
"""PyTorch-native implementation equivalent to forward()."""
orig_dtype
=
x
.
dtype
if
residual
is
not
None
:
x
=
x
+
residual
.
float
()
if
orig_dtype
==
torch
.
float16
else
x
+
residual
x
=
(
x
.
float
()
+
residual
.
float
()
if
orig_dtype
==
torch
.
float16
else
x
+
residual
)
residual
=
x
x
=
x
.
float
()
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment