Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
c90fb03d
Unverified
Commit
c90fb03d
authored
Aug 12, 2025
by
Isotr0py
Committed by
GitHub
Aug 11, 2025
Browse files
[CI/Build] Skip Mllama HF runner tests with Transformers v4.55.0 (#22659)
Signed-off-by:
Isotr0py
<
2037008807@qq.com
>
parent
84cf78ac
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
17 additions
and
0 deletions
+17
-0
tests/models/multimodal/generation/test_mllama.py
tests/models/multimodal/generation/test_mllama.py
+17
-0
No files found.
tests/models/multimodal/generation/test_mllama.py
View file @
c90fb03d
...
@@ -6,6 +6,7 @@ from typing import Optional, overload
...
@@ -6,6 +6,7 @@ from typing import Optional, overload
import
pytest
import
pytest
import
torch
import
torch
from
transformers
import
AutoConfig
,
AutoModelForImageTextToText
,
AutoTokenizer
from
transformers
import
AutoConfig
,
AutoModelForImageTextToText
,
AutoTokenizer
from
transformers
import
__version__
as
TRANSFORMERS_VERSION
from
vllm
import
LLM
,
SamplingParams
from
vllm
import
LLM
,
SamplingParams
from
vllm.attention.backends.flash_attn
import
FlashAttentionMetadata
from
vllm.attention.backends.flash_attn
import
FlashAttentionMetadata
...
@@ -285,6 +286,10 @@ def clear_cache():
...
@@ -285,6 +286,10 @@ def clear_cache():
@
pytest
.
mark
.
parametrize
(
"max_tokens"
,
[
128
])
@
pytest
.
mark
.
parametrize
(
"max_tokens"
,
[
128
])
@
pytest
.
mark
.
parametrize
(
"num_logprobs"
,
[
5
])
@
pytest
.
mark
.
parametrize
(
"num_logprobs"
,
[
5
])
@
pytest
.
mark
.
parametrize
(
"attn_backend"
,
LIST_ENC_DEC_SUPPORTED_BACKENDS
)
@
pytest
.
mark
.
parametrize
(
"attn_backend"
,
LIST_ENC_DEC_SUPPORTED_BACKENDS
)
@
pytest
.
mark
.
skipif
(
TRANSFORMERS_VERSION
==
"4.55.0"
,
reason
=
"Transformers v4.55.0 has a regression issue on mllama, "
"see: https://github.com/huggingface/transformers/pull/40083"
)
def
test_models_single_leading_image
(
hf_runner
,
vllm_runner
,
image_assets
,
def
test_models_single_leading_image
(
hf_runner
,
vllm_runner
,
image_assets
,
model
,
sizes
,
dtype
,
max_tokens
,
model
,
sizes
,
dtype
,
max_tokens
,
num_logprobs
,
num_logprobs
,
...
@@ -313,6 +318,10 @@ def test_models_single_leading_image(hf_runner, vllm_runner, image_assets,
...
@@ -313,6 +318,10 @@ def test_models_single_leading_image(hf_runner, vllm_runner, image_assets,
@
pytest
.
mark
.
parametrize
(
"max_tokens"
,
[
128
])
@
pytest
.
mark
.
parametrize
(
"max_tokens"
,
[
128
])
@
pytest
.
mark
.
parametrize
(
"num_logprobs"
,
[
5
])
@
pytest
.
mark
.
parametrize
(
"num_logprobs"
,
[
5
])
@
pytest
.
mark
.
parametrize
(
"attn_backend"
,
LIST_ENC_DEC_SUPPORTED_BACKENDS
)
@
pytest
.
mark
.
parametrize
(
"attn_backend"
,
LIST_ENC_DEC_SUPPORTED_BACKENDS
)
@
pytest
.
mark
.
skipif
(
TRANSFORMERS_VERSION
==
"4.55.0"
,
reason
=
"Transformers v4.55.0 has a regression issue on mllama, "
"see: https://github.com/huggingface/transformers/pull/40083"
)
def
test_models_multi_leading_images
(
hf_runner
,
vllm_runner
,
image_assets
,
def
test_models_multi_leading_images
(
hf_runner
,
vllm_runner
,
image_assets
,
model
,
dtype
,
max_tokens
,
num_logprobs
,
model
,
dtype
,
max_tokens
,
num_logprobs
,
attn_backend
:
_Backend
)
->
None
:
attn_backend
:
_Backend
)
->
None
:
...
@@ -362,6 +371,10 @@ def test_models_multi_leading_images(hf_runner, vllm_runner, image_assets,
...
@@ -362,6 +371,10 @@ def test_models_multi_leading_images(hf_runner, vllm_runner, image_assets,
@
pytest
.
mark
.
parametrize
(
"max_tokens"
,
[
128
])
@
pytest
.
mark
.
parametrize
(
"max_tokens"
,
[
128
])
@
pytest
.
mark
.
parametrize
(
"num_logprobs"
,
[
5
])
@
pytest
.
mark
.
parametrize
(
"num_logprobs"
,
[
5
])
@
pytest
.
mark
.
parametrize
(
"attn_backend"
,
LIST_ENC_DEC_SUPPORTED_BACKENDS
)
@
pytest
.
mark
.
parametrize
(
"attn_backend"
,
LIST_ENC_DEC_SUPPORTED_BACKENDS
)
@
pytest
.
mark
.
skipif
(
TRANSFORMERS_VERSION
==
"4.55.0"
,
reason
=
"Transformers v4.55.0 has a regression issue on mllama, "
"see: https://github.com/huggingface/transformers/pull/40083"
)
def
test_models_interleaved_images
(
hf_runner
,
vllm_runner
,
image_assets
,
model
,
def
test_models_interleaved_images
(
hf_runner
,
vllm_runner
,
image_assets
,
model
,
dtype
,
max_tokens
,
num_logprobs
,
dtype
,
max_tokens
,
num_logprobs
,
attn_backend
:
_Backend
)
->
None
:
attn_backend
:
_Backend
)
->
None
:
...
@@ -402,6 +415,10 @@ def test_models_interleaved_images(hf_runner, vllm_runner, image_assets, model,
...
@@ -402,6 +415,10 @@ def test_models_interleaved_images(hf_runner, vllm_runner, image_assets, model,
@
pytest
.
mark
.
parametrize
(
"dtype"
,
[
"bfloat16"
])
@
pytest
.
mark
.
parametrize
(
"dtype"
,
[
"bfloat16"
])
@
pytest
.
mark
.
parametrize
(
"max_tokens"
,
[
64
])
@
pytest
.
mark
.
parametrize
(
"max_tokens"
,
[
64
])
@
pytest
.
mark
.
parametrize
(
"num_logprobs"
,
[
5
])
@
pytest
.
mark
.
parametrize
(
"num_logprobs"
,
[
5
])
@
pytest
.
mark
.
skipif
(
TRANSFORMERS_VERSION
==
"4.55.0"
,
reason
=
"Transformers v4.55.0 has a regression issue on mllama, "
"see: https://github.com/huggingface/transformers/pull/40083"
)
def
test_models_distributed
(
def
test_models_distributed
(
hf_runner
,
hf_runner
,
vllm_runner
,
vllm_runner
,
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment