Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
cc7f22a8
Commit
cc7f22a8
authored
Jun 11, 2025
by
zhuwenwen
Browse files
Merge tag 'v0.9.1' into v0.9.1-ori
parents
b9ea0c09
b6553be1
Changes
1000
Show whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
21 additions
and
1 deletion
+21
-1
tests/models/multimodal/processing/test_internvl.py
tests/models/multimodal/processing/test_internvl.py
+1
-0
tests/models/multimodal/processing/test_llama4.py
tests/models/multimodal/processing/test_llama4.py
+1
-0
tests/models/multimodal/processing/test_llava_next.py
tests/models/multimodal/processing/test_llava_next.py
+1
-0
tests/models/multimodal/processing/test_llava_onevision.py
tests/models/multimodal/processing/test_llava_onevision.py
+1
-0
tests/models/multimodal/processing/test_minimax_vl_01.py
tests/models/multimodal/processing/test_minimax_vl_01.py
+1
-0
tests/models/multimodal/processing/test_mllama.py
tests/models/multimodal/processing/test_mllama.py
+1
-0
tests/models/multimodal/processing/test_phi3v.py
tests/models/multimodal/processing/test_phi3v.py
+1
-0
tests/models/multimodal/processing/test_phi4mm.py
tests/models/multimodal/processing/test_phi4mm.py
+1
-0
tests/models/multimodal/processing/test_qwen2_vl.py
tests/models/multimodal/processing/test_qwen2_vl.py
+1
-0
tests/models/multimodal/processing/test_smolvlm.py
tests/models/multimodal/processing/test_smolvlm.py
+1
-0
tests/models/quantization/test_aqlm.py
tests/models/quantization/test_aqlm.py
+1
-0
tests/models/quantization/test_awq.py
tests/models/quantization/test_awq.py
+1
-0
tests/models/quantization/test_bitblas.py
tests/models/quantization/test_bitblas.py
+1
-0
tests/models/quantization/test_fp8.py
tests/models/quantization/test_fp8.py
+1
-0
tests/models/quantization/test_gguf.py
tests/models/quantization/test_gguf.py
+2
-1
tests/models/quantization/test_gptq_bitblas.py
tests/models/quantization/test_gptq_bitblas.py
+1
-0
tests/models/quantization/test_gptq_marlin.py
tests/models/quantization/test_gptq_marlin.py
+1
-0
tests/models/quantization/test_gptq_marlin_24.py
tests/models/quantization/test_gptq_marlin_24.py
+1
-0
tests/models/quantization/test_modelopt.py
tests/models/quantization/test_modelopt.py
+1
-0
tests/models/quantization/test_mxfp4.py
tests/models/quantization/test_mxfp4.py
+1
-0
No files found.
Too many changes to show.
To preserve performance only
1000 of 1000+
files are displayed.
Plain diff
Email patch
tests/models/multimodal/processing/test_internvl.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""Tests for InternVL's multimodal preprocessing kwargs."""
from
collections.abc
import
Mapping
from
typing
import
Optional
...
...
tests/models/multimodal/processing/test_llama4.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""Tests for Llama4's multimodal preprocessing kwargs."""
import
pytest
...
...
tests/models/multimodal/processing/test_llava_next.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
itertools
from
functools
import
partial
...
...
tests/models/multimodal/processing/test_llava_onevision.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
itertools
from
functools
import
partial
...
...
tests/models/multimodal/processing/test_minimax_vl_01.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
pytest
from
PIL
import
Image
...
...
tests/models/multimodal/processing/test_mllama.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""Tests for mllama's multimodal preprocessing and profiling."""
import
pytest
from
transformers
import
MllamaConfig
...
...
tests/models/multimodal/processing/test_phi3v.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""Tests for phi3v's multimodal preprocessing kwargs."""
import
pytest
...
...
tests/models/multimodal/processing/test_phi4mm.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""Tests for phi4mm's multimodal preprocessing kwargs."""
import
pytest
...
...
tests/models/multimodal/processing/test_qwen2_vl.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
pytest
...
...
tests/models/multimodal/processing/test_smolvlm.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""Tests for smolvlm's multimodal preprocessing kwargs."""
import
pytest
from
transformers
import
SmolVLMConfig
...
...
tests/models/quantization/test_aqlm.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
pytest
from
tests.quantization.utils
import
is_quant_method_supported
...
...
tests/models/quantization/test_awq.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
from
typing
import
Optional
...
...
tests/models/quantization/test_bitblas.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""Compare the outputs of a GPTQ model to a bitblas model.
Note: GPTQ and bitblas do not have bitwise correctness.
...
...
tests/models/quantization/test_fp8.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
# flake8: noqa
"""Tests fp8 models against ground truth generation
...
...
tests/models/quantization/test_gguf.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""
Tests gguf models against unquantized models generations
Note: To pass the test, quantization higher than Q4 should be used
...
...
@@ -37,7 +38,7 @@ class GGUFTestConfig(NamedTuple):
LLAMA_CONFIG
=
GGUFTestConfig
(
original_model
=
"meta-llama/Llama-3.2-1B-Instruct"
,
gguf_repo
=
"bartowski/Llama-3.2-1B-Instruct-GGUF"
,
gguf_filename
=
"Llama-3.2-1B-Instruct-
IQ4_XS
.gguf"
,
gguf_filename
=
"Llama-3.2-1B-Instruct-
Q6_K
.gguf"
,
)
QWEN2_CONFIG
=
GGUFTestConfig
(
...
...
tests/models/quantization/test_gptq_bitblas.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""Compare the outputs of a GPTQ model to a bitblas model.
Note: GPTQ and bitblas do not have bitwise correctness.
...
...
tests/models/quantization/test_gptq_marlin.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""Compares the outputs of gptq vs gptq_marlin.
Note: GPTQ and Marlin do not have bitwise correctness.
...
...
tests/models/quantization/test_gptq_marlin_24.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""Compare the outputs of a GPTQ model to a Marlin_24 model.
Note: GPTQ and Marlin_24 do not have bitwise correctness.
...
...
tests/models/quantization/test_modelopt.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
# flake8: noqa
"""Tests Model Optimizer fp8 models against ground truth generation
...
...
tests/models/quantization/test_mxfp4.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
# flake8: noqa
"""Tests Quark mxfp4 models against ground truth generation
"""
...
...
Prev
1
…
24
25
26
27
28
29
30
31
32
…
50
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment