Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
cc7f22a8
Commit
cc7f22a8
authored
Jun 11, 2025
by
zhuwenwen
Browse files
Merge tag 'v0.9.1' into v0.9.1-ori
parents
b9ea0c09
b6553be1
Changes
1000
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
21 additions
and
1 deletion
+21
-1
tests/models/multimodal/processing/test_internvl.py
tests/models/multimodal/processing/test_internvl.py
+1
-0
tests/models/multimodal/processing/test_llama4.py
tests/models/multimodal/processing/test_llama4.py
+1
-0
tests/models/multimodal/processing/test_llava_next.py
tests/models/multimodal/processing/test_llava_next.py
+1
-0
tests/models/multimodal/processing/test_llava_onevision.py
tests/models/multimodal/processing/test_llava_onevision.py
+1
-0
tests/models/multimodal/processing/test_minimax_vl_01.py
tests/models/multimodal/processing/test_minimax_vl_01.py
+1
-0
tests/models/multimodal/processing/test_mllama.py
tests/models/multimodal/processing/test_mllama.py
+1
-0
tests/models/multimodal/processing/test_phi3v.py
tests/models/multimodal/processing/test_phi3v.py
+1
-0
tests/models/multimodal/processing/test_phi4mm.py
tests/models/multimodal/processing/test_phi4mm.py
+1
-0
tests/models/multimodal/processing/test_qwen2_vl.py
tests/models/multimodal/processing/test_qwen2_vl.py
+1
-0
tests/models/multimodal/processing/test_smolvlm.py
tests/models/multimodal/processing/test_smolvlm.py
+1
-0
tests/models/quantization/test_aqlm.py
tests/models/quantization/test_aqlm.py
+1
-0
tests/models/quantization/test_awq.py
tests/models/quantization/test_awq.py
+1
-0
tests/models/quantization/test_bitblas.py
tests/models/quantization/test_bitblas.py
+1
-0
tests/models/quantization/test_fp8.py
tests/models/quantization/test_fp8.py
+1
-0
tests/models/quantization/test_gguf.py
tests/models/quantization/test_gguf.py
+2
-1
tests/models/quantization/test_gptq_bitblas.py
tests/models/quantization/test_gptq_bitblas.py
+1
-0
tests/models/quantization/test_gptq_marlin.py
tests/models/quantization/test_gptq_marlin.py
+1
-0
tests/models/quantization/test_gptq_marlin_24.py
tests/models/quantization/test_gptq_marlin_24.py
+1
-0
tests/models/quantization/test_modelopt.py
tests/models/quantization/test_modelopt.py
+1
-0
tests/models/quantization/test_mxfp4.py
tests/models/quantization/test_mxfp4.py
+1
-0
No files found.
Too many changes to show.
To preserve performance only
1000 of 1000+
files are displayed.
Plain diff
Email patch
tests/models/multimodal/processing/test_internvl.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""Tests for InternVL's multimodal preprocessing kwargs."""
"""Tests for InternVL's multimodal preprocessing kwargs."""
from
collections.abc
import
Mapping
from
collections.abc
import
Mapping
from
typing
import
Optional
from
typing
import
Optional
...
...
tests/models/multimodal/processing/test_llama4.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""Tests for Llama4's multimodal preprocessing kwargs."""
"""Tests for Llama4's multimodal preprocessing kwargs."""
import
pytest
import
pytest
...
...
tests/models/multimodal/processing/test_llava_next.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
itertools
import
itertools
from
functools
import
partial
from
functools
import
partial
...
...
tests/models/multimodal/processing/test_llava_onevision.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
itertools
import
itertools
from
functools
import
partial
from
functools
import
partial
...
...
tests/models/multimodal/processing/test_minimax_vl_01.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
pytest
import
pytest
from
PIL
import
Image
from
PIL
import
Image
...
...
tests/models/multimodal/processing/test_mllama.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""Tests for mllama's multimodal preprocessing and profiling."""
"""Tests for mllama's multimodal preprocessing and profiling."""
import
pytest
import
pytest
from
transformers
import
MllamaConfig
from
transformers
import
MllamaConfig
...
...
tests/models/multimodal/processing/test_phi3v.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""Tests for phi3v's multimodal preprocessing kwargs."""
"""Tests for phi3v's multimodal preprocessing kwargs."""
import
pytest
import
pytest
...
...
tests/models/multimodal/processing/test_phi4mm.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""Tests for phi4mm's multimodal preprocessing kwargs."""
"""Tests for phi4mm's multimodal preprocessing kwargs."""
import
pytest
import
pytest
...
...
tests/models/multimodal/processing/test_qwen2_vl.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
pytest
import
pytest
...
...
tests/models/multimodal/processing/test_smolvlm.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""Tests for smolvlm's multimodal preprocessing kwargs."""
"""Tests for smolvlm's multimodal preprocessing kwargs."""
import
pytest
import
pytest
from
transformers
import
SmolVLMConfig
from
transformers
import
SmolVLMConfig
...
...
tests/models/quantization/test_aqlm.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
pytest
import
pytest
from
tests.quantization.utils
import
is_quant_method_supported
from
tests.quantization.utils
import
is_quant_method_supported
...
...
tests/models/quantization/test_awq.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
from
typing
import
Optional
from
typing
import
Optional
...
...
tests/models/quantization/test_bitblas.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""Compare the outputs of a GPTQ model to a bitblas model.
"""Compare the outputs of a GPTQ model to a bitblas model.
Note: GPTQ and bitblas do not have bitwise correctness.
Note: GPTQ and bitblas do not have bitwise correctness.
...
...
tests/models/quantization/test_fp8.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
# flake8: noqa
# flake8: noqa
"""Tests fp8 models against ground truth generation
"""Tests fp8 models against ground truth generation
...
...
tests/models/quantization/test_gguf.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""
"""
Tests gguf models against unquantized models generations
Tests gguf models against unquantized models generations
Note: To pass the test, quantization higher than Q4 should be used
Note: To pass the test, quantization higher than Q4 should be used
...
@@ -37,7 +38,7 @@ class GGUFTestConfig(NamedTuple):
...
@@ -37,7 +38,7 @@ class GGUFTestConfig(NamedTuple):
LLAMA_CONFIG
=
GGUFTestConfig
(
LLAMA_CONFIG
=
GGUFTestConfig
(
original_model
=
"meta-llama/Llama-3.2-1B-Instruct"
,
original_model
=
"meta-llama/Llama-3.2-1B-Instruct"
,
gguf_repo
=
"bartowski/Llama-3.2-1B-Instruct-GGUF"
,
gguf_repo
=
"bartowski/Llama-3.2-1B-Instruct-GGUF"
,
gguf_filename
=
"Llama-3.2-1B-Instruct-
IQ4_XS
.gguf"
,
gguf_filename
=
"Llama-3.2-1B-Instruct-
Q6_K
.gguf"
,
)
)
QWEN2_CONFIG
=
GGUFTestConfig
(
QWEN2_CONFIG
=
GGUFTestConfig
(
...
...
tests/models/quantization/test_gptq_bitblas.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""Compare the outputs of a GPTQ model to a bitblas model.
"""Compare the outputs of a GPTQ model to a bitblas model.
Note: GPTQ and bitblas do not have bitwise correctness.
Note: GPTQ and bitblas do not have bitwise correctness.
...
...
tests/models/quantization/test_gptq_marlin.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""Compares the outputs of gptq vs gptq_marlin.
"""Compares the outputs of gptq vs gptq_marlin.
Note: GPTQ and Marlin do not have bitwise correctness.
Note: GPTQ and Marlin do not have bitwise correctness.
...
...
tests/models/quantization/test_gptq_marlin_24.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""Compare the outputs of a GPTQ model to a Marlin_24 model.
"""Compare the outputs of a GPTQ model to a Marlin_24 model.
Note: GPTQ and Marlin_24 do not have bitwise correctness.
Note: GPTQ and Marlin_24 do not have bitwise correctness.
...
...
tests/models/quantization/test_modelopt.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
# flake8: noqa
# flake8: noqa
"""Tests Model Optimizer fp8 models against ground truth generation
"""Tests Model Optimizer fp8 models against ground truth generation
...
...
tests/models/quantization/test_mxfp4.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
# flake8: noqa
# flake8: noqa
"""Tests Quark mxfp4 models against ground truth generation
"""Tests Quark mxfp4 models against ground truth generation
"""
"""
...
...
Prev
1
…
24
25
26
27
28
29
30
31
32
…
50
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment