Unverified Commit c973ecde authored by Marc Sun's avatar Marc Sun Committed by GitHub
Browse files

[bnb] Skip moe + bnb test (#36896)


Signed-off-by: default avatarMarc Sun <marc@huggingface.co>
parent e39257a5
...@@ -6,7 +6,9 @@ Run `pytest tests/quantization/test_bitsandbytes.py`. ...@@ -6,7 +6,9 @@ Run `pytest tests/quantization/test_bitsandbytes.py`.
""" """
import pytest import pytest
from packaging.version import Version
from transformers import BitsAndBytesConfig from transformers import BitsAndBytesConfig
from transformers import __version__ as TRANSFORMERS_VERSION
from tests.quantization.utils import is_quant_method_supported from tests.quantization.utils import is_quant_method_supported
from vllm.platforms import current_platform from vllm.platforms import current_platform
...@@ -138,6 +140,12 @@ def test_load_pp_4bit_bnb_model(model_name, description) -> None: ...@@ -138,6 +140,12 @@ def test_load_pp_4bit_bnb_model(model_name, description) -> None:
compare_two_settings(model_name, common_args, pp_args) compare_two_settings(model_name, common_args, pp_args)
@pytest.mark.skipif(
Version(TRANSFORMERS_VERSION) >= Version("5.0.0"),
reason="Need to add support for quantizing MoE experts with bnb"
" in transformers v5. See"
" https://github.com/bitsandbytes-foundation/bitsandbytes/issues/1849",
)
@pytest.mark.skipif( @pytest.mark.skipif(
not is_quant_method_supported("bitsandbytes"), not is_quant_method_supported("bitsandbytes"),
reason="bitsandbytes is not supported on this GPU type.", reason="bitsandbytes is not supported on this GPU type.",
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment