utils.py 604 Bytes
Newer Older
1
2
# SPDX-License-Identifier: Apache-2.0

3
from vllm.model_executor.layers.quantization import get_quantization_config
4
from vllm.platforms import current_platform
5
6
7
8


def is_quant_method_supported(quant_method: str) -> bool:
    # Currently, all quantization methods require Nvidia or AMD GPUs
youkaichao's avatar
youkaichao committed
9
    if not (current_platform.is_cuda() or current_platform.is_rocm()):
10
11
        return False

12
    capability = current_platform.get_device_capability()
13
14
    assert capability is not None

15
    min_capability = get_quantization_config(quant_method).get_min_capability()
16
17

    return capability.to_int() >= min_capability