utils.py 673 Bytes
Newer Older
1
# SPDX-License-Identifier: Apache-2.0
2
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
3

4
from vllm.model_executor.layers.quantization import get_quantization_config
5
from vllm.platforms import current_platform
6
7
8
9


def is_quant_method_supported(quant_method: str) -> bool:
    # Currently, all quantization methods require Nvidia or AMD GPUs
youkaichao's avatar
youkaichao committed
10
    if not (current_platform.is_cuda() or current_platform.is_rocm()):
11
12
        return False

13
    capability = current_platform.get_device_capability()
14
15
    assert capability is not None

16
    min_capability = get_quantization_config(quant_method).get_min_capability()
17
18

    return capability.to_int() >= min_capability