fix awq_dequantize import (#5669)

fbb5f229 · Yineng Zhang · GitHub · 15fabcc0 · fbb5f229
Unverified Commit fbb5f229 authored Apr 23, 2025 by Yineng Zhang Committed by GitHub Apr 23, 2025
Hide whitespace changes
Inline Side-by-side

Showing with 5 additions and 1 deletion

python/sglang/srt/layers/quantization/awq.py python/sglang/srt/layers/quantization/awq.py +5 -1

No files found.
--- a/python/sglang/srt/layers/quantization/awq.py
+++ b/python/sglang/srt/layers/quantization/awq.py
@@ -3,7 +3,6 @@ import logging
 from typing import Any, Dict, List, Optional

 import torch
-from sgl_kernel import awq_dequantize

 from sglang.srt.layers.linear import (
    LinearBase,
@@ -12,6 +11,11 @@ from sglang.srt.layers.linear import (
 )
 from sglang.srt.layers.parameter import GroupQuantScaleParameter, PackedvLLMParameter
 from sglang.srt.layers.quantization.base_config import QuantizationConfig
+from sglang.srt.utils import is_cuda
+
+_is_cuda = is_cuda()
+if _is_cuda:
+    from sgl_kernel import awq_dequantize

 logger = logging.getLogger(__name__)