Remove references to squeezellm (#1603)

3ff64113 · Jani Monoses · GitHub · 2b302b93 · 3ff64113 · 3ff64113
Unverified Commit 3ff64113 authored Oct 07, 2024 by Jani Monoses Committed by GitHub Oct 07, 2024
Show whitespace changes
Inline Side-by-side

Showing with 0 additions and 3 deletions

python/sglang/srt/layers/quantization/__init__.py python/sglang/srt/layers/quantization/__init__.py +0 -2

python/sglang/srt/server_args.py python/sglang/srt/server_args.py +0 -1

No files found.
--- a/python/sglang/srt/layers/quantization/__init__.py
+++ b/python/sglang/srt/layers/quantization/__init__.py
@@ -19,7 +19,6 @@ from vllm.model_executor.layers.quantization.gptq_marlin import GPTQMarlinConfig
 from vllm.model_executor.layers.quantization.gptq_marlin_24 import GPTQMarlin24Config
 from vllm.model_executor.layers.quantization.marlin import MarlinConfig
 from vllm.model_executor.layers.quantization.qqq import QQQConfig
-from vllm.model_executor.layers.quantization.squeezellm import SqueezeLLMConfig
 from vllm.model_executor.layers.quantization.tpu_int8 import Int8TpuConfig
 from sglang.srt.layers.quantization.base_config import QuantizationConfig
@@ -39,7 +38,6 @@ QUANTIZATION_METHODS: Dict[str, Type[QuantizationConfig]] = {
    "gptq_marlin": GPTQMarlinConfig,
    "awq_marlin": AWQMarlinConfig,
    "gptq": GPTQConfig,
-    "squeezellm": SqueezeLLMConfig,
    "compressed-tensors": CompressedTensorsConfig,
    "bitsandbytes": BitsAndBytesConfig,
    "qqq": QQQConfig,

--- a/python/sglang/srt/server_args.py
+++ b/python/sglang/srt/server_args.py
@@ -266,7 +266,6 @@ class ServerArgs:
                "marlin",
                "gptq_marlin",
                "awq_marlin",
-                "squeezellm",
                "bitsandbytes",
            ],
            help="The quantization method.",