Unverified Commit 4c584fc6 authored by Stefan He's avatar Stefan He Committed by GitHub
Browse files

Fix circular imports in gptq.py and unblock test explorer (#4736)

parent 77cf771e
...@@ -6,7 +6,6 @@ import torch ...@@ -6,7 +6,6 @@ import torch
from sglang.srt.layers.linear import LinearBase from sglang.srt.layers.linear import LinearBase
from sglang.srt.layers.quantization.base_config import QuantizationConfig from sglang.srt.layers.quantization.base_config import QuantizationConfig
from sglang.srt.layers.vocab_parallel_embedding import ParallelLMHead
from sglang.srt.utils import is_cuda from sglang.srt.utils import is_cuda
_is_cuda = is_cuda() _is_cuda = is_cuda()
...@@ -434,6 +433,9 @@ class MarlinConfig(QuantizationConfig): ...@@ -434,6 +433,9 @@ class MarlinConfig(QuantizationConfig):
from vllm.model_executor.layers.quantization.marlin import MarlinLinearMethod from vllm.model_executor.layers.quantization.marlin import MarlinLinearMethod
# Delay import to avoid circular dependency
from sglang.srt.layers.vocab_parallel_embedding import ParallelLMHead
if isinstance(layer, LinearBase) or ( if isinstance(layer, LinearBase) or (
isinstance(layer, ParallelLMHead) and self.lm_head_quantized isinstance(layer, ParallelLMHead) and self.lm_head_quantized
): ):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment