Unverified Commit 197c47a3 authored by Daniël de Kok's avatar Daniël de Kok Committed by GitHub
Browse files

Fix `text-generation-server quantize` (#2103)

The subcommand did not work due to some broken imports.
parent bcb3faa1
......@@ -316,7 +316,7 @@ def quantize(
logger_level=logger_level,
json_output=json_output,
)
from text_generation_server.utils.gptq.quantize import quantize
from text_generation_server.layers.gptq.quantize import quantize
quantize(
model_id=model_id,
......
......@@ -12,7 +12,7 @@ from huggingface_hub import HfApi
from accelerate import init_empty_weights
from text_generation_server.utils import initialize_torch_distributed, Weights
from text_generation_server.utils.hub import weight_files
from text_generation_server.utils.gptq.quant_linear import QuantLinear
from text_generation_server.layers.gptq.quant_linear import QuantLinear
from loguru import logger
from typing import Optional
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment