Unverified Commit 197c47a3 authored by Daniël de Kok's avatar Daniël de Kok Committed by GitHub
Browse files

Fix `text-generation-server quantize` (#2103)

The subcommand did not work due to some broken imports.
parent bcb3faa1
...@@ -316,7 +316,7 @@ def quantize( ...@@ -316,7 +316,7 @@ def quantize(
logger_level=logger_level, logger_level=logger_level,
json_output=json_output, json_output=json_output,
) )
from text_generation_server.utils.gptq.quantize import quantize from text_generation_server.layers.gptq.quantize import quantize
quantize( quantize(
model_id=model_id, model_id=model_id,
......
...@@ -12,7 +12,7 @@ from huggingface_hub import HfApi ...@@ -12,7 +12,7 @@ from huggingface_hub import HfApi
from accelerate import init_empty_weights from accelerate import init_empty_weights
from text_generation_server.utils import initialize_torch_distributed, Weights from text_generation_server.utils import initialize_torch_distributed, Weights
from text_generation_server.utils.hub import weight_files from text_generation_server.utils.hub import weight_files
from text_generation_server.utils.gptq.quant_linear import QuantLinear from text_generation_server.layers.gptq.quant_linear import QuantLinear
from loguru import logger from loguru import logger
from typing import Optional from typing import Optional
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment