Unverified Commit e03b6bee authored by Liana Koleva's avatar Liana Koleva Committed by GitHub
Browse files

doc: improve modelopt error description (#12269)

parent 5e36a0b4
......@@ -590,14 +590,20 @@ class ModelConfig:
return
# Check if ModelOpt quantization is specified
modelopt_quantization_specified = self.quantization in [
_MODELOPT_QUANTIZATION_METHODS = [
"modelopt",
"modelopt_fp8",
"modelopt_fp4",
]
modelopt_quantization_specified = (
self.quantization in _MODELOPT_QUANTIZATION_METHODS
)
if not modelopt_quantization_specified:
raise ValueError("quantize_and_serve requires ModelOpt quantization")
raise ValueError(
"quantize_and_serve requires ModelOpt quantization (set with --quantization "
f"{{{', '.join(sorted(_MODELOPT_QUANTIZATION_METHODS))}}})"
)
# quantize_and_serve is disabled due to compatibility issues
raise NotImplementedError(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment