Unverified Commit e03b6bee authored by Liana Koleva's avatar Liana Koleva Committed by GitHub
Browse files

doc: improve modelopt error description (#12269)

parent 5e36a0b4
...@@ -590,14 +590,20 @@ class ModelConfig: ...@@ -590,14 +590,20 @@ class ModelConfig:
return return
# Check if ModelOpt quantization is specified # Check if ModelOpt quantization is specified
modelopt_quantization_specified = self.quantization in [ _MODELOPT_QUANTIZATION_METHODS = [
"modelopt", "modelopt",
"modelopt_fp8", "modelopt_fp8",
"modelopt_fp4", "modelopt_fp4",
] ]
modelopt_quantization_specified = (
self.quantization in _MODELOPT_QUANTIZATION_METHODS
)
if not modelopt_quantization_specified: if not modelopt_quantization_specified:
raise ValueError("quantize_and_serve requires ModelOpt quantization") raise ValueError(
"quantize_and_serve requires ModelOpt quantization (set with --quantization "
f"{{{', '.join(sorted(_MODELOPT_QUANTIZATION_METHODS))}}})"
)
# quantize_and_serve is disabled due to compatibility issues # quantize_and_serve is disabled due to compatibility issues
raise NotImplementedError( raise NotImplementedError(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment