Unverified Commit 382f66fb authored by Helena Kloosterman's avatar Helena Kloosterman Committed by GitHub
Browse files

[Bugfix] Fix boolean conversion for OpenVINO env variable (#13615)

parent 8354f664
...@@ -360,8 +360,9 @@ environment_variables: Dict[str, Callable[[], Any]] = { ...@@ -360,8 +360,9 @@ environment_variables: Dict[str, Callable[[], Any]] = {
# Enables weights compression during model export via HF Optimum # Enables weights compression during model export via HF Optimum
# default is False # default is False
"VLLM_OPENVINO_ENABLE_QUANTIZED_WEIGHTS": "VLLM_OPENVINO_ENABLE_QUANTIZED_WEIGHTS":
lambda: bool(os.getenv("VLLM_OPENVINO_ENABLE_QUANTIZED_WEIGHTS", False)), lambda:
(os.environ.get("VLLM_OPENVINO_ENABLE_QUANTIZED_WEIGHTS", "0").lower() in
("on", "true", "1")),
# If the env var is set, then all workers will execute as separate # If the env var is set, then all workers will execute as separate
# processes from the engine, and we use the same mechanism to trigger # processes from the engine, and we use the same mechanism to trigger
# execution on all workers. # execution on all workers.
......
...@@ -125,7 +125,8 @@ class OpenVINOCausalLM(nn.Module): ...@@ -125,7 +125,8 @@ class OpenVINOCausalLM(nn.Module):
"as-is, all possible options that may affect model conversion " "as-is, all possible options that may affect model conversion "
"are ignored.") "are ignored.")
load_in_8bit = envs.VLLM_OPENVINO_ENABLE_QUANTIZED_WEIGHTS load_in_8bit = (envs.VLLM_OPENVINO_ENABLE_QUANTIZED_WEIGHTS
if export else False)
pt_model = OVModelForCausalLM.from_pretrained( pt_model = OVModelForCausalLM.from_pretrained(
model_config.model, model_config.model,
export=export, export=export,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment