Unverified Commit bb549467 authored by chenqianfzh's avatar chenqianfzh Committed by GitHub
Browse files

enforce eager mode with bnb quantization temporarily (#6846)

parent b5f49ee5
......@@ -282,6 +282,10 @@ class ModelConfig:
raise ValueError(
"BitAndBytes quantization with TP or PP is not supported yet.")
if self.quantization == "bitsandbytes" and self.enforce_eager is False:
raise ValueError(
"BitAndBytes with enforce_eager = False is not supported yet.")
def get_hf_config_sliding_window(self) -> Optional[int]:
"""Get the sliding window size, or None if disabled."""
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment