Unverified Commit 2d69bacb authored by Sayak Paul's avatar Sayak Paul Committed by GitHub
Browse files

handle offload_state_dict when initing transformers models (#12438)

parent 0974b4c6
...@@ -838,6 +838,9 @@ def load_sub_model( ...@@ -838,6 +838,9 @@ def load_sub_model(
else: else:
loading_kwargs["low_cpu_mem_usage"] = False loading_kwargs["low_cpu_mem_usage"] = False
if is_transformers_model and is_transformers_version(">=", "4.57.0"):
loading_kwargs.pop("offload_state_dict")
if ( if (
quantization_config is not None quantization_config is not None
and isinstance(quantization_config, PipelineQuantizationConfig) and isinstance(quantization_config, PipelineQuantizationConfig)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment