Merge pull request #80 from casper-hansen/low_cpu_mem_example

Add low_cpu_mem_usage=True in example

Merge pull request #80 from casper-hansen/low_cpu_mem_example
Add low_cpu_mem_usage=True in example
8793a9f7 · Casper · GitHub · 1c5ccc79 · aa6497cd · 8793a9f7
Unverified Commit 8793a9f7 authored Sep 27, 2023 by Casper Committed by GitHub Sep 27, 2023
Hide whitespace changes
Inline Side-by-side

Showing with 1 addition and 1 deletion

examples/basic_quant.py examples/basic_quant.py +1 -1

No files found.
--- a/examples/basic_quant.py
+++ b/examples/basic_quant.py
@@ -7,7 +7,7 @@ quant_config = { "zero_point": True, "q_group_size": 128, "w_bit": 4, "version":
 # Load model
 # NOTE: pass safetensors=True to load safetensors
-model = AutoAWQForCausalLM.from_pretrained(model_path)
+model = AutoAWQForCausalLM.from_pretrained(model_path, **{"low_cpu_mem_usage": True})
 tokenizer = AutoTokenizer.from_pretrained(model_path, trust_remote_code=True)
 # Quantize