Add basic quant example

60296077 · Casper · c39ac59b · 60296077
Commit 60296077 authored Aug 27, 2023 by Casper
Hide whitespace changes
Inline Side-by-side

Showing with 19 additions and 0 deletions

examples/basic_quant.py examples/basic_quant.py +19 -0

No files found.
--- a/examples/basic_quant.py
+++ b/examples/basic_quant.py
+from awq import AutoAWQForCausalLM
+from transformers import AutoTokenizer
+
+model_path = 'lmsys/vicuna-7b-v1.5'
+quant_path = 'vicuna-7b-v1.5-awq'
+quant_config = { "zero_point": True, "q_group_size": 128, "w_bit": 4 }
+
+# Load model
+model = AutoAWQForCausalLM.from_pretrained(model_path)
+tokenizer = AutoTokenizer.from_pretrained(model_path, trust_remote_code=True)
+
+# Quantize
+model.quantize(tokenizer, quant_config=quant_config)
+
+# Save quantized model
+model.save_quantized(quant_path)
+tokenizer.save_pretrained(quant_path)
+
+print(f'Model is quantized and saved at "{quant_path}"')
\ No newline at end of file