Unverified Commit 5eb1d2f0 authored by jundolc's avatar jundolc Committed by GitHub
Browse files

Fixed an issue where the Qwen model had too much error after quantization (#243)

parent 5a673bf8
...@@ -26,7 +26,7 @@ class QwenAWQForCausalLM(BaseAWQForCausalLM): ...@@ -26,7 +26,7 @@ class QwenAWQForCausalLM(BaseAWQForCausalLM):
layers.append( layers.append(
dict( dict(
prev_op=module.ln_1, prev_op=module.ln_1,
layers=[module.attn.c_attn, module.attn.c_proj], layers=[module.attn.c_attn],
inp=input_feat["attn.c_attn"], inp=input_feat["attn.c_attn"],
module2inspect=module.attn, module2inspect=module.attn,
kwargs=module_kwargs, kwargs=module_kwargs,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment