Fixed an issue where the Qwen model had too much error after quantization (#243)

5eb1d2f0 · jundolc · GitHub · 5a673bf8 · 5eb1d2f0
Unverified Commit 5eb1d2f0 authored Dec 08, 2023 by jundolc Committed by GitHub Dec 08, 2023
Hide whitespace changes
Inline Side-by-side

Showing with 1 addition and 1 deletion

awq/models/qwen.py awq/models/qwen.py +1 -1

No files found.
--- a/awq/models/qwen.py
+++ b/awq/models/qwen.py
@@ -26,7 +26,7 @@ class QwenAWQForCausalLM(BaseAWQForCausalLM):
        layers.append(
            dict(
                prev_op=module.ln_1,
-                layers=[module.attn.c_attn, module.attn.c_proj],
+                layers=[module.attn.c_attn],
                inp=input_feat["attn.c_attn"],
                module2inspect=module.attn,
                kwargs=module_kwargs,