Commit b190df35 authored by Jiaming Tang's avatar Jiaming Tang
Browse files

[Minor] add a comment

parent 9b427ebc
...@@ -213,6 +213,7 @@ def auto_scale_block(module, module_kwargs, ...@@ -213,6 +213,7 @@ def auto_scale_block(module, module_kwargs,
module2inspect=module.self_attn, kwargs=module_kwargs, module2inspect=module.self_attn, kwargs=module_kwargs,
)) ))
# attn out # attn out
# Please refer to https://github.com/mit-han-lab/llm-awq/pull/67#issue-1850622696
if module.self_attn.v_proj.weight.shape == module.self_attn.o_proj.weight.shape: if module.self_attn.v_proj.weight.shape == module.self_attn.o_proj.weight.shape:
scales_list.append(_auto_get_scale( scales_list.append(_auto_get_scale(
prev_op=module.self_attn.v_proj, prev_op=module.self_attn.v_proj,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment