Update module name

5bd6fbc7 · Casper Hansen · adc5304b · 5bd6fbc7
Commit 5bd6fbc7 authored Sep 09, 2023 by Casper Hansen
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 2 deletions

awq/models/llama.py awq/models/llama.py +2 -2

No files found.
--- a/awq/models/llama.py
+++ b/awq/models/llama.py
@@ -70,7 +70,7 @@ from typing import List, Tuple, Union
 from awq.utils.utils import set_module_name
 from awq.modules.fused.mlp import QuantLlamaMLP
 from awq.modules.fused.norm import FTLlamaRMSNorm
-from awq.modules.fused.attn import QuantLlamaAttentionFused
+from awq.modules.fused.attn import QuantAttentionFused
 from awq.modules.linear import WQLinear_GEMM, WQLinear_GEMV
 from transformers.models.llama.modeling_llama import LlamaAttention, LlamaRMSNorm, LlamaMLP

@@ -97,7 +97,7 @@ class LlamaFuser:
    def fuse_attention(self):
        for name, module in self.attention_modules:
            qkv_layer: Union[WQLinear_GEMM, WQLinear_GEMV] = self._fuse_qkv(module)
-            attn = QuantLlamaAttentionFused(
+            attn = QuantAttentionFused(
                module.hidden_size,
                module.num_heads,
                qkv_layer,