Get correct devices

7cf0d987 · Casper Hansen · ab7d68e7 · 7cf0d987
Commit 7cf0d987 authored Sep 06, 2023 by Casper Hansen
Hide whitespace changes
Inline Side-by-side

Showing with 3 additions and 3 deletions

awq/models/llama.py awq/models/llama.py +3 -3

No files found.
--- a/awq/models/llama.py
+++ b/awq/models/llama.py
@@ -102,7 +102,7 @@ class LlamaFuser:
                module.num_key_value_heads,
                qkv_layer,
                module.o_proj,
-                qkv_layer.qweight.device,
+                next(iter(qkv_layer.state_dict().values())).device,
                self.model.config.max_new_tokens
            )
            set_module_name(self.model, name, attn)
@@ -111,7 +111,7 @@ class LlamaFuser:
        # get qkv and bias
        q_proj, k_proj, v_proj = module.q_proj, module.k_proj, module.v_proj
        bias = torch.cat([q_proj.bias, k_proj.bias, v_proj.bias], dim=0) if q_proj.bias is not None else None
        # create module
        qkv_layer = WQLinear(
            q_proj.w_bit, 
@@ -119,7 +119,7 @@ class LlamaFuser:
            q_proj.in_features, 
            q_proj.out_features + k_proj.out_features + v_proj.out_features, 
            q_proj.bias is not None,
-            q_proj.qweight.device
+            next(iter(module.state_dict().values())).device
        )
        # replace buffers with real weights