[`PEFT`] Fix PEFT batch size > 1 (#338)

c69d3b65 · Younes Belkada · GitHub · 29ee66d9 · c69d3b65
Unverified Commit c69d3b65 authored Feb 14, 2024 by Younes Belkada Committed by GitHub Feb 14, 2024
Show whitespace changes
Inline Side-by-side

Showing with 4 additions and 4 deletions

awq/modules/linear/gemm.py awq/modules/linear/gemm.py +4 -4

No files found.
--- a/awq/modules/linear/gemm.py
+++ b/awq/modules/linear/gemm.py
@@ -89,10 +89,10 @@ class WQLinearMMFunction(Function):
        )

        if ctx.needs_input_grad[0]:
-            # 2D matrix multiplication, unsqueeze to 3D
-            grad_input = grad_output.squeeze(0).mm(
-                weights.transpose(0, 1)
-            ).unsqueeze(0)
+            # 3D matmul using torch.bmm: https://pytorch.org/docs/stable/generated/torch.bmm.html#torch.bmm
+            # to propagate gradient across all batch sizes.
+            batch_size = grad_output.shape[0]
+            grad_input = grad_output.bmm(weights.transpose(0, 1).unsqueeze(0).repeat(batch_size, 1, 1))

        return grad_input, None, None, None, None, None, None, None