Correct comments

9848b6a4 · Casper Hansen · c9d01ac3 · 9848b6a4
Commit 9848b6a4 authored Sep 20, 2023 by Casper Hansen
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 3 deletions

awq/quantize/quantizer.py awq/quantize/quantizer.py +2 -3

No files found.
--- a/awq/quantize/quantizer.py
+++ b/awq/quantize/quantizer.py
@@ -176,14 +176,13 @@ class AwqQuantizer:
            # create new scales
            ratio = ratio / n_grid
-            # s^-1
+            # NOTE: s^-1 * x is fused here, according to paper
            scales = (x_max.pow(ratio) / w_max.pow(1-ratio)).clamp(min=1e-4)
            scales = scales / (scales.max() * scales.min()).sqrt()
            scales_view = scales.view(1, -1).to(device)
-            # NOTE: s^-1 * x is fused here, according to paper
+            # Q(W * s)
            for fc in linears2scale:
-                # Q(W * s)
                fc.weight.mul_(scales_view)
                fc.weight.data = self.pseudo_quantize_tensor(fc.weight.data) / scales_view