[`core`] Fix quantization issues with transformers==4.36.0 (#249)

78b59d73 · Younes Belkada · GitHub · ae24f424 · 78b59d73
Unverified Commit 78b59d73 authored Dec 11, 2023 by Younes Belkada Committed by GitHub Dec 11, 2023
Hide whitespace changes
Inline Side-by-side

Showing with 7 additions and 0 deletions

awq/quantize/quantizer.py awq/quantize/quantizer.py +7 -0

No files found.
--- a/awq/quantize/quantizer.py
+++ b/awq/quantize/quantizer.py
@@ -342,6 +342,13 @@ class AwqQuantizer:
            self.model(samples.to(next(self.model.parameters()).device))
        except ValueError:  # work with early exit
            pass
+        
+        # Update the layer kwargs with `prepare_inputs_for_generation` method
+        # that takes care of everything to avoid unexpected errors.
+        layer_kwargs = self.model.prepare_inputs_for_generation(samples, **layer_kwargs)
+        # Pop the input_ids as they are not needed at all.
+        layer_kwargs.pop("input_ids")
+
        del samples
        modules[0] = modules[0].module  # restore
        inps = inps[0]