Merge pull request #1295 from matthewdouglas/fsdp-load-prequantized

[FSDP] Enable loading prequantized weights with bf16/fp16/fp32 quant_storage

Merge pull request #1295 from matthewdouglas/fsdp-load-prequantized
[FSDP] Enable loading prequantized weights with bf16/fp16/fp32 quant_storage
3a6911fa · Matthew Douglas · GitHub · 5cc91b1b · a96d2f05 · 3a6911fa
Unverified Commit 3a6911fa authored Jul 29, 2024 by Matthew Douglas Committed by GitHub Jul 29, 2024
Hide whitespace changes
Inline Side-by-side

Showing with 5 additions and 0 deletions

bitsandbytes/nn/modules.py bitsandbytes/nn/modules.py +5 -0

No files found.
--- a/bitsandbytes/nn/modules.py
+++ b/bitsandbytes/nn/modules.py
@@ -273,6 +273,7 @@ class Params4bit(torch.nn.Parameter):
        quantized_stats: Dict[str, Any],
        requires_grad: bool = False,
        device="cuda",
+        module: Optional["Linear4bit"] = None,
        **kwargs,
    ) -> "Params4bit":
        self = torch.Tensor._make_subclass(cls, data.to(device))
@@ -284,6 +285,10 @@ class Params4bit(torch.nn.Parameter):
        self.bnb_quantized = True
        self.quant_storage = data.dtype
+        self.module = module
+        if self.module is not None:
+            self.module.quant_state = self.quant_state
        return self