debug

5d658171 · justheuristic · 4da2227f · 5d658171 · 5d658171
Commit 5d658171 authored Sep 18, 2022 by justheuristic
Hide whitespace changes
Inline Side-by-side

Showing with 3 additions and 3 deletions

bitsandbytes/autograd/_functions.py bitsandbytes/autograd/_functions.py +0 -2

bitsandbytes/nn/modules.py bitsandbytes/nn/modules.py +3 -1

No files found.
--- a/bitsandbytes/autograd/_functions.py
+++ b/bitsandbytes/autograd/_functions.py
@@ -370,8 +370,6 @@ class MatMul8bitLt(torch.autograd.Function):
            if state.threshold > 0.0 and subA is not None:
                grad_B[:, idx] += torch.matmul(grad_output.t(), subA)
-            raise NotImplementedError("!!")
        if req_gradA:
            if state.CBt is not None:
                C32grad, Sgrad = F.transform(Cgrad, "col32")

--- a/bitsandbytes/nn/modules.py
+++ b/bitsandbytes/nn/modules.py
@@ -237,7 +237,9 @@ class Linear8bitLt(nn.Linear):
        if threshold > 0.0 and not has_fp16_weights:
            self.state.use_pool = True
-        self.weight = Int8Params(self.weight.data, has_fp16_weights=has_fp16_weights)
+        self.weight = Int8Params(
+            self.weight.data, has_fp16_weights=has_fp16_weights, requires_grad=has_fp16_weights
+        )
    def init_8bit_state(self):
        self.state.CB = self.weight.CB