Fix torch.compile issue for LLM.int8() with threshold=0 (#1581)

49609323 · Matthew Douglas · GitHub · 90bbe147 · 49609323
Unverified Commit 49609323 authored Apr 01, 2025 by Matthew Douglas Committed by GitHub Apr 01, 2025
Hide whitespace changes
Inline Side-by-side

Showing with 8 additions and 1 deletion

bitsandbytes/autograd/_functions.py bitsandbytes/autograd/_functions.py +8 -1

No files found.
--- a/bitsandbytes/autograd/_functions.py
+++ b/bitsandbytes/autograd/_functions.py
@@ -84,6 +84,13 @@ def get_inverse_transform_indices(
    return permuted_tile_indices
+# torch.compiler.is_compiling() is available only in torch >= 2.3
+if hasattr(torch.compiler, "is_compiling"):
+    _is_compiling = torch.compiler.is_compiling
+else:
+    _is_compiling = torch._dynamo.is_compiling
 @deprecated(
    "This function is deprecated and will be removed in a future release.",
    category=FutureWarning,
@@ -174,7 +181,7 @@ class MatMul8bitLt(torch.autograd.Function):
        input_shape = A.shape
        # Cast A to fp16
-        if A.dtype != torch.float16:
+        if A.dtype != torch.float16 and not _is_compiling():
            warnings.warn(f"MatMul8bitLt: inputs will be cast from {A.dtype} to float16 during quantization")
        if len(A.shape) == 3: