Merge pull request #670 from akemimadoka/fix-win

Fix RuntimeError on Windows caused by integer overflow in np.prod

Merge pull request #670 from akemimadoka/fix-win
Fix RuntimeError on Windows caused by integer overflow in np.prod
0422152c · Atream · GitHub · 798e1d0c · 8817777e · 0422152c
Unverified Commit 0422152c authored Feb 27, 2025 by Atream Committed by GitHub Feb 27, 2025
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 1 deletion

ktransformers/util/custom_gguf.py ktransformers/util/custom_gguf.py +2 -1

No files found.
--- a/ktransformers/util/custom_gguf.py
+++ b/ktransformers/util/custom_gguf.py
@@ -27,6 +27,7 @@ import torch
 import KTransformersOps
 from .custom_loader import SafeTensorLoader
 import ctypes
+import math
 class GGMLQuantizationType(IntEnum):
    F32     = 0
@@ -230,7 +231,7 @@ class GGUFLoader:
            shape = [read_value(f, DATA_TYPES["uint64"]) for _ in range(shape_len)]
            ggml_type = read_value(f, DATA_TYPES["uint32"])
            bad_offset = read_value(f, DATA_TYPES["uint64"])
-            n_elems = int(np.prod(shape))
+            n_elems = int(math.prod(shape))
            block_size, type_size = GGML_QUANT_SIZES[ggml_type]
            n_bytes = n_elems * type_size // block_size
            np_dims = tuple(reversed(shape))