Merge pull request #670 from akemimadoka/fix-win

Fix RuntimeError on Windows caused by integer overflow in np.prod
2025-09-08 05:29:29 +00:00 · 2025-02-27 17:40:27 +08:00 · 2025-02-27 17:40:27 +08:00 · 0422152cf3
commit 0422152cf3
parent 798e1d0cfa 8817777e11
1 changed files with 2 additions and 1 deletions
--- a/ktransformers/util/custom_gguf.py
+++ b/ktransformers/util/custom_gguf.py
@ -27,6 +27,7 @@ import torch
 import KTransformersOps
 from .custom_loader import SafeTensorLoader
 import ctypes
 import math
 class GGMLQuantizationType(IntEnum):
    F32     = 0
@ -230,7 +231,7 @@ class GGUFLoader:
            shape = [read_value(f, DATA_TYPES["uint64"]) for _ in range(shape_len)]
            ggml_type = read_value(f, DATA_TYPES["uint32"])
            bad_offset = read_value(f, DATA_TYPES["uint64"])
-            n_elems = int(np.prod(shape))
+            n_elems = int(math.prod(shape))
            block_size, type_size = GGML_QUANT_SIZES[ggml_type]
            n_bytes = n_elems * type_size // block_size
            np_dims = tuple(reversed(shape))