2 лет назад · 7f7ddd5002
--- a/convert-llama-ggmlv3-to-gguf.py
+++ b/convert-llama-ggmlv3-to-gguf.py
@@ -1,12 +1,10 @@
 
															-import sys, struct, math, argparse, warnings
														
 
															+import sys, struct, math, argparse
														
 
															 from pathlib import Path
														
 
															 import numpy as np
														
 
															 import gguf
														
 
															-warnings.filterwarnings('error')
														
 
															-
														
 
															 # Note: Does not support GGML_QKK_64
														
 
															 QK_K = 256
														
 
															 # Items here are (block size, type size)
														
@@ -95,7 +93,7 @@ class Tensor:
 
															         pad = ((offset + 31) & ~31) - offset
														
 
															         offset += pad
														
 
															         n_elems = np.prod(self.dims)
														
 
															-        n_bytes = (n_elems * tysize) // blksize
														
 
															+        n_bytes = np.int64(np.int64(n_elems) * np.int64(tysize)) // np.int64(blksize)
														
 
															         self.start_offset = offset
														
 
															         self.len_bytes = n_bytes
														
 
															         offset += n_bytes
														
@@ -327,11 +325,7 @@ def main():
 
															     data = np.memmap(cfg.input, mode = 'r')
														
 
															     model = GGMLV3Model()
														
 
															     print('* Scanning GGML input file')
														
 
															-    try:
														
 
															-        offset = model.load(data, 0)
														
 
															-    except OverflowError:
														
 
															-        print(f'!!! Caught overflow loading tensors. The most likely issue is running on Windows but not in WSL. Try running in WSL if possible.', file = sys.stderr)
														
 
															-        raise
														
 
															+    offset = model.load(data, 0)
														
 
															     print(f'* GGML model hyperparameters: {model.hyperparameters}')
														
 
															     vocab_override = None
														
 
															     params_override = None