Explorar o código

falcon : write file type

Georgi Gerganov %!s(int64=2) %!d(string=hai) anos
pai
achega
01f2224682
Modificáronse 2 ficheiros con 2 adicións e 1 borrados
  1. 1 0
      convert-falcon-hf-to-gguf.py
  2. 1 1
      scripts/run-all-ppl.sh

+ 1 - 0
convert-falcon-hf-to-gguf.py

@@ -107,6 +107,7 @@ if "n_head_kv" in hparams:
 else:
 else:
     gguf_writer.add_head_count_kv(1)
     gguf_writer.add_head_count_kv(1)
 gguf_writer.add_layer_norm_eps(hparams["layer_norm_epsilon"])
 gguf_writer.add_layer_norm_eps(hparams["layer_norm_epsilon"])
+gguf_writer.add_file_type(ftype)
 
 
 # TOKENIZATION
 # TOKENIZATION
 
 

+ 1 - 1
scripts/run-all-ppl.sh

@@ -1,7 +1,7 @@
 #!/bin/bash
 #!/bin/bash
 
 
 qnt=(f16 q8_0 q6_k q5_k q5_1 q5_0 q4_k q4_1 q4_0 q3_k q2_k)
 qnt=(f16 q8_0 q6_k q5_k q5_1 q5_0 q4_k q4_1 q4_0 q3_k q2_k)
-args="--no-mmap -ngl 999 -t 8"
+args="-ngl 999 -t 8"
 
 
 if [ -z "$1" ]; then
 if [ -z "$1" ]; then
     echo "usage: $0 <model> [qnt] [args]"
     echo "usage: $0 <model> [qnt] [args]"