]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
falcon : write file type
authorGeorgi Gerganov <redacted>
Thu, 24 Aug 2023 16:58:30 +0000 (19:58 +0300)
committerGeorgi Gerganov <redacted>
Thu, 24 Aug 2023 16:58:30 +0000 (19:58 +0300)
convert-falcon-hf-to-gguf.py
scripts/run-all-ppl.sh

index 43e208497a7bc14d5ada46a1902b1d4b24001afd..411cbf682d67d1f61e9f7bfe7ecc295e3c1f4ed4 100755 (executable)
@@ -107,6 +107,7 @@ if "n_head_kv" in hparams:
 else:
     gguf_writer.add_head_count_kv(1)
 gguf_writer.add_layer_norm_eps(hparams["layer_norm_epsilon"])
+gguf_writer.add_file_type(ftype)
 
 # TOKENIZATION
 
index bdbbb19c9472e0054e2a3275adc6f42c9297bf3b..366d0866cb280e6ad3a1c0fa48d65168aeefa9e5 100755 (executable)
@@ -1,7 +1,7 @@
 #!/bin/bash
 
 qnt=(f16 q8_0 q6_k q5_k q5_1 q5_0 q4_k q4_1 q4_0 q3_k q2_k)
-args="--no-mmap -ngl 999 -t 8"
+args="-ngl 999 -t 8"
 
 if [ -z "$1" ]; then
     echo "usage: $0 <model> [qnt] [args]"