falcon : write file type

author Georgi Gerganov <redacted>

Thu, 24 Aug 2023 16:58:30 +0000 (19:58 +0300)

committer Georgi Gerganov <redacted>

Thu, 24 Aug 2023 16:58:30 +0000 (19:58 +0300)
author Georgi Gerganov <redacted>
Thu, 24 Aug 2023 16:58:30 +0000 (19:58 +0300)
committer Georgi Gerganov <redacted>
Thu, 24 Aug 2023 16:58:30 +0000 (19:58 +0300)
diff --git a/convert-falcon-hf-to-gguf.py b/convert-falcon-hf-to-gguf.py

index 43e208497a7bc14d5ada46a1902b1d4b24001afd..411cbf682d67d1f61e9f7bfe7ecc295e3c1f4ed4 100755 (executable)
--- a/convert-falcon-hf-to-gguf.py
+++ b/convert-falcon-hf-to-gguf.py
@@ -107,6 +107,7 @@ if "n_head_kv" in hparams:
  else:
      gguf_writer.add_head_count_kv(1)
  gguf_writer.add_layer_norm_eps(hparams["layer_norm_epsilon"])
+gguf_writer.add_file_type(ftype)
  
  # TOKENIZATION
  
diff --git a/scripts/run-all-ppl.sh b/scripts/run-all-ppl.sh

index bdbbb19c9472e0054e2a3275adc6f42c9297bf3b..366d0866cb280e6ad3a1c0fa48d65168aeefa9e5 100755 (executable)
--- a/scripts/run-all-ppl.sh
+++ b/scripts/run-all-ppl.sh
@@ -1,7 +1,7 @@
  #!/bin/bash
  
  qnt=(f16 q8_0 q6_k q5_k q5_1 q5_0 q4_k q4_1 q4_0 q3_k q2_k)
-args="--no-mmap -ngl 999 -t 8"
+args="-ngl 999 -t 8"
  
  if [ -z "$1" ]; then
      echo "usage: $0 <model> [qnt] [args]"
author	Georgi Gerganov <redacted>
	Thu, 24 Aug 2023 16:58:30 +0000 (19:58 +0300)
committer	Georgi Gerganov <redacted>
	Thu, 24 Aug 2023 16:58:30 +0000 (19:58 +0300)
convert-falcon-hf-to-gguf.py		patch \| blob \| history
scripts/run-all-ppl.sh		patch \| blob \| history