summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorGeorgi Gerganov <ggerganov@gmail.com>2023-08-24 19:58:30 +0300
committerGeorgi Gerganov <ggerganov@gmail.com>2023-08-24 19:58:30 +0300
commit01f2224682b08185af609b28b1268b95c8b4cfa2 (patch)
tree729f6e761fa83f2692837aa738f393da74741fbd
parent38b16dfca6e5032e6cfb90c1653bf1ba4cf647b4 (diff)
falcon : write file type
-rwxr-xr-xconvert-falcon-hf-to-gguf.py1
-rwxr-xr-xscripts/run-all-ppl.sh2
2 files changed, 2 insertions, 1 deletions
diff --git a/convert-falcon-hf-to-gguf.py b/convert-falcon-hf-to-gguf.py
index 43e20849..411cbf68 100755
--- a/convert-falcon-hf-to-gguf.py
+++ b/convert-falcon-hf-to-gguf.py
@@ -107,6 +107,7 @@ if "n_head_kv" in hparams:
else:
gguf_writer.add_head_count_kv(1)
gguf_writer.add_layer_norm_eps(hparams["layer_norm_epsilon"])
+gguf_writer.add_file_type(ftype)
# TOKENIZATION
diff --git a/scripts/run-all-ppl.sh b/scripts/run-all-ppl.sh
index bdbbb19c..366d0866 100755
--- a/scripts/run-all-ppl.sh
+++ b/scripts/run-all-ppl.sh
@@ -1,7 +1,7 @@
#!/bin/bash
qnt=(f16 q8_0 q6_k q5_k q5_1 q5_0 q4_k q4_1 q4_0 q3_k q2_k)
-args="--no-mmap -ngl 999 -t 8"
+args="-ngl 999 -t 8"
if [ -z "$1" ]; then
echo "usage: $0 <model> [qnt] [args]"