summaryrefslogtreecommitdiff
path: root/scripts/qnt-all.sh
diff options
context:
space:
mode:
Diffstat (limited to 'scripts/qnt-all.sh')
-rwxr-xr-xscripts/qnt-all.sh27
1 files changed, 27 insertions, 0 deletions
diff --git a/scripts/qnt-all.sh b/scripts/qnt-all.sh
new file mode 100755
index 00000000..1b3d07da
--- /dev/null
+++ b/scripts/qnt-all.sh
@@ -0,0 +1,27 @@
+#!/bin/bash
+
+qnt=(q8_0 q6_k q5_k q5_1 q5_0 q4_k q4_1 q4_0 q3_k q2_k)
+args=""
+
+if [ -z "$1" ]; then
+ echo "usage: $0 <model> [qnt] [args]"
+ echo "default: $0 <model> \"${qnt[@]}\" \"${args}\""
+ exit 1
+fi
+
+if [ ! -z "$2" ]; then
+ qnt=($2)
+fi
+
+if [ ! -z "$3" ]; then
+ args="$3"
+fi
+
+model="$1"
+out="../tmp/results-${model}"
+
+mkdir -p ${out}
+
+for q in ${qnt[@]}; do
+ time ./bin/quantize ../models/${model}/ggml-model-f16.gguf ../models/${model}/ggml-model-${q}.gguf ${q} 2>&1 ${args} | tee ${out}/qnt-${q}.txt
+done