IQ2_S_R4 (#156)

* iq2_s_r4: Zen4 * Minor * iq2_s_r4: NEON --------- Co-authored-by: Iwan Kawrakow <iwan.kawrakow@gmail.com>
author: Kawrakow <iwankawrakow@gmail.com> 2024-12-21 11:26:35 +0100
committer: GitHub <noreply@github.com> 2024-12-21 11:26:35 +0100
commit: 93419de68f90fede135480a2717785d519df9f42 (patch)
tree: 615164646770d7fdb596f04af2d887a8441f3afb /examples/quantize/quantize.cpp
parent: a867b919ca1e26cc828f98c35b4c6926e8e54762 (diff)
1 files changed, 1 insertions, 0 deletions
diff --git a/examples/quantize/quantize.cpp b/examples/quantize/quantize.cpp
index dbae9792..1599405b 100644
--- a/examples/quantize/quantize.cpp
+++ b/examples/quantize/quantize.cpp
@@ -27,6 +27,7 @@ static const std::vector<struct quant_option> QUANT_OPTIONS = {
     { "IQ2_XS_R4",LLAMA_FTYPE_MOSTLY_IQ2_XS_R4,"IQ2_XS repacked",            },
     { "IQ2_S",    LLAMA_FTYPE_MOSTLY_IQ2_S,    " 2.5  bpw quantization",            },
     { "IQ2_M",    LLAMA_FTYPE_MOSTLY_IQ2_M,    " 2.7  bpw quantization",            },
+    { "IQ2_M_R4", LLAMA_FTYPE_MOSTLY_IQ2_M_R4, " 2.7  bpw quantization",            },
     { "IQ1_S",    LLAMA_FTYPE_MOSTLY_IQ1_S,    " 1.56 bpw quantization",            },
     { "IQ1_M",    LLAMA_FTYPE_MOSTLY_IQ1_M,    " 1.75 bpw quantization",            },
     { "IQ1_BN",   LLAMA_FTYPE_MOSTLY_IQ1_BN,   " 1.62 bpw quantization (Bitnet)",   },
author	Kawrakow <iwankawrakow@gmail.com>	2024-12-21 11:26:35 +0100
committer	GitHub <noreply@github.com>	2024-12-21 11:26:35 +0100
commit	93419de68f90fede135480a2717785d519df9f42 (patch)
tree	615164646770d7fdb596f04af2d887a8441f3afb /examples/quantize/quantize.cpp
parent	a867b919ca1e26cc828f98c35b4c6926e8e54762 (diff)