summaryrefslogtreecommitdiff
path: root/ggml/src
diff options
context:
space:
mode:
authorKawrakow <iwankawrakow@gmail.com>2025-04-25 19:48:08 +0200
committerGitHub <noreply@github.com>2025-04-25 19:48:08 +0200
commit770892086c15471a397a6a1a196986de906cdc91 (patch)
treed74bac28ba73fb8f335b8d1d6da486c3ffe7f6e8 /ggml/src
parentc817160d0395ddbc2ad79d3c0ce52a4da63ac81d (diff)
Fix q4_1 and q5_1 on Arm (#348)
Co-authored-by: Iwan Kawrakow <iwan.kawrakow@gmail.com>
Diffstat (limited to 'ggml/src')
-rw-r--r--ggml/src/ggml.c8
1 files changed, 8 insertions, 0 deletions
diff --git a/ggml/src/ggml.c b/ggml/src/ggml.c
index 83a48cb6..ad9393cc 100644
--- a/ggml/src/ggml.c
+++ b/ggml/src/ggml.c
@@ -741,8 +741,12 @@ static const ggml_type_traits_t type_traits[GGML_TYPE_COUNT] = {
.from_float_ref = (ggml_from_float_t) quantize_row_q4_1_ref,
.vec_dot = ggml_vec_dot_q4_1_q8_1,
#if GGML_USE_IQK_MULMAT
+#if defined __AVX2__
.vec_dot_type = GGML_TYPE_Q8_2_X4,
#else
+ .vec_dot_type = GGML_TYPE_Q8_1_X4,
+#endif
+#else
.vec_dot_type = GGML_TYPE_Q8_1,
#endif
#if defined (__ARM_FEATURE_MATMUL_INT8)
@@ -809,8 +813,12 @@ static const ggml_type_traits_t type_traits[GGML_TYPE_COUNT] = {
.from_float_ref = (ggml_from_float_t) quantize_row_q5_1_ref,
.vec_dot = ggml_vec_dot_q5_1_q8_1,
#if GGML_USE_IQK_MULMAT
+#ifdef __AVX2__
.vec_dot_type = GGML_TYPE_Q8_2_X4,
#else
+ .vec_dot_type = GGML_TYPE_Q8_1_X4,
+#endif
+#else
.vec_dot_type = GGML_TYPE_Q8_1,
#endif
.nrows = 1,