diff options
author | Kawrakow <iwankawrakow@gmail.com> | 2025-07-20 09:49:59 +0200 |
---|---|---|
committer | GitHub <noreply@github.com> | 2025-07-20 09:49:59 +0200 |
commit | 07673c6c33753487dd054dcff37f19d93d6c56d3 (patch) | |
tree | e406416d8581fc7d6a82d8b4eb31c4dccb375bc5 /ggml/src/iqk/iqk_mul_mat.cpp | |
parent | 38012f7290f1761f151c415d2dc11d1af04da927 (diff) |
IQ1_M GEMM for ARM_NEON (#631)
* iq1_m GEMM on NEON
* Set repacking threshold
---------
Co-authored-by: Iwan Kawrakow <iwan.kawrakow@gmail.com>
Diffstat (limited to 'ggml/src/iqk/iqk_mul_mat.cpp')
-rw-r--r-- | ggml/src/iqk/iqk_mul_mat.cpp | 2 |
1 files changed, 1 insertions, 1 deletions
diff --git a/ggml/src/iqk/iqk_mul_mat.cpp b/ggml/src/iqk/iqk_mul_mat.cpp index 75ca87df..d7a5c1d8 100644 --- a/ggml/src/iqk/iqk_mul_mat.cpp +++ b/ggml/src/iqk/iqk_mul_mat.cpp @@ -279,7 +279,7 @@ struct MulMat { case GGML_TYPE_Q5_K : return nrc_y >= 32 ? GGML_TYPE_Q8_1 : type; case GGML_TYPE_Q6_K : return nrc_y >= 64 ? GGML_TYPE_Q8_0_R8 : type; case GGML_TYPE_IQ1_S : return nrc_y >= 32 ? GGML_TYPE_Q8_K_R8 : type; - case GGML_TYPE_IQ1_M : return nrc_y >= 8 ? GGML_TYPE_Q8_K_R8 : type; + case GGML_TYPE_IQ1_M : return nrc_y >= 32 ? GGML_TYPE_Q8_K_R8 : type; case GGML_TYPE_IQ2_XXS: return nrc_y >= 32 ? GGML_TYPE_Q8_K_R8 : type; case GGML_TYPE_IQ2_XS : return nrc_y >= 32 ? GGML_TYPE_Q8_K_R8 : type; case GGML_TYPE_IQ2_S : return nrc_y >= 32 ? GGML_TYPE_Q8_K_R8 : type; |