diff options
Diffstat (limited to 'ggml/src/ggml.c')
-rw-r--r-- | ggml/src/ggml.c | 4 |
1 files changed, 2 insertions, 2 deletions
diff --git a/ggml/src/ggml.c b/ggml/src/ggml.c index 0aee8dd4..ad092923 100644 --- a/ggml/src/ggml.c +++ b/ggml/src/ggml.c @@ -14,6 +14,7 @@ #include "iqk/iqk_quantize.h" #if GGML_USE_IQK_MULMAT #include "iqk/iqk_mul_mat.h" +#include "iqk/iqk_config.h" #endif #if defined(_MSC_VER) || defined(__MINGW32__) @@ -847,11 +848,10 @@ static const ggml_type_traits_t type_traits[GGML_TYPE_COUNT] = { .from_float_to_mat = quantize_mat_q8_0, .vec_dot = ggml_vec_dot_q8_0_q8_0, #if GGML_USE_IQK_MULMAT -#if defined(__AVX512F__) && defined(__AVX512VNNI__) && defined(__AVX512VL__) && defined(__AVX512BW__) && defined(__AVX512DQ__) +#ifdef HAVE_FANCY_SIMD // Remember: we cannot add 128 to the Q8 quants and use iblock sum in Q8_1 to subtract as we do on Zen4 for pure AVX2 // because there the result of the _mm256_maddubs_epi16() instruction may overflow the int16_t range // (and it gets satured if it does), leading to wrong results. - // TODO: expose HAVE_FANCY_SIMD from iqk_mul_mat.cpp and use #ifdef HAVE_FANCY_SIMD instead of the above. .vec_dot_type = GGML_TYPE_Q8_1_X4, #else .vec_dot_type = GGML_TYPE_Q8_0_X4, |