summaryrefslogtreecommitdiff
path: root/iqk-quantize.cpp
diff options
context:
space:
mode:
authorIwan Kawrakow <iwan.kawrakow@gmail.com>2024-07-17 16:51:34 +0300
committerIwan Kawrakow <iwan.kawrakow@gmail.com>2024-07-17 16:51:34 +0300
commit6a132862fd3826d241c0c6f43e5f91450626eeb2 (patch)
tree2b542136ad9d67f86cfaaa8f32d4ade725aa8c0d /iqk-quantize.cpp
parenta4017cc04733361838e7380d529c4a6d3ff215c6 (diff)
Fix Makefile, add GGML_USE_IQK_MULMAT ifdefs to iqk-quantize
Diffstat (limited to 'iqk-quantize.cpp')
-rw-r--r--iqk-quantize.cpp4
1 files changed, 4 insertions, 0 deletions
diff --git a/iqk-quantize.cpp b/iqk-quantize.cpp
index c7b868a5..f0b6eec4 100644
--- a/iqk-quantize.cpp
+++ b/iqk-quantize.cpp
@@ -14,7 +14,9 @@
// limitations under the License.
#include "iqk-quantize.h"
+#if GGML_USE_IQK_MULMAT
#include "iqk_mul_mat.h"
+#endif
#include "ggml-quants.h"
#include "ggml-impl.h"
#define GGML_COMMON_IMPL_C
@@ -243,9 +245,11 @@ void ggml_vec_dot_iq1_bn_q8_K64(int n, float * s, size_t bs, const void * vx, si
static_assert(QK_IQ1BN == 64, "This dot product implementation for iq1_bn requires a block size of 64");
+#if GGML_USE_IQK_MULMAT
if (iqk_mul_mat(GGML_TASK_TYPE_COMPUTE, 1, 1, n, GGML_TYPE_IQ1_BN, vx, 0, GGML_TYPE_Q8_K64, vy, 0, s, 0, 0, 1)) {
return;
}
+#endif
const block_iq1_bn * x = (const block_iq1_bn *)vx;