From 8ffad187abbb93b74db8ef813b6fdceec80e02b0 Mon Sep 17 00:00:00 2001 From: Kawrakow Date: Thu, 5 Jun 2025 08:31:20 +0300 Subject: MMQ implementation for IQ4_KS_R4 and IQ5_KS_R4 (#493) * MMQ for iq4_ks_r4 * MMQ for iq5_ks_r4 * Add forgotten file * Another forgotten file --------- Co-authored-by: Iwan Kawrakow --- ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_ks_r4.cu | 5 +++++ ggml/src/ggml-cuda/template-instances/mmq-instance-iq5_ks_r4.cu | 5 +++++ 2 files changed, 10 insertions(+) create mode 100644 ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_ks_r4.cu create mode 100644 ggml/src/ggml-cuda/template-instances/mmq-instance-iq5_ks_r4.cu (limited to 'ggml/src/ggml-cuda/template-instances') diff --git a/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_ks_r4.cu b/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_ks_r4.cu new file mode 100644 index 00000000..d0f08ce8 --- /dev/null +++ b/ggml/src/ggml-cuda/template-instances/mmq-instance-iq4_ks_r4.cu @@ -0,0 +1,5 @@ +// This file has been autogenerated by generate_cu_files.py, do not edit manually. + +#include "../mmq.cuh" + +DECL_MMQ_CASE(GGML_TYPE_IQ4_KS_R4); diff --git a/ggml/src/ggml-cuda/template-instances/mmq-instance-iq5_ks_r4.cu b/ggml/src/ggml-cuda/template-instances/mmq-instance-iq5_ks_r4.cu new file mode 100644 index 00000000..0cc77dc0 --- /dev/null +++ b/ggml/src/ggml-cuda/template-instances/mmq-instance-iq5_ks_r4.cu @@ -0,0 +1,5 @@ +// This file has been autogenerated by generate_cu_files.py, do not edit manually. + +#include "../mmq.cuh" + +DECL_MMQ_CASE(GGML_TYPE_IQ5_KS_R4); -- cgit v1.2.3