summaryrefslogtreecommitdiff
path: root/ggml/src/ggml-cuda/common.cuh
diff options
context:
space:
mode:
authorIwan Kawrakow <iwan.kawrakow@gmail.com>2024-08-01 16:08:32 +0300
committerKawrakow <48489457+ikawrakow@users.noreply.github.com>2024-08-09 16:00:31 +0200
commitcfb0410067be051dd8ea76c08280a3b04d5a5188 (patch)
tree64ffc06e18f75a8cfc4d04b98875f68cd7fa99d4 /ggml/src/ggml-cuda/common.cuh
parenta9f302ebe2373321c12b01d8760904901aa064a4 (diff)
iq6_k: WIP (nothing works)
Diffstat (limited to 'ggml/src/ggml-cuda/common.cuh')
-rw-r--r--ggml/src/ggml-cuda/common.cuh7
1 files changed, 7 insertions, 0 deletions
diff --git a/ggml/src/ggml-cuda/common.cuh b/ggml/src/ggml-cuda/common.cuh
index c18e865a..07a53bcd 100644
--- a/ggml/src/ggml-cuda/common.cuh
+++ b/ggml/src/ggml-cuda/common.cuh
@@ -705,6 +705,13 @@ struct ggml_cuda_type_traits<GGML_TYPE_IQ5_K> {
};
template<>
+struct ggml_cuda_type_traits<GGML_TYPE_IQ6_K> {
+ static constexpr int qk = QK_K;
+ static constexpr int qr = QR6_XS;
+ static constexpr int qi = QI6_XS;
+};
+
+template<>
struct ggml_cuda_type_traits<GGML_TYPE_IQ3_S> {
static constexpr int qk = QK_K;
static constexpr int qr = QR3_S;