diff options
author | Iwan Kawrakow <iwan.kawrakow@gmail.com> | 2024-08-01 16:08:32 +0300 |
---|---|---|
committer | Kawrakow <48489457+ikawrakow@users.noreply.github.com> | 2024-08-09 16:00:31 +0200 |
commit | cfb0410067be051dd8ea76c08280a3b04d5a5188 (patch) | |
tree | 64ffc06e18f75a8cfc4d04b98875f68cd7fa99d4 /ggml/src/ggml-cuda/common.cuh | |
parent | a9f302ebe2373321c12b01d8760904901aa064a4 (diff) |
iq6_k: WIP (nothing works)
Diffstat (limited to 'ggml/src/ggml-cuda/common.cuh')
-rw-r--r-- | ggml/src/ggml-cuda/common.cuh | 7 |
1 files changed, 7 insertions, 0 deletions
diff --git a/ggml/src/ggml-cuda/common.cuh b/ggml/src/ggml-cuda/common.cuh index c18e865a..07a53bcd 100644 --- a/ggml/src/ggml-cuda/common.cuh +++ b/ggml/src/ggml-cuda/common.cuh @@ -705,6 +705,13 @@ struct ggml_cuda_type_traits<GGML_TYPE_IQ5_K> { }; template<> +struct ggml_cuda_type_traits<GGML_TYPE_IQ6_K> { + static constexpr int qk = QK_K; + static constexpr int qr = QR6_XS; + static constexpr int qi = QI6_XS; +}; + +template<> struct ggml_cuda_type_traits<GGML_TYPE_IQ3_S> { static constexpr int qk = QK_K; static constexpr int qr = QR3_S; |