diff options
Diffstat (limited to 'ggml/src/ggml-common.h')
-rw-r--r-- | ggml/src/ggml-common.h | 18 |
1 files changed, 18 insertions, 0 deletions
diff --git a/ggml/src/ggml-common.h b/ggml/src/ggml-common.h index 26041ac2..5fe27b29 100644 --- a/ggml/src/ggml-common.h +++ b/ggml/src/ggml-common.h @@ -621,6 +621,24 @@ typedef struct { static_assert(sizeof(block_iq2_ks) == sizeof(uint16_t) + QK_K/64 + QK_K/4, "wrong iq2_ks block size/padding"); typedef struct { + uint8_t scales[QK_K/64]; + uint8_t ql[QK_K/4]; +} block_iq2_kt; +static_assert(sizeof(block_iq2_kt) == QK_K/4 + QK_K/64, "wrong iq2_kt block size/padding"); + +typedef struct { + uint8_t scales[QK_K/64]; + uint8_t ql[QK_K/4]; + uint8_t qh[QK_K/8]; +} block_iq3_kt; +static_assert(sizeof(block_iq3_kt) == QK_K/4 + QK_K/8 + QK_K/64, "wrong iq3_kt block size/padding"); + +typedef struct { + uint32_t qs[QK_K/8]; +} block_iq4_kt; +static_assert(sizeof(block_iq4_kt) == QK_K/2, "wrong iq4_kt block size/padding"); + +typedef struct { ggml_half d; uint16_t extra; uint16_t scales_h; |