summaryrefslogtreecommitdiff
path: root/gguf-py
diff options
context:
space:
mode:
authorpmysl <piotr.myslinski@outlook.com>2024-04-21 14:49:30 +0200
committerGitHub <noreply@github.com>2024-04-21 15:49:30 +0300
commitc1386c936e9fbc38eb2816c711ab28f13355708e (patch)
tree9dcb24cb7039c0747127ea39f1f905dcafcbee4d /gguf-py
parente8d35f47cb8cb4002fca02e18aaa1cb9fa21d6f1 (diff)
gguf-py : add IQ1_M to GGML_QUANT_SIZES (#6761)
Diffstat (limited to 'gguf-py')
-rw-r--r--gguf-py/gguf/constants.py1
1 files changed, 1 insertions, 0 deletions
diff --git a/gguf-py/gguf/constants.py b/gguf-py/gguf/constants.py
index ba24065a..06cb26a7 100644
--- a/gguf-py/gguf/constants.py
+++ b/gguf-py/gguf/constants.py
@@ -872,6 +872,7 @@ GGML_QUANT_SIZES = {
GGMLQuantizationType.I32: (1, 4),
GGMLQuantizationType.I64: (1, 8),
GGMLQuantizationType.F64: (1, 8),
+ GGMLQuantizationType.IQ1_M: (256, QK_K // 8 + QK_K // 16 + QK_K // 32),
}