From c1386c936e9fbc38eb2816c711ab28f13355708e Mon Sep 17 00:00:00 2001 From: pmysl Date: Sun, 21 Apr 2024 14:49:30 +0200 Subject: [PATCH] gguf-py : add IQ1_M to GGML_QUANT_SIZES (#6761) --- gguf-py/gguf/constants.py | 1 + 1 file changed, 1 insertion(+) diff --git a/gguf-py/gguf/constants.py b/gguf-py/gguf/constants.py index ba24065a8..06cb26a7d 100644 --- a/gguf-py/gguf/constants.py +++ b/gguf-py/gguf/constants.py @@ -872,6 +872,7 @@ GGML_QUANT_SIZES = { GGMLQuantizationType.I32: (1, 4), GGMLQuantizationType.I64: (1, 8), GGMLQuantizationType.F64: (1, 8), + GGMLQuantizationType.IQ1_M: (256, QK_K // 8 + QK_K // 16 + QK_K // 32), }