gguf-py: Add IQ1_M to GGML_QUANT_SIZES

This commit is contained in:
Piotr Myśliński 2024-04-19 06:59:07 +02:00
parent bca40e9814
commit 5622e3aa22

View file

@ -859,6 +859,7 @@ GGML_QUANT_SIZES = {
GGMLQuantizationType.I32: (1, 4), GGMLQuantizationType.I32: (1, 4),
GGMLQuantizationType.I64: (1, 8), GGMLQuantizationType.I64: (1, 8),
GGMLQuantizationType.F64: (1, 8), GGMLQuantizationType.F64: (1, 8),
GGMLQuantizationType.IQ1_M: (256, QK_K // 8 + QK_K // 16 + QK_K // 32),
} }