gguf-py: Add IQ1_M to GGML_QUANT_SIZES
This commit is contained in:
parent
bca40e9814
commit
5622e3aa22
1 changed files with 1 additions and 0 deletions
|
@ -859,6 +859,7 @@ GGML_QUANT_SIZES = {
|
|||
GGMLQuantizationType.I32: (1, 4),
|
||||
GGMLQuantizationType.I64: (1, 8),
|
||||
GGMLQuantizationType.F64: (1, 8),
|
||||
GGMLQuantizationType.IQ1_M: (256, QK_K // 8 + QK_K // 16 + QK_K // 32),
|
||||
}
|
||||
|
||||
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue