imatrix : use GGUF to store imatrix data

2024-09-06 17:17:25 -04:00 · 2024-09-06 17:17:25 -04:00 · 3de9300c37
commit 3de9300c37
parent 347247a24e
4 changed files with 352 additions and 149 deletions
--- a/gguf-py/gguf/constants.py
+++ b/gguf-py/gguf/constants.py
@ -167,6 +167,12 @@ class Keys:
        TYPE       = "adapter.type"
        LORA_ALPHA = "adapter.lora.alpha"

+    class IMatrix:
+        CHUNK_COUNT = "imatrix.chunk_count"
+        CHUNK_SIZE  = "imatrix.chunk_size"
+        DATASET     = "imatrix.dataset"
+
+
 #
 # recommended mapping of model tensor names for storage in gguf
 #
@ -175,6 +181,7 @@ class Keys:
 class GGUFType:
    MODEL   = "model"
    ADAPTER = "adapter"
+    IMATRIX = "imatrix"


 class MODEL_ARCH(IntEnum):