Add support for I8, I16 and I32 to gguf_writer

2024-03-13 14:06:33 -06:00 · 2024-03-13 14:06:33 -06:00 · c5423753f7
commit c5423753f7
parent dc0e4d8e74
1 changed files with 7 additions and 1 deletions
--- a/gguf-py/gguf/gguf_writer.py
+++ b/gguf-py/gguf/gguf_writer.py
@ -208,8 +208,14 @@ class GGUFWriter:
                dtype = GGMLQuantizationType.F32
            elif tensor_dtype == np.float16:
                dtype = GGMLQuantizationType.F16
            elif tensor_dtype == np.int8:
                dtype = GGMLQuantizationType.I8
            elif tensor_dtype == np.int16:
                dtype = GGMLQuantizationType.I16
            elif tensor_dtype == np.int32:
                dtype = GGMLQuantizationType.I32
            else:
-                raise ValueError("Only F32 and F16 tensors are supported for now")
+                raise ValueError("Only F32, F16, I8, I16, I32 tensors are supported for now")
        else:
            dtype = raw_dtype
        self.ti_data += self._pack("I", dtype)