imatrix : offload to GPU support

2024-01-15 16:18:11 +02:00 · 2024-01-15 16:18:11 +02:00 · 0b2fca9a9f
commit 0b2fca9a9f
parent e0493800ce
3 changed files with 48 additions and 33 deletions
--- a/ggml.h
+++ b/ggml.h
@ -2075,12 +2075,6 @@ extern "C" {
    GGML_API void ggml_init_iq2_quantization(enum ggml_type type);
    GGML_API void ggml_deinit_iq2_quantization(enum ggml_type type);

-    //
-    // Importance matrix
-    //
-    typedef void(*ggml_collect_imatrix_t)(const struct ggml_tensor * src0, const struct ggml_tensor * src1);
-    GGML_API void ggml_set_imatrix_collection(ggml_collect_imatrix_t imatrix_collect);
-
    //
    // gguf
    //