quantize: be able to override metadata by key

2024-03-26 11:53:42 +02:00 · 2024-03-26 11:53:42 +02:00 · fc4c2a6fc3
commit fc4c2a6fc3
parent e190f1fca6
3 changed files with 83 additions and 2 deletions
--- a/llama.h
+++ b/llama.h
@ -284,6 +284,7 @@ extern "C" {
        bool only_copy;                      // only copy tensors - ftype, allow_requantize and quantize_output_tensor are ignored
        bool pure;                           // quantize all tensors to the default type
        void * imatrix;                      // pointer to importance matrix data
+        void * kv_overrides;                 // pointer to vector containing overrides
    } llama_model_quantize_params;

    // grammar types