quantize: be able to override metadata by key
This commit is contained in:
parent
e190f1fca6
commit
fc4c2a6fc3
3 changed files with 83 additions and 2 deletions
1
llama.h
1
llama.h
|
@ -284,6 +284,7 @@ extern "C" {
|
|||
bool only_copy; // only copy tensors - ftype, allow_requantize and quantize_output_tensor are ignored
|
||||
bool pure; // quantize all tensors to the default type
|
||||
void * imatrix; // pointer to importance matrix data
|
||||
void * kv_overrides; // pointer to vector containing overrides
|
||||
} llama_model_quantize_params;
|
||||
|
||||
// grammar types
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue