imatrix : offload to GPU support
This commit is contained in:
parent
e0493800ce
commit
0b2fca9a9f
3 changed files with 48 additions and 33 deletions
6
ggml.h
6
ggml.h
|
@ -2075,12 +2075,6 @@ extern "C" {
|
|||
GGML_API void ggml_init_iq2_quantization(enum ggml_type type);
|
||||
GGML_API void ggml_deinit_iq2_quantization(enum ggml_type type);
|
||||
|
||||
//
|
||||
// Importance matrix
|
||||
//
|
||||
typedef void(*ggml_collect_imatrix_t)(const struct ggml_tensor * src0, const struct ggml_tensor * src1);
|
||||
GGML_API void ggml_set_imatrix_collection(ggml_collect_imatrix_t imatrix_collect);
|
||||
|
||||
//
|
||||
// gguf
|
||||
//
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue