llama : add n_expert and n_expert_used to hparams + change quants

2023-12-10 13:57:54 +02:00 · 2023-12-10 13:57:54 +02:00 · e640cbe055
commit e640cbe055
parent d1259b7b35
6 changed files with 111 additions and 54 deletions
--- a/ggml.h
+++ b/ggml.h
@ -1051,7 +1051,7 @@ extern "C" {
    //  ggml_mul_mat_id(ctx, as, ids, id, b) ~= ggml_mul_mat(as[ids[id]], b)
    GGML_API struct ggml_tensor * ggml_mul_mat_id(
            struct ggml_context * ctx,
-            struct ggml_tensor  * as[],
+            struct ggml_tensor  * const as[],
            int                   n_as,
            struct ggml_tensor  * ids,
            int                   id,