llama : add n_expert and n_expert_used to hparams + change quants

2023-12-10 13:57:54 +02:00 · 2023-12-10 13:57:54 +02:00 · e640cbe055
commit e640cbe055
parent d1259b7b35
6 changed files with 111 additions and 54 deletions
--- a/ggml.c
+++ b/ggml.c
@ -4075,7 +4075,7 @@ struct ggml_tensor * ggml_mul_mat(

 struct ggml_tensor * ggml_mul_mat_id(
        struct ggml_context * ctx,
-        struct ggml_tensor  * as[],
+        struct ggml_tensor  * const as[],
        int                   n_as,
        struct ggml_tensor  * ids,
        int                   id,