llama : add n_expert and n_expert_used to hparams + change quants
This commit is contained in:
parent
d1259b7b35
commit
e640cbe055
6 changed files with 111 additions and 54 deletions
2
ggml.c
2
ggml.c
|
@ -4075,7 +4075,7 @@ struct ggml_tensor * ggml_mul_mat(
|
|||
|
||||
struct ggml_tensor * ggml_mul_mat_id(
|
||||
struct ggml_context * ctx,
|
||||
struct ggml_tensor * as[],
|
||||
struct ggml_tensor * const as[],
|
||||
int n_as,
|
||||
struct ggml_tensor * ids,
|
||||
int id,
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue