llama : add n_expert and n_expert_used to hparams + change quants
This commit is contained in:
parent
d1259b7b35
commit
e640cbe055
6 changed files with 111 additions and 54 deletions
2
ggml.h
2
ggml.h
|
@ -1051,7 +1051,7 @@ extern "C" {
|
|||
// ggml_mul_mat_id(ctx, as, ids, id, b) ~= ggml_mul_mat(as[ids[id]], b)
|
||||
GGML_API struct ggml_tensor * ggml_mul_mat_id(
|
||||
struct ggml_context * ctx,
|
||||
struct ggml_tensor * as[],
|
||||
struct ggml_tensor * const as[],
|
||||
int n_as,
|
||||
struct ggml_tensor * ids,
|
||||
int id,
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue