llama : add n_expert and n_expert_used to hparams + change quants

This commit is contained in:
Georgi Gerganov 2023-12-10 13:57:54 +02:00
parent d1259b7b35
commit e640cbe055
No known key found for this signature in database
GPG key ID: 449E073F9DC10735
6 changed files with 111 additions and 54 deletions

2
ggml.h
View file

@ -1051,7 +1051,7 @@ extern "C" {
// ggml_mul_mat_id(ctx, as, ids, id, b) ~= ggml_mul_mat(as[ids[id]], b)
GGML_API struct ggml_tensor * ggml_mul_mat_id(
struct ggml_context * ctx,
struct ggml_tensor * as[],
struct ggml_tensor * const as[],
int n_as,
struct ggml_tensor * ids,
int id,