metal : support Q > 8
This commit is contained in:
parent
134c81c78d
commit
1db22d7032
3 changed files with 55 additions and 34 deletions
|
@ -104,7 +104,7 @@ int main(int argc, char ** argv) {
|
|||
|
||||
ctx_params.seed = 1234;
|
||||
ctx_params.n_ctx = n_kv_max;
|
||||
ctx_params.n_batch = 512;
|
||||
ctx_params.n_batch = 2048;
|
||||
ctx_params.mul_mat_q = mmq;
|
||||
|
||||
ctx_params.n_threads = params.n_threads;
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue