use mmq

2023-08-30 16:42:01 +02:00 · 2023-08-30 16:42:01 +02:00 · c436f18cc4
commit c436f18cc4
parent 3ef3cf8c3d
1 changed files with 1 additions and 0 deletions
--- a/examples/llama2-chat/llama2-chat.cpp
+++ b/examples/llama2-chat/llama2-chat.cpp
@ -25,6 +25,7 @@ struct chat {
        lparams = llama_context_default_params();
        lparams.n_ctx = 4096;
        lparams.n_gpu_layers = 99;
        lparams.mul_mat_q = true;
        model = llama_load_model_from_file(model_file.c_str(), lparams);
        if (model == NULL) {