Update src/llama.cpp

Co-authored-by: compilade <git@compilade.net>
2024-08-09 02:06:04 -07:00 · 2024-08-09 02:06:04 -07:00 · 092382fee3
commit 092382fee3
parent b841554d0c
1 changed files with 1 additions and 1 deletions
--- a/src/llama.cpp
+++ b/src/llama.cpp
@ -13854,7 +13854,7 @@ struct llm_build_context {
            // self-attention
            {
                // compute Q and K and RoPE them
-                struct ggml_tensor * Qcur = ggml_mul_mat(ctx0, model.layers[il].wq, cur);
+                struct ggml_tensor * Qcur = llm_build_lora_mm(lctx, ctx0, model.layers[il].wq, cur);
                cb(Qcur, "Qcur", il);
                if (model.layers[il].bq) {
                    Qcur = ggml_add(ctx0, Qcur, model.layers[il].bq);