diff --git a/src/llama.cpp b/src/llama.cpp index a4ceb0959..b42cc5fb4 100644 --- a/src/llama.cpp +++ b/src/llama.cpp @@ -7867,10 +7867,9 @@ static struct ggml_tensor * llm_build_lora_mm( continue; } // TODO: check if lora_a need transpose - struct ggml_tensor * a = ggml_cont(ctx0, ggml_transpose(ctx0, lora->a)); struct ggml_tensor * ab_cur = ggml_mul_mat( ctx0, lora->b, - ggml_mul_mat(ctx0, a, cur) + ggml_mul_mat(ctx0, lora->a, cur) ); ab_cur = ggml_scale_inplace(ctx0, ab_cur, scale); res = ggml_add(ctx0, res, ab_cur);