diff --git a/src/llama.cpp b/src/llama.cpp index aae3c69b5..3d5a928a8 100644 --- a/src/llama.cpp +++ b/src/llama.cpp @@ -7217,7 +7217,7 @@ struct llm_build_context { struct ggml_tensor * Qcur = nullptr; struct ggml_tensor * Kcur = nullptr; struct ggml_tensor * Vcur = nullptr; - if (model.type == LLM_TYPE_1_5B || model.type == LLM_TYPE_4B || model.type == LLM_TYPE_9B) { + if (model.layers[il].wqkv == nullptr) { Qcur = llm_build_lora_mm(lctx, ctx0, model.layers[il].wq, cur); if (model.layers[il].bq) { Qcur = ggml_add(ctx0, Qcur, model.layers[il].bq);