From c033958d7c0055f89f0dcf738054342935c09652 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Stanis=C5=82aw=20Szymczyk?= Date: Tue, 21 May 2024 17:53:37 +0200 Subject: [PATCH] Removed usage of output bias tensor since it's not present in DeepSeek-V2 models. --- llama.cpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/llama.cpp b/llama.cpp index b13290b04..03bf77fa0 100644 --- a/llama.cpp +++ b/llama.cpp @@ -11080,7 +11080,7 @@ struct llm_build_context { key_states = ggml_set_inplace(ctx0, key_states, k_pe, key_states->nb[1], key_states->nb[2], key_states->nb[3], ggml_element_size(key_states) * qk_nope_head_dim); cur = llm_build_kv(ctx0, model, hparams, cparams, kv_self, gf, - model.layers[il].wo, model.layers[il].bo, + model.layers[il].wo, NULL, key_states, value_states, query_states, KQ_mask, n_tokens, kv_head, n_kv, kq_scale, cb, il); }