From 06f1ba410eb2e47e20d5dbf573bbe6f9a36baa4a Mon Sep 17 00:00:00 2001 From: Andrei Betlen Date: Thu, 27 Jun 2024 13:43:45 -0400 Subject: [PATCH] cleanup --- src/llama.cpp | 5 ++--- 1 file changed, 2 insertions(+), 3 deletions(-) diff --git a/src/llama.cpp b/src/llama.cpp index f036fb637..1e7d5a1ea 100644 --- a/src/llama.cpp +++ b/src/llama.cpp @@ -10992,7 +10992,7 @@ struct llm_build_context { return gf; } - + struct ggml_cgraph * build_gemma2() { struct ggml_cgraph * gf = ggml_new_graph_custom(ctx0, LLAMA_MAX_NODES, false); @@ -11050,8 +11050,7 @@ struct llm_build_context { model.layers[il].wo, NULL, Kcur, Vcur, Qcur, KQ_mask, n_tokens, kv_head, n_kv, 1.0f, cb, il); } - - // is this the right place for it? + cur = llm_build_norm(ctx0, cur, hparams, model.layers[il].attn_post_norm, NULL, LLM_NORM_RMS, cb, il);