From e20765534d3b098afb804c7660c66b5e1d4719cb Mon Sep 17 00:00:00 2001
From: Ebey Abraham <ebeyabraham@microsoft.com>
Date: Sat, 16 Dec 2023 00:41:06 +0000
Subject: [PATCH] fix breaking change

---
 llama.cpp | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/llama.cpp b/llama.cpp
index e229ecfe3..162692ce8 100644
--- a/llama.cpp
+++ b/llama.cpp
@@ -5591,7 +5591,7 @@ struct llm_build_context {
         cb(cur, "result_norm", -1);
         
         cur = ggml_mul_mat(ctx0, model.output, cur);
-        cb(cur, "result_output", -1);
+        cb(cur, "result_norm", -1);
 
         cur = ggml_add(ctx0, cur, model.output_b);
         cb(cur, "result_output", -1);
@@ -6236,7 +6236,7 @@ static int llama_decode_internal(
     ggml_allocr_alloc_graph(lctx.alloc, gf);
 
     struct ggml_tensor * res        = gf->nodes[gf->n_nodes - 1];
-    struct ggml_tensor * embeddings = gf->nodes[gf->n_nodes - 3];
+    struct ggml_tensor * embeddings = gf->nodes[gf->n_nodes - 2];
 
     GGML_ASSERT(strcmp(res->name,        "result_output") == 0);
     GGML_ASSERT(strcmp(embeddings->name, "result_norm")   == 0);