From 408fcb0f91dba87386d9bf02a12eb0cf71c08559 Mon Sep 17 00:00:00 2001
From: Francis Couture-Harpin <git@compilade.net>
Date: Sun, 17 Mar 2024 15:34:56 -0400
Subject: [PATCH] llama : fix llama_get_embeddings_ith when the resulting id is
 0

---
 llama.cpp | 10 +++++++---
 1 file changed, 7 insertions(+), 3 deletions(-)

diff --git a/llama.cpp b/llama.cpp
index 538a3af32..b82b56059 100644
--- a/llama.cpp
+++ b/llama.cpp
@@ -14650,11 +14650,13 @@ float * llama_get_logits_ith(struct llama_context * ctx, int32_t i) {
     const int32_t j = ctx->output_ids[i];
 
     llama_synchronize(ctx);
+
     if (ctx->logits && 0 <= j && (size_t) j < ctx->output_size) {
         return ctx->logits + j*ctx->model.hparams.n_vocab;
     }
     LLAMA_LOG_ERROR("%s: invalid logits id %i, reason: %s (j=%i, output_size=%li)\n",
-        __func__, i, !ctx->logits ? "no logits" : j < 0 ? "batch.logits[i] wasn't true" : "too big", j, ctx->output_size);
+        __func__, i, !ctx->logits ? "no logits" : j < 0 ? "batch.logits[i] wasn't true" : "too big",
+        j, ctx->output_size);
 #ifndef NDEBUG
     GGML_ASSERT(false);
 #endif
@@ -14672,10 +14674,12 @@ float * llama_get_embeddings_ith(struct llama_context * ctx, int32_t i) {
 
     llama_synchronize(ctx);
 
-    if (ctx->embd && 0 < j && (size_t) j < ctx->output_size) {
+    if (ctx->embd && 0 <= j && (size_t) j < ctx->output_size) {
         return ctx->embd + j*ctx->model.hparams.n_embd;
     }
-    LLAMA_LOG_ERROR("%s: invalid embeddings id %i\n", __func__, i);
+    LLAMA_LOG_ERROR("%s: invalid embeddings id %i, reason: %s (j=%i, output_size=%li)\n",
+         __func__, i, !ctx->embd ? "no embeddings" : j < 0 ? "batch.logits[i] wasn't true" : "too big",
+        j, ctx->output_size);
 #ifndef NDEBUG
     GGML_ASSERT(false);
 #endif