From 2927cca6113313762a78b8f5cd4048d795198130 Mon Sep 17 00:00:00 2001 From: Jonas Templestein <242550+jonastemplestein@users.noreply.github.com> Date: Fri, 10 Nov 2023 21:26:48 +0100 Subject: [PATCH] Fix bug where POST /infill doesn't work without prompt argument Fixes https://github.com/ggerganov/llama.cpp/issues/4027 --- examples/server/server.cpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/examples/server/server.cpp b/examples/server/server.cpp index cbf36ad67..c096ebf57 100644 --- a/examples/server/server.cpp +++ b/examples/server/server.cpp @@ -1510,7 +1510,7 @@ struct llama_server_context const bool has_prompt = slot.prompt.is_array() || (slot.prompt.is_string() && !slot.prompt.get().empty()) || !slot.images.empty(); // empty prompt passed -> release the slot and send empty response - if (slot.state == IDLE && slot.command == LOAD_PROMPT && !has_prompt) + if (slot.state == IDLE && slot.command == LOAD_PROMPT && !has_prompt && !slot.infill) { slot.release(); slot.print_timings();