From 6cfa0809506123715216ad4e06fc03068c83324d Mon Sep 17 00:00:00 2001 From: HanClinto Date: Tue, 9 Jul 2024 16:50:45 -0400 Subject: [PATCH] Load server sampling parameters from the server context by default. --- examples/server/server.cpp | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/examples/server/server.cpp b/examples/server/server.cpp index 47bea1591..28b511303 100644 --- a/examples/server/server.cpp +++ b/examples/server/server.cpp @@ -884,7 +884,8 @@ struct server_context { bool launch_slot_with_task(server_slot & slot, const server_task & task) { slot_params default_params; - llama_sampling_params default_sparams; + // Default sampling parameters are loaded from the server context unless overridden by individual requests + llama_sampling_params default_sparams = params.sparams; auto & data = task.data; if (data.count("__oaicompat") != 0) {