Load server sampling parameters from the server context by default.
This commit is contained in:
parent
fd560fe680
commit
6cfa080950
1 changed files with 2 additions and 1 deletions
|
@ -884,7 +884,8 @@ struct server_context {
|
||||||
|
|
||||||
bool launch_slot_with_task(server_slot & slot, const server_task & task) {
|
bool launch_slot_with_task(server_slot & slot, const server_task & task) {
|
||||||
slot_params default_params;
|
slot_params default_params;
|
||||||
llama_sampling_params default_sparams;
|
// Default sampling parameters are loaded from the server context unless overridden by individual requests
|
||||||
|
llama_sampling_params default_sparams = params.sparams;
|
||||||
auto & data = task.data;
|
auto & data = task.data;
|
||||||
|
|
||||||
if (data.count("__oaicompat") != 0) {
|
if (data.count("__oaicompat") != 0) {
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue