server : return error on too large embedding input

This commit is contained in:
Georgi Gerganov 2024-05-19 19:01:34 +03:00
parent f030ec1f7a
commit 85137247b2
No known key found for this signature in database
GPG key ID: 449E073F9DC10735

View file

@ -1981,8 +1981,7 @@ struct server_context {
slot.state = SLOT_STATE_PROCESSING; slot.state = SLOT_STATE_PROCESSING;
slot.command = SLOT_COMMAND_NONE; slot.command = SLOT_COMMAND_NONE;
slot.release(); slot.release();
slot.print_timings(); send_error(slot, "input is too large to process. increase the physical batch size", ERROR_TYPE_SERVER);
send_final_response(slot);
continue; continue;
} }
} else { } else {