From f1710b90dcd4fb47a170e8e05faceb26ed594580 Mon Sep 17 00:00:00 2001 From: anon Date: Wed, 31 May 2023 10:35:25 -0300 Subject: [PATCH] add infinite generation when n_predict is -1 --- examples/server/server.cpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/examples/server/server.cpp b/examples/server/server.cpp index b42333228..b0f0486b7 100644 --- a/examples/server/server.cpp +++ b/examples/server/server.cpp @@ -250,7 +250,7 @@ struct llama_server_context return result; } - has_next_token = n_remain != 0; + has_next_token = params.n_predict == -1 ? true : n_remain != 0; return result; }