From 4e5b6293aba4528eee9b165a21f248d1ae50ecec Mon Sep 17 00:00:00 2001 From: Concedo <39025047+LostRuins@users.noreply.github.com> Date: Sun, 8 Oct 2023 23:12:45 +0800 Subject: [PATCH] adjust streaming timings --- koboldcpp.py | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/koboldcpp.py b/koboldcpp.py index 0fc72c1fa..0b0b9f31f 100755 --- a/koboldcpp.py +++ b/koboldcpp.py @@ -361,7 +361,7 @@ maxhordelen = 256 modelbusy = threading.Lock() requestsinqueue = 0 defaultport = 5001 -KcppVersion = "1.46" +KcppVersion = "1.46.1" showdebug = True showsamplerwarning = True showmaxctxwarning = True @@ -540,8 +540,9 @@ class ServerRequestHandler(http.server.SimpleHTTPRequestHandler): # flush buffers, sleep a bit to make sure all data sent, and then force close the connection self.wfile.flush() - await asyncio.sleep(0.1) + await asyncio.sleep(0.2) self.close_connection = True + await asyncio.sleep(0.1) async def handle_request(self, genparams, api_format, stream_flag):