From 2cf6d16c403bc1feb84666db68b6258f429ee917 Mon Sep 17 00:00:00 2001 From: Concedo <39025047+LostRuins@users.noreply.github.com> Date: Wed, 21 Aug 2024 01:06:41 +0800 Subject: [PATCH] adjust sleep time --- koboldcpp.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/koboldcpp.py b/koboldcpp.py index d1e0b0c98..786d9682b 100644 --- a/koboldcpp.py +++ b/koboldcpp.py @@ -1482,7 +1482,7 @@ class ServerRequestHandler(http.server.SimpleHTTPRequestHandler): current_token = 0 incomplete_token_buffer = bytearray() async_sleep_short = 0.02 - await asyncio.sleep(0.5) #anti race condition, prevent check from overtaking generate + await asyncio.sleep(0.35) #anti race condition, prevent check from overtaking generate try: tokenReserve = "" #keeps fully formed tokens that we cannot send out yet while True: