mirror of
https://github.com/kvcache-ai/ktransformers.git
synced 2025-09-10 15:29:39 +00:00
[fix] thread context bug
This commit is contained in:
parent
299c4dca64
commit
08a8b553d6
1 changed files with 11 additions and 6 deletions
|
@ -15,6 +15,7 @@ from ktransformers.server.schemas.assistants.assistants import AssistantObject
|
||||||
from ktransformers.server.schemas.assistants.messages import MessageCreate, MessageObject, Role
|
from ktransformers.server.schemas.assistants.messages import MessageCreate, MessageObject, Role
|
||||||
from ktransformers.server.schemas.assistants.runs import RunObject
|
from ktransformers.server.schemas.assistants.runs import RunObject
|
||||||
from ktransformers.server.schemas.assistants.threads import ThreadObject
|
from ktransformers.server.schemas.assistants.threads import ThreadObject
|
||||||
|
from ktransformers.server.schemas.endpoints.chat import RawUsage
|
||||||
from ktransformers.server.schemas.base import ObjectID, Order
|
from ktransformers.server.schemas.base import ObjectID, Order
|
||||||
from ktransformers.server.utils.multi_timer import Profiler
|
from ktransformers.server.utils.multi_timer import Profiler
|
||||||
|
|
||||||
|
@ -142,7 +143,11 @@ class ThreadContext:
|
||||||
yield reply_message.stream_response_with_event(MessageObject.Status.in_progress)
|
yield reply_message.stream_response_with_event(MessageObject.Status.in_progress)
|
||||||
yield self.run.stream_response_with_event(RunObject.Status.in_progress)
|
yield self.run.stream_response_with_event(RunObject.Status.in_progress)
|
||||||
|
|
||||||
async for token, finish_reason in self.interface.inference(local_messages,self.thread.id):
|
async for res in self.interface.inference(local_messages,self.thread.id):
|
||||||
|
if isinstance(res, RawUsage):
|
||||||
|
raw_usage = res
|
||||||
|
else:
|
||||||
|
token, finish_reason = res
|
||||||
if self.run.status == RunObject.Status.cancelling:
|
if self.run.status == RunObject.Status.cancelling:
|
||||||
logger.warn(f'Run {self.run.id} cancelling')
|
logger.warn(f'Run {self.run.id} cancelling')
|
||||||
break
|
break
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue