Update completions.py

This commit is contained in:
Yuhao Tsui 2025-03-26 15:39:46 +08:00 committed by GitHub
parent 52fa671c10
commit 84164f584c
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -85,7 +85,11 @@ async def generate(request: Request, input: OllamaGenerateCompletionRequest):
return check_link_response(request, inner()) return check_link_response(request, inner())
else: else:
complete_response = "" complete_response = ""
async for token in interface.inference(input.prompt, id): async for res in interface.inference(input.prompt, id):
if isinstance(res, RawUsage):
raw_usage = res
else:
token, finish_reason = res
complete_response += token complete_response += token
response = OllamaGenerationResponse( response = OllamaGenerationResponse(
model=config.model_name, model=config.model_name,
@ -187,7 +191,11 @@ async def chat(request: Request, input: OllamaChatCompletionRequest):
complete_response = "" complete_response = ""
eval_count = 0 eval_count = 0
async for token in interface.inference(prompt, id): async for res in interface.inference(prompt, id):
if isinstance(res, RawUsage):
raw_usage = res
else:
token, finish_reason = res
complete_response += token complete_response += token
eval_count += 1 eval_count += 1