Revert repetition_penalty as it is not in API spec

2025-09-10 06:14:58 +00:00 · 2025-02-24 21:30:03 +08:00 · 2025-02-24 21:30:03 +08:00 · 76487c4dcb
commit 76487c4dcb
parent 05ad288453
5 changed files with 12 additions and 14 deletions
--- a/ktransformers/server/api/openai/endpoints/chat.py
+++ b/ktransformers/server/api/openai/endpoints/chat.py
@ -28,13 +28,13 @@ async def chat_completion(request:Request,create:ChatCompletionCreate):
    if create.stream:
        async def inner():
            chunk = ChatCompletionChunk(id=id,object='chat.completion.chunk',created=int(time()))
-            async for token in interface.inference(input_message,id,create.temperature,create.top_p,create.repetition_penalty):
+            async for token in interface.inference(input_message,id,create.temperature,create.top_p):
                chunk.set_token(token)
                yield chunk
        return chat_stream_response(request,inner())
    else:
        comp = ChatCompletionObject(id=id,object='chat.completion',created=int(time()))
        comp.usage = Usage(completion_tokens=1, prompt_tokens=1, total_tokens=2)
-        async for token in interface.inference(input_message,id,create.temperature,create.top_p,create.repetition_penalty):
+        async for token in interface.inference(input_message,id,create.temperature,create.top_p):
            comp.append_token(token)
        return comp