mirror of
https://github.com/kvcache-ai/ktransformers.git
synced 2025-09-11 15:54:37 +00:00
Update balance_serve.py
This commit is contained in:
parent
dc59af6167
commit
a2e95e467a
1 changed files with 1 additions and 1 deletions
|
@ -445,7 +445,7 @@ class BalanceServeInterface(BackendInterfaceBase):
|
||||||
query_add.query_length = query_length
|
query_add.query_length = query_length
|
||||||
profiler.set_counter("prefill", query_length)
|
profiler.set_counter("prefill", query_length)
|
||||||
#@TODO add server
|
#@TODO add server
|
||||||
stop_criteria = [self.tokenizer.encode(self.tokenizer.eos_token, add_special_tokens=False),self.tokenizer.encode("<|im_end|>")]
|
stop_criteria = [self.tokenizer.encode(self.tokenizer.eos_token, add_special_tokens=False),self.tokenizer.encode("<|im_end|>", add_special_tokens=True)]
|
||||||
query_add.stop_criteria = stop_criteria
|
query_add.stop_criteria = stop_criteria
|
||||||
|
|
||||||
temperature, top_p, max_new_tokens = self.get_params(temperature, top_p, max_tokens, max_completion_tokens)
|
temperature, top_p, max_new_tokens = self.get_params(temperature, top_p, max_tokens, max_completion_tokens)
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue