mirror of
https://github.com/kvcache-ai/ktransformers.git
synced 2025-09-10 06:14:58 +00:00
clean PR code and disable flashinfer
This commit is contained in:
parent
cf4da5fd47
commit
a529518346
3 changed files with 13 additions and 23 deletions
|
@ -381,13 +381,13 @@ class TransformersInterface(BackendInterfaceBase):
|
|||
|
||||
self.profiler.create_and_start_timer("prefill")
|
||||
|
||||
|
||||
if Config().user_force_think:
|
||||
think = '<think>\n'
|
||||
print(think, end="",flush=True)
|
||||
yield think
|
||||
|
||||
for t in self.prefill(input_ids, self.check_is_new(thread_id)):
|
||||
# output think token after prefill done
|
||||
if Config().user_force_think:
|
||||
think = '<think>\n'
|
||||
print(think, end="",flush=True)
|
||||
yield think
|
||||
if t is not None:
|
||||
print(t, end="",flush=True)
|
||||
yield t
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue