clean PR code and disable flashinfer

2025-09-10 06:14:58 +00:00 · 2025-02-19 04:42:47 +00:00 · 2025-02-19 04:42:47 +00:00 · a529518346
commit a529518346
parent cf4da5fd47
3 changed files with 13 additions and 23 deletions
--- a/ktransformers/server/backend/interfaces/transformers.py
+++ b/ktransformers/server/backend/interfaces/transformers.py
@ -381,13 +381,13 @@ class TransformersInterface(BackendInterfaceBase):

        self.profiler.create_and_start_timer("prefill")

-               
+        if Config().user_force_think:
+            think = '<think>\n'
+            print(think, end="",flush=True)
+            yield think
+        
        for t in self.prefill(input_ids, self.check_is_new(thread_id)):
            # output think token after prefill done
-            if Config().user_force_think:
-                think = '<think>\n'
-                print(think, end="",flush=True)
-                yield think
            if t is not None:
                print(t, end="",flush=True)
                yield t