fixed a bug with drafting tokens

2026-05-22 03:10:03 +00:00 · 2024-12-23 11:36:08 +08:00 · 2024-12-23 11:36:08 +08:00 · 10d4fc637d
commit 10d4fc637d
parent fd5100c382
1 changed files with 1 additions and 1 deletions
--- a/gpttype_adapter.cpp
+++ b/gpttype_adapter.cpp
@ -3611,7 +3611,7 @@ generation_outputs gpttype_generate(const generation_inputs inputs)
            {
                logits_to_sample = draft_results.drafted_amount;
            }
-            while(logits_sampled<logits_to_sample && remaining_tokens>0 && !abort_draft)
+            while(logits_sampled<logits_to_sample && remaining_tokens>0 && !abort_draft && !early_abort)
            {
                if(logits_sampled>0)
                {