From 10d4fc637d05c218515e5fb1488a308e616d0f51 Mon Sep 17 00:00:00 2001 From: Concedo <39025047+LostRuins@users.noreply.github.com> Date: Mon, 23 Dec 2024 11:36:08 +0800 Subject: [PATCH] fixed a bug with drafting tokens --- gpttype_adapter.cpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/gpttype_adapter.cpp b/gpttype_adapter.cpp index 5b76b7492..4e0140b7c 100644 --- a/gpttype_adapter.cpp +++ b/gpttype_adapter.cpp @@ -3611,7 +3611,7 @@ generation_outputs gpttype_generate(const generation_inputs inputs) { logits_to_sample = draft_results.drafted_amount; } - while(logits_sampled0 && !abort_draft) + while(logits_sampled0 && !abort_draft && !early_abort) { if(logits_sampled>0) {