From b0541f36523ace67770e56dd5daaeaca099bc469 Mon Sep 17 00:00:00 2001 From: Concedo <39025047+LostRuins@users.noreply.github.com> Date: Mon, 10 Mar 2025 22:03:20 +0800 Subject: [PATCH] added draft results --- gpttype_adapter.cpp | 9 +++++++++ 1 file changed, 9 insertions(+) diff --git a/gpttype_adapter.cpp b/gpttype_adapter.cpp index 134c4297d..51526a194 100644 --- a/gpttype_adapter.cpp +++ b/gpttype_adapter.cpp @@ -3357,6 +3357,8 @@ generation_outputs gpttype_generate(const generation_inputs inputs) speculative_draft_result draft_results; //only use if drafting was used bool draft_used = false; + int draft_successes = 0; + int draft_failures = 0; time0 = timer_check(); timer_start(); @@ -3665,7 +3667,10 @@ generation_outputs gpttype_generate(const generation_inputs inputs) } if(draftedid!=id) //draft mismatch, abort { + draft_failures += 1; abort_draft = true; + } else { + draft_successes += 1; } } @@ -3983,6 +3988,10 @@ generation_outputs gpttype_generate(const generation_inputs inputs) float ts2 = (1000.0/pt2); float tokens_per_second = (realnpredict <= 0 ? 0 : realnpredict / (time1 + time2)); printf("\n[%s] CtxLimit:%d/%d, Amt:%d/%d, Init:%.2fs, Process:%.2fs (%.1fms/T = %.2fT/s), Generate:%.2fs (%.1fms/T = %.2fT/s), Total:%.2fs (%.2fT/s)",get_timestamp_str().c_str(),(int)current_context_tokens.size(),(int)nctx, realnpredict, kcpp_data->n_predict, time0, time1, pt1, ts1, time2, pt2, ts2, (time1 + time2), tokens_per_second); + if(debugmode==1 && !is_quiet && (draft_successes+draft_failures)>0) + { + printf("\n(Draft Results - Success:%d, Failure:%d)",draft_successes,draft_failures); + } fflush(stdout); output.status = 1; int finaltokcount = (int)current_context_tokens.size()-realnpredict;