mirror of
https://github.com/LostRuins/koboldcpp.git
synced 2025-09-10 00:54:41 +00:00
added draft results
This commit is contained in:
parent
3a406b37a7
commit
b0541f3652
1 changed files with 9 additions and 0 deletions
|
@ -3357,6 +3357,8 @@ generation_outputs gpttype_generate(const generation_inputs inputs)
|
|||
|
||||
speculative_draft_result draft_results; //only use if drafting was used
|
||||
bool draft_used = false;
|
||||
int draft_successes = 0;
|
||||
int draft_failures = 0;
|
||||
|
||||
time0 = timer_check();
|
||||
timer_start();
|
||||
|
@ -3665,7 +3667,10 @@ generation_outputs gpttype_generate(const generation_inputs inputs)
|
|||
}
|
||||
if(draftedid!=id) //draft mismatch, abort
|
||||
{
|
||||
draft_failures += 1;
|
||||
abort_draft = true;
|
||||
} else {
|
||||
draft_successes += 1;
|
||||
}
|
||||
}
|
||||
|
||||
|
@ -3983,6 +3988,10 @@ generation_outputs gpttype_generate(const generation_inputs inputs)
|
|||
float ts2 = (1000.0/pt2);
|
||||
float tokens_per_second = (realnpredict <= 0 ? 0 : realnpredict / (time1 + time2));
|
||||
printf("\n[%s] CtxLimit:%d/%d, Amt:%d/%d, Init:%.2fs, Process:%.2fs (%.1fms/T = %.2fT/s), Generate:%.2fs (%.1fms/T = %.2fT/s), Total:%.2fs (%.2fT/s)",get_timestamp_str().c_str(),(int)current_context_tokens.size(),(int)nctx, realnpredict, kcpp_data->n_predict, time0, time1, pt1, ts1, time2, pt2, ts2, (time1 + time2), tokens_per_second);
|
||||
if(debugmode==1 && !is_quiet && (draft_successes+draft_failures)>0)
|
||||
{
|
||||
printf("\n(Draft Results - Success:%d, Failure:%d)",draft_successes,draft_failures);
|
||||
}
|
||||
fflush(stdout);
|
||||
output.status = 1;
|
||||
int finaltokcount = (int)current_context_tokens.size()-realnpredict;
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue