added more perf stats

This commit is contained in:
Concedo 2025-06-21 12:12:28 +08:00
parent ea21a9d749
commit 65ff041827
4 changed files with 39 additions and 2 deletions

View file

@ -59,6 +59,7 @@ bool generation_finished;
float last_process_time = 0;
float last_eval_time = 0;
int last_token_count = 0;
int last_input_count = 0;
int last_seed = -1;
int total_gens = 0;
int last_draft_success = 0;
@ -1596,7 +1597,7 @@ void sample_grammar(FileFormat file_format, int32_t n_vocab, llama_token_data_ar
for (auto reject: llama_grammar_reject_candidates(grammar->rules, grammar->stacks, candidates_grammar)) {
rejects[reject.index] = true;
}
auto first = candidates->data;
auto last = first + candidates->size;
last = std::remove_if(first, last,
@ -4318,6 +4319,7 @@ generation_outputs gpttype_generate(const generation_inputs inputs)
last_eval_time = pt2;
last_process_time = pt1;
last_token_count = realnpredict;
last_input_count = (finaltokcount<0?0:finaltokcount);
last_seed = kcpp_data->seed;
last_draft_failed = draft_failures;
last_draft_success = draft_successes;