fix: args in speculative

This commit is contained in:
DeEMO 2025-06-30 04:35:59 +00:00
parent 9bf6565df4
commit b4929d510a
3 changed files with 19 additions and 6 deletions

View file

@ -169,7 +169,7 @@ int main(int argc, char ** argv) {
const auto t_enc_end = ggml_time_us();
// how many tokens to draft each time
int n_draft = params.n_draft;
int n_draft = params.speculative.n_max;
int n_predict = 0;
int n_drafted = 0;