llama_profile_device: add arg n_predict

This commit is contained in:
Lizonghang 2024-12-06 16:37:25 +04:00
parent a46d56cc60
commit cd823546dd
3 changed files with 4 additions and 3 deletions

View file

@ -896,7 +896,7 @@ struct llama_init_result llama_init_from_gpt_params(gpt_params & params) {
device_info dev_info;
dev_info.rank = params.rank;
llama_profile_device(&dev_info, model, ml, params.cpuparams.n_threads);
llama_profile_device(&dev_info, model, ml, params.n_predict, params.cpuparams.n_threads);
// create llama context
struct llama_context_params cparams = llama_context_params_from_gpt_params(params);