count model flops for f32xf32, f16xf32, q4kxf32, q6kxf32

This commit is contained in:
Lizonghang 2024-11-24 13:13:32 +04:00
parent a5ba34169a
commit 3fe00a16a0
4 changed files with 188 additions and 119 deletions

View file

@ -528,7 +528,8 @@ extern "C" {
LLAMA_API void llama_model_n_flops(
struct llama_model * model,
struct llama_model_loader * ml,
struct model_flops * ffo,
struct model_flops * n_flops,
struct model_params * n_params,
const int64_t n_input,
const int64_t n_history);