fix: add warm-up in profiling to prevent init delay

2025-09-10 03:24:35 +00:00 · 2025-06-03 17:10:09 +04:00 · 2025-06-03 17:10:09 +04:00 · 1b3b6a506f
commit 1b3b6a506f
parent b30f749e5e
2 changed files with 9 additions and 6 deletions
--- a/common/profiler.cpp
+++ b/common/profiler.cpp
@ -439,7 +439,7 @@ float device_inp_embd_delay(struct llama_model * model, enum ggml_type src0t, in
    }

    // warm-up
-    // ggml_backend_graph_compute(backend, gf);
+    ggml_backend_graph_compute(backend, gf);

    const int64_t t_start = ggml_time_us();
    ggml_backend_graph_compute(backend, gf);
@ -1288,6 +1288,9 @@ static float device_mem_copy(struct llama_model * model, enum profiler_backend_t
        ggml_backend_cpu_set_n_threads(backend, n_threads);
    }

+    // warm-up 
+    ggml_backend_graph_compute(backend, gf);
+
    const int64_t t_start = ggml_time_us();
    ggml_backend_graph_compute(backend, gf);
    const int64_t t_end = ggml_time_us();