llama-bench: print -n-cpu-moe when offloaded layers > 1 (#20984)

2026-05-19 08:00:25 +00:00 · 2026-03-25 21:17:27 +08:00 · 2026-03-25 21:17:27 +08:00 · 9c600bcd4b
commit 9c600bcd4b
parent b2704f9028
1 changed files with 1 additions and 1 deletions
--- a/tools/llama-bench/llama-bench.cpp
+++ b/tools/llama-bench/llama-bench.cpp
@ -1807,7 +1807,7 @@ struct markdown_printer : public printer {
        if (!is_cpu_backend) {
            fields.emplace_back("n_gpu_layers");
        }
-        if (params.n_cpu_moe.size() > 1) {
+        if (params.n_cpu_moe.size() > 1 || params.n_cpu_moe != cmd_params_defaults.n_cpu_moe) {
            fields.emplace_back("n_cpu_moe");
        }
        if (params.n_threads.size() > 1 || params.n_threads != cmd_params_defaults.n_threads || is_cpu_backend) {