Merge branch 'upstream' into concedo_experimental

# Conflicts: # CODEOWNERS # common/CMakeLists.txt # ggml/CMakeLists.txt # ggml/src/ggml-webgpu/ggml-webgpu-shader-lib.hpp # ggml/src/ggml-webgpu/ggml-webgpu.cpp # ggml/src/ggml-webgpu/wgsl-shaders/common_decls.tmpl # ggml/src/ggml-webgpu/wgsl-shaders/mul_mat_vec.wgsl # scripts/sync-ggml.last # tools/cli/cli.cpp # tools/llama-bench/llama-bench.cpp # tools/perplexity/perplexity.cpp
2026-05-17 04:09:19 +00:00 · 2026-04-21 18:53:03 +08:00 · 2026-04-21 18:53:03 +08:00 · 19a12bb080
commit 19a12bb080
parent 1feba4e4ea 82209efb7e
31 changed files with 1594 additions and 1172 deletions
--- a/common/common.cpp
+++ b/common/common.cpp
@ -3,6 +3,7 @@

 #include "build-info.h"
 #include "common.h"
+#include "fit.h"
 #include "log.h"
 #include "log.cpp"
 // Change JSON_ASSERT from assert() to GGML_ASSERT:
@ -1153,7 +1154,7 @@ common_init_result::common_init_result(common_params & params) :

    if (params.fit_params) {
        LOG_INF("%s: fitting params to device memory, for bugs during this step try to reproduce them with -fit off, or provide --verbose logs if the bug only occurs with -fit on\n", __func__);
-        llama_params_fit(params.model.path.c_str(), &mparams, &cparams,
+        common_fit_params(params.model.path.c_str(), &mparams, &cparams,
            params.tensor_split,
            params.tensor_buft_overrides.data(),
            params.fit_params_target.data(),