llama : remove KV cache defragmentation logic (#15473)

ggml-ci
2025-09-13 02:19:41 +00:00 · 2025-08-22 12:22:13 +03:00 · 2025-08-22 12:22:13 +03:00 · 9ebebef62f
commit 9ebebef62f
parent ad5c975c2d
16 changed files with 32 additions and 440 deletions
--- a/common/arg.cpp
+++ b/common/arg.cpp
@ -2254,9 +2254,11 @@ common_params_context common_params_parser_init(common_params & params, llama_ex
    ).set_examples({LLAMA_EXAMPLE_PERPLEXITY}));
    add_opt(common_arg(
        {"-dt", "--defrag-thold"}, "N",
-        string_format("KV cache defragmentation threshold (default: %.1f, < 0 - disabled)", (double)params.defrag_thold),
+        string_format("KV cache defragmentation threshold (DEPRECATED)"),
        [](common_params & params, const std::string & value) {
-            params.defrag_thold = std::stof(value);
+            GGML_UNUSED(params);
+            GGML_UNUSED(value);
+            LOG_WRN("DEPRECATED: --defrag-thold is deprecated and no longer necessary to specify\n");
        }
    ).set_env("LLAMA_ARG_DEFRAG_THOLD"));
    add_opt(common_arg(