Merge commit '2b6dfe824d' into concedo_experimental

# Conflicts: # .github/workflows/release.yml # examples/save-load-state/save-load-state.cpp # src/llama-context.cpp # tools/cli/cli.cpp
2026-05-08 09:59:50 +00:00 · 2026-02-26 15:07:23 +08:00 · 2026-02-26 15:07:23 +08:00 · 7e53bfd28d
commit 7e53bfd28d
parent d400b37215 2b6dfe824d
17 changed files with 258 additions and 194 deletions
--- a/src/llama-model.cpp
+++ b/src/llama-model.cpp
@ -1816,8 +1816,8 @@ void llama_model::load_hparams(llama_model_loader & ml) {
            } break;
        case LLM_ARCH_DEEPSEEK2:
            {
-                // lite variants include DeepSeek-V2-Lite, GigaChat3-10B-A1.8B
-                const bool is_lite = (hparams.n_layer == 27 || hparams.n_layer == 26);
+                // lite variants include DeepSeek-V2-Lite, GigaChat3-10B-A1.8B, Kanana-2-30B-A3B
+                const bool is_lite = (hparams.n_layer == 27 || hparams.n_layer == 26 || (hparams.n_layer == 48 && n_vocab == 128256));

                ml.get_key(LLM_KV_ATTENTION_LAYERNORM_RMS_EPS, hparams.f_norm_rms_eps);
                ml.get_key(LLM_KV_LEADING_DENSE_BLOCK_COUNT,   hparams.n_layer_dense_lead);