Merge branch 'upstream' into concedo_experimental

# Conflicts: # .devops/llama-server.Dockerfile # README.md # flake.lock # ggml/src/ggml-vulkan.cpp # ggml/src/vulkan-shaders/concat.comp # ggml/src/vulkan-shaders/pad.comp # ggml/src/vulkan-shaders/vulkan-shaders-gen.cpp # scripts/sync-ggml-am.sh # scripts/sync-ggml.last # src/llama.cpp # tests/test-backend-ops.cpp
2025-09-11 01:24:36 +00:00 · 2024-08-06 16:33:26 +08:00 · 2024-08-06 16:33:26 +08:00 · e1f97f7fb5
commit e1f97f7fb5
parent 6b8b50b350 2d5dd7bb3f
55 changed files with 112612 additions and 111077 deletions
--- a/examples/main/main.cpp
+++ b/examples/main/main.cpp
@ -208,7 +208,10 @@ int main(int argc, char ** argv) {

    // load the model and apply lora adapter, if any
    LOG("%s: load the model and apply lora adapter, if any\n", __func__);
-    std::tie(model, ctx) = llama_init_from_gpt_params(params);
+    llama_init_result llama_init = llama_init_from_gpt_params(params);
+
+    model = llama_init.model;
+    ctx = llama_init.context;
    if (sparams.cfg_scale > 1.f) {
        struct llama_context_params lparams = llama_context_params_from_gpt_params(params);
        ctx_guidance = llama_new_context_with_model(model, lparams);