Merge branch 'upstream' into concedo_experimental

# Conflicts: # .devops/llama-server-cuda.Dockerfile # .devops/llama-server-rocm.Dockerfile # .devops/llama-server-vulkan.Dockerfile # .devops/llama-server.Dockerfile # .github/workflows/docker.yml # README.md # llama.cpp # tests/test-chat-template.cpp # tests/test-grammar-integration.cpp # tests/test-json-schema-to-grammar.cpp # tests/test-llama-grammar.cpp
2025-09-11 01:24:36 +00:00 · 2024-06-26 18:59:10 +08:00 · 2024-06-26 18:59:10 +08:00 · f3dfa96dbc
commit f3dfa96dbc
parent 24bfa54f3c 8854044561
29 changed files with 2097 additions and 431 deletions
--- a/examples/server/server.cpp
+++ b/examples/server/server.cpp
@ -2607,17 +2607,9 @@ int main(int argc, char ** argv) {

    // print sample chat example to make it clear which template is used
    {
-        json chat;
-        chat.push_back({{"role", "system"},    {"content", "You are a helpful assistant"}});
-        chat.push_back({{"role", "user"},      {"content", "Hello"}});
-        chat.push_back({{"role", "assistant"}, {"content", "Hi there"}});
-        chat.push_back({{"role", "user"},      {"content", "How are you?"}});
-
-        const std::string chat_example = format_chat(ctx_server.model, params.chat_template, chat);
-
        LOG_INFO("chat template", {
-            {"chat_example", chat_example},
-            {"built_in", params.chat_template.empty()},
+            {"chat_example", llama_chat_format_example(ctx_server.model, params.chat_template)},
+            {"built_in",     params.chat_template.empty()},
        });
    }