Merge commit '451ef08432' into concedo_experimental

# Conflicts: # .github/workflows/build.yml # README.md # docs/ops.md # docs/ops/Vulkan.csv # src/llama-model-loader.cpp # src/llama-model.cpp # src/llama.cpp # tests/CMakeLists.txt # tests/peg-parser/test-basic.cpp # tests/peg-parser/test-json-parser.cpp # tests/peg-parser/test-python-dict-parser.cpp # tests/peg-parser/test-unicode.cpp # tests/test-chat-auto-parser.cpp # tests/test-chat-peg-parser.cpp # tests/test-chat.cpp # tools/CMakeLists.txt
2026-05-20 09:25:53 +00:00 · 2026-03-13 23:33:37 +08:00 · 2026-03-13 23:33:37 +08:00 · 04915d99ee
commit 04915d99ee
parent d2c911884d 451ef08432
36 changed files with 1001 additions and 725 deletions
--- a/src/llama-context.cpp
+++ b/src/llama-context.cpp
@ -1168,6 +1168,7 @@ llm_graph_result * llama_context::process_ubatch(const llama_ubatch & ubatch, ll
    {
        //const auto t_start_us = ggml_time_us();

+        // FIXME this call causes a crash if any model inputs were not used in the graph and were therefore not allocated
        res->set_inputs(&ubatch);

        //LLAMA_LOG_INFO("graph set inputs time: %.3f ms\n", (ggml_time_us() - t_start_us)/1000.0);