Merge branch 'upstream' into concedo_experimental

# Conflicts: # .devops/cpu.Dockerfile # .devops/cuda.Dockerfile # .devops/intel.Dockerfile # .devops/llama-cli-cann.Dockerfile # .devops/musa.Dockerfile # .devops/rocm.Dockerfile # .devops/vulkan.Dockerfile # examples/llama-bench/llama-bench.cpp # examples/rpc/rpc-server.cpp # scripts/compare-llama-bench.py # tests/test-quantize-stats.cpp
2025-09-13 18:39:48 +00:00 · 2025-04-30 17:22:18 +08:00 · 2025-04-30 17:22:18 +08:00 · 8273739412
commit 8273739412
parent 5d382970ec 5933e6fdc9
9 changed files with 210 additions and 98 deletions
--- a/include/llama.h
+++ b/include/llama.h
@ -1234,6 +1234,7 @@ extern "C" {
        "will be removed in the future (see https://github.com/ggml-org/llama.cpp/pull/9896#discussion_r1800920915)");

    /// @details Top-K sampling described in academic paper "The Curious Case of Neural Text Degeneration" https://arxiv.org/abs/1904.09751
+    /// Setting k <= 0 makes this a noop
    LLAMA_API struct llama_sampler * llama_sampler_init_top_k      (int32_t k);

    /// @details Nucleus sampling described in academic paper "The Curious Case of Neural Text Degeneration" https://arxiv.org/abs/1904.09751