Merge branch 'upstream' into concedo_experimental

# Conflicts: # .github/workflows/build.yml # CMakeLists.txt # README.md # ci/run.sh # llama.cpp # models/ggml-vocab-llama-bpe.gguf.inp # models/ggml-vocab-llama-bpe.gguf.out # requirements.txt # scripts/compare-llama-bench.py # scripts/sync-ggml.last # tests/CMakeLists.txt # tests/test-backend-ops.cpp # tests/test-grammar-integration.cpp # tests/test-tokenizer-1-bpe.cpp
2025-09-11 09:34:37 +00:00 · 2024-05-14 19:28:47 +08:00 · 2024-05-14 19:28:47 +08:00 · 2ee808a747
commit 2ee808a747
parent 5d15f8f76a 541600201e
66 changed files with 3034 additions and 1821 deletions
--- a/common/sampling.h
+++ b/common/sampling.h
@ -82,7 +82,7 @@ struct llama_sampling_context {
    // TODO: replace with ring-buffer
    std::vector<llama_token>      prev;
    std::vector<llama_token_data> cur;
-    size_t n_considered;
+    size_t n_valid; // Number of correct top tokens with correct probabilities.

    std::mt19937 rng;
 };