Merge commit '32c8486e1f' into concedo_experimental

# Conflicts: # .devops/nix/package.nix # CMakeLists.txt # Makefile # Package.swift # README.md # build.zig # llama.cpp # tests/test-backend-ops.cpp
2025-09-11 09:34:37 +00:00 · 2024-04-07 20:39:17 +08:00 · 2024-04-07 20:39:17 +08:00 · 22f543d09b
commit 22f543d09b
parent a530afa1e4 32c8486e1f
32 changed files with 3521 additions and 1792 deletions
--- a/examples/imatrix/imatrix.cpp
+++ b/examples/imatrix/imatrix.cpp
@ -425,6 +425,7 @@ static bool compute_imatrix(llama_context * ctx, const gpt_params & params, bool
                tokens[batch_start] = llama_token_bos(llama_get_model(ctx));
            }

+            // TODO: use batch.logits to save computations instead of relying on logits_all == true
            if (llama_decode(ctx, llama_batch_get_one(tokens.data() + batch_start, batch_size, j * n_batch, 0))) {
                fprintf(stderr, "%s : failed to eval\n", __func__);
                return false;