Merge branch 'master' into concedo_experimental

# Conflicts: # .flake8 # .github/workflows/python-lint.yml # flake.lock # ggml-cuda.cu # ggml-quants.c # llama.cpp # pocs/vdot/q8dot.cpp # pocs/vdot/vdot.cpp # tests/test-quantize-fns.cpp # tests/test-quantize-perf.cpp
2025-09-10 17:14:36 +00:00 · 2024-02-13 00:14:22 +08:00 · 2024-02-13 00:14:22 +08:00 · 3cec37c2e0
commit 3cec37c2e0
parent fdc54efcf0 43fe07c1a4
35 changed files with 2814 additions and 1749 deletions
--- a/examples/embedding/embedding.cpp
+++ b/examples/embedding/embedding.cpp
@ -88,7 +88,17 @@ int main(int argc, char ** argv) {
    }

    const int n_embd = llama_n_embd(model);
-    const auto * embeddings = llama_get_embeddings(ctx);
+    auto * embeddings = llama_get_embeddings(ctx);
+
+    // l2-normalize embeddings
+    float norm = 0;
+    for (int i = 0; i < n_embd; i++) {
+        norm += embeddings[i] * embeddings[i];
+    }
+    norm = sqrt(norm);
+    for (int i = 0; i < n_embd; i++) {
+        embeddings[i] /= norm;
+    }

    for (int i = 0; i < n_embd; i++) {
        printf("%f ", embeddings[i]);