Merge branch 'master' into concedo_experimental

# Conflicts: # CMakeLists.txt # Makefile # README.md # pocs/vdot/vdot.cpp # scripts/verify-checksum-models.py # tests/test-quantize-fns.cpp # tests/test-quantize-perf.cpp # tests/test-sampling.cpp # tests/test-tokenizer-0.cpp
2026-05-09 19:46:11 +00:00 · 2023-06-17 20:02:32 +08:00 · 2023-06-17 20:02:32 +08:00 · 9f8e2f8a18
commit 9f8e2f8a18
parent 795b35546b 794db3e7b9
25 changed files with 1829 additions and 1252 deletions
--- a/llama.cpp
+++ b/llama.cpp
@ -40,6 +40,10 @@
 #include <sstream>
 #include <numeric>

+#if defined(_MSC_VER)
+#pragma warning(disable: 4244 4267) // possible loss of data
+#endif
+
 #define LLAMA_USE_SCRATCH
 #define LLAMA_MAX_SCRATCH_BUFFERS 16

@ -1654,7 +1658,7 @@ static bool llama_eval_internal(

        // cur = cur*norm(broadcasted)
        cur = ggml_mul(ctx0, cur, model.norm);
-        offload_func_nr(cur);
+        // offload_func_nr(cur); // TODO CPU + GPU mirrored backend
        ggml_set_name(cur, "result_norm");

        embeddings = cur;