Merge commit '6986c7835a' into concedo_experimental

# Conflicts: # README.md
2025-09-10 17:14:36 +00:00 · 2023-05-20 11:30:51 +08:00 · 2023-05-20 11:30:51 +08:00 · 010b2753d9
commit 010b2753d9
parent 1225fab2ec 6986c7835a
11 changed files with 192 additions and 36 deletions
--- a/llama.cpp
+++ b/llama.cpp
@ -829,10 +829,9 @@ static bool kv_cache_init(
 struct llama_context_params llama_context_default_params() {
    struct llama_context_params result = {
        /*.n_ctx                       =*/ 512,
-        /*.n_parts                     =*/ -1,
        /*.gpu_layers                  =*/ 0,
        /*.seed                        =*/ -1,
-        /*.f16_kv                      =*/ false,
+        /*.f16_kv                      =*/ true,
        /*.logits_all                  =*/ false,
        /*.vocab_only                  =*/ false,
        /*.use_mmap                    =*/ true,
@ -965,7 +964,7 @@ static void llama_model_load_internal(
    size_t ctx_size;
    size_t mmapped_size;
    ml->calc_sizes(&ctx_size, &mmapped_size);
-    fprintf(stderr, "%s: ggml ctx size = %6.2f KB\n", __func__, ctx_size/1024.0);
+    fprintf(stderr, "%s: ggml ctx size = %6.2f MB\n", __func__, ctx_size/1024.0/1024.0);

    // print memory requirements
    {