diff --git a/src/llama.cpp b/src/llama.cpp index aa497843..321855ca 100644 --- a/src/llama.cpp +++ b/src/llama.cpp @@ -4599,7 +4599,7 @@ namespace GGUFMeta { using llama_buf_map = std::unordered_map; static size_t llama_model_max_nodes(const llama_model & model) { - return std::max(16384, model.tensors_by_name.size()*5); + return std::max(8192, model.tensors_by_name.size()*5); } static int get_layer_id(const ggml_tensor * tensor) {