disable prefetch in standalone mode

2025-09-08 05:59:11 +00:00 · 2025-02-12 00:17:33 +04:00 · 2025-02-12 00:17:33 +04:00 · b163918b46
commit b163918b46
parent 6a50d494d2
1 changed files with 2 additions and 2 deletions
--- a/src/llama.cpp
+++ b/src/llama.cpp
@ -18108,9 +18108,9 @@ static int llama_decode_internal(
                timer(manage_graph_tensors);
                
                int next_gf_id = (i + 1) % gf.size();
-                manage_graph_tensors(gf[next_gf_id], POSIX_MADV_WILLNEED, true);
+                manage_graph_tensors(gf[next_gf_id], POSIX_MADV_WILLNEED, n_world > 1);
                if (my_rank == 0 && (is_last_l || (next_gf_id == (int)gf.size() - 1))) {
-                    manage_graph_tensors(gf[0], POSIX_MADV_WILLNEED, true);
+                    manage_graph_tensors(gf[0], POSIX_MADV_WILLNEED, n_world > 1);
                }

                if (cparams.unload && n_world > 1) {