remove token_embd from metal mem

2025-09-10 17:34:49 +00:00 · 2025-01-23 16:58:25 +04:00 · 2025-01-23 16:58:25 +04:00 · fb05f80f89
commit fb05f80f89
parent 92f00303d5
1 changed files with 1 additions and 1 deletions
--- a/src/llama.cpp
+++ b/src/llama.cpp
@ -5260,7 +5260,7 @@ struct llama_model_loader {
                try {
                    const char * tname = ggml_get_name(tensor);
                    if (keep_only_inp_out && !(
-                            strcmp(tname, "token_embd.weight") == 0 || 
+                            // strcmp(tname, "token_embd.weight") == 0 || // lookup table is used so we do not need to keep it in metal memory
                            strcmp(tname, "output_norm.weight") == 0 || 
                            strcmp(tname, "output.weight") == 0)) {
                        continue;