fixed segfault with all non-gguf models

2025-09-13 02:19:41 +00:00 · 2023-11-20 22:31:56 +08:00 · 2023-11-20 22:31:56 +08:00 · dc4078c039
commit dc4078c039
parent cf646fa809
8 changed files with 48 additions and 73 deletions
--- a/otherarch/gpt2_v3.cpp
+++ b/otherarch/gpt2_v3.cpp
@ -455,7 +455,7 @@ bool gpt2_eval(


    struct ggml_context * ctx0 = ggml_init(params);
-    struct ggml_cgraph gf = {};
+    struct ggml_cgraph * gf = ggml_new_graph(ctx0);

    struct ggml_tensor * embd = ggml_new_tensor_1d(ctx0, GGML_TYPE_I32, N);
    memcpy(embd->data, embd_inp.data(), N*ggml_element_size(embd));
@ -521,8 +521,8 @@ bool gpt2_eval(
                struct ggml_tensor * k = ggml_view_1d(ctx0, model.memory_k, N*n_embd, (ggml_element_size(model.memory_k)*n_embd)*(il*n_ctx + n_past));
                struct ggml_tensor * v = ggml_view_1d(ctx0, model.memory_v, N*n_embd, (ggml_element_size(model.memory_v)*n_embd)*(il*n_ctx + n_past));

-                ggml_build_forward_expand(&gf, ggml_cpy(ctx0, Kcur, k));
-                ggml_build_forward_expand(&gf, ggml_cpy(ctx0, Vcur, v));
+                ggml_build_forward_expand(gf, ggml_cpy(ctx0, Kcur, k));
+                ggml_build_forward_expand(gf, ggml_cpy(ctx0, Vcur, v));
            }

            // Q = Qcur.contiguous().view(n_embd/n_head, n_head, N).permute(0, 2, 1, 3)
@ -715,8 +715,8 @@ bool gpt2_eval(
    //inpL = ggml_soft_max_inplace(ctx0, inpL);

    // run the computation
-    ggml_build_forward_expand(&gf, inpL);
-    kcpp_graph_compute_helper(&gf, n_threads);
+    ggml_build_forward_expand(gf, inpL);
+    kcpp_graph_compute_helper(gf, n_threads);

    //if (n_past%100 == 0) {
    //    ggml_graph_print   (&gf);