Merge branch 'master' into concedo_experimental

# Conflicts: # CMakeLists.txt # Makefile # README.md # ggml.c
2025-09-12 01:54:37 +00:00 · 2023-04-29 11:14:05 +08:00 · 2023-04-29 11:14:05 +08:00 · 0fc1772a8f
commit 0fc1772a8f
parent 67ee2b93a7 7fc50c051a
25 changed files with 1156 additions and 740 deletions
--- a/llama_util.h
+++ b/llama_util.h
@ -405,4 +405,30 @@ struct llama_buffer {
        delete[] addr;
    }
 };
+
+#ifdef GGML_USE_CUBLAS
+#include "ggml-cuda.h"
+struct llama_ctx_buffer {
+    uint8_t * addr = NULL;
+    size_t size = 0;
+
+    void resize(size_t size) {
+        if (addr) {
+            ggml_cuda_host_free(addr);
+        }
+        addr = (uint8_t *) ggml_cuda_host_malloc(size);
+        this->size = size;
+    }
+
+    ~llama_ctx_buffer() {
+        if (addr) {
+            ggml_cuda_host_free(addr);
+        }
+    }
+};
+#else
+typedef llama_buffer llama_ctx_buffer;
+#endif
+
+
 #endif