From 21f0ce2502b36868d3ce3703f30b626b3d6f5b38 Mon Sep 17 00:00:00 2001 From: Concedo <39025047+LostRuins@users.noreply.github.com> Date: Sat, 20 Jan 2024 11:30:22 +0800 Subject: [PATCH] do not use vmm for ggml v3 --- otherarch/ggml_v3-cuda.cu | 12 ++---------- 1 file changed, 2 insertions(+), 10 deletions(-) diff --git a/otherarch/ggml_v3-cuda.cu b/otherarch/ggml_v3-cuda.cu index 0447499f3..90f8e8c12 100644 --- a/otherarch/ggml_v3-cuda.cu +++ b/otherarch/ggml_v3-cuda.cu @@ -7434,19 +7434,11 @@ static void ggml_v3_cuda_pool_free_vmm(int device, void * ptr, size_t size) { } static void * ggml_v3_cuda_pool_malloc(int device, size_t size, size_t * actual_size) { - if (g_device_caps[device].vmm) { - return ggml_v3_cuda_pool_malloc_vmm(device, size, actual_size); - } else { - return ggml_v3_cuda_pool_malloc_leg(device, size, actual_size); - } + return ggml_v3_cuda_pool_malloc_leg(device, size, actual_size); } static void ggml_v3_cuda_pool_free(int device, void * ptr, size_t size) { - if (g_device_caps[device].vmm) { - ggml_v3_cuda_pool_free_vmm(device, ptr, size); - } else { - ggml_v3_cuda_pool_free_leg(device, ptr, size); - } + ggml_v3_cuda_pool_free_leg(device, ptr, size); } #else #define ggml_v3_cuda_pool_malloc ggml_v3_cuda_pool_malloc_leg