From 35284bcdb5c4069001cc7c50aad75c67e37ae6a5 Mon Sep 17 00:00:00 2001 From: Concedo <39025047+LostRuins@users.noreply.github.com> Date: Tue, 13 May 2025 17:03:24 +0800 Subject: [PATCH] glm4 clamp 8 on vk --- gpttype_adapter.cpp | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/gpttype_adapter.cpp b/gpttype_adapter.cpp index 735aa59e3..705996e31 100644 --- a/gpttype_adapter.cpp +++ b/gpttype_adapter.cpp @@ -1942,8 +1942,8 @@ ModelLoadResult gpttype_load_model(const load_model_inputs inputs, FileFormat in { printf("GLM-4 is broken on larger batch sizes in Vulkan. Clamp ignored in debug.\n"); } else { - printf("GLM-4 is broken on larger batch sizes in Vulkan. Clamping ubatch size to 16.\n"); - kcpp_data->n_ubatch = 16; + printf("GLM-4 is broken on larger batch sizes in Vulkan. Clamping ubatch size to 8.\n"); + kcpp_data->n_ubatch = 8; } } #endif