fix for physical batch size

2025-09-10 17:14:36 +00:00 · 2024-03-15 16:45:20 +08:00 · 2024-03-15 16:45:20 +08:00 · 2ef03c9de6
commit 2ef03c9de6
parent 93d3871056
1 changed files with 4 additions and 0 deletions
--- a/gpttype_adapter.cpp
+++ b/gpttype_adapter.cpp
@ -748,6 +748,10 @@ ModelLoadResult gpttype_load_model(const load_model_inputs inputs, FileFormat in
    kcpp_params->n_threads_batch = inputs.blasthreads;
    bool isGguf = (file_format == FileFormat::GGUF_GENERIC);
    kcpp_params->n_batch = GetBatchSize(inputs.blasbatchsize, in_file_format);
+    if(kcpp_params->n_batch>512)
+    {
+        kcpp_params->n_ubatch = (kcpp_params->n_batch>1024?1024:kcpp_params->n_batch);
+    }
    modelname = kcpp_params->model = inputs.model_filename;
    useSmartContext = inputs.use_smartcontext;
    useContextShift = inputs.use_contextshift;