reduce batch sizes and skip all intrinsic flags except AVX when building in compatibility mode.

2025-09-10 09:04:36 +00:00 · 2023-04-13 11:32:05 +08:00 · 2023-04-13 11:32:05 +08:00 · 5c22f7e4c4
commit 5c22f7e4c4
parent f4257a8eef
3 changed files with 9 additions and 4 deletions
--- a/gpttype_adapter.cpp
+++ b/gpttype_adapter.cpp
@ -224,7 +224,7 @@ generation_outputs gpttype_generate(const generation_inputs inputs, generation_o
    int original_threads = params.n_threads;
    if (blasmode)
    {
-        params.n_batch = 1024;
+        params.n_batch = 512; //received reports of 1024 and above crashing on some models
        params.n_threads = 1;
    }