mirror of
https://github.com/LostRuins/koboldcpp.git
synced 2025-09-10 09:04:36 +00:00
reduce batch sizes and skip all intrinsic flags except AVX when building in compatibility mode.
This commit is contained in:
parent
f4257a8eef
commit
5c22f7e4c4
3 changed files with 9 additions and 4 deletions
|
@ -224,7 +224,7 @@ generation_outputs gpttype_generate(const generation_inputs inputs, generation_o
|
|||
int original_threads = params.n_threads;
|
||||
if (blasmode)
|
||||
{
|
||||
params.n_batch = 1024;
|
||||
params.n_batch = 512; //received reports of 1024 and above crashing on some models
|
||||
params.n_threads = 1;
|
||||
}
|
||||
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue