reinstated the q4_3 format, for backwards compatibility.

This commit is contained in:
Concedo 2023-04-29 11:42:04 +08:00
parent 0fc1772a8f
commit bb282a4ecf
12 changed files with 364 additions and 26 deletions

View file

@ -377,7 +377,7 @@ generation_outputs gpttype_generate(const generation_inputs inputs, generation_o
}
params.n_batch = bbs; //received reports of 1024 and above crashing on some models
if(!ggml_cpu_has_cublas())
if(!ggml_cpu_has_gpublas())
{
params.n_threads = 1; //do not limit here anymore.
}