trying out mmq

Merge branch 'master' into concedo_experimental

# Conflicts:
#	CMakeLists.txt
#	README.md
This commit is contained in:
Concedo 2023-07-31 22:51:15 +08:00
commit e221843147
10 changed files with 61 additions and 22 deletions

View file

@ -466,6 +466,7 @@ ModelLoadResult gpttype_load_model(const load_model_inputs inputs, FileFormat in
llama_ctx_params.seed = -1;
llama_ctx_params.f16_kv = inputs.f16_kv;
llama_ctx_params.low_vram = inputs.low_vram;
llama_ctx_params.mul_mat_q = true;
llama_ctx_params.logits_all = false;
llama_ctx_params.use_mmap = inputs.use_mmap;
llama_ctx_params.use_mlock = inputs.use_mlock;