fixes for vulkan multigpu

This commit is contained in:
Concedo 2024-02-09 14:42:27 +08:00
parent fe424a5466
commit 992eea71d7
3 changed files with 34 additions and 18 deletions

View file

@ -961,7 +961,12 @@ ModelLoadResult gpttype_load_model(const load_model_inputs inputs, FileFormat in
}
#endif
model_params.main_gpu = cu_parseinfo_maindevice;
#if defined(GGML_USE_CUBLAS)
model_params.split_mode = llama_split_mode::LLAMA_SPLIT_ROW;
#else
model_params.split_mode = llama_split_mode::LLAMA_SPLIT_LAYER;
#endif
llama_ctx_params.n_batch = kcpp_params->n_batch;
llama_ctx_params.n_threads = kcpp_params->n_threads;