move pipeline parallelism to a --pipelineparallel launch flag

This commit is contained in:
Concedo 2025-12-11 21:03:41 +08:00
parent b7428048fc
commit fd0d0cab03
5 changed files with 20 additions and 3 deletions

View file

@ -662,8 +662,8 @@ static bool ggml_is_view_op(enum ggml_op op) {
#endif
#ifndef GGML_SCHED_MAX_COPIES
//kcpp reduced from 4 to 2 to try make buffer sizes smaller on multigpu
#define GGML_SCHED_MAX_COPIES 2
//kcpp can reduce this if you want to try make buffer sizes smaller on multigpu
#define GGML_SCHED_MAX_COPIES 4
#endif
struct ggml_backend_sched_split {