mirror of
https://github.com/LostRuins/koboldcpp.git
synced 2026-05-10 12:11:08 +00:00
move pipeline parallelism to a --pipelineparallel launch flag
This commit is contained in:
parent
b7428048fc
commit
fd0d0cab03
5 changed files with 20 additions and 3 deletions
|
|
@ -662,8 +662,8 @@ static bool ggml_is_view_op(enum ggml_op op) {
|
|||
#endif
|
||||
|
||||
#ifndef GGML_SCHED_MAX_COPIES
|
||||
//kcpp reduced from 4 to 2 to try make buffer sizes smaller on multigpu
|
||||
#define GGML_SCHED_MAX_COPIES 2
|
||||
//kcpp can reduce this if you want to try make buffer sizes smaller on multigpu
|
||||
#define GGML_SCHED_MAX_COPIES 4
|
||||
#endif
|
||||
|
||||
struct ggml_backend_sched_split {
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue