diff --git a/koboldcpp.py b/koboldcpp.py index fc22664f3..e3bddbb21 100755 --- a/koboldcpp.py +++ b/koboldcpp.py @@ -1632,7 +1632,7 @@ def load_model(model_filename): sclimit = (savestate_limit_default if scint<=1 else scint) savestate_limit = sclimit inputs.smartcacheslots = sclimit - inputs.pipelineparallel = args.pipelineparallel + inputs.pipelineparallel = (not args.nopipelineparallel) inputs = set_backend_props(inputs) ret = handle.load_model(inputs) return ret @@ -6442,7 +6442,7 @@ def show_gui(): args.remotetunnel = remotetunnel_var.get()==1 args.foreground = keepforeground.get()==1 args.cli = terminalonly.get()==1 - args.pipelineparallel = pipelineparallel.get()==1 + args.nopipelineparallel = pipelineparallel.get()==0 args.quiet = quietmode.get()==1 args.nocertify = nocertifymode.get()==1 args.nomodel = nomodel.get()==1 @@ -6666,7 +6666,7 @@ def show_gui(): remotetunnel_var.set(1 if "remotetunnel" in dict and dict["remotetunnel"] else 0) keepforeground.set(1 if "foreground" in dict and dict["foreground"] else 0) terminalonly.set(1 if "cli" in dict and dict["cli"] else 0) - pipelineparallel.set(1 if "pipelineparallel" in dict and dict["pipelineparallel"] else 0) + pipelineparallel.set(0 if "nopipelineparallel" in dict and dict["nopipelineparallel"] else 1) quietmode.set(1 if "quiet" in dict and dict["quiet"] else 0) nocertifymode.set(1 if "nocertify" in dict and dict["nocertify"] else 0) nomodel.set(1 if "nomodel" in dict and dict["nomodel"] else 0) @@ -8788,7 +8788,7 @@ if __name__ == '__main__': compatgroup2.add_argument("--showgui", help="Always show the GUI instead of launching the model right away when loading settings from a .kcpps file.", action='store_true') compatgroup2.add_argument("--skiplauncher", help="Doesn't display or use the GUI launcher. Overrides showgui.", action='store_true') advparser.add_argument("--singleinstance", help="Allows this KoboldCpp instance to be shut down by any new instance requesting the same port, preventing duplicate servers from clashing on a port.", action='store_true') - advparser.add_argument("--pipelineparallel", help="Enable Pipeline Parallelism for faster multigpu speeds but using more memory, only active for multigpu.", action='store_true') + advparser.add_argument("--nopipelineparallel", help="Disable Pipeline Parallelism. Pipeline Parallelism provides faster multigpu speeds but using more memory, only active for multigpu.", action='store_true') advparser.add_argument("--gendefaults", metavar=('{"parameter":"value",...}'), help="Sets extra default parameters for some fields in API requests, as a JSON string.", default="") advparser.add_argument("--gendefaultsoverwrite", help="Allow the gendefaults parameters to overwrite the original value in API payloads.", action='store_true') advparser.add_argument("--mcpfile", metavar=('[mcp json file]'), help="Specify path to mcp.json which contains the Cladue Desktop compatible MCP server config.", default="") @@ -8849,6 +8849,7 @@ if __name__ == '__main__': deprecatedgroup.add_argument("--sdconfig", help=argparse.SUPPRESS, nargs='+') compatgroup.add_argument("--noblas", help=argparse.SUPPRESS, action='store_true') compatgroup3.add_argument("--nommap","--no-mmap", help=argparse.SUPPRESS, action='store_true') + deprecatedgroup.add_argument("--pipelineparallel", help=argparse.SUPPRESS, action='store_true') #changed to nopipelineparallel deprecatedgroup.add_argument("--sdnotile", help=argparse.SUPPRESS, action='store_true') # legacy option, see sdtiledvae deprecatedgroup.add_argument("--forceversion", help=argparse.SUPPRESS, action='store_true') #no longer used deprecatedgroup.add_argument("--sdgendefaults", help=argparse.SUPPRESS, action='store_true') # legacy option, see gendefaults