diff --git a/koboldcpp.py b/koboldcpp.py index bcb6a67e0..19298bc8e 100644 --- a/koboldcpp.py +++ b/koboldcpp.py @@ -447,35 +447,29 @@ def set_backend_props(inputs): # otherwise the default will divide equally and multigpu crap will slow it down badly inputs.cublas_info = 0 + if args.usecublas: + os.environ["CUDA_DEVICE_ORDER"] = "PCI_BUS_ID" if not args.tensor_split: if (args.usecublas and "0" in args.usecublas): - os.environ["CUDA_DEVICE_ORDER"] = "PCI_BUS_ID" os.environ["CUDA_VISIBLE_DEVICES"] = "0" os.environ["HIP_VISIBLE_DEVICES"] = "0" elif (args.usecublas and "1" in args.usecublas): - os.environ["CUDA_DEVICE_ORDER"] = "PCI_BUS_ID" os.environ["CUDA_VISIBLE_DEVICES"] = "1" os.environ["HIP_VISIBLE_DEVICES"] = "1" elif (args.usecublas and "2" in args.usecublas): - os.environ["CUDA_DEVICE_ORDER"] = "PCI_BUS_ID" os.environ["CUDA_VISIBLE_DEVICES"] = "2" os.environ["HIP_VISIBLE_DEVICES"] = "2" elif (args.usecublas and "3" in args.usecublas): - os.environ["CUDA_DEVICE_ORDER"] = "PCI_BUS_ID" os.environ["CUDA_VISIBLE_DEVICES"] = "3" os.environ["HIP_VISIBLE_DEVICES"] = "3" else: if (args.usecublas and "0" in args.usecublas): - os.environ["CUDA_DEVICE_ORDER"] = "PCI_BUS_ID" inputs.cublas_info = 0 elif (args.usecublas and "1" in args.usecublas): - os.environ["CUDA_DEVICE_ORDER"] = "PCI_BUS_ID" inputs.cublas_info = 1 elif (args.usecublas and "2" in args.usecublas): - os.environ["CUDA_DEVICE_ORDER"] = "PCI_BUS_ID" inputs.cublas_info = 2 elif (args.usecublas and "3" in args.usecublas): - os.environ["CUDA_DEVICE_ORDER"] = "PCI_BUS_ID" inputs.cublas_info = 3 if args.usevulkan: #is an empty array if using vulkan without defined gpu