From 1ca666f9c11cf97f3a8a9be90ae9b476858a6519 Mon Sep 17 00:00:00 2001 From: Concedo <39025047+LostRuins@users.noreply.github.com> Date: Fri, 18 Jul 2025 01:18:28 +0800 Subject: [PATCH] allow handling multipart files up to 999 --- koboldcpp.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/koboldcpp.py b/koboldcpp.py index aab86351c..b41e10655 100644 --- a/koboldcpp.py +++ b/koboldcpp.py @@ -63,7 +63,7 @@ dry_seq_break_max = 128 extra_images_max = 4 # global vars -KcppVersion = "1.96" +KcppVersion = "1.96.1" showdebug = True kcpp_instance = None #global running instance global_memory = {"tunnel_url": "", "restart_target":"", "input_to_exit":False, "load_complete":False, "restart_override_config_target":""} @@ -1116,7 +1116,7 @@ def autoset_gpu_layers(ctxsize, sdquanted, bbs, qkv_level): #shitty algo to dete match = re.search(r'-(\d{5})-of-(\d{5})\.', fname) if match: total_parts = int(match.group(2)) - if total_parts > 1 and total_parts <= 9: + if total_parts > 1 and total_parts <= 999: if showmultigpuwarning: showmultigpuwarning = False print("Multi-Part GGUF detected. Layer estimates may not be very accurate - recommend setting layers manually.") @@ -6335,7 +6335,7 @@ def download_model_from_url(url, permitted_types=[".gguf",".safetensors", ".ggml match = re.search(r'-(\d{5})-of-(\d{5})\.', url) if match: total_parts = int(match.group(2)) - if total_parts > 1 and total_parts <= 9: + if total_parts > 1 and total_parts <= 999: current_part = 1 base_url = url for part_num in range(current_part + 1, total_parts + 1):