From 58d8635827401b7541f9be569525faa85a8962e6 Mon Sep 17 00:00:00 2001 From: Concedo <39025047+LostRuins@users.noreply.github.com> Date: Sun, 28 Dec 2025 23:15:06 +0800 Subject: [PATCH] fixed autofit --- koboldcpp.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/koboldcpp.py b/koboldcpp.py index 8148eb463..c67d9c74f 100755 --- a/koboldcpp.py +++ b/koboldcpp.py @@ -1504,7 +1504,7 @@ def load_model(model_filename): inputs.quant_k = inputs.quant_v = 0 inputs.batchsize = args.batchsize inputs.autofit = args.autofit - inputs.autofit_tax_mb = int(calulated_gpu_overhead) + inputs.autofit_tax_mb = int(calulated_gpu_overhead/(1024*1024)) inputs.gpulayers = args.gpulayers if args.overridenativecontext and args.overridenativecontext>0: inputs.overridenativecontext = args.overridenativecontext