diff --git a/koboldcpp.py b/koboldcpp.py index 00b383c9b..03ca983d4 100755 --- a/koboldcpp.py +++ b/koboldcpp.py @@ -1495,7 +1495,7 @@ def load_model(model_filename): inputs.quant_k = inputs.quant_v = 0 inputs.batchsize = args.batchsize inputs.autofit = args.autofit - inputs.autofit_tax_mb = calulated_gpu_overhead + inputs.autofit_tax_mb = int(calulated_gpu_overhead) inputs.gpulayers = args.gpulayers if args.overridenativecontext and args.overridenativecontext>0: inputs.overridenativecontext = args.overridenativecontext