mirror of
https://github.com/LostRuins/koboldcpp.git
synced 2025-09-10 17:14:36 +00:00
improve model estimation
This commit is contained in:
parent
5d7c5e9e33
commit
0954e9e476
1 changed files with 2 additions and 2 deletions
|
@ -884,9 +884,9 @@ def autoset_gpu_layers(ctxsize,sdquanted,bbs): #shitty algo to determine how man
|
|||
elif modelfile_extracted_meta[2] > 1024*1024*512: #normal sd tax
|
||||
mem -= 1024*1024*1024*(3.25 if sdquanted else 4.25)
|
||||
if modelfile_extracted_meta[3] > 1024*1024*10: #whisper tax
|
||||
mem -= 350*1024*1024
|
||||
mem -= max(350*1024*1024,modelfile_extracted_meta[3]*1.5)
|
||||
if modelfile_extracted_meta[4] > 1024*1024*10: #mmproj tax
|
||||
mem -= 350*1024*1024
|
||||
mem -= max(350*1024*1024,modelfile_extracted_meta[4]*1.5)
|
||||
if modelfile_extracted_meta[5] > 1024*1024*10: #draft model tax
|
||||
mem -= (modelfile_extracted_meta[5] * 1.5)
|
||||
if modelfile_extracted_meta[6] > 1024*1024*10: #tts model tax
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue