From 38d4d743bb10bc906f1c0673d81981ace59c597e Mon Sep 17 00:00:00 2001 From: Concedo <39025047+LostRuins@users.noreply.github.com> Date: Tue, 28 May 2024 18:25:00 +0800 Subject: [PATCH] add flash attn and quiet mode to quick launch --- koboldcpp.py | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/koboldcpp.py b/koboldcpp.py index 25182890c..4b61bad52 100644 --- a/koboldcpp.py +++ b/koboldcpp.py @@ -2076,11 +2076,13 @@ def show_new_gui(): # quick boxes - quick_boxes = {"Launch Browser": launchbrowser , "Disable MMAP":disablemmap,"Use ContextShift":contextshift,"Remote Tunnel":remotetunnel} + quick_boxes = {"Launch Browser": launchbrowser , "Disable MMAP":disablemmap,"Use ContextShift":contextshift,"Remote Tunnel":remotetunnel,"Use FlashAttention":flashattention,"Quiet Mode":quietmode} quick_boxes_desc = {"Launch Browser": "Launches your default browser after model loading is complete", "Disable MMAP":"Avoids using mmap to load models if enabled", "Use ContextShift":"Uses Context Shifting to reduce reprocessing.\nRecommended. Check the wiki for more info.", - "Remote Tunnel":"Creates a trycloudflare tunnel.\nAllows you to access koboldcpp from other devices over an internet URL."} + "Remote Tunnel":"Creates a trycloudflare tunnel.\nAllows you to access koboldcpp from other devices over an internet URL.", + "Use FlashAttention":"Enable flash attention for GGUF models.", + "Quiet Mode":"Prevents all generation related terminal output from being displayed."} for idx, name, in enumerate(quick_boxes): makecheckbox(quick_tab, name, quick_boxes[name], int(idx/2) +20, idx%2,tooltiptxt=quick_boxes_desc[name]) # context size