remove obsolete warning about flash attention on Vulkan (#1634)

2025-09-10 17:14:36 +00:00 · 2025-07-03 05:57:03 -03:00 · 2025-07-03 05:57:03 -03:00 · bc3e4c1197
commit bc3e4c1197
parent f407aa3b8a
1 changed files with 0 additions and 2 deletions
--- a/koboldcpp.py
+++ b/koboldcpp.py
@ -6911,8 +6911,6 @@ def kcpp_main_process(launch_args, g_memory=None, gui_launcher=False):

        if not args.blasthreads or args.blasthreads <= 0:
            args.blasthreads = args.threads
-        if args.flashattention and (args.usevulkan is not None) and args.gpulayers!=0:
-            print("\nWARNING: FlashAttention is strongly discouraged when using Vulkan GPU offload as it is extremely slow!\n")

        modelname = os.path.abspath(args.model_param)
        print(args)