From bc3e4c1197468103eb686aee70fcc2231cc58f2f Mon Sep 17 00:00:00 2001 From: Wagner Bruna Date: Thu, 3 Jul 2025 05:57:03 -0300 Subject: [PATCH] remove obsolete warning about flash attention on Vulkan (#1634) --- koboldcpp.py | 2 -- 1 file changed, 2 deletions(-) diff --git a/koboldcpp.py b/koboldcpp.py index dcdf05324..75e979f50 100644 --- a/koboldcpp.py +++ b/koboldcpp.py @@ -6911,8 +6911,6 @@ def kcpp_main_process(launch_args, g_memory=None, gui_launcher=False): if not args.blasthreads or args.blasthreads <= 0: args.blasthreads = args.threads - if args.flashattention and (args.usevulkan is not None) and args.gpulayers!=0: - print("\nWARNING: FlashAttention is strongly discouraged when using Vulkan GPU offload as it is extremely slow!\n") modelname = os.path.abspath(args.model_param) print(args)