diff --git a/koboldcpp.py b/koboldcpp.py index dcdf05324..75e979f50 100644 --- a/koboldcpp.py +++ b/koboldcpp.py @@ -6911,8 +6911,6 @@ def kcpp_main_process(launch_args, g_memory=None, gui_launcher=False): if not args.blasthreads or args.blasthreads <= 0: args.blasthreads = args.threads - if args.flashattention and (args.usevulkan is not None) and args.gpulayers!=0: - print("\nWARNING: FlashAttention is strongly discouraged when using Vulkan GPU offload as it is extremely slow!\n") modelname = os.path.abspath(args.model_param) print(args)