relocated shader compile warning

2026-05-08 09:59:50 +00:00 · 2025-11-15 23:17:47 +08:00 · 2025-11-15 23:17:47 +08:00 · 86f907272a
commit 86f907272a
parent ea22e04320
2 changed files with 2 additions and 1 deletions
--- a/ggml/src/ggml-cuda/ggml-cuda.cu
+++ b/ggml/src/ggml-cuda/ggml-cuda.cu
@ -208,7 +208,7 @@ static ggml_cuda_device_info ggml_cuda_init() {
 //#else
 //    GGML_LOG_INFO("%s: GGML_CUDA_FORCE_CUBLAS: no\n", __func__);
 //#endif // GGML_CUDA_FORCE_CUBLAS
-    GGML_LOG_INFO("---\nInitializing CUDA/HIP, please wait, the following step may take a few minutes (only for first launch)...\n---\n");
+  
    GGML_LOG_INFO("%s: found %d " GGML_CUDA_NAME " devices:\n", __func__, info.device_count);

    std::vector<std::pair<int, std::string>> turing_devices_without_mma;
--- a/gpttype_adapter.cpp
+++ b/gpttype_adapter.cpp
@ -2217,6 +2217,7 @@ ModelLoadResult gpttype_load_model(const load_model_inputs inputs, FileFormat in
            printf("CUDA: Set main device to %d\n",kcpp_parseinfo_maindevice);
        }
        printf("CUDA MMQ: %s\n",(inputs.use_mmq?"True":"False"));
+        printf("---\nInitializing CUDA/HIP, please wait, the following step may take a few minutes (only for first launch)...\n---\n");
        ggml_cuda_set_mul_mat_q(inputs.use_mmq);
        #endif
        if((file_format_meta.model_architecture == GGUFArch::ARCH_QWEN2 || file_format_meta.model_architecture == GGUFArch::ARCH_QWEN2VL) && !kcpp_data->flash_attn)