From bc2877d2fede3298c8f88cb7600b3f71ad000d14 Mon Sep 17 00:00:00 2001 From: Concedo <39025047+LostRuins@users.noreply.github.com> Date: Sun, 13 Jul 2025 23:42:59 +0800 Subject: [PATCH] test without g3n fix --- gpttype_adapter.cpp | 10 +++++----- 1 file changed, 5 insertions(+), 5 deletions(-) diff --git a/gpttype_adapter.cpp b/gpttype_adapter.cpp index 68f676d43..f253e5fc2 100644 --- a/gpttype_adapter.cpp +++ b/gpttype_adapter.cpp @@ -2292,11 +2292,11 @@ ModelLoadResult gpttype_load_model(const load_model_inputs inputs, FileFormat in } //handle override tensor std::string tensoroverrides = inputs.override_tensors; - if(file_format_meta.model_architecture==GGUFArch::ARCH_GEMMA3N) - { - std::string forced = "per_layer_token_embd.weight=CPU"; //this tensor on gpu is problematic on unsloth q4_0 - tensoroverrides = (tensoroverrides=="" ? forced: (forced+","+tensoroverrides)); - } + // if(file_format_meta.model_architecture==GGUFArch::ARCH_GEMMA3N) + // { + // std::string forced = "per_layer_token_embd.weight=CPU"; //this tensor on gpu is problematic on unsloth q4_0 + // tensoroverrides = (tensoroverrides=="" ? forced: (forced+","+tensoroverrides)); + // } if(tensoroverrides!="" && ggml_backend_dev_count()>1) { printf("Handling Override Tensors for backends: ");