gemma3 template, updated lite, fixed tool calling, reenable ctx shift for gemma3

This commit is contained in:
Concedo 2025-03-14 17:47:01 +08:00
parent 7dc72db9de
commit 6a1dd57435
5 changed files with 78 additions and 8 deletions

View file

@ -2129,11 +2129,6 @@ ModelLoadResult gpttype_load_model(const load_model_inputs inputs, FileFormat in
printf("Qwen2VL detected! Mrope will be used, and context shift will be disabled!\n");
kcpp_data->use_contextshift = false;
}
if(file_format_meta.model_architecture == GGUFArch::ARCH_GEMMA3)
{
printf("Gemma3 detected! Context shift will be disabled!\n");
kcpp_data->use_contextshift = false;
}
model_params.main_gpu = cu_parseinfo_maindevice;
#if defined(GGML_USE_CUDA)