mirror of
https://github.com/LostRuins/koboldcpp.git
synced 2025-09-10 09:04:36 +00:00
try disabling the gMask prefix for glm-4 completions
This commit is contained in:
parent
c64557a851
commit
49305942ab
2 changed files with 24 additions and 24 deletions
|
@ -3263,28 +3263,28 @@ generation_outputs gpttype_generate(const generation_inputs inputs)
|
|||
}
|
||||
|
||||
//need to add a cursed hack to get coherency for GLM4, by ensuring injection for both sop and gmask
|
||||
if (file_format == FileFormat::GGUF_GENERIC && file_format_meta.model_architecture == GGUFArch::ARCH_GLM4) {
|
||||
std::string temp = gpttype_get_chat_template();
|
||||
if (temp.find("[gMASK]<sop>") != std::string::npos) {
|
||||
if (addedmemory == "") {
|
||||
if (kcpp_data->prompt.rfind("[gMASK]", 0) == 0) { //check startswith
|
||||
kcpp_data->prompt.erase(0, 7);
|
||||
}
|
||||
if (kcpp_data->prompt.rfind("<sop>", 0) == 0) { //check startswith
|
||||
kcpp_data->prompt.erase(0, 5);
|
||||
}
|
||||
addedmemory = "[gMASK]<sop>";
|
||||
} else {
|
||||
if (addedmemory.rfind("[gMASK]", 0) == 0) { //check startswith
|
||||
addedmemory.erase(0, 7);
|
||||
}
|
||||
if (addedmemory.rfind("<sop>", 0) == 0) { //check startswith
|
||||
addedmemory.erase(0, 5);
|
||||
}
|
||||
addedmemory = "[gMASK]<sop>" + addedmemory;
|
||||
}
|
||||
}
|
||||
}
|
||||
// if (file_format == FileFormat::GGUF_GENERIC && file_format_meta.model_architecture == GGUFArch::ARCH_GLM4) {
|
||||
// std::string temp = gpttype_get_chat_template();
|
||||
// if (temp.find("[gMASK]<sop>") != std::string::npos) {
|
||||
// if (addedmemory == "") {
|
||||
// if (kcpp_data->prompt.rfind("[gMASK]", 0) == 0) { //check startswith
|
||||
// kcpp_data->prompt.erase(0, 7);
|
||||
// }
|
||||
// if (kcpp_data->prompt.rfind("<sop>", 0) == 0) { //check startswith
|
||||
// kcpp_data->prompt.erase(0, 5);
|
||||
// }
|
||||
// addedmemory = "[gMASK]<sop>";
|
||||
// } else {
|
||||
// if (addedmemory.rfind("[gMASK]", 0) == 0) { //check startswith
|
||||
// addedmemory.erase(0, 7);
|
||||
// }
|
||||
// if (addedmemory.rfind("<sop>", 0) == 0) { //check startswith
|
||||
// addedmemory.erase(0, 5);
|
||||
// }
|
||||
// addedmemory = "[gMASK]<sop>" + addedmemory;
|
||||
// }
|
||||
// }
|
||||
// }
|
||||
|
||||
bool stream_sse = inputs.stream_sse;
|
||||
bool allow_regular_prints = (!is_quiet && debugmode!=-1);
|
||||
|
|
|
@ -4433,8 +4433,8 @@ def show_gui():
|
|||
except Exception:
|
||||
pass
|
||||
else:
|
||||
quick_gpuname_label.configure(text="")
|
||||
gpuname_label.configure(text="")
|
||||
quick_gpuname_label.configure(text="(dGPUs only, tensor split sets ratio)")
|
||||
gpuname_label.configure(text="(dGPUs only, tensor split sets ratio)")
|
||||
|
||||
gpu_choice_var.trace("w", changed_gpu_choice_var)
|
||||
gpulayers_var.trace("w", changed_gpulayers_estimate)
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue