fix gpt oss

This commit is contained in:
Concedo 2025-11-26 23:44:56 +08:00
parent 998dfcd1be
commit 5fe1d51c24
4 changed files with 5 additions and 4 deletions

View file

@ -4153,7 +4153,7 @@ Current version indicated by LITEVER below.
"name":"OpenAI Harmony Non-Thinking",
"user":"<|start|>user<|message|>",
"user_end":"<|end|>",
"assistant":"<|start|>assistant<|channel|>final<|message|>",
"assistant":"<<|start|>assistant<|channel|>analysis<|message|>We can answer immediately.<|end|><|start|>assistant<|channel|>final<|message|>",
"assistant_end":"<|end|>",
"system":"<|start|>developer<|message|>",
"system_end":"<|end|>",
@ -6893,6 +6893,7 @@ Current version indicated by LITEVER below.
.replace(/\*\*\*([^\s*][\s\S]*?[^\\])\*\*\*/gm, "<b><em>$1</em></b>")
.replace(/\*\*(.)\*\*/g, "<b>$1</b>") //handle single char bold
.replace(/ \*\*(\w+(?: \w+)?)\*\* /g, " <b>$1</b> ") //hack: support 1 or 2 nested bolded words (not official)
.replace(/\*\*([^\s*][\s\S]*?[^\\])\*\*/gm, "<b>$1</b>")
.replace(/(^|[\s.,;:!?<>])\*(.)\*(?=[\s.,;:!?<>]|$)/g, "$1<em>$2</em>") //handle single char italics
.replace(/\*([^\s*][\s\S]*?[^\\])\*/gm, "<em>$1</em>")

View file

@ -588,7 +588,7 @@ void ggml_cuda_flash_attn_ext_wmma_f16(ggml_backend_cuda_context & ctx, ggml_ten
// ggml_cuda_flash_attn_ext_wmma_f16_case<256, cols_per_block, float>(ctx, dst);
// break;
default:
GGML_ABORT("fatal error");
GGML_ABORT("fatal error: case %d",Q->ne[0]);
break;
}
}

View file

@ -218,7 +218,7 @@
"system_end": "\n\n<|end|>",
"user_start": "<|start|>user<|message|>",
"user_end": "<|end|>",
"assistant_start": "<|start|>assistant<|channel|>final<|message|>",
"assistant_start": "<|start|>assistant<|channel|>analysis<|message|>We can answer immediately.<|end|><|start|>assistant<|channel|>final<|message|>",
"assistant_end": "<|end|>"
}
}, {

View file

@ -3,6 +3,6 @@
"system_end": "<|end|>",
"user_start": "<|start|>user<|message|>",
"user_end": "<|end|>",
"assistant_start": "<|start|>assistant<|channel|>final<|message|>",
"assistant_start": "<|start|>assistant<|channel|>analysis<|message|>We can answer immediately.<|end|><|start|>assistant<|channel|>final<|message|>",
"assistant_end": "<|end|>"
}