mirror of
https://github.com/LostRuins/koboldcpp.git
synced 2025-09-11 09:34:37 +00:00
add ability to use guide tokens for TTS, ref: https://github.com/ggerganov/llama.cpp/pull/11186
This commit is contained in:
parent
bd38665e1f
commit
07173e84a0
4 changed files with 53 additions and 3 deletions
|
@ -11122,9 +11122,9 @@ static int llama_decode_impl(
|
|||
}
|
||||
}
|
||||
|
||||
GGML_ASSERT(n_tokens_all <= cparams.n_batch);
|
||||
GGML_ASSERT_CONTINUE(n_tokens_all <= cparams.n_batch);
|
||||
|
||||
GGML_ASSERT((cparams.causal_attn || cparams.n_ubatch >= n_tokens_all) && "non-causal attention requires n_ubatch >= n_tokens");
|
||||
GGML_ASSERT_CONTINUE((cparams.causal_attn || cparams.n_ubatch >= n_tokens_all) && "non-causal attention requires n_ubatch >= n_tokens");
|
||||
|
||||
if (lctx.t_compute_start_us == 0) {
|
||||
lctx.t_compute_start_us = ggml_time_us();
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue