add ability to use guide tokens for TTS, ref: https://github.com/ggerganov/llama.cpp/pull/11186

This commit is contained in:
Concedo 2025-01-11 17:18:21 +08:00
parent bd38665e1f
commit 07173e84a0
4 changed files with 53 additions and 3 deletions

View file

@ -11122,9 +11122,9 @@ static int llama_decode_impl(
}
}
GGML_ASSERT(n_tokens_all <= cparams.n_batch);
GGML_ASSERT_CONTINUE(n_tokens_all <= cparams.n_batch);
GGML_ASSERT((cparams.causal_attn || cparams.n_ubatch >= n_tokens_all) && "non-causal attention requires n_ubatch >= n_tokens");
GGML_ASSERT_CONTINUE((cparams.causal_attn || cparams.n_ubatch >= n_tokens_all) && "non-causal attention requires n_ubatch >= n_tokens");
if (lctx.t_compute_start_us == 0) {
lctx.t_compute_start_us = ggml_time_us();