some tweaks and cleanup

This commit is contained in:
Concedo 2025-01-13 23:50:54 +08:00
parent 636beac6d2
commit e77d566268
3 changed files with 8 additions and 4 deletions

View file

@ -11124,7 +11124,7 @@ static int llama_decode_impl(
GGML_ASSERT_CONTINUE(n_tokens_all <= cparams.n_batch);
GGML_ASSERT_CONTINUE((cparams.causal_attn || cparams.n_ubatch >= n_tokens_all) && "non-causal attention requires n_ubatch >= n_tokens");
//GGML_ASSERT_CONTINUE((cparams.causal_attn || cparams.n_ubatch >= n_tokens_all) && "non-causal attention requires n_ubatch >= n_tokens");
if (lctx.t_compute_start_us == 0) {
lctx.t_compute_start_us = ggml_time_us();