Modified batch backend_buffer size to actual size

This commit is contained in:
leeetao 2025-07-04 08:52:15 +00:00
parent 82787be7eb
commit da31acbe6a

View file

@ -3052,8 +3052,7 @@ struct llama_sbatch {
ubatch_token.resize(!has_embd ? n_ubatch : 0); ubatch_token.resize(!has_embd ? n_ubatch : 0);
ubatch_embd.resize(has_embd ? n_embd * n_ubatch : 0); ubatch_embd.resize(has_embd ? n_embd * n_ubatch : 0);
// TODO: just a guess and test, need to be removed(from tao) ubatch_backend_embd.resize(n_embd * n_tokens + n_tokens);
ubatch_backend_embd.resize(n_embd * n_tokens * 3);
ubatch_out_embd.resize(n_embd * n_tokens); ubatch_out_embd.resize(n_embd * n_tokens);
ubatch_pos.resize(n_ubatch); ubatch_pos.resize(n_ubatch);