mirror of
https://github.com/Lizonghang/prima.cpp.git
synced 2025-09-05 19:49:03 +00:00
Modified batch backend_buffer size to actual size
This commit is contained in:
parent
82787be7eb
commit
da31acbe6a
1 changed files with 1 additions and 2 deletions
|
@ -3052,8 +3052,7 @@ struct llama_sbatch {
|
||||||
ubatch_token.resize(!has_embd ? n_ubatch : 0);
|
ubatch_token.resize(!has_embd ? n_ubatch : 0);
|
||||||
ubatch_embd.resize(has_embd ? n_embd * n_ubatch : 0);
|
ubatch_embd.resize(has_embd ? n_embd * n_ubatch : 0);
|
||||||
|
|
||||||
// TODO: just a guess and test, need to be removed(from tao)
|
ubatch_backend_embd.resize(n_embd * n_tokens + n_tokens);
|
||||||
ubatch_backend_embd.resize(n_embd * n_tokens * 3);
|
|
||||||
ubatch_out_embd.resize(n_embd * n_tokens);
|
ubatch_out_embd.resize(n_embd * n_tokens);
|
||||||
|
|
||||||
ubatch_pos.resize(n_ubatch);
|
ubatch_pos.resize(n_ubatch);
|
||||||
|
|
Loading…
Add table
Reference in a new issue