mirror of
https://github.com/Lizonghang/prima.cpp.git
synced 2025-09-05 19:19:02 +00:00
speculative: free sockets and send stop signal when inference ends
This commit is contained in:
parent
dc875bbef9
commit
2687ef3126
1 changed files with 2 additions and 0 deletions
|
@ -628,6 +628,8 @@ int main(int argc, char ** argv) {
|
|||
LOG_INF("target:\n\n");
|
||||
gpt_perf_print(ctx_tgt, smpl);
|
||||
|
||||
llama_free_sockets(ctx_tgt, nullptr);
|
||||
|
||||
gpt_sampler_free(smpl);
|
||||
for (int s = 0; s < n_seq_dft; ++s) {
|
||||
gpt_sampler_free(drafts[s].smpl);
|
||||
|
|
Loading…
Add table
Reference in a new issue