mirror of
https://github.com/Lizonghang/prima.cpp.git
synced 2025-09-06 06:49:02 +00:00
speculative: free sockets and send stop signal when inference ends
This commit is contained in:
parent
dc875bbef9
commit
2687ef3126
1 changed files with 2 additions and 0 deletions
|
@ -628,6 +628,8 @@ int main(int argc, char ** argv) {
|
||||||
LOG_INF("target:\n\n");
|
LOG_INF("target:\n\n");
|
||||||
gpt_perf_print(ctx_tgt, smpl);
|
gpt_perf_print(ctx_tgt, smpl);
|
||||||
|
|
||||||
|
llama_free_sockets(ctx_tgt, nullptr);
|
||||||
|
|
||||||
gpt_sampler_free(smpl);
|
gpt_sampler_free(smpl);
|
||||||
for (int s = 0; s < n_seq_dft; ++s) {
|
for (int s = 0; s < n_seq_dft; ++s) {
|
||||||
gpt_sampler_free(drafts[s].smpl);
|
gpt_sampler_free(drafts[s].smpl);
|
||||||
|
|
Loading…
Add table
Reference in a new issue