From 2687ef3126fcb120b014b9c80e98238ebc049781 Mon Sep 17 00:00:00 2001 From: "Li, Zonghang" <870644199@qq.com> Date: Fri, 13 Jun 2025 11:25:42 +0400 Subject: [PATCH] speculative: free sockets and send stop signal when inference ends --- examples/speculative/speculative.cpp | 2 ++ 1 file changed, 2 insertions(+) diff --git a/examples/speculative/speculative.cpp b/examples/speculative/speculative.cpp index 3716579e..f4ab8262 100644 --- a/examples/speculative/speculative.cpp +++ b/examples/speculative/speculative.cpp @@ -628,6 +628,8 @@ int main(int argc, char ** argv) { LOG_INF("target:\n\n"); gpt_perf_print(ctx_tgt, smpl); + llama_free_sockets(ctx_tgt, nullptr); + gpt_sampler_free(smpl); for (int s = 0; s < n_seq_dft; ++s) { gpt_sampler_free(drafts[s].smpl);