diff --git a/examples/speculative/speculative.cpp b/examples/speculative/speculative.cpp index 3716579e..f4ab8262 100644 --- a/examples/speculative/speculative.cpp +++ b/examples/speculative/speculative.cpp @@ -628,6 +628,8 @@ int main(int argc, char ** argv) { LOG_INF("target:\n\n"); gpt_perf_print(ctx_tgt, smpl); + llama_free_sockets(ctx_tgt, nullptr); + gpt_sampler_free(smpl); for (int s = 0; s < n_seq_dft; ++s) { gpt_sampler_free(drafts[s].smpl);