Skip to content
Prev Previous commit
Next Next commit
fixed memory leak by freeing temporary graph during session load
  • Loading branch information
l3utterfly committed Oct 7, 2023
commit 9ee8aeccd73dbc4a000eb93c1c08eea843c752a3
4 changes: 4 additions & 0 deletions llama.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -8405,6 +8405,10 @@ size_t llama_set_state_data(struct llama_context * ctx, uint8_t * src) {
ggml_graph_compute_helper(ctx->work_buffer, gf, /*n_threads*/ 1);

ggml_free(cpy_ctx);

// free our allocated graph
free(gf);
gf = NULL;
}

ctx->kv_self.head = kv_head;
Expand Down