fixed memory leak by freeing temporary graph during session load

2023-10-08 00:36:20 +08:00 · 2023-10-08 00:36:20 +08:00 · 9ee8aeccd7
commit 9ee8aeccd7
parent 88a14fcfef
1 changed files with 4 additions and 0 deletions
--- a/llama.cpp
+++ b/llama.cpp
@ -8405,6 +8405,10 @@ size_t llama_set_state_data(struct llama_context * ctx, uint8_t * src) {
            ggml_graph_compute_helper(ctx->work_buffer, gf, /*n_threads*/ 1);

            ggml_free(cpy_ctx);
+
+            // free our allocated graph
+            free(gf);
+            gf = NULL;
        }

        ctx->kv_self.head = kv_head;