From 1ebe20789bd6ec52672f4b1a2c1b1260ec9c342a Mon Sep 17 00:00:00 2001 From: Markus Tavenrath Date: Wed, 12 Jun 2024 13:45:41 +0200 Subject: [PATCH] Free resources except for backend. --- llama.cpp | 8 ++++++-- 1 file changed, 6 insertions(+), 2 deletions(-) diff --git a/llama.cpp b/llama.cpp index 71f5b53ba..ac4582864 100644 --- a/llama.cpp +++ b/llama.cpp @@ -3936,8 +3936,12 @@ struct llama_model_loader { } #if defined(GGML_USE_CUDA) - for (auto const& event : events) { - ggml_backend_event_synchronize(event); + for (size_t idx = 0; idx < num_buffers;++idx) { + ggml_backend_event_synchronize(events[idx]); + ggml_backend_event_free(events[idx]); + ggml_backend_buffer_free(host_buffers[idx]); + + //ggml_backend_free(backend); } #endif