llama : llama_kv_cache_clear zeroes data + fix save-load seq

ggml-ci
2024-04-25 19:37:27 +03:00 · 2024-04-25 19:37:27 +03:00 · c225609f10
commit c225609f10
parent ac1c6d91de
2 changed files with 103 additions and 46 deletions
--- a/llama.h
+++ b/llama.h
@ -526,7 +526,7 @@ extern "C" {
    // Returns the number of used KV cells (i.e. have at least one sequence assigned to them)
    LLAMA_API int32_t llama_get_kv_cache_used_cells(const struct llama_context * ctx);

-    // Clear the KV cache
+    // Clear the KV cache - both cell info is erased and KV data is zeroed
    LLAMA_API void llama_kv_cache_clear(
            struct llama_context * ctx);