diff --git a/llama.h b/llama.h index da8f7f600..b4769ed20 100644 --- a/llama.h +++ b/llama.h @@ -96,7 +96,7 @@ extern "C" { // Sets the KV cache containing the current context for the model LLAMA_API void llama_set_kv_cache( struct llama_context * ctx, - uint8_t * kv_cache, + const uint8_t * kv_cache, size_t n_size, int n_token_count);