cuBLAS: also pin kv cache

2023-04-28 00:48:01 +02:00 · 2023-04-28 00:48:01 +02:00 · 3cf2247d37
commit 3cf2247d37
parent d5d6a8083a
1 changed files with 1 additions and 1 deletions
--- a/llama.cpp
+++ b/llama.cpp
@ -136,7 +136,7 @@ struct llama_kv_cache {

    struct ggml_context * ctx = NULL;

-    llama_buffer buf;
+    llama_ctx_buffer buf;

    int n; // number of tokens currently in the cache