cuBLAS: also pin kv cache
This commit is contained in:
parent
d5d6a8083a
commit
3cf2247d37
1 changed files with 1 additions and 1 deletions
|
@ -136,7 +136,7 @@ struct llama_kv_cache {
|
|||
|
||||
struct ggml_context * ctx = NULL;
|
||||
|
||||
llama_buffer buf;
|
||||
llama_ctx_buffer buf;
|
||||
|
||||
int n; // number of tokens currently in the cache
|
||||
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue