llama : cont

ggml-ci
2025-01-13 14:56:52 +02:00 · 2025-01-13 14:56:52 +02:00 · e4550fbafc
commit e4550fbafc
parent f78b396ee7
19 changed files with 128 additions and 79 deletions
--- a/examples/lookup/lookup.cpp
+++ b/examples/lookup/lookup.cpp
@ -35,6 +35,7 @@ int main(int argc, char ** argv){

    llama_model * model = llama_init.model.get();
    llama_context * ctx = llama_init.context.get();
+    llama_kv_cache * kv = llama_get_kv_cache(ctx);

    const llama_vocab * vocab = llama_model_get_vocab(model);

@ -192,7 +193,7 @@ int main(int argc, char ** argv){

        // KV cache management
        // clean the cache of draft tokens that weren't accepted
-        llama_kv_cache_seq_rm(ctx, 0, n_past, -1);
+        llama_kv_cache_seq_rm(kv, 0, n_past, -1);

        common_batch_clear(batch_tgt);
        common_batch_add(batch_tgt, draft[0], n_past, { 0 }, true);