Be nice to CI machines by not allocating buffers

...for vocab_only=true
2023-04-01 17:00:01 +02:00 · 2023-04-01 17:00:01 +02:00 · 3ef747808a
commit 3ef747808a
parent d0a7f742e7
1 changed files with 1 additions and 1 deletions
--- a/llama.cpp
+++ b/llama.cpp
@ -1608,7 +1608,7 @@ struct llama_context * llama_init_from_file(
    }

    // reserve memory for context buffers
-    {
+    if (!params.vocab_only) {
        if (!kv_cache_init(ctx->model.hparams, ctx->model.kv_self, memory_type, ctx->model.hparams.n_ctx)) {
            fprintf(stderr, "%s: kv_cache_init() failed for self-attention cache\n", __func__);
            llama_free(ctx);