From b698d87e9afacf7d82d6c7d5a7a961b59e206cc7 Mon Sep 17 00:00:00 2001 From: vincent Date: Tue, 6 Feb 2024 00:41:52 +0800 Subject: [PATCH] fix bug for quantize minicpm --- llama.cpp | 1 + 1 file changed, 1 insertion(+) diff --git a/llama.cpp b/llama.cpp index cc50ea303..f14e56bd0 100644 --- a/llama.cpp +++ b/llama.cpp @@ -697,6 +697,7 @@ static std::map> LLM_TENSOR_NAMES = { { LLM_TENSOR_TOKEN_EMBD, "token_embd" }, { LLM_TENSOR_OUTPUT_NORM, "output_norm" }, + { LLM_TENSOR_OUTPUT, "output" }, { LLM_TENSOR_ROPE_FREQS, "rope_freqs" }, { LLM_TENSOR_ATTN_NORM, "blk.%d.attn_norm" }, { LLM_TENSOR_ATTN_Q, "blk.%d.attn_q" },