Merge branch 'master' into gg/llama-kv-cache

ggml-ci
2025-01-31 15:11:02 +02:00 · 2025-01-31 15:11:02 +02:00 · 5d3491e789
commit 5d3491e789
parent a40ba49fa6 5783575c9d
53 changed files with 4034 additions and 208 deletions
--- a/common/common.cpp
+++ b/common/common.cpp
@ -12,6 +12,7 @@
 #include "json.hpp"
 #include "json-schema-to-grammar.h"
 #include "llama.h"
+#include "chat.hpp"
 #include "chat-template.hpp"

 #include <algorithm>
@ -1774,11 +1775,13 @@ std::string common_detokenize(const struct llama_vocab * vocab, const std::vecto
 bool common_chat_verify_template(const std::string & tmpl, bool use_jinja) {
    if (use_jinja) {
        try {
-            auto chat_template = minja::chat_template(tmpl, "<s>", "</s>");
-            chat_template.apply({{
+            auto chat_template = common_chat_template(tmpl, "<s>", "</s>");
+            common_chat_inputs inputs;
+            inputs.messages = json::array({{
                {"role", "user"},
                {"content", "test"},
-            }}, json(), true);
+            }});
+            common_chat_params_init(chat_template, inputs);
            return true;
        } catch (const std::exception & e) {
            LOG_ERR("%s: failed to apply template: %s\n", __func__, e.what());
@ -1800,7 +1803,10 @@ std::string common_chat_apply_template(
        for (const auto & msg : msgs) {
            messages.push_back({{"role", msg.role}, {"content", msg.content}});
        }
-        return tmpl.apply(messages, /* tools= */ json(), add_ass);
+        common_chat_inputs inputs;
+        inputs.messages = messages;
+        inputs.add_generation_prompt = add_ass;
+        return common_chat_params_init(tmpl, inputs).prompt;
    }

    int alloc_size = 0;
@ -1855,10 +1861,10 @@ std::string common_chat_format_single(

 std::string common_chat_format_example(const common_chat_template & tmpl, bool use_jinja) {
    std::vector<common_chat_msg> msgs = {
-        {"system",    "You are a helpful assistant"},
-        {"user",      "Hello"},
-        {"assistant", "Hi there"},
-        {"user",      "How are you?"},
+        {"system",    "You are a helpful assistant", {}},
+        {"user",      "Hello", {}},
+        {"assistant", "Hi there", {}},
+        {"user",      "How are you?", {}},
    };
    return common_chat_apply_template(tmpl, msgs, true, use_jinja);
 }