server : clean up built-in template detection (#11026)

* server : clean up built-in template detection * fix compilation * add chat template test * fix condition
2024-12-31 15:22:01 +01:00 · 2024-12-31 15:22:01 +01:00 · 45095a61bf
commit 45095a61bf
parent 5896c65232
6 changed files with 44 additions and 27 deletions
--- a/common/common.cpp
+++ b/common/common.cpp
@ -1614,6 +1614,18 @@ std::string common_detokenize(llama_context * ctx, const std::vector<llama_token
 // Chat template utils
 //

+std::string common_get_builtin_chat_template(const struct llama_model * model) {
+    static const char * template_key = "tokenizer.chat_template";
+    // call with NULL buffer to get the total size of the string
+    int32_t res = llama_model_meta_val_str(model, template_key, NULL, 0);
+    if (res > 0) {
+        std::vector<char> model_template(res + 1, 0);
+        llama_model_meta_val_str(model, template_key, model_template.data(), model_template.size());
+        return std::string(model_template.data(), model_template.size() - 1);
+    }
+    return "";
+}
+
 bool common_chat_verify_template(const std::string & tmpl) {
    llama_chat_message chat[] = {{"user", "test"}};
    int res = llama_chat_apply_template(nullptr, tmpl.c_str(), chat, 1, true, nullptr, 0);
--- a/common/common.h
+++ b/common/common.h
@ -571,6 +571,9 @@ struct common_chat_msg {
    std::string content;
 };

+// Get the built-in chat template for the model. Return empty string if not present.
+std::string common_get_builtin_chat_template(const struct llama_model * model);
+
 // Check if the template supplied via "--chat-template" is supported or not. Returns true if it's valid
 bool common_chat_verify_template(const std::string & tmpl);