llama : Add IBM granite template (#10013)

* Add granite template to llama.cpp * Add granite template to test-chat-template.cpp * Update src/llama.cpp Co-authored-by: Xuan Son Nguyen <thichthat@gmail.com> * Update tests/test-chat-template.cpp Co-authored-by: Xuan Son Nguyen <thichthat@gmail.com> * Added proper template and expected output * Small change to \n Small change to \n * Add code space & Co-authored-by: Xuan Son Nguyen <thichthat@gmail.com> * Fix spacing * Apply suggestions from code review * Update src/llama.cpp --------- Co-authored-by: Xuan Son Nguyen <thichthat@gmail.com>
2024-10-28 10:45:33 -07:00 · 2024-10-28 10:45:33 -07:00 · 61715d5cc8
commit 61715d5cc8
parent 07028f9d74
2 changed files with 14 additions and 0 deletions
--- a/src/llama.cpp
+++ b/src/llama.cpp
@ -21706,6 +21706,16 @@ static int32_t llama_chat_apply_template_internal(
                ss << message->content << "\n\n";
            }
        }
+    } else if (tmpl == "granite" || tmpl_contains("<|start_of_role|>")) {
+        // IBM Granite template
+        for (const auto & message : chat) {
+            std::string role(message->role);
+            ss << "<|start_of_role|>" << role << "<|end_of_role|>"
+               << message->content << "<|end_of_text|>\n";
+        }
+        if (add_ass) {
+            ss << "<|start_of_role|>assistant<|end_of_role|>\n";
+        }
    } else {
        // template not supported
        return -1;