llama : better rwkv chat template and add missing inputs.use_jinja setting (#14336)

* llama-cli : add missing `inputs.use_jinja` setting Signed-off-by: Molly Sophia <mollysophia379@gmail.com> * llama : better legacy chat template for rwkv Signed-off-by: Molly Sophia <mollysophia379@gmail.com> --------- Signed-off-by: Molly Sophia <mollysophia379@gmail.com>
2025-06-27 12:05:03 +00:00 · 2025-06-23 19:56:19 +08:00
parent defe2158dd
commit 72c6bc3f3d
2 changed files with 12 additions and 6 deletions
--- a/src/llama-chat.cpp
+++ b/src/llama-chat.cpp
@ -528,12 +528,17 @@ int32_t llm_chat_apply_template(
        }
    } else if (tmpl == LLM_CHAT_TEMPLATE_RWKV_WORLD) {
        // this template requires the model to have "\n\n" as EOT token
-        for (auto message : chat) {
+        for (size_t i = 0; i < chat.size(); i++) {
-            std::string role(message->role);
+            std::string role(chat[i]->role);
-            if (role == "user") {
+            if (role == "system") {
-                ss << "User: " << message->content << "\n\nAssistant:";
+                ss << "System: " << trim(chat[i]->content) << "\n\n";
-            } else {
+            } else if (role == "user") {
-                ss << message->content << "\n\n";
+                ss << "User: " << trim(chat[i]->content) << "\n\n";
                if (i == chat.size() - 1) {
                    ss << "Assistant:";
                }
            } else if (role == "assistant") {
                ss << "Assistant: " << trim(chat[i]->content) << "\n\n";
            }
        }
    } else if (tmpl == LLM_CHAT_TEMPLATE_GRANITE) {
--- a/tools/main/main.cpp
+++ b/tools/main/main.cpp
@ -292,6 +292,7 @@ int main(int argc, char ** argv) {
            if (!params.system_prompt.empty() || !params.prompt.empty()) {
                common_chat_templates_inputs inputs;
                inputs.use_jinja = g_params->use_jinja;
                inputs.messages = chat_msgs;
                inputs.add_generation_prompt = !params.prompt.empty();