mtmd : fix glm-edge redundant token count (#13139)

* mtmd : fix glm-edge redundant token count * fix chat template * temporary disable GLMEdge test chat tmpl
2025-04-28 16:12:56 +02:00 · 2025-04-28 16:12:56 +02:00 · 4e87962e34
commit 4e87962e34
parent fb0471d175
3 changed files with 11 additions and 26 deletions
--- a/src/llama-chat.cpp
+++ b/src/llama-chat.cpp
@ -447,7 +447,7 @@ int32_t llm_chat_apply_template(
        if (add_ass) {
            ss << "<|assistant|>";
        }
-    } else if (tmpl == LLM_CHAT_TEMPLATE_CHATGLM_4) {
+    } else if (tmpl == LLM_CHAT_TEMPLATE_CHATGLM_4 || tmpl == LLM_CHAT_TEMPLATE_GLMEDGE) {
        ss << "[gMASK]" << "<sop>";
        for (auto message : chat) {
            std::string role(message->role);
@ -456,14 +456,6 @@ int32_t llm_chat_apply_template(
        if (add_ass) {
            ss << "<|assistant|>";
        }
-    } else if (tmpl == LLM_CHAT_TEMPLATE_GLMEDGE) {
-        for (auto message : chat) {
-            std::string role(message->role);
-            ss << "<|" << role << "|>" << "\n" << message->content;
-        }
-        if (add_ass) {
-            ss << "<|assistant|>";
-        }
    } else if (tmpl == LLM_CHAT_TEMPLATE_MINICPM) {
        // MiniCPM-3B-OpenHermes-2.5-v2-GGUF
        for (auto message : chat) {