llama-chat : reset glmedge chat template (#13253)

author piDack <redacted>

Fri, 2 May 2025 09:06:09 +0000 (17:06 +0800)

committer GitHub <redacted>

Fri, 2 May 2025 09:06:09 +0000 (11:06 +0200)
author piDack <redacted>
Fri, 2 May 2025 09:06:09 +0000 (17:06 +0800)
committer GitHub <redacted>
Fri, 2 May 2025 09:06:09 +0000 (11:06 +0200)
diff --git a/src/llama-chat.cpp b/src/llama-chat.cpp

index 9b566149518796eca991e982574aa7797d41c439..46d43c58ef4d468ba98d6b0548523be57e3414d6 100644 (file)
--- a/src/llama-chat.cpp
+++ b/src/llama-chat.cpp
@@ -447,7 +447,7 @@ int32_t llm_chat_apply_template(
          if (add_ass) {
              ss << "<|assistant|>";
          }
-    } else if (tmpl == LLM_CHAT_TEMPLATE_CHATGLM_4 || tmpl == LLM_CHAT_TEMPLATE_GLMEDGE) {
+    } else if (tmpl == LLM_CHAT_TEMPLATE_CHATGLM_4) {
          ss << "[gMASK]" << "<sop>";
          for (auto message : chat) {
              std::string role(message->role);
@@ -456,6 +456,14 @@ int32_t llm_chat_apply_template(
          if (add_ass) {
              ss << "<|assistant|>\n";
          }
+    } else if (tmpl == LLM_CHAT_TEMPLATE_GLMEDGE) {
+        for (auto message : chat) {
+            std::string role(message->role);
+            ss << "<|" << role << "|>" << "\n" << message->content;
+        }
+        if (add_ass) {
+            ss << "<|assistant|>";
+        }
      } else if (tmpl == LLM_CHAT_TEMPLATE_MINICPM) {
          // MiniCPM-3B-OpenHermes-2.5-v2-GGUF
          for (auto message : chat) {
diff --git a/tests/test-chat-template.cpp b/tests/test-chat-template.cpp

index d217069575cdf02bbf80ebc3509599ed057bd6fb..a0a50f9881fe0381661c1da92fbf2a3da20f8df5 100644 (file)
--- a/tests/test-chat-template.cpp
+++ b/tests/test-chat-template.cpp
@@ -187,15 +187,14 @@ int main(void) {
              /* .bos_token= */ "",
              /* .eos_token= */ "",
          },
-        // TODO @ngxson : GLMEdge produces poor result without `[gMASK]<sop>`, so we're temporarily using GLM4 template for it. We should fix this in the future.
-        // {
-        //     /* .name= */ "GLMEdge",
-        //     /* .template_str= */ "{% for item in messages %}{% if item['role'] == 'system' %}<|system|>\n{{ item['content'] }}{% elif item['role'] == 'user' %}<|user|>\n{{ item['content'] }}{% elif item['role'] == 'assistant' %}<|assistant|>\n{{ item['content'] }}{% endif %}{% endfor %}<|assistant|>",
-        //     /* .expected_output= */ "<|system|>\nYou are a helpful assistant<|user|>\nHello<|assistant|>\nHi there<|user|>\nWho are you<|assistant|>\n   I am an assistant   <|user|>\nAnother question<|assistant|>",
-        //     /* .expected_output_jinja= */ "<|system|>\nYou are a helpful assistant<|user|>\nHello<|assistant|>\nHi there<|user|>\nWho are you<|assistant|>\n   I am an assistant   <|user|>\nAnother question<|assistant|>",
-        //     /* .bos_token= */ "",
-        //     /* .eos_token= */ "",
-        // },
+        {
+            /* .name= */ "GLMEdge",
+            /* .template_str= */ "{% for item in messages %}{% if item['role'] == 'system' %}<|system|>\n{{ item['content'] }}{% elif item['role'] == 'user' %}<|user|>\n{{ item['content'] }}{% elif item['role'] == 'assistant' %}<|assistant|>\n{{ item['content'] }}{% endif %}{% endfor %}<|assistant|>",
+            /* .expected_output= */ "<|system|>\nYou are a helpful assistant<|user|>\nHello<|assistant|>\nHi there<|user|>\nWho are you<|assistant|>\n   I am an assistant   <|user|>\nAnother question<|assistant|>",
+            /* .expected_output_jinja= */ "<|system|>\nYou are a helpful assistant<|user|>\nHello<|assistant|>\nHi there<|user|>\nWho are you<|assistant|>\n   I am an assistant   <|user|>\nAnother question<|assistant|>",
+            /* .bos_token= */ "",
+            /* .eos_token= */ "",
+        },
          {
              /* .name= */ "MiniCPM-3B-OpenHermes-2.5-v2-GGUF",
              /* .template_str= */ U8C("{% for message in messages %}{% if message['role'] == 'user' %}{{'<用户>' + message['content'].strip() + '<AI>'}}{% else %}{{message['content'].strip()}}{% endif %}{% endfor %}"),
author	piDack <redacted>
	Fri, 2 May 2025 09:06:09 +0000 (17:06 +0800)
committer	GitHub <redacted>
	Fri, 2 May 2025 09:06:09 +0000 (11:06 +0200)
src/llama-chat.cpp		patch \| blob \| history
tests/test-chat-template.cpp		patch \| blob \| history