llama-chat : Add Yandex instruct model template support (#12621)

author Sergei Vorobyov <redacted>

Sun, 30 Mar 2025 18:12:03 +0000 (21:12 +0300)

committer GitHub <redacted>

Sun, 30 Mar 2025 18:12:03 +0000 (20:12 +0200)
author Sergei Vorobyov <redacted>
Sun, 30 Mar 2025 18:12:03 +0000 (21:12 +0300)
committer GitHub <redacted>
Sun, 30 Mar 2025 18:12:03 +0000 (20:12 +0200)
diff --git a/src/llama-chat.cpp b/src/llama-chat.cpp

index de44586967d7115ec7985d39d1e7a3c1a522c58d..d6d781cbaad182bb37759459054e1380c95a4697 100644 (file)
--- a/src/llama-chat.cpp
+++ b/src/llama-chat.cpp
@@ -59,6 +59,7 @@ static const std::map<std::string, llm_chat_template> LLM_CHAT_TEMPLATES = {
      { "granite",           LLM_CHAT_TEMPLATE_GRANITE           },
      { "gigachat",          LLM_CHAT_TEMPLATE_GIGACHAT          },
      { "megrez",            LLM_CHAT_TEMPLATE_MEGREZ            },
+    { "yandex",            LLM_CHAT_TEMPLATE_YANDEX            },
  };
  
  llm_chat_template llm_chat_template_from_str(const std::string & name) {
@@ -168,6 +169,8 @@ llm_chat_template llm_chat_detect_template(const std::string & tmpl) {
          return LLM_CHAT_TEMPLATE_GIGACHAT;
      } else if (tmpl_contains("<|role_start|>")) {
          return LLM_CHAT_TEMPLATE_MEGREZ;
+    } else if (tmpl_contains(" Ассистент:")) {
+        return LLM_CHAT_TEMPLATE_YANDEX;
      }
      return LLM_CHAT_TEMPLATE_UNKNOWN;
  }
@@ -567,6 +570,24 @@ int32_t llm_chat_apply_template(
          if (add_ass) {
              ss << "<|role_start|>assistant<|role_end|>";
          }
+    } else if (tmpl == LLM_CHAT_TEMPLATE_YANDEX) {
+        // Yandex template ("\n\n" is defined as EOT token)
+
+        ss << "<s>";
+
+        for (size_t i = 0; i < chat.size(); i++) {
+            std::string role(chat[i]->role);
+            if (role == "user") {
+                ss << " Пользователь: " << chat[i]->content << "\n\n";
+            } else if (role == "assistant") {
+                ss << " Ассистент: " << chat[i]->content << "\n\n";
+            }
+        }
+
+        // Add generation prompt if needed
+        if (add_ass) {
+            ss << " Ассистент:[SEP]";
+        }
      } else {
          // template not supported
          return -1;
@@ -585,4 +606,3 @@ int32_t llama_chat_builtin_templates(const char ** output, size_t len) {
      }
      return (int32_t) LLM_CHAT_TEMPLATES.size();
  }
-
diff --git a/src/llama-chat.h b/src/llama-chat.h

index 2f6a0e3e2826638be2af9c59047c4ff071741d64..bbd5a6b722a7398f394e8bcdf63da845d83d1a3d 100644 (file)
--- a/src/llama-chat.h
+++ b/src/llama-chat.h
@@ -38,6 +38,7 @@ enum llm_chat_template {
      LLM_CHAT_TEMPLATE_GRANITE,
      LLM_CHAT_TEMPLATE_GIGACHAT,
      LLM_CHAT_TEMPLATE_MEGREZ,
+    LLM_CHAT_TEMPLATE_YANDEX,
      LLM_CHAT_TEMPLATE_UNKNOWN,
  };
  
diff --git a/tests/test-chat-template.cpp b/tests/test-chat-template.cpp

index 9231c517afb0b85d0df60e3868076addd60cce64..894d83714105dc11b8432ec51b85b24849c56a89 100644 (file)
--- a/tests/test-chat-template.cpp
+++ b/tests/test-chat-template.cpp
@@ -270,6 +270,14 @@ int main(void) {
              /* .bos_token= */ "",
              /* .eos_token= */ "",
          },
+        {
+            /* .name= */ "yandex/YandexGPT-5-Lite-8B-instruct",
+            /* .template_str= */ "<s>{%- set names = {'assistant': ' Ассистент:', 'user': ' Пользователь:'} %}\n{%- set tools_prefix = 'Тебе доступны следующие функции:' %}\n{%- macro __render_tool(tool) %}\n    {%- set name = tool.function.name %}\n    {%- set description = tool.function.description|default('') %}\n    {%- set parameters = tool.function.parameters|tojson %}\n    {{- '\\n' }}function {{ '{' }}'name':'{{ name }}',\n    {%- if tool.function.description %}'description':'{{ description }}',{% endif %}\n'parameters':{{ parameters }}\n    {{- '}' }}\n{%- endmacro %}\n{%- macro __render_tools(tools) %}\n    {{- tools_prefix }}\n    {%- for tool in tools %}\n        {{- __render_tool(tool) }}\n    {%- endfor %}\n    {{- '\\n\\n' }}\n{%- endmacro %}\n{%- macro __render_tool_message(message) %}\n    {{- '\\n\\nРезультат вызова' }} {{ message.name }}: {{ message.content }} {{ '\\n\\n' }}\n{%- endmacro %}\n{%- if tools -%}\n    {{- __render_tools(tools) }}\n{%- endif -%}\n{%- macro __render_user_message(message) %}\n{{ names.user }} {{ message.content + '\\n\\n' }}\n{%- endmacro %}\n{%- macro __render_assistant_message(message) %}\n    {{- names.assistant }}\n    {%- set call = message['function_call'] %}\n    {%- if call %}\n        {{- '\\n[TOOL_CALL_START]' }}{{ call.name }}{{ '\\n' }}{{ call.arguments|tojson }}\n    {%- else %}\n        {{- ' ' + message.content + '\\n\\n' }}\n    {%- endif %}\n{%- endmacro %}\n{%- if not add_generation_prompt is defined %}\n{%- set add_generation_prompt = false %}\n{%- endif %}\n{%- for message in messages %}\n    {%- if message['role'] == 'user' %}\n        {{- __render_user_message(message) }}\n    {%- endif %}\n    {%- if message.role == 'assistant' and not loop.last %}\n        {{- __render_assistant_message(message) }}\n    {%- endif %}\n    {%- if message.role == 'tool' %}\n        {{- __render_tool_message(message) }}\n    {%- endif %}\n    {%- if loop.last %}\n        {{- ' Ассистент:[SEP]' }}\n    {%- endif %}\n{%- endfor %}\n",
+            /* .expected_output= */ "<s> Пользователь: Hello\n\n Ассистент: Hi there\n\n Пользователь: Who are you\n\n Ассистент:    I am an assistant   \n\n Пользователь: Another question\n\n Ассистент:[SEP]",
+            /* .expected_output_jinja= */ "<s> Пользователь: You are a helpful assistant\nHello\n\n Ассистент: Hi there\n\n Пользователь: Who are you\n\n Ассистент:    I am an assistant   \n\n Пользователь: Another question\n\n Ассистент:[SEP]",
+            /* .bos_token= */ "",
+            /* .eos_token= */ "",
+        },
      };
      std::vector<char> formatted_chat(1024);
      int32_t res;
author	Sergei Vorobyov <redacted>
	Sun, 30 Mar 2025 18:12:03 +0000 (21:12 +0300)
committer	GitHub <redacted>
	Sun, 30 Mar 2025 18:12:03 +0000 (20:12 +0200)
src/llama-chat.cpp		patch \| blob \| history
src/llama-chat.h		patch \| blob \| history
tests/test-chat-template.cpp		patch \| blob \| history