llama : add Orion chat template (#6066)

author Xuan Son Nguyen <redacted>

Fri, 15 Mar 2024 08:44:57 +0000 (09:44 +0100)

committer GitHub <redacted>

Fri, 15 Mar 2024 08:44:57 +0000 (10:44 +0200)
author Xuan Son Nguyen <redacted>
Fri, 15 Mar 2024 08:44:57 +0000 (09:44 +0100)
committer GitHub <redacted>
Fri, 15 Mar 2024 08:44:57 +0000 (10:44 +0200)
diff --git a/llama.cpp b/llama.cpp

index 2c384197492e87841f57408a511b6ea5902e2938..b8a8d2723ae7d526f83121ff18bc25232645187d 100644 (file)
--- a/llama.cpp
+++ b/llama.cpp
@@ -14242,6 +14242,26 @@ static int32_t llama_chat_apply_template_internal(
          if (add_ass) {
              ss << "<start_of_turn>model\n";
          }
+    } else if (tmpl == "orion" || tmpl.find("'\\n\\nAssistant: ' + eos_token") != std::string::npos) {
+        // OrionStarAI/Orion-14B-Chat
+        std::string system_prompt = "";
+        for (auto message : chat) {
+            std::string role(message->role);
+            if (role == "system") {
+                // there is no system message support, we will merge it with user prompt
+                system_prompt = message->content;
+                continue;
+            } else if (role == "user") {
+                ss << "Human: ";
+                if (!system_prompt.empty()) {
+                    ss << system_prompt << "\n\n";
+                    system_prompt = "";
+                }
+                ss << message->content << "\n\nAssistant: </s>";
+            } else {
+                ss << message->content << "</s>";
+            }
+        }
      } else {
          // template not supported
          return -1;
diff --git a/tests/test-chat-template.cpp b/tests/test-chat-template.cpp

index fa2eb577b6e423c9cdb673f83babef8465a45ad5..6e9e4bd1ea2cc242b094d41a191aa639dfe0420d 100644 (file)
--- a/tests/test-chat-template.cpp
+++ b/tests/test-chat-template.cpp
@@ -31,6 +31,8 @@ int main(void) {
          "{% for message in messages %}{{bos_token + message['role'] + '\\n' + message['content'] + eos_token + '\\n'}}{% endfor %}{% if add_generation_prompt %}{{ bos_token + 'assistant\\n' }}{% endif %}",
          // google/gemma-7b-it
          "{% if messages[0]['role'] == 'system' %}{{ raise_exception('System role not supported') }}{% endif %}{% for message in messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if (message['role'] == 'assistant') %}{% set role = 'model' %}{% else %}{% set role = message['role'] %}{% endif %}{{ '<start_of_turn>' + role + '\\n' + message['content'] | trim + '<end_of_turn>\\n' }}{% endfor %}{% if add_generation_prompt %}{{'<start_of_turn>model\\n'}}{% endif %}",
+        // OrionStarAI/Orion-14B-Chat
+        "{% for message in messages %}{% if loop.first %}{{ bos_token }}{% endif %}{% if message['role'] == 'user' %}{{ 'Human: ' + message['content'] + '\\n\\nAssistant: ' + eos_token }}{% elif message['role'] == 'assistant' %}{{ message['content'] + eos_token }}{% endif %}{% endfor %}",
      };
      std::vector<std::string> expected_output = {
          // teknium/OpenHermes-2.5-Mistral-7B
@@ -45,6 +47,8 @@ int main(void) {
          "system\nYou are a helpful assistant</s>\n<s>user\nHello</s>\n<s>assistant\nHi there</s>\n<s>user\nWho are you</s>\n<s>assistant\n   I am an assistant   </s>\n<s>user\nAnother question</s>\n<s>assistant\n",
          // google/gemma-7b-it
          "<start_of_turn>user\nYou are a helpful assistant\n\nHello<end_of_turn>\n<start_of_turn>model\nHi there<end_of_turn>\n<start_of_turn>user\nWho are you<end_of_turn>\n<start_of_turn>model\nI am an assistant<end_of_turn>\n<start_of_turn>user\nAnother question<end_of_turn>\n<start_of_turn>model\n",
+        // OrionStarAI/Orion-14B-Chat
+        "Human: You are a helpful assistant\n\nHello\n\nAssistant: </s>Hi there</s>Human: Who are you\n\nAssistant: </s>   I am an assistant   </s>Human: Another question\n\nAssistant: </s>",
      };
      std::vector<char> formatted_chat(1024);
      int32_t res;
author	Xuan Son Nguyen <redacted>
	Fri, 15 Mar 2024 08:44:57 +0000 (09:44 +0100)
committer	GitHub <redacted>
	Fri, 15 Mar 2024 08:44:57 +0000 (10:44 +0200)
llama.cpp		patch \| blob \| history
tests/test-chat-template.cpp		patch \| blob \| history