gguf-py : export chat templates (#4125)

author slaren <redacted>

Sun, 19 Nov 2023 10:10:52 +0000 (11:10 +0100)

committer GitHub <redacted>

Sun, 19 Nov 2023 10:10:52 +0000 (11:10 +0100)
author slaren <redacted>
Sun, 19 Nov 2023 10:10:52 +0000 (11:10 +0100)
committer GitHub <redacted>
Sun, 19 Nov 2023 10:10:52 +0000 (11:10 +0100)
diff --git a/gguf-py/gguf/constants.py b/gguf-py/gguf/constants.py

index 7f63361bd32bc3bc1b82e4bb04b805577b1efc9c..8bd82daca38a78c902922b7c1273a10af6bca30e 100644 (file)
--- a/gguf-py/gguf/constants.py
+++ b/gguf-py/gguf/constants.py
@@ -56,20 +56,21 @@ class Keys:
          SCALING_FINETUNED    = "{arch}.rope.scaling.finetuned"
  
      class Tokenizer:
-        MODEL      = "tokenizer.ggml.model"
-        LIST       = "tokenizer.ggml.tokens"
-        TOKEN_TYPE = "tokenizer.ggml.token_type"
-        SCORES     = "tokenizer.ggml.scores"
-        MERGES     = "tokenizer.ggml.merges"
-        BOS_ID     = "tokenizer.ggml.bos_token_id"
-        EOS_ID     = "tokenizer.ggml.eos_token_id"
-        UNK_ID     = "tokenizer.ggml.unknown_token_id"
-        SEP_ID     = "tokenizer.ggml.seperator_token_id"
-        PAD_ID     = "tokenizer.ggml.padding_token_id"
-        ADD_BOS    = "tokenizer.ggml.add_bos_token"
-        ADD_EOS    = "tokenizer.ggml.add_eos_token"
-        HF_JSON    = "tokenizer.huggingface.json"
-        RWKV       = "tokenizer.rwkv.world"
+        MODEL         = "tokenizer.ggml.model"
+        LIST          = "tokenizer.ggml.tokens"
+        TOKEN_TYPE    = "tokenizer.ggml.token_type"
+        SCORES        = "tokenizer.ggml.scores"
+        MERGES        = "tokenizer.ggml.merges"
+        BOS_ID        = "tokenizer.ggml.bos_token_id"
+        EOS_ID        = "tokenizer.ggml.eos_token_id"
+        UNK_ID        = "tokenizer.ggml.unknown_token_id"
+        SEP_ID        = "tokenizer.ggml.seperator_token_id"
+        PAD_ID        = "tokenizer.ggml.padding_token_id"
+        ADD_BOS       = "tokenizer.ggml.add_bos_token"
+        ADD_EOS       = "tokenizer.ggml.add_eos_token"
+        HF_JSON       = "tokenizer.huggingface.json"
+        RWKV          = "tokenizer.rwkv.world"
+        CHAT_TEMPLATE = "tokenizer.chat_template"
  
  
  #
diff --git a/gguf-py/gguf/gguf_writer.py b/gguf-py/gguf/gguf_writer.py

index c3b8c588f17cdb10e3be2aafcc85af6bdbcd87fb..ab7382c44f44e651a9cd0ae3a98b1b02ab578ae0 100644 (file)
--- a/gguf-py/gguf/gguf_writer.py
+++ b/gguf-py/gguf/gguf_writer.py
@@ -399,6 +399,9 @@ class GGUFWriter:
      def add_add_eos_token(self, value: bool) -> None:
          self.add_bool(Keys.Tokenizer.ADD_EOS, value)
  
+    def add_chat_template(self, value: str) -> None:
+        self.add_string(Keys.Tokenizer.CHAT_TEMPLATE, value)
+
      def _pack(self, fmt: str, value: Any, skip_pack_prefix: bool = False) -> bytes:
          pack_prefix = ''
          if not skip_pack_prefix:
diff --git a/gguf-py/gguf/vocab.py b/gguf-py/gguf/vocab.py

index b9f50a0afed7a0ccbe0f8ed239c5b9fee4eb008d..de3e5edb557d7b483ccb76da975a2c71e30700b9 100644 (file)
--- a/gguf-py/gguf/vocab.py
+++ b/gguf-py/gguf/vocab.py
@@ -13,6 +13,7 @@ class SpecialVocab:
      merges: list[str]
      add_special_token: dict[str, bool]
      special_token_ids: dict[str, int]
+    chat_template: str | None
  
      def __init__(
          self, path: str | os.PathLike[str], load_merges: bool = False,
@@ -24,6 +25,7 @@ class SpecialVocab:
          self.n_vocab = n_vocab
          self.load_merges = load_merges
          self.merges = []
+        self.chat_template = None
          if special_token_types is not None:
              self.special_token_types = special_token_types
          else:
@@ -67,6 +69,10 @@ class SpecialVocab:
              if not quiet:
                  print(f'gguf: Setting add_{typ}_token to {value}')
              add_handler(value)
+        if self.chat_template is not None:
+            if not quiet:
+                print(f'gguf: Setting chat_template to {self.chat_template}')
+            gw.add_chat_template(self.chat_template)
  
      def _load(self, path: Path) -> None:
          self._try_load_from_tokenizer_json(path)
@@ -132,6 +138,14 @@ class SpecialVocab:
              return True
          with open(tokenizer_config_file, encoding = 'utf-8') as f:
              tokenizer_config = json.load(f)
+        chat_template = tokenizer_config.get('chat_template')
+        if chat_template is None or isinstance(chat_template, str):
+            self.chat_template = chat_template
+        else:
+            print(
+                f'gguf: WARNING: Bad type for chat_template field in {tokenizer_config_file!r} - ignoring',
+                file = sys.stderr
+            )
          for typ in self.special_token_types:
              add_entry = tokenizer_config.get(f'add_{typ}_token')
              if isinstance(add_entry, bool):
diff --git a/gguf-py/pyproject.toml b/gguf-py/pyproject.toml

index 6e3f9e85549d0261e5e0756d0b2e3d299e988149..e6374bfe898a4b86a55e0a06c2e8768fdb94707d 100644 (file)
--- a/gguf-py/pyproject.toml
+++ b/gguf-py/pyproject.toml
@@ -1,6 +1,6 @@
  [tool.poetry]
  name = "gguf"
-version = "0.5.3"
+version = "0.6.0"
  description = "Read and write ML models in GGUF for GGML"
  authors = ["GGML <ggml@ggml.ai>"]
  packages = [
diff --git a/llama.cpp b/llama.cpp

index 56d8e765cc11299c107b326b41412ab7d13c683c..062c9757b53981dbf11c8fd22ec26874d215a7ca 100644 (file)
--- a/llama.cpp
+++ b/llama.cpp
@@ -1871,6 +1871,7 @@ struct llama_model_loader {
                  if (value.size() > MAX_VALUE_LEN) {
                      value = format("%s...", value.substr(0, MAX_VALUE_LEN - 3).c_str());
                  }
+                replace_all(value, "\n", "\\n");
  
                  LLAMA_LOG_INFO("%s: - kv %3d: %42s %-16s = %s\n", __func__, i, name, type_name.c_str(), value.c_str());
              }
author	slaren <redacted>
	Sun, 19 Nov 2023 10:10:52 +0000 (11:10 +0100)
committer	GitHub <redacted>
	Sun, 19 Nov 2023 10:10:52 +0000 (11:10 +0100)
gguf-py/gguf/constants.py		patch \| blob \| history
gguf-py/gguf/gguf_writer.py		patch \| blob \| history
gguf-py/gguf/vocab.py		patch \| blob \| history
gguf-py/pyproject.toml		patch \| blob \| history
llama.cpp		patch \| blob \| history