]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
convert : fix rwkv bos/eos token (#13844)
authorSigbjørn Skjæret <redacted>
Fri, 30 May 2025 12:50:43 +0000 (14:50 +0200)
committerGitHub <redacted>
Fri, 30 May 2025 12:50:43 +0000 (14:50 +0200)
convert_hf_to_gguf.py

index 54738b862e1fb6fff2569b550a0d39d41263d13e..ab0f0e0ea087e8776750ea1e6eeb282c6340a691 100755 (executable)
@@ -1047,6 +1047,10 @@ class TextModel(ModelBase):
         special_vocab.chat_template = "rwkv-world"
         # hack: Add '\n\n' as the EOT token to make it chat normally
         special_vocab._set_special_token("eot", 261)
+        # hack: Override these as they have already been set (incorrectly)
+        special_vocab.special_token_ids["bos"] = 0
+        special_vocab.special_token_ids["eos"] = 0
+
         special_vocab.add_to_gguf(self.gguf_writer)
 
     def _set_vocab_builtin(self, model_name: Literal["gpt-neox", "llama-spm"], vocab_size: int):