]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
gguf-py : add add_classifier_output_labels method to writer (#14031)
authorSigbjørn Skjæret <redacted>
Thu, 5 Jun 2025 15:42:31 +0000 (17:42 +0200)
committerGitHub <redacted>
Thu, 5 Jun 2025 15:42:31 +0000 (17:42 +0200)
* add add_classifier_output_labels

* use add_classifier_output_labels

convert_hf_to_gguf.py
gguf-py/gguf/gguf_writer.py

index ec3b5697d8f6f67cf5a8c9aef67a2760c9c46ee3..7b9893c8a3e10e0b99cfe175eff45425001cd402 100755 (executable)
@@ -3709,8 +3709,7 @@ class BertModel(TextModel):
         self._try_set_pooling_type()
 
         if self.cls_out_labels:
-            key_name = gguf.Keys.Classifier.OUTPUT_LABELS.format(arch = gguf.MODEL_ARCH_NAMES[self.model_arch])
-            self.gguf_writer.add_array(key_name, [v for k, v in sorted(self.cls_out_labels.items())])
+            self.gguf_writer.add_classifier_output_labels([v for k, v in sorted(self.cls_out_labels.items())])
 
     def set_vocab(self):
         tokens, toktypes, tokpre = self.get_vocab_base()
index de6e45ae827b953a06a01781d14f41db77db2a6a..adc673e38ff072dd700bb58d228dd03d6e27ef9f 100644 (file)
@@ -935,6 +935,9 @@ class GGUFWriter:
     def add_eom_token_id(self, id: int) -> None:
         self.add_uint32(Keys.Tokenizer.EOM_ID, id)
 
+    def add_classifier_output_labels(self, labels: Sequence[str]) -> None:
+        self.add_array(Keys.Classifier.OUTPUT_LABELS.format(arch=self.arch), labels)
+
     # for vision models
 
     def add_clip_has_vision_encoder(self, value: bool) -> None: