]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
py : also print the normalizers
authorGeorgi Gerganov <redacted>
Wed, 8 May 2024 09:47:07 +0000 (12:47 +0300)
committerGeorgi Gerganov <redacted>
Wed, 8 May 2024 09:47:07 +0000 (12:47 +0300)
convert-hf-to-gguf-update.py

index ae901e24c9a175e16dc207eb92026c3f4091450d..a3fe67ee7de9c018169359582d7eb66abcbb6874 100755 (executable)
@@ -151,6 +151,8 @@ for model in models:
     # print the "pre_tokenizer" content from the tokenizer.json
     with open(f"models/tokenizers/{name}/tokenizer.json", "r", encoding="utf-8") as f:
         cfg = json.load(f)
+        normalizer = cfg["normalizer"]
+        logger.info("normalizer: " + json.dumps(normalizer, indent=4))
         pre_tokenizer = cfg["pre_tokenizer"]
         logger.info("pre_tokenizer: " + json.dumps(pre_tokenizer, indent=4))