summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorGeorgi Gerganov <ggerganov@gmail.com>2024-05-08 12:47:07 +0300
committerGeorgi Gerganov <ggerganov@gmail.com>2024-05-08 12:47:07 +0300
commit7e0b6a7b3ba94ff624dc27c1e0e735fded8819b8 (patch)
tree71fde56f4719bf795918f2179f11919dc8e2d3c0
parentacdce3cdef6fc2f0b7b5623231fd7762c0884d1c (diff)
py : also print the normalizers
-rwxr-xr-xconvert-hf-to-gguf-update.py2
1 files changed, 2 insertions, 0 deletions
diff --git a/convert-hf-to-gguf-update.py b/convert-hf-to-gguf-update.py
index ae901e24..a3fe67ee 100755
--- a/convert-hf-to-gguf-update.py
+++ b/convert-hf-to-gguf-update.py
@@ -151,6 +151,8 @@ for model in models:
# print the "pre_tokenizer" content from the tokenizer.json
with open(f"models/tokenizers/{name}/tokenizer.json", "r", encoding="utf-8") as f:
cfg = json.load(f)
+ normalizer = cfg["normalizer"]
+ logger.info("normalizer: " + json.dumps(normalizer, indent=4))
pre_tokenizer = cfg["pre_tokenizer"]
logger.info("pre_tokenizer: " + json.dumps(pre_tokenizer, indent=4))