]> git.djapps.eu Git - pkg/ggml/sources/whisper.cpp/commitdiff
convert : update convert-h5-to-ggml.py (#2840)
authorAnders Bjarby <redacted>
Mon, 17 Mar 2025 07:41:05 +0000 (08:41 +0100)
committerGitHub <redacted>
Mon, 17 Mar 2025 07:41:05 +0000 (09:41 +0200)
improved handling of missing max_length

models/convert-h5-to-ggml.py

index 5474d58613ac343b40662a4e947f5560ea6cbf07..4d50af46428ef8d2fcb14455172111c0bbab4cd2 100644 (file)
@@ -85,9 +85,15 @@ encoder_added = json.load((dir_model / "added_tokens.json").open( "r", encoding=
 hparams = json.load((dir_model / "config.json").open("r", encoding="utf8"))
 
 # Add this block to handle missing 'max_length'
-if "max_length" not in hparams:
-    hparams["max_length"] = hparams.get("max_target_positions", 448)
-
+if "max_length" not in hparams or hparams["max_length"] is None:
+    hparams["max_length"] = hparams.get("max_target_positions", 448)  # Default to 448 if missing
+elif not isinstance(hparams["max_length"], int):
+    try:
+        hparams["max_length"] = int(hparams["max_length"])  # Convert if necessary
+    except ValueError:
+        print(f"Warning: Invalid max_length value '{hparams['max_length']}', using default 448.")
+        hparams["max_length"] = 448
+        
 model = WhisperForConditionalGeneration.from_pretrained(dir_model)
 
 #code.interact(local=locals())