convert.py : fix llama/llama2 conversion due to vocab_size=-1 (#5019)

author David Sommers <redacted>

Thu, 18 Jan 2024 17:20:59 +0000 (12:20 -0500)

committer GitHub <redacted>

Thu, 18 Jan 2024 17:20:59 +0000 (19:20 +0200)
author David Sommers <redacted>
Thu, 18 Jan 2024 17:20:59 +0000 (12:20 -0500)
committer GitHub <redacted>
Thu, 18 Jan 2024 17:20:59 +0000 (19:20 +0200)
diff --git a/convert.py b/convert.py

index e38ee5315af30ec3b21f6e83b4c809e8e3f3908b..980e6fc720aa63486390e76d68564de01a1007e2 100755 (executable)
--- a/convert.py
+++ b/convert.py
@@ -348,7 +348,7 @@ class Params:
              f_rope_freq_base = 1e6
  
          return Params(
-            n_vocab=config.get("vocab_size", model["tok_embeddings.weight"].shape[0]),
+            n_vocab=model["tok_embeddings.weight"].shape[0],
              n_embd=config["dim"],
              n_layer=config["n_layers"],
              n_ctx=n_ctx,
author	David Sommers <redacted>
	Thu, 18 Jan 2024 17:20:59 +0000 (12:20 -0500)
committer	GitHub <redacted>
	Thu, 18 Jan 2024 17:20:59 +0000 (19:20 +0200)