llama : print correct model type for Llama 3.2 1B and 3B

author Georgi Gerganov <redacted>

Tue, 1 Oct 2024 08:42:01 +0000 (11:42 +0300)

committer Georgi Gerganov <redacted>

Tue, 1 Oct 2024 08:42:01 +0000 (11:42 +0300)
author Georgi Gerganov <redacted>
Tue, 1 Oct 2024 08:42:01 +0000 (11:42 +0300)
committer Georgi Gerganov <redacted>
Tue, 1 Oct 2024 08:42:01 +0000 (11:42 +0300)
diff --git a/src/llama.cpp b/src/llama.cpp

index c466cd88b7c1428da7ad0df6e819209634b338f7..d1d27d21e232fe23b3b1766c4a10afa9d5618c1a 100644 (file)
--- a/src/llama.cpp
+++ b/src/llama.cpp
@@ -5502,8 +5502,10 @@ static void llm_load_hparams(
                      }
                  } else {
                      switch (hparams.n_layer) {
+                        case 16: model.type = e_model::MODEL_1B; break; // Llama 3.2 1B
                          case 22: model.type = e_model::MODEL_1B; break;
                          case 26: model.type = e_model::MODEL_3B; break;
+                        case 28: model.type = e_model::MODEL_3B; break; // Llama 3.2 3B
                          // granite uses a vocab with len 49152
                          case 32: model.type = hparams.n_vocab == 49152 ? e_model::MODEL_3B : (hparams.n_vocab < 40000 ? e_model::MODEL_7B : e_model::MODEL_8B); break;
                          case 36: model.type = e_model::MODEL_8B; break; // granite
author	Georgi Gerganov <redacted>
	Tue, 1 Oct 2024 08:42:01 +0000 (11:42 +0300)
committer	Georgi Gerganov <redacted>
	Tue, 1 Oct 2024 08:42:01 +0000 (11:42 +0300)