From: Georgi Gerganov Date: Tue, 1 Oct 2024 08:42:01 +0000 (+0300) Subject: llama : print correct model type for Llama 3.2 1B and 3B X-Git-Tag: upstream/0.0.4488~632 X-Git-Url: https://git.djapps.eu/?a=commitdiff_plain;h=a90484c6d9db699bf739d0f33daf1c50cbdd45c9;p=pkg%2Fggml%2Fsources%2Fllama.cpp llama : print correct model type for Llama 3.2 1B and 3B --- diff --git a/src/llama.cpp b/src/llama.cpp index c466cd88..d1d27d21 100644 --- a/src/llama.cpp +++ b/src/llama.cpp @@ -5502,8 +5502,10 @@ static void llm_load_hparams( } } else { switch (hparams.n_layer) { + case 16: model.type = e_model::MODEL_1B; break; // Llama 3.2 1B case 22: model.type = e_model::MODEL_1B; break; case 26: model.type = e_model::MODEL_3B; break; + case 28: model.type = e_model::MODEL_3B; break; // Llama 3.2 3B // granite uses a vocab with len 49152 case 32: model.type = hparams.n_vocab == 49152 ? e_model::MODEL_3B : (hparams.n_vocab < 40000 ? e_model::MODEL_7B : e_model::MODEL_8B); break; case 36: model.type = e_model::MODEL_8B; break; // granite