From: Nico Bosshard Date: Mon, 12 Aug 2024 15:13:59 +0000 (+0200) Subject: llama : model-based max number of graph nodes calculation (#8970) X-Git-Tag: upstream/0.0.4488~910 X-Git-Url: https://git.djapps.eu/?a=commitdiff_plain;h=0fd93cdef5e583aa980b3c0d693c0d207f0787a7;p=pkg%2Fggml%2Fsources%2Fllama.cpp llama : model-based max number of graph nodes calculation (#8970) * llama : model-based max number of graph nodes calculation * Update src/llama.cpp --------- Co-authored-by: slaren --- diff --git a/src/llama.cpp b/src/llama.cpp index aaf8db49..7f2f0003 100644 --- a/src/llama.cpp +++ b/src/llama.cpp @@ -3575,13 +3575,8 @@ namespace GGUFMeta { using llama_buf_map = std::unordered_map; -// TODO: update when needed or think of some clever automatic way to do this -static size_t llama_model_max_nodes(const llama_model & /*model*/) { - //if (model.arch == LLM_ARCH_LLAMA && model.hparams.n_layer > ??) { // llama-3 405B - // return 32768; - //} - - return 8192; +static size_t llama_model_max_nodes(const llama_model & model) { + return std::max(8192, model.tensors_by_name.size()*5); } struct llama_model_loader {