From: Georgi Gerganov Date: Wed, 30 Aug 2023 10:29:40 +0000 (+0300) Subject: convert.py : use dir name to name the llama X-Git-Tag: gguf-v0.4.0~178 X-Git-Url: https://git.djapps.eu/?a=commitdiff_plain;h=b532a69b2fd08067f34f32f37a2fd9b37678a34a;p=pkg%2Fggml%2Fsources%2Fllama.cpp convert.py : use dir name to name the llama --- diff --git a/convert.py b/convert.py index 448b6f0f..a7f4c2d7 100755 --- a/convert.py +++ b/convert.py @@ -811,10 +811,12 @@ class OutputFile: def add_meta_arch(self, params: Params) -> None: name = "LLaMA" + + # TODO: better logic to determine model name if (params.n_ctx == 4096): name = "LLaMA v2" - if params.path_model: - name = str(params.path_model.parent).split('/')[-1] + elif params.path_model: + name = str(params.path_model.parent).split('/')[-1] self.gguf.add_name (name) self.gguf.add_context_length (params.n_ctx) @@ -839,8 +841,7 @@ class OutputFile: tokens = [] scores = [] toktypes = [] - # NOTE: `all_tokens` returns the the base vocabulary and added tokens - # TODO: add special tokens? + # NOTE: `all_tokens` returns the base vocabulary and added tokens for text, score, toktype in vocab.all_tokens(): tokens.append(text) scores.append(score)