From: Galunid Date: Mon, 23 Oct 2023 15:47:03 +0000 (+0200) Subject: Fix baichuan convert script not detecing model (#3739) X-Git-Tag: upstream/0.0.4488~3072 X-Git-Url: https://git.djapps.eu/?a=commitdiff_plain;h=6336701c9378c23c85d1c0e464b663ca2bbb8e60;p=pkg%2Fggml%2Fsources%2Fllama.cpp Fix baichuan convert script not detecing model (#3739) It seems nobody objects. --- diff --git a/convert-baichuan-hf-to-gguf.py b/convert-baichuan-hf-to-gguf.py index 3b64ecb8..5ee99be7 100755 --- a/convert-baichuan-hf-to-gguf.py +++ b/convert-baichuan-hf-to-gguf.py @@ -110,7 +110,7 @@ print("gguf: loading model "+dir_model.name) with open(dir_model / "config.json", "r", encoding="utf-8") as f: hparams = json.load(f) print("hello print: ",hparams["architectures"][0]) -if hparams["architectures"][0] != "BaichuanForCausalLM": +if hparams["architectures"][0] != "BaichuanForCausalLM" and hparams["architectures"][0] != "BaiChuanForCausalLM": print("Model architecture not supported: " + hparams["architectures"][0]) sys.exit()