From: Zhang Peiyuan Date: Wed, 27 Sep 2023 18:45:20 +0000 (+0800) Subject: convert : remove bug in convert.py permute function (#3364) X-Git-Tag: gguf-v0.4.0~27 X-Git-Url: https://git.djapps.eu/?a=commitdiff_plain;h=e519621010cac02c6fec0f8f3b16cda0591042c0;p=pkg%2Fggml%2Fsources%2Fllama.cpp convert : remove bug in convert.py permute function (#3364) --- diff --git a/convert.py b/convert.py index 4ac5030d..8bb6c7e4 100755 --- a/convert.py +++ b/convert.py @@ -439,7 +439,7 @@ Vocab: TypeAlias = 'BpeVocab | SentencePieceVocab' def permute(weights: NDArray, n_head: int, n_head_kv: int) -> NDArray: #print( "permute debug " + str(weights.shape[0]) + " x " + str(weights.shape[1]) + " nhead " + str(n_head) + " nheadkv " + str(n_kv_head) ) if n_head_kv is not None and n_head != n_head_kv: - n_head //= n_head_kv + n_head = n_head_kv return (weights.reshape(n_head, 2, weights.shape[0] // n_head // 2, *weights.shape[1:]) .swapaxes(1, 2) .reshape(weights.shape))