From: Piotr Wilkin (ilintar) Date: Wed, 21 Jan 2026 11:35:20 +0000 (+0100) Subject: Fix GLM 4.7 Lite MoE gating func (#18980) X-Git-Tag: upstream/0.0.8067~279 X-Git-Url: https://git.djapps.eu/?a=commitdiff_plain;h=12a4a47e6aaf691492644c39da453745aaee1672;p=pkg%2Fggml%2Fsources%2Fllama.cpp Fix GLM 4.7 Lite MoE gating func (#18980) * Fix GLM 4.7 MoE gating func * Update src/models/deepseek2.cpp Co-authored-by: Sigbjørn Skjæret * Update src/llama-model.cpp Co-authored-by: Xuan-Son Nguyen --------- Co-authored-by: Sigbjørn Skjæret Co-authored-by: Xuan-Son Nguyen --- diff --git a/src/llama-model.cpp b/src/llama-model.cpp index 94c47dc24..255289b7c 100644 --- a/src/llama-model.cpp +++ b/src/llama-model.cpp @@ -1713,7 +1713,12 @@ void llama_model::load_hparams(llama_model_loader & ml) { if (hparams.expert_gating_func == LLAMA_EXPERT_GATING_FUNC_TYPE_NONE) { // for compatibility with existing DeepSeek V2 and V2.5 GGUFs // that have no expert_gating_func model parameter set - hparams.expert_gating_func = LLAMA_EXPERT_GATING_FUNC_TYPE_SOFTMAX; + if ((hparams.n_layer == 47 || hparams.n_layer == 48) && n_vocab == 154880) { + // GLM 4.7 Lite + hparams.expert_gating_func = LLAMA_EXPERT_GATING_FUNC_TYPE_SIGMOID; + } else { + hparams.expert_gating_func = LLAMA_EXPERT_GATING_FUNC_TYPE_SOFTMAX; + } } if (ml.get_key(LLM_KV_ROPE_SCALING_YARN_LOG_MUL, hparams.rope_yarn_log_mul, 0.0f)) {