]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
convert : register Qwen 3.5 ForCausalLM for text only (#20119)
authorSigbjørn Skjæret <redacted>
Thu, 5 Mar 2026 09:30:02 +0000 (10:30 +0100)
committerGitHub <redacted>
Thu, 5 Mar 2026 09:30:02 +0000 (10:30 +0100)
convert_hf_to_gguf.py

index a6d259a640480b57c9e26ce4e99ff7dfdb1a7c49..083b5bca9e94b31b8b0b3caffea84f360fc65e7a 100755 (executable)
@@ -4842,12 +4842,12 @@ class _LinearAttentionVReorderBase(Qwen3NextModel):
         yield from super().modify_tensors(data_torch, name, bid)
 
 
-@ModelBase.register("Qwen3_5ForConditionalGeneration")
+@ModelBase.register("Qwen3_5ForConditionalGeneration", "Qwen3_5ForCausalLM")
 class Qwen3_5TextModel(_LinearAttentionVReorderBase):
     model_arch = gguf.MODEL_ARCH.QWEN35
 
 
-@ModelBase.register("Qwen3_5MoeForConditionalGeneration")
+@ModelBase.register("Qwen3_5MoeForConditionalGeneration", "Qwen3_5MoeForCausalLM")
 class Qwen3_5MoeTextModel(_LinearAttentionVReorderBase):
     model_arch = gguf.MODEL_ARCH.QWEN35MOE