]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
MODEL_TENSOR.SSM_DT_NORM has defined twice (#14991)
authorCsaba Kecskemeti <redacted>
Thu, 31 Jul 2025 14:59:49 +0000 (07:59 -0700)
committerGitHub <redacted>
Thu, 31 Jul 2025 14:59:49 +0000 (10:59 -0400)
* MODEL_TENSOR.SSM_DT_NORM has defined twice, and second overwritten the jamba model's layername

* correct order

gguf-py/gguf/tensor_mapping.py

index 15adbfa7818455a93e67a54a6a6faed472ea4ce2..df490fc80e9b7331b6bea8523dba3d5daffe3dd5 100644 (file)
@@ -616,6 +616,7 @@ class TensorNameMap:
         ),
 
         MODEL_TENSOR.SSM_DT_NORM: (
+            "model.layers.layers.{bid}.mixer.dt_norm.weight",  # plamo2
             "model.layers.{bid}.mamba.dt_layernorm",  # jamba
         ),
 
@@ -645,10 +646,6 @@ class TensorNameMap:
             "model.layers.layers.{bid}.mixer.D",  # plamo2
         ),
 
-        MODEL_TENSOR.SSM_DT_NORM: (
-            "model.layers.layers.{bid}.mixer.dt_norm.weight",  # plamo2
-        ),
-
         MODEL_TENSOR.SSM_NORM: (
             "model.layers.{bid}.mamba.norm", # falcon-h1 granite-hybrid
             "backbone.layers.{bid}.mixer.norm",  # mamba2