Browse Source

MODEL_TENSOR.SSM_DT_NORM has defined twice (#14991)

* MODEL_TENSOR.SSM_DT_NORM has defined twice, and second overwritten the jamba model's layername

* correct order
Csaba Kecskemeti 5 months ago
parent
commit
36e5fe7bcd
1 changed files with 1 additions and 4 deletions
  1. 1 4
      gguf-py/gguf/tensor_mapping.py

+ 1 - 4
gguf-py/gguf/tensor_mapping.py

@@ -616,6 +616,7 @@ class TensorNameMap:
         ),
         ),
 
 
         MODEL_TENSOR.SSM_DT_NORM: (
         MODEL_TENSOR.SSM_DT_NORM: (
+            "model.layers.layers.{bid}.mixer.dt_norm.weight",  # plamo2
             "model.layers.{bid}.mamba.dt_layernorm",  # jamba
             "model.layers.{bid}.mamba.dt_layernorm",  # jamba
         ),
         ),
 
 
@@ -645,10 +646,6 @@ class TensorNameMap:
             "model.layers.layers.{bid}.mixer.D",  # plamo2
             "model.layers.layers.{bid}.mixer.D",  # plamo2
         ),
         ),
 
 
-        MODEL_TENSOR.SSM_DT_NORM: (
-            "model.layers.layers.{bid}.mixer.dt_norm.weight",  # plamo2
-        ),
-
         MODEL_TENSOR.SSM_NORM: (
         MODEL_TENSOR.SSM_NORM: (
             "model.layers.{bid}.mamba.norm", # falcon-h1 granite-hybrid
             "model.layers.{bid}.mamba.norm", # falcon-h1 granite-hybrid
             "backbone.layers.{bid}.mixer.norm",  # mamba2
             "backbone.layers.{bid}.mixer.norm",  # mamba2