Просмотр исходного кода

convert : correct gemma 3n conversion (#14450)

* convert : correct gemma 3n conversion

* rm redundant code
Xuan-Son Nguyen 6 месяцев назад
Родитель
Сommit
0c2ee38ab7
1 измененных файлов с 2 добавлено и 2 удалено
  1. 2 2
      gguf-py/gguf/gguf_writer.py

+ 2 - 2
gguf-py/gguf/gguf_writer.py

@@ -714,8 +714,8 @@ class GGUFWriter:
     def add_clamp_kqv(self, value: float) -> None:
         self.add_float32(Keys.Attention.CLAMP_KQV.format(arch=self.arch), value)
 
-    def add_shared_kv_layers(self, value: float) -> None:
-        self.add_float32(Keys.Attention.SHARED_KV_LAYERS.format(arch=self.arch), value)
+    def add_shared_kv_layers(self, value: int) -> None:
+        self.add_uint32(Keys.Attention.SHARED_KV_LAYERS.format(arch=self.arch), value)
 
     def add_sliding_window_pattern(self, value: Sequence[bool]) -> None:
         self.add_array(Keys.Attention.SLIDING_WINDOW_PATTERN.format(arch=self.arch), value)