]> git.djapps.eu Git - pkg/ggml/sources/llama.cpp/commitdiff
convert : correct gemma 3n conversion (#14450)
authorXuan-Son Nguyen <redacted>
Thu, 3 Jul 2025 08:03:06 +0000 (10:03 +0200)
committerGitHub <redacted>
Thu, 3 Jul 2025 08:03:06 +0000 (10:03 +0200)
* convert : correct gemma 3n conversion

* rm redundant code

gguf-py/gguf/gguf_writer.py

index 697e057c090dae9219f470f9687b80cdfcd30f0e..a7ecf3d31209f6113a581d02c24bb2c769848176 100644 (file)
@@ -714,8 +714,8 @@ class GGUFWriter:
     def add_clamp_kqv(self, value: float) -> None:
         self.add_float32(Keys.Attention.CLAMP_KQV.format(arch=self.arch), value)
 
-    def add_shared_kv_layers(self, value: float) -> None:
-        self.add_float32(Keys.Attention.SHARED_KV_LAYERS.format(arch=self.arch), value)
+    def add_shared_kv_layers(self, value: int) -> None:
+        self.add_uint32(Keys.Attention.SHARED_KV_LAYERS.format(arch=self.arch), value)
 
     def add_sliding_window_pattern(self, value: Sequence[bool]) -> None:
         self.add_array(Keys.Attention.SLIDING_WINDOW_PATTERN.format(arch=self.arch), value)