We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent a70c8a0 commit 0c2ee38Copy full SHA for 0c2ee38
gguf-py/gguf/gguf_writer.py
@@ -714,8 +714,8 @@ def add_max_alibi_bias(self, bias: float) -> None:
714
def add_clamp_kqv(self, value: float) -> None:
715
self.add_float32(Keys.Attention.CLAMP_KQV.format(arch=self.arch), value)
716
717
- def add_shared_kv_layers(self, value: float) -> None:
718
- self.add_float32(Keys.Attention.SHARED_KV_LAYERS.format(arch=self.arch), value)
+ def add_shared_kv_layers(self, value: int) -> None:
+ self.add_uint32(Keys.Attention.SHARED_KV_LAYERS.format(arch=self.arch), value)
719
720
def add_sliding_window_pattern(self, value: Sequence[bool]) -> None:
721
self.add_array(Keys.Attention.SLIDING_WINDOW_PATTERN.format(arch=self.arch), value)
0 commit comments