Set rope_theta

This commit is contained in:
Tarek Dakhran 2025-12-15 14:43:03 +01:00
parent 145b6280d6
commit 4f5d5212b8
No known key found for this signature in database
GPG Key ID: AA0AF9C3E1721799
1 changed files with 1 additions and 0 deletions

View File

@ -9567,6 +9567,7 @@ class LFM2Model(TextModel):
self.gguf_writer.add_vocab_size(self.hparams["vocab_size"]) self.gguf_writer.add_vocab_size(self.hparams["vocab_size"])
self.gguf_writer.add_shortconv_l_cache(self.hparams["conv_L_cache"]) self.gguf_writer.add_shortconv_l_cache(self.hparams["conv_L_cache"])
self.gguf_writer.add_layer_norm_rms_eps(self.hparams["norm_eps"]) self.gguf_writer.add_layer_norm_rms_eps(self.hparams["norm_eps"])
self.gguf_writer.add_rope_freq_base(self.hparams.get("rope_theta", 1000000))
self._add_feed_forward_length() self._add_feed_forward_length()
def modify_tensors(self, data_torch: Tensor, name: str, bid: int | None) -> Iterable[tuple[str, Tensor]]: def modify_tensors(self, data_torch: Tensor, name: str, bid: int | None) -> Iterable[tuple[str, Tensor]]: