diff --git a/convert_hf_to_gguf.py b/convert_hf_to_gguf.py index 3590a27eba..4061d946b0 100755 --- a/convert_hf_to_gguf.py +++ b/convert_hf_to_gguf.py @@ -7259,7 +7259,7 @@ class DeepseekV2Model(TextModel): else: # note: deepseek2 using MLA converts into MQA (ie: GQA with 1 group) self.hparams["num_key_value_heads"] = 1 - + self.hparams['rms_norm_eps'] = self.hparams.get('rms_norm_eps', 1e-6) super().set_gguf_parameters()