convert: quick fix
This commit is contained in:
parent
616f009e28
commit
e5d426be98
|
|
@ -7256,13 +7256,11 @@ class DeepseekV2Model(TextModel):
|
||||||
|
|
||||||
if is_ocr:
|
if is_ocr:
|
||||||
self.hparams['rope_theta'] = self.hparams.get('rope_theta', 10000.0)
|
self.hparams['rope_theta'] = self.hparams.get('rope_theta', 10000.0)
|
||||||
self.hparams['rms_norm_eps'] = self.hparams.get('rms_norm_eps', 1e-6)
|
|
||||||
else:
|
else:
|
||||||
# note: deepseek2 using MLA converts into MQA (ie: GQA with 1 group)
|
# note: deepseek2 using MLA converts into MQA (ie: GQA with 1 group)
|
||||||
self.hparams["num_key_value_heads"] = 1
|
self.hparams["num_key_value_heads"] = 1
|
||||||
|
|
||||||
if (rope_mscale_all := self.rope_parameters.get("mscale_all_dim")) is not None:
|
self.hparams['rms_norm_eps'] = self.hparams.get('rms_norm_eps', 1e-6)
|
||||||
self.hparams["rms_norm_eps"] = self.hparams.get("rms_norm_eps", 1e-6)
|
|
||||||
|
|
||||||
super().set_gguf_parameters()
|
super().set_gguf_parameters()
|
||||||
hparams = self.hparams
|
hparams = self.hparams
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue