Fix a couple of oversights

This commit is contained in:
Aes Sedai 2026-01-28 22:24:26 -08:00
parent 042c3cb8c5
commit a4c9a08270
2 changed files with 2 additions and 2 deletions

View File

@ -10623,7 +10623,7 @@ class MistralMoeModel(DeepseekV2Model):
self.gguf_writer.add_rope_scaling_yarn_log_mul(0.1) # mscale_all_dim * 0.1
def modify_tensors(self, data_torch: Tensor, name: str, bid: int | None):
if name.startswith("vision_") or name.startswith("patch_merger."):
if name.startswith("vision_") or name.startswith("patch_merger.") or "mm_projector" in name:
return
# rename certain tensors so that we can reuse DeepseekV2Model modify_tensors logic

View File

@ -1255,7 +1255,7 @@ class TensorNameMap:
MODEL_TENSOR.V_MMPROJ: (
"multi_modal_projector.linear_{bid}",
"mm_projector.proj.linear_{bid}",
"mm_projector.proj.linear_{bid}", # Kimi-K2.5
"visual.merger.mlp.{bid}", # qwen2vl
"merger.mlp.{bid}",
),