add back ggml_cont for Vcur

2026-02-03 18:42:17 +08:00 · 2026-02-03 18:42:17 +08:00 · 000fded1ea
parent efaea45cb3
commit 000fded1ea
1 changed files with 1 additions and 0 deletions
--- a/src/models/kimi-linear.cpp
+++ b/src/models/kimi-linear.cpp
@ -291,6 +291,7 @@ llm_build_kimi_linear::llm_build_kimi_linear(const llama_model & model, const ll
                    ggml_row_size(kv->type, kv_per_head),
                    ggml_row_size(kv->type, kv_per_head * n_head),
                    ggml_row_size(kv->type, n_embd_head_qk_nope));
+                Vcur = ggml_cont(ctx0, Vcur);
                cb(Vcur, "mla_V", il);

                // Concatenate k_nope + k_pe (broadcast k_pe to all heads)