From 93c17446992894a51c0ca732ef88083cbb9727de Mon Sep 17 00:00:00 2001 From: Ryan Mangeno <160974989+ryan-mangeno@users.noreply.github.com> Date: Fri, 10 Oct 2025 12:03:21 -0400 Subject: [PATCH] Update src/llama-graph.cpp MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Co-authored-by: Sigbjørn Skjæret --- src/llama-graph.cpp | 1 + 1 file changed, 1 insertion(+) diff --git a/src/llama-graph.cpp b/src/llama-graph.cpp index 3e7b0f3674..90cd885a60 100644 --- a/src/llama-graph.cpp +++ b/src/llama-graph.cpp @@ -1598,6 +1598,7 @@ ggml_tensor * llm_graph_context::build_attn( // optionally store to KV cache if (k_cur) { const auto & k_idxs = is_swa ? inp->get_k_idxs_swa() : inp->get_k_idxs(); + ggml_build_forward_expand(gf, mctx_cur->cpy_k(ctx0, k_cur, k_idxs, il)); }