Merge 2aef9767d9 into 2634ed207a

2026-02-01 12:33:06 +02:00 · 2026-02-01 12:33:06 +02:00 · fd86c1ac68
parent 2634ed207a 2aef9767d9
commit fd86c1ac68
1 changed files with 5 additions and 3 deletions
--- a/src/llama-kv-cache-iswa.cpp
+++ b/src/llama-kv-cache-iswa.cpp
@ -107,12 +107,14 @@ void llama_kv_cache_iswa::seq_div(llama_seq_id seq_id, llama_pos p0, llama_pos p
 }

 llama_pos llama_kv_cache_iswa::seq_pos_min(llama_seq_id seq_id) const {
-    // the base cache is a superset of the SWA cache, so we can just check the SWA cache
-    return kv_swa->seq_pos_min(seq_id);
+    // base cache preserves all positions (no SWA cell reuse), making it the ground truth for position tracking
+    // SWA cache can lose older positions when cells are reused for new tokens outside the SWA window
+    return kv_base->seq_pos_min(seq_id);
 }

 llama_pos llama_kv_cache_iswa::seq_pos_max(llama_seq_id seq_id) const {
-    return kv_swa->seq_pos_max(seq_id);
+    // base cache preserves all positions (no SWA cell reuse), making it the ground truth for position tracking
+    return kv_base->seq_pos_max(seq_id);
 }

 std::map<ggml_backend_buffer_type_t, size_t> llama_kv_cache_iswa::memory_breakdown() const {