From fe00a84b4b972b3172b2c6b880954d81da532ca4 Mon Sep 17 00:00:00 2001 From: Aaron Teo Date: Wed, 18 Mar 2026 17:40:22 +0800 Subject: [PATCH] tests: enable kv_unified to prevent cuda oom error on rtx 2060 (#20645) Signed-off-by: Aaron Teo --- tests/test-backend-sampler.cpp | 1 + 1 file changed, 1 insertion(+) diff --git a/tests/test-backend-sampler.cpp b/tests/test-backend-sampler.cpp index d4cd62c71e..58361ae80a 100644 --- a/tests/test-backend-sampler.cpp +++ b/tests/test-backend-sampler.cpp @@ -89,6 +89,7 @@ struct test_context { cparams.n_batch = 512; cparams.samplers = configs.data(); cparams.n_samplers = configs.size(); + cparams.kv_unified = true; // If n_seq_max is not specified, calculate it from configs if (n_seq_max < 0) {