cont : fix reserve

2026-01-02 19:26:15 +02:00 · 2026-01-02 19:26:15 +02:00 · 614fe5b4e4
parent 8a36119407
commit 614fe5b4e4
1 changed files with 6 additions and 0 deletions
--- a/src/llama-context.cpp
+++ b/src/llama-context.cpp
@ -383,6 +383,8 @@ llama_context::~llama_context() {
 void llama_context::reserve() {
    LLAMA_LOG_INFO("%s: reserving ...\n", __func__);

+    synchronize();
+
    const uint32_t n_seqs = cparams.n_seq_max;
    const uint32_t n_tokens = std::min(cparams.n_ctx, cparams.n_ubatch);

@ -529,6 +531,10 @@ void llama_context::reserve() {
 }

 void llama_context::synchronize() {
+    if (!sched) {
+        return;
+    }
+
    ggml_backend_sched_synchronize(sched.get());

    // FIXME: if multiple single tokens are evaluated without a synchronization,