diff --git a/tools/server/server-context.cpp b/tools/server/server-context.cpp index a79ad3c059..8dab846960 100644 --- a/tools/server/server-context.cpp +++ b/tools/server/server-context.cpp @@ -1154,7 +1154,7 @@ private: // initialize draft batch // TODO: rework speculative decoding [TAG_SERVER_SPEC_REWORK] - if (can_speculate()) { + if (slot.can_speculate()) { llama_batch_free(slot.batch_spec); slot.batch_spec = llama_batch_init(task.params.speculative.n_max + 1, 0, 1);