cont : fix reserve

This commit is contained in:
Georgi Gerganov 2026-01-02 19:26:15 +02:00
parent bd5de6bab9
commit 4aa4588042
No known key found for this signature in database
GPG Key ID: 449E073F9DC10735
1 changed files with 6 additions and 0 deletions

View File

@ -351,6 +351,8 @@ llama_context::~llama_context() {
void llama_context::reserve() {
LLAMA_LOG_INFO("%s: reserving ...\n", __func__);
synchronize();
const uint32_t n_seqs = cparams.n_seq_max;
const uint32_t n_tokens = std::min(cparams.n_ctx, cparams.n_ubatch);
@ -497,6 +499,10 @@ void llama_context::reserve() {
}
void llama_context::synchronize() {
if (!sched) {
return;
}
ggml_backend_sched_synchronize(sched.get());
// FIXME: if multiple single tokens are evaluated without a synchronization,