cont : fix

2026-01-02 16:00:25 +02:00 · 2026-01-02 16:00:25 +02:00 · bd5de6bab9
parent d96d0417d1
commit bd5de6bab9
1 changed files with 1 additions and 1 deletions
--- a/src/llama-context.cpp
+++ b/src/llama-context.cpp
@ -320,7 +320,7 @@ llama_context::llama_context(

        reserve();

-        if (cparams.flash_attn) {
+        if (!cparams.flash_attn) {
            if (ggml_is_quantized(params.type_v)) {
                throw std::runtime_error("quantized V cache was requested, but this requires Flash Attention");
            }