From cdb09db91e791eaef597c2fd1777d4615a6085f7 Mon Sep 17 00:00:00 2001 From: Jeff Bolz Date: Sun, 14 Dec 2025 11:15:49 -0600 Subject: [PATCH] vulkan: use 4 rows for scalar FA large tile size --- ggml/src/ggml-vulkan/ggml-vulkan.cpp | 5 ++--- 1 file changed, 2 insertions(+), 3 deletions(-) diff --git a/ggml/src/ggml-vulkan/ggml-vulkan.cpp b/ggml/src/ggml-vulkan/ggml-vulkan.cpp index 34ec09d403..d8f5e22ddc 100644 --- a/ggml/src/ggml-vulkan/ggml-vulkan.cpp +++ b/ggml/src/ggml-vulkan/ggml-vulkan.cpp @@ -2535,12 +2535,11 @@ static constexpr uint32_t flash_attention_num_small_rows = 32; static constexpr uint32_t scalar_flash_attention_num_small_rows = 1; static uint32_t get_fa_scalar_num_large_rows(uint32_t hsk, uint32_t hsv) { + GGML_UNUSED(hsk); if (hsv >= 192) { return 2; - } else if ((hsv | hsk) & 8) { - return 4; } else { - return 8; + return 4; } }