Fixed mismatch in MULMAT when subgroup is 16

was failing on MUL_MAT(type_a=q4_0,type_b=f32,m=1,n=2048,k=8192,bs=[1,1],nr=[1,1],per=[0,1,2,3],k_v=0,o=1)
This commit is contained in:
Nakasaka, Masato 2026-01-19 19:18:45 -08:00
parent 2460f5463f
commit 7e05215f9a
1 changed files with 1 additions and 1 deletions

View File

@ -3061,7 +3061,7 @@ static void ggml_vk_load_shaders(vk_device& device) {
const uint32_t tk_m = device->coopmat_support ? device->coopmat_k : 1;
const uint32_t tk_s = device->coopmat_support ? device->coopmat_k : 1;
const uint32_t s_warptile_wm = default_subgroup_size == 8 ? 8 : 32;
const uint32_t s_warptile_wm = default_subgroup_size < 32 ? default_subgroup_size : 32;
l_warptile = { 128, 128, 128, 16, subgroup_size_8 * 2, 64, 2, tm_l, tn_l, tk_l, subgroup_size_8 };
m_warptile = { 128, 64, 64, 16, subgroup_size_8, 32, 2, tm_m, tn_m, tk_m, subgroup_size_8 };