Fixed mismatch in MULMAT when subgroup is 16
was failing on MUL_MAT(type_a=q4_0,type_b=f32,m=1,n=2048,k=8192,bs=[1,1],nr=[1,1],per=[0,1,2,3],k_v=0,o=1)
This commit is contained in:
parent
2460f5463f
commit
7e05215f9a
|
|
@ -3061,7 +3061,7 @@ static void ggml_vk_load_shaders(vk_device& device) {
|
|||
const uint32_t tk_m = device->coopmat_support ? device->coopmat_k : 1;
|
||||
const uint32_t tk_s = device->coopmat_support ? device->coopmat_k : 1;
|
||||
|
||||
const uint32_t s_warptile_wm = default_subgroup_size == 8 ? 8 : 32;
|
||||
const uint32_t s_warptile_wm = default_subgroup_size < 32 ? default_subgroup_size : 32;
|
||||
|
||||
l_warptile = { 128, 128, 128, 16, subgroup_size_8 * 2, 64, 2, tm_l, tn_l, tk_l, subgroup_size_8 };
|
||||
m_warptile = { 128, 64, 64, 16, subgroup_size_8, 32, 2, tm_m, tn_m, tk_m, subgroup_size_8 };
|
||||
|
|
|
|||
Loading…
Reference in New Issue