diff --git a/ggml/src/ggml-vulkan/vulkan-shaders/mul_mat_vec_iq2_xs.comp b/ggml/src/ggml-vulkan/vulkan-shaders/mul_mat_vec_iq2_xs.comp index 5fbec7d6b9..7ec2e04f58 100644 --- a/ggml/src/ggml-vulkan/vulkan-shaders/mul_mat_vec_iq2_xs.comp +++ b/ggml/src/ggml-vulkan/vulkan-shaders/mul_mat_vec_iq2_xs.comp @@ -34,15 +34,15 @@ void calc_superblock(const uint a_offset, const uint b_offset, const uint itid, const uvec2 grid_data = iq2xs_grid[qs & 511]; grid0_vals[l] = vec4(unpack8(grid_data.x)); grid1_vals[l] = vec4(unpack8(grid_data.y)); - } + } // Preload B data for all j columns (reduce repeated index calculations) [[unroll]] for (uint j = 0; j < NUM_COLS; ++j) { - FLOAT_TYPE sum = FLOAT_TYPE(0.0); + FLOAT_TYPE sum = FLOAT_TYPE(0.0); [[unroll]] for (uint l = 0; l < 2; ++l) { const uint sign = sign_vals[l]; const uint sign7 = sign7_vals[l]; const vec4 grid0 = grid0_vals[l]; - const vec4 grid1 = grid1_vals[l]; + const vec4 grid1 = grid1_vals[l]; // Precompute indices const uint b_idx = (j * p.batch_stride_b + b_offset + y_idx) / 4 + 2 * l; const vec4 b0 = vec4(data_b_v4[b_idx + 0]);