diff --git a/ggml/src/ggml-cuda/mma.cuh b/ggml/src/ggml-cuda/mma.cuh index c189ac5682..dd45d6c78f 100644 --- a/ggml/src/ggml-cuda/mma.cuh +++ b/ggml/src/ggml-cuda/mma.cuh @@ -993,17 +993,10 @@ namespace ggml_cuda_mma { using floatx4_t = __attribute__((ext_vector_type(4))) float; floatx4_t& acc_frag = reinterpret_cast(D.x[0]); #if defined(CDNA3) -#if 0 using floatx2_t = __attribute__((ext_vector_type(2))) float; const floatx2_t& a_frag = reinterpret_cast(A.x[0]); const floatx2_t& b_frag = reinterpret_cast(B.x[0]); acc_frag = __builtin_amdgcn_mfma_f32_16x16x8_xf32(a_frag, b_frag, acc_frag, 0, 0, 0); -#else -#pragma unroll - for (int i = 0; i < 2; ++i) { - acc_frag = __builtin_amdgcn_mfma_f32_16x16x4f32(A.x[i], B.x[i], acc_frag, 0, 0, 0); - } -#endif #elif defined(CDNA2) || defined(CDNA1) #pragma unroll for (int i = 0; i < 2; ++i) {