From 45024ee85acd16a34e3b57ae71b5d8664c782535 Mon Sep 17 00:00:00 2001 From: zhang hui Date: Sat, 17 Jan 2026 20:47:51 +0800 Subject: [PATCH] clean float mma --- ggml/src/ggml-cuda/mma.cuh | 8 ++------ 1 file changed, 2 insertions(+), 6 deletions(-) diff --git a/ggml/src/ggml-cuda/mma.cuh b/ggml/src/ggml-cuda/mma.cuh index cd0d6c3e2a..c189ac5682 100644 --- a/ggml/src/ggml-cuda/mma.cuh +++ b/ggml/src/ggml-cuda/mma.cuh @@ -1001,17 +1001,13 @@ namespace ggml_cuda_mma { #else #pragma unroll for (int i = 0; i < 2; ++i) { - const float& a_frag = reinterpret_cast(A.x[i]); - const float& b_frag = reinterpret_cast(B.x[i]); - acc_frag = __builtin_amdgcn_mfma_f32_16x16x4f32(a_frag, b_frag, acc_frag, 0, 0, 0); + acc_frag = __builtin_amdgcn_mfma_f32_16x16x4f32(A.x[i], B.x[i], acc_frag, 0, 0, 0); } #endif #elif defined(CDNA2) || defined(CDNA1) #pragma unroll for (int i = 0; i < 2; ++i) { - const float& a_frag = reinterpret_cast(A.x[i]); - const float& b_frag = reinterpret_cast(B.x[i]); - acc_frag = __builtin_amdgcn_mfma_f32_16x16x4f32(a_frag, b_frag, acc_frag, 0, 0, 0); + acc_frag = __builtin_amdgcn_mfma_f32_16x16x4f32(A.x[i], B.x[i], acc_frag, 0, 0, 0); } #else GGML_UNUSED_VARS(D, A, B);