fix j-major wrong ne on CDNA

This commit is contained in:
zhang hui 2025-12-16 10:01:30 +08:00
parent 6acad9c759
commit cffa070b08
1 changed files with 1 additions and 1 deletions

View File

@ -446,7 +446,7 @@ namespace ggml_cuda_mma {
static constexpr int J = J_;
static constexpr data_layout dl = DATA_LAYOUT_J_MAJOR;
static constexpr int ne = I * J / 32;
static constexpr int ne = tile<I_, J_, T, DATA_LAYOUT_I_MAJOR>::ne;
T x[ne] = {0};
static constexpr __device__ bool supported() {