HIP : fix RDNA4 build (#17792)
This commit is contained in:
parent
1be97831e4
commit
6016d0bd41
|
|
@ -560,7 +560,7 @@ namespace ggml_cuda_mma {
|
||||||
xi[0] = xs[0];
|
xi[0] = xs[0];
|
||||||
xi[1] = xs[1];
|
xi[1] = xs[1];
|
||||||
#endif // defined(RDNA4)
|
#endif // defined(RDNA4)
|
||||||
}else if constexpr (I == 16 && J == 8) {
|
} else if constexpr (I == 16 && J == 8) {
|
||||||
int64_t * xi = (int64_t *) t.x;
|
int64_t * xi = (int64_t *) t.x;
|
||||||
#if defined(RDNA4)
|
#if defined(RDNA4)
|
||||||
const int64_t * xs = (int64_t *) ((const int *) xs0 + (threadIdx.x % t.I) * stride + 4 * (threadIdx.x / t.I));
|
const int64_t * xs = (int64_t *) ((const int *) xs0 + (threadIdx.x % t.I) * stride + 4 * (threadIdx.x / t.I));
|
||||||
|
|
@ -577,14 +577,13 @@ namespace ggml_cuda_mma {
|
||||||
const int64_t * xs1 = xs + 2;
|
const int64_t * xs1 = xs + 2;
|
||||||
xi[2] = xs1[0];
|
xi[2] = xs1[0];
|
||||||
xi[3] = xs1[1];
|
xi[3] = xs1[1];
|
||||||
|
#endif // defined(RDNA4)
|
||||||
}else{
|
} else {
|
||||||
NO_DEVICE_CODE;
|
NO_DEVICE_CODE;
|
||||||
}
|
}
|
||||||
} else {
|
} else {
|
||||||
NO_DEVICE_CODE;
|
NO_DEVICE_CODE;
|
||||||
}
|
}
|
||||||
#endif // defined(RDNA4)
|
|
||||||
#else
|
#else
|
||||||
#pragma unroll
|
#pragma unroll
|
||||||
for (int l = 0; l < t.ne; ++l) {
|
for (int l = 0; l < t.ne; ++l) {
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue