fix softmax for iGPU (#17838)
This commit is contained in:
parent
2fbe3b7bb7
commit
2e9eab80c2
|
|
@ -277,7 +277,7 @@ static void soft_max_f32_sycl(const float *x, const T *mask,
|
||||||
const int id = get_current_device_id();
|
const int id = get_current_device_id();
|
||||||
const size_t smpbo = ggml_sycl_info().devices[id].smpbo;
|
const size_t smpbo = ggml_sycl_info().devices[id].smpbo;
|
||||||
|
|
||||||
if (nbytes_shared <= smpbo) {
|
if (nbytes_shared <= smpbo && ncols_x <= max_block_size) {
|
||||||
launch_soft_max_kernels<32, 64, 128, 256, 512, 1024, 2048, 4096>(
|
launch_soft_max_kernels<32, 64, 128, 256, 512, 1024, 2048, 4096>(
|
||||||
x, mask, sinks, dst, params, stream, block_dims, block_nums,
|
x, mask, sinks, dst, params, stream, block_dims, block_nums,
|
||||||
nbytes_shared);
|
nbytes_shared);
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue