diff --git a/ggml/src/ggml-cuda/conv2d-implicit.cu b/ggml/src/ggml-cuda/conv2d-implicit.cu index 66af15c167..93ede3efc8 100644 --- a/ggml/src/ggml-cuda/conv2d-implicit.cu +++ b/ggml/src/ggml-cuda/conv2d-implicit.cu @@ -25,7 +25,7 @@ static __global__ void reduce_f32(const float * __restrict__ x, float * __restri template + const int layout, const bool vec_load, const int ksplit, const int PAD=4> static __global__ void conv2d_implicit_kernel(const float * __restrict__ input, const T * __restrict__ kernel, float * __restrict__ output,