diff --git a/ggml/src/ggml-cuda/convert.cu b/ggml/src/ggml-cuda/convert.cu index 0887a8f9bc..d477f542ce 100644 --- a/ggml/src/ggml-cuda/convert.cu +++ b/ggml/src/ggml-cuda/convert.cu @@ -621,12 +621,12 @@ template static __global__ void dequantize_block_nvfp4( const void * __restrict__ vx, dst_t * __restrict__ yy, - const int64_t k) { + const int64_t ne) { const int64_t i = blockIdx.x; const int tid = threadIdx.x; const int64_t base = i * QK_NVFP4; - if (base >= k) { + if (base >= ne) { return; }