From 9e15d138f2003629d2319d533c7d12c54f48c061 Mon Sep 17 00:00:00 2001 From: "Vithule, Prashant" Date: Fri, 6 Feb 2026 10:04:41 +0000 Subject: [PATCH] If SVE 256 not present then was using generic function to compute, hence slowing the performance. So added code if SVE 256 is not present then use NEON code. --- ggml/src/ggml-cpu/arch/arm/repack.cpp | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/ggml/src/ggml-cpu/arch/arm/repack.cpp b/ggml/src/ggml-cpu/arch/arm/repack.cpp index 5ec8bb657e..c6d0c5a5f6 100644 --- a/ggml/src/ggml-cpu/arch/arm/repack.cpp +++ b/ggml/src/ggml-cpu/arch/arm/repack.cpp @@ -3535,8 +3535,9 @@ void ggml_gemm_q4_K_8x8_q8_K(int n, } // for y return; } +#endif // SVE compile-time end -#elif defined(__aarch64__) && defined(__ARM_NEON) && defined(__ARM_FEATURE_MATMUL_INT8) +#if defined(__aarch64__) && defined(__ARM_NEON) && defined(__ARM_FEATURE_MATMUL_INT8) constexpr int q8_k_blocklen = 4; const uint8x16_t m4b = vdupq_n_u8(0x0f);