Added if condition to support only vector length 256.
This commit is contained in:
parent
57b218d447
commit
6363036f2b
|
|
@ -3227,6 +3227,7 @@ void ggml_gemm_q4_K_8x8_q8_K(int n,
|
||||||
UNUSED(blocklen);
|
UNUSED(blocklen);
|
||||||
|
|
||||||
#if defined(__aarch64__) && defined(__ARM_FEATURE_SVE) && defined(__ARM_FEATURE_MATMUL_INT8)
|
#if defined(__aarch64__) && defined(__ARM_FEATURE_SVE) && defined(__ARM_FEATURE_MATMUL_INT8)
|
||||||
|
if (svcntb()*8 == 256) {
|
||||||
constexpr int q8_k_blocklen = 4;
|
constexpr int q8_k_blocklen = 4;
|
||||||
const svuint8_t m4b_1 = svdup_n_u8(0x0f);
|
const svuint8_t m4b_1 = svdup_n_u8(0x0f);
|
||||||
// 8 accumulators: 2 row pairs × 4 col pairs
|
// 8 accumulators: 2 row pairs × 4 col pairs
|
||||||
|
|
@ -3551,6 +3552,7 @@ void ggml_gemm_q4_K_8x8_q8_K(int n,
|
||||||
} // for x
|
} // for x
|
||||||
} // for y
|
} // for y
|
||||||
return;
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
#elif defined(__aarch64__) && defined(__ARM_NEON) && defined(__ARM_FEATURE_MATMUL_INT8)
|
#elif defined(__aarch64__) && defined(__ARM_NEON) && defined(__ARM_FEATURE_MATMUL_INT8)
|
||||||
constexpr int q8_k_blocklen = 4;
|
constexpr int q8_k_blocklen = 4;
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue