Update ggml/src/ggml-cuda/mmq.cuh
Co-authored-by: Johannes Gäßler <johannesg@5d6.de>
This commit is contained in:
parent
777f5943a4
commit
fbc4cfcdde
|
|
@ -496,6 +496,8 @@ static __device__ __forceinline__ void vec_dot_q4_1_q8_1_dp4a(
|
||||||
|
|
||||||
constexpr int max_cpy = ggml_cuda_get_max_cpy_bytes();
|
constexpr int max_cpy = ggml_cuda_get_max_cpy_bytes();
|
||||||
constexpr int mcpy_int = max_cpy / sizeof(int);
|
constexpr int mcpy_int = max_cpy / sizeof(int);
|
||||||
|
static_assert(VDR_Q4_0_Q8_1_MMQ == 4, "bad VDR_Q4_0_Q8_1_MMQ");
|
||||||
|
|
||||||
|
|
||||||
int tmp0[4], tmp1[4];
|
int tmp0[4], tmp1[4];
|
||||||
|
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue