From daacf6ca150d7a7d80e30d488e66a4e812186afa Mon Sep 17 00:00:00 2001 From: Iwan Kawrakow Date: Tue, 20 Feb 2024 09:37:42 +0200 Subject: [PATCH] It was the ggml_vdotq thing missed inside the brackets --- ggml-quants.c | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/ggml-quants.c b/ggml-quants.c index 6fb3b4c14..6336538f0 100644 --- a/ggml-quants.c +++ b/ggml-quants.c @@ -9511,8 +9511,8 @@ void ggml_vec_dot_iq4_nl_q8_0(int n, float * restrict s, size_t bs, const void * q4b.val[2] = vqtbl1q_s8(values, vandq_u8(q4bits.val[1], m4b)); q4b.val[3] = vqtbl1q_s8(values, vshrq_n_u8(q4bits.val[1], 4)); - prod_1 = ggml_vdotq_s32(vdotq_s32(vdupq_n_s32(0), q4b.val[0], q8b.val[0]), q4b.val[1], q8b.val[1]); - prod_2 = ggml_vdotq_s32(vdotq_s32(vdupq_n_s32(0), q4b.val[2], q8b.val[2]), q4b.val[3], q8b.val[3]); + prod_1 = ggml_vdotq_s32(ggml_vdotq_s32(vdupq_n_s32(0), q4b.val[0], q8b.val[0]), q4b.val[1], q8b.val[1]); + prod_2 = ggml_vdotq_s32(ggml_vdotq_s32(vdupq_n_s32(0), q4b.val[2], q8b.val[2]), q4b.val[3], q8b.val[3]); sumf += (float)x[ib+0].d * (float)y[ib+0].d * vaddvq_s32(prod_1) + (float)x[ib+1].d * (float)y[ib+1].d * vaddvq_s32(prod_2);