From ece01fc2e99570f240ecc9a65f3e4f3df216e827 Mon Sep 17 00:00:00 2001 From: Max Krasnyansky Date: Wed, 15 May 2024 09:05:07 -0700 Subject: [PATCH] matmul-int8: remove unnecessary casts in q8_0_q8_0 --- ggml-quants.c | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/ggml-quants.c b/ggml-quants.c index e9b24f5eb..f13599f6b 100644 --- a/ggml-quants.c +++ b/ggml-quants.c @@ -4852,10 +4852,10 @@ void ggml_vec_dot_q8_0_q8_0(int n, float * restrict s, size_t bs, const void * r const block_q8_0 * restrict b_x1 = &vx1[i]; const block_q8_0 * restrict b_y1 = &vy1[i]; - const int8x16_t x0_l = vld1q_s8((const int8_t*)b_x0->qs); - const int8x16_t x0_h = vld1q_s8((const int8_t*)b_x0->qs + 16); - const int8x16_t x1_l = vld1q_s8((const int8_t*)b_x1->qs); - const int8x16_t x1_h = vld1q_s8((const int8_t*)b_x1->qs + 16); + const int8x16_t x0_l = vld1q_s8(b_x0->qs); + const int8x16_t x0_h = vld1q_s8(b_x0->qs + 16); + const int8x16_t x1_l = vld1q_s8(b_x1->qs); + const int8x16_t x1_h = vld1q_s8(b_x1->qs + 16); // load y const int8x16_t y0_l = vld1q_s8(b_y0->qs);