From a8592fbc1123de3d44d164f3e2de09b86a2fe7c0 Mon Sep 17 00:00:00 2001 From: Georgi Gerganov Date: Mon, 17 Apr 2023 18:41:14 +0300 Subject: [PATCH] ggml : explicit assignment of deltas --- ggml.c | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/ggml.c b/ggml.c index 533371d13..855a835f5 100644 --- a/ggml.c +++ b/ggml.c @@ -726,8 +726,8 @@ static void quantize_row_q4_0(const float * restrict x, void * restrict vy, int const float id0 = d0 ? 1.0f/d0 : 0.0f; const float id1 = d1 ? 1.0f/d1 : 0.0f; - y[i].d0 = d0; - y[i].d1 = d1; + y[i].d0 = GGML_FP32_TO_FP16(d0); + y[i].d1 = GGML_FP32_TO_FP16(d1); for (int l = 0; l < 4; l++) { const float32x4_t v = vmulq_n_f32(srcv[l], id0);