From 80d3b39bff9cc18187972ac198c3630ad7c94f3d Mon Sep 17 00:00:00 2001 From: Aidan Date: Tue, 2 Jul 2024 10:09:20 +0100 Subject: [PATCH] Single load for half2 --- ggml/src/ggml-sycl/dequantize.hpp | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/ggml/src/ggml-sycl/dequantize.hpp b/ggml/src/ggml-sycl/dequantize.hpp index 24eb70c18..84c35d415 100644 --- a/ggml/src/ggml-sycl/dequantize.hpp +++ b/ggml/src/ggml-sycl/dequantize.hpp @@ -319,8 +319,9 @@ static void dequantize_block_q4_K(const void * __restrict__ vx, dst_t * __restri dst_t * y = yy + i*QK_K + 64*il + n*ir; - const float dall = x[i].dm[0]; - const float dmin = x[i].dm[1]; + const sycl::half2 dm = x[i].dm; + const float dall = dm[0]; + const float dmin = dm[1]; const uint8_t * q = x[i].qs + 32*il + n*ir;