From d07dc44c6320c8ee0d7f57416d7808907377119a Mon Sep 17 00:00:00 2001 From: Alan Gray Date: Thu, 10 Oct 2024 06:05:12 -0700 Subject: [PATCH] addressed comment --- ggml/src/ggml-cuda/dmmv.cu | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/ggml/src/ggml-cuda/dmmv.cu b/ggml/src/ggml-cuda/dmmv.cu index 2a9543fd1..b727d4ff0 100644 --- a/ggml/src/ggml-cuda/dmmv.cu +++ b/ggml/src/ggml-cuda/dmmv.cu @@ -419,8 +419,8 @@ static __device__ void convert_f16(const void * vx, const int64_t ib, const int // load 2 halfs into register in a single instruction const half2 x_reg = *((half2 *) &(x[ib + iqs])); // automatic half -> float type cast if dfloat == float - v.x = x_reg.x; - v.y = x_reg.y; + v.x = __low2float(x_reg); + v.y = __high2float(x_reg); } static constexpr __device__ dequantize_kernel_t get_dequantize_kernel(ggml_type type) {