From 6a8432bf436d5ab3a5214dced294c789ffa543a2 Mon Sep 17 00:00:00 2001 From: "Meng, Hengyu" Date: Tue, 28 May 2024 20:59:44 +0800 Subject: [PATCH] Update ggml-sycl.cpp Co-authored-by: Neo Zhang Jianyu --- ggml-sycl.cpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ggml-sycl.cpp b/ggml-sycl.cpp index 855015978..d1ebf26e5 100644 --- a/ggml-sycl.cpp +++ b/ggml-sycl.cpp @@ -15251,7 +15251,7 @@ static void ggml_sycl_mul_mat(const ggml_tensor * src0, const ggml_tensor * src1 && src1->type == GGML_TYPE_F32 && dst->type == GGML_TYPE_F32 && src0->ne[0] % GGML_SYCL_DMMV_X == 0 && src1->ne[1] == 1; - bool use_mul_mat_vec_q = ggml_is_quantized(src0->type) + bool use_mul_mat_vec_q = ggml_is_quantized(src0->type) && src1->type == GGML_TYPE_F32 && dst->type == GGML_TYPE_F32 && src1->ne[1] <= MMVQ_MAX_BATCH_SIZE;