From 1723c147c2c1d96468014854add294f6548f9119 Mon Sep 17 00:00:00 2001 From: "Meng, Hengyu" Date: Tue, 28 May 2024 20:59:54 +0800 Subject: [PATCH] Update ggml-sycl.cpp Co-authored-by: Neo Zhang Jianyu --- ggml-sycl.cpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ggml-sycl.cpp b/ggml-sycl.cpp index d1ebf26e5..2f105e300 100644 --- a/ggml-sycl.cpp +++ b/ggml-sycl.cpp @@ -15255,7 +15255,7 @@ static void ggml_sycl_mul_mat(const ggml_tensor * src0, const ggml_tensor * src1 && src1->type == GGML_TYPE_F32 && dst->type == GGML_TYPE_F32 && src1->ne[1] <= MMVQ_MAX_BATCH_SIZE; - bool use_mul_mat_q = ggml_sycl_supports_mmq(src0->type) + bool use_mul_mat_q = ggml_sycl_supports_mmq(src0->type) && src1->type == GGML_TYPE_F32 && dst->type == GGML_TYPE_F32; // mmvq and mmq need the __dp4a instruction which is available for gen12+