From 935eabd917bb480f71072de67d150e0c0ff72a63 Mon Sep 17 00:00:00 2001 From: abhilash1910 Date: Wed, 27 Mar 2024 22:56:15 -0700 Subject: [PATCH] add condition --- ggml-sycl.cpp | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/ggml-sycl.cpp b/ggml-sycl.cpp index 291594459..c2fb20c17 100644 --- a/ggml-sycl.cpp +++ b/ggml-sycl.cpp @@ -15421,7 +15421,8 @@ static void ggml_sycl_mul_mat(const ggml_tensor * src0, const ggml_tensor * src1 ggml_sycl_op_mul_mat(src0, src1, dst, ggml_sycl_op_dequantize_mul_mat_vec, false); } } else { - bool use_mul_mat_q = min_compute_capability >= VER_4VEC && ggml_is_quantized(src0->type); + bool use_mul_mat_q = min_compute_capability >= VER_4VEC && ggml_is_quantized(src0->type) + && ggml_sycl_supports_mmq(src0->type); if (use_xmx && min_compute_capability >= VER_GEN9 && src1->ne[1] > XMX_MAX_BATCH_SIZE) { use_mul_mat_q = false;