From 87e5c86686e3c87ddf26829f863a4b5f9ed7ab83 Mon Sep 17 00:00:00 2001 From: abhilash1910 Date: Fri, 15 Mar 2024 00:33:35 -0700 Subject: [PATCH] allow iq quant --- ggml-sycl.cpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ggml-sycl.cpp b/ggml-sycl.cpp index 31b3a3e15..15aeb993f 100644 --- a/ggml-sycl.cpp +++ b/ggml-sycl.cpp @@ -15498,7 +15498,7 @@ static void ggml_sycl_mul_mat(const ggml_tensor * src0, const ggml_tensor * src1 #ifdef GGML_SYCL_FORCE_DMMV const bool use_mul_mat_vec_q = false; #else - const bool use_mul_mat_vec_q = min_compute_capability >= VER_4VEC && ggml_is_quantized(src0->type) && ggml_nrows(src1) == 1; + const bool use_mul_mat_vec_q = min_compute_capability >= VER_4VEC && ggml_is_quantized(src0->type); #endif // GGML_SYCL_FORCE_DMMV if (use_mul_mat_vec_q) {