diff --git a/ggml-sycl.cpp b/ggml-sycl.cpp index 31b3a3e15..15aeb993f 100644 --- a/ggml-sycl.cpp +++ b/ggml-sycl.cpp @@ -15498,7 +15498,7 @@ static void ggml_sycl_mul_mat(const ggml_tensor * src0, const ggml_tensor * src1 #ifdef GGML_SYCL_FORCE_DMMV const bool use_mul_mat_vec_q = false; #else - const bool use_mul_mat_vec_q = min_compute_capability >= VER_4VEC && ggml_is_quantized(src0->type) && ggml_nrows(src1) == 1; + const bool use_mul_mat_vec_q = min_compute_capability >= VER_4VEC && ggml_is_quantized(src0->type); #endif // GGML_SYCL_FORCE_DMMV if (use_mul_mat_vec_q) {