allow iq quant

2024-03-15 00:33:35 -07:00 · 2024-03-15 00:33:35 -07:00 · 87e5c86686
commit 87e5c86686
parent 0af3ed733f
1 changed files with 1 additions and 1 deletions
--- a/ggml-sycl.cpp
+++ b/ggml-sycl.cpp
@ -15498,7 +15498,7 @@ static void ggml_sycl_mul_mat(const ggml_tensor * src0, const ggml_tensor * src1
 #ifdef GGML_SYCL_FORCE_DMMV
            const bool use_mul_mat_vec_q = false;
 #else
-            const bool use_mul_mat_vec_q = min_compute_capability >= VER_4VEC && ggml_is_quantized(src0->type) && ggml_nrows(src1) == 1;
+            const bool use_mul_mat_vec_q = min_compute_capability >= VER_4VEC && ggml_is_quantized(src0->type);
 #endif // GGML_SYCL_FORCE_DMMV
            if (use_mul_mat_vec_q) {