diff --git a/ggml-sycl.cpp b/ggml-sycl.cpp index caffe9b02..5c8803653 100644 --- a/ggml-sycl.cpp +++ b/ggml-sycl.cpp @@ -11946,7 +11946,8 @@ inline void ggml_sycl_op_mul_mat_vec_q( // TODO: support these quantization types GGML_ASSERT(!(src0->type == GGML_TYPE_IQ2_XXS || src0->type == GGML_TYPE_IQ2_XS || - src0->type == GGML_TYPE_IQ3_XXS)); + src0->type == GGML_TYPE_IQ3_XXS || + src0->type == GGML_TYPE_IQ1_S)); switch (src0->type) { case GGML_TYPE_Q4_0: @@ -14965,7 +14966,10 @@ static bool ggml_backend_sycl_supports_op(ggml_backend_t backend, const ggml_ten if (a->ne[3] != b->ne[3]) { return false; } - + + if (a->type == GGML_TYPE_IQ1_S) { + return false; + } if (a->type == GGML_TYPE_IQ3_XXS) { return false; }