From 3fbf0529ef6d76b68561036c6669e071d806ee9f Mon Sep 17 00:00:00 2001 From: Jared Van Bortel Date: Thu, 25 Jan 2024 15:47:43 -0500 Subject: [PATCH] kompute : mark last few failing ops as unsupported --- ggml-kompute.cpp | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/ggml-kompute.cpp b/ggml-kompute.cpp index 030cb7a23..b4781d3da 100644 --- a/ggml-kompute.cpp +++ b/ggml-kompute.cpp @@ -1350,7 +1350,7 @@ static bool ggml_vk_supports_op(const struct ggml_tensor * op) { case GGML_TYPE_Q4_0: case GGML_TYPE_Q4_1: case GGML_TYPE_Q6_K: - return op->ne[3] == 1; + return op->ne[2] == 1 && op->ne[3] == 1; default: ; } @@ -1361,11 +1361,12 @@ static bool ggml_vk_supports_op(const struct ggml_tensor * op) { switch (op->src[0]->type) { case GGML_TYPE_F32: + case GGML_TYPE_Q6_K: + return op->ne[3] == 1; case GGML_TYPE_F16: case GGML_TYPE_Q8_0: case GGML_TYPE_Q4_0: case GGML_TYPE_Q4_1: - case GGML_TYPE_Q6_K: return true; default: ;