sched : allow ops with weights on an incompatible buffer type

This will cause the weight to be copied to a backend that supports the op, which is very costly. The weight should have been stored in a buffer of a backend that can run the op, but llama.cpp cannot do this automatically at the moment. ggml-ci
2024-06-13 02:38:36 +02:00 · 2024-06-13 02:38:36 +02:00 · 211fb045f1
commit 211fb045f1
parent ae9cd85698
1 changed files with 4 additions and 3 deletions
--- a/ggml-backend.c
+++ b/ggml-backend.c
@ -1116,9 +1116,10 @@ static int ggml_backend_sched_backend_from_buffer(ggml_backend_sched_t sched, co
        }
    }

-    fprintf(stderr, "%s: error: no backend supports buffer type %s used in tensor %s\n",
-        __func__, ggml_backend_buffer_name(buffer), tensor->name);
-    GGML_ASSERT(false);
+#ifndef NDEBUG
+    fprintf(stderr, "%s: warning: no backend supports op %s with a weight with buffer type %s used in tensor %s, the weight will need to be copied\n",
+        __func__, ggml_op_desc(tensor), ggml_backend_buffer_name(buffer), tensor->name);
+#endif

    return -1;
 }