llama : initial Mamba-2 support

2024-08-01 10:43:42 -04:00 · 2024-08-01 10:43:42 -04:00 · 1f0fea70fb
commit 1f0fea70fb
parent a1631e53f6
7 changed files with 490 additions and 82 deletions
--- a/ggml/include/ggml.h
+++ b/ggml/include/ggml.h
@ -1787,7 +1787,8 @@ extern "C" {
            struct ggml_tensor  * dt,
            struct ggml_tensor  * A,
            struct ggml_tensor  * B,
-            struct ggml_tensor  * C);
+            struct ggml_tensor  * C,
+            struct ggml_tensor  * D);

    // partition into non-overlapping windows with padding if needed
    // example: