llama : sync gguf-llama.cpp with latest llama.cpp (#2608)

* llama : sync gguf-llama.cpp with latest llama.cpp * minor : indentation + assert * llama : refactor gguf_buffer and gguf_ctx_buffer * llama : minor
2023-08-14 16:28:44 +03:00 · 2023-08-14 16:28:44 +03:00 · f00780b2ee
commit f00780b2ee
parent 6f64b6c0f8
6 changed files with 692 additions and 463 deletions
--- a/ggml-metal.m
+++ b/ggml-metal.m
@ -224,6 +224,21 @@ void ggml_metal_free(struct ggml_metal_context * ctx) {
    free(ctx);
 }

+void * ggml_metal_host_malloc(size_t n) {
+    void * data = NULL;
+    const int result = posix_memalign((void **) &data, getpagesize(), n);
+    if (result != 0) {
+        fprintf(stderr, "%s: error: posix_memalign failed\n", __func__);
+        return NULL;
+    }
+
+    return data;
+}
+
+void ggml_metal_host_free(void * data) {
+    free(data);
+}
+
 void ggml_metal_set_n_cb(struct ggml_metal_context * ctx, int n_cb) {
    ctx->n_cb = n_cb;
 }