Add assert to make sure we only allocate temp buffer for non-CPU backend tensor

Co-authored-by: Johannes Gäßler <johannesg@5d6.de>
2023-06-12 20:19:26 +08:00 · 2023-06-12 20:19:26 +08:00 · 61726bd942
commit 61726bd942
parent 34ca572e84
1 changed files with 1 additions and 0 deletions
--- a/llama.cpp
+++ b/llama.cpp
@ -762,6 +762,7 @@ struct llama_model_loader {

            // allocate temp buffer if not using mmap
            if (!use_mmap && lt.data == NULL) {
+                GGML_ASSERT(lt.ggml_tensor->backend != GGML_BACKEND_CPU);
                lt.data = (uint8_t*)malloc(ggml_nbytes(lt.ggml_tensor));
            }