diff --git a/ggml-qnn.cpp b/ggml-qnn.cpp index b97b20245..47810c933 100644 --- a/ggml-qnn.cpp +++ b/ggml-qnn.cpp @@ -1995,7 +1995,7 @@ public: if (is_npu) { qnn_instance * instance = ctx->instance; uint8_t *qnn_buffer = static_cast(instance->alloc_rpcmem( - ggml_nbytes(tensor), 4)); // TODO: should we get the align param from device here? + ggml_nbytes(tensor), alignof(void*))); if (!qnn_buffer) { QNN_LOG_WARN("alloc rpcmem failure, %s\n", strerror(errno)); QNN_LOG_DEBUG("tensor%p name %s", _qnn_tensor, QNN_TENSOR_GET_NAME(*_qnn_tensor));