move graph map to backend object
This commit is contained in:
parent
ca0d999c2a
commit
4b2ee61f62
4 changed files with 16 additions and 22 deletions
|
@ -529,18 +529,13 @@ GGML_CALL static void ggml_backend_qnn_free(ggml_backend_t backend) {
|
|||
|
||||
auto *instance = g_qnn_mgr[ctx->device].instance;
|
||||
if (instance != nullptr) {
|
||||
// TODO: this should be done inside the destructor
|
||||
std::map<std::string,
|
||||
std::tuple<Qnn_GraphHandle_t, Qnn_Tensor_t *, Qnn_Tensor_t *,
|
||||
Qnn_Tensor_t *>>::iterator graph_it;
|
||||
for (graph_it = instance->_qnn_graph_map.begin();
|
||||
graph_it != instance->_qnn_graph_map.end(); graph_it++) {
|
||||
auto & graph_item = graph_it->second;
|
||||
Qnn_GraphHandle_t & graph_handle = std::get<0>(graph_item);
|
||||
for (const auto &graph_item: ctx->qnn_graph_map) {
|
||||
Qnn_GraphHandle_t graph_handle = std::get<0>(graph_item.second);
|
||||
GGML_UNUSED(graph_handle);
|
||||
QNN_LOG_INFO("graph type:%s", graph_it->first.c_str());
|
||||
QNN_LOG_INFO("graph type:%s", graph_item.first.c_str());
|
||||
}
|
||||
instance->_qnn_graph_map.clear();
|
||||
|
||||
ctx->qnn_graph_map.clear();
|
||||
|
||||
instance->qnn_finalize();
|
||||
delete instance;
|
||||
|
|
|
@ -57,9 +57,9 @@ static void ggml_qnn_add(ggml_backend_qnn_context *ctx, const ggml_tensor *src0,
|
|||
perf.start();
|
||||
|
||||
std::string map_entry(ggml_op_name(ggmlop));
|
||||
if (instance->_qnn_graph_map.find(map_entry) != instance->_qnn_graph_map.end()) {
|
||||
if (ctx->qnn_graph_map.find(map_entry) != ctx->qnn_graph_map.end()) {
|
||||
graph_initialized = true;
|
||||
auto &graph_item = instance->_qnn_graph_map[map_entry];
|
||||
auto &graph_item = ctx->qnn_graph_map[map_entry];
|
||||
graph_handle = std::get<0>(graph_item);
|
||||
}
|
||||
|
||||
|
@ -157,9 +157,9 @@ static void ggml_qnn_add(ggml_backend_qnn_context *ctx, const ggml_tensor *src0,
|
|||
|
||||
auto graph_item = std::make_tuple(graph_handle, tensor_input0.get_qnn_tensor(), tensor_input1.get_qnn_tensor(),
|
||||
tensor_output.get_qnn_tensor());
|
||||
instance->_qnn_graph_map[map_entry] = graph_item;
|
||||
ctx->qnn_graph_map[map_entry] = graph_item;
|
||||
} else {
|
||||
auto &graph_item = instance->_qnn_graph_map[map_entry];
|
||||
auto &graph_item = ctx->qnn_graph_map[map_entry];
|
||||
qnn::ggml_qnn_tensor_input tensor_input0(src0, std::get<1>(graph_item), ctx);
|
||||
qnn::ggml_qnn_tensor_input tensor_input1(src1, std::get<2>(graph_item), ctx);
|
||||
qnn::ggml_qnn_tensor_output tensor_output(dst, std::get<3>(graph_item), ctx);
|
||||
|
@ -226,9 +226,9 @@ static void ggml_qnn_mul_mat(ggml_backend_qnn_context *ctx, const ggml_tensor *s
|
|||
perf.start();
|
||||
|
||||
std::string map_entry = std::string(ggml_op_name(ggmlop));
|
||||
if (instance->_qnn_graph_map.find(map_entry) != instance->_qnn_graph_map.end()) {
|
||||
if (ctx->qnn_graph_map.find(map_entry) != ctx->qnn_graph_map.end()) {
|
||||
graph_initialized = true;
|
||||
auto &graph_item = instance->_qnn_graph_map[map_entry];
|
||||
auto &graph_item = ctx->qnn_graph_map[map_entry];
|
||||
graph_handle = std::get<0>(graph_item);
|
||||
}
|
||||
|
||||
|
@ -327,9 +327,9 @@ static void ggml_qnn_mul_mat(ggml_backend_qnn_context *ctx, const ggml_tensor *s
|
|||
|
||||
auto graph_item = std::make_tuple(graph_handle, tensor_input0.get_qnn_tensor(), tensor_input1.get_qnn_tensor(),
|
||||
tensor_output.get_qnn_tensor());
|
||||
instance->_qnn_graph_map[map_entry] = graph_item;
|
||||
ctx->qnn_graph_map[map_entry] = graph_item;
|
||||
} else {
|
||||
auto &graph_item = instance->_qnn_graph_map[map_entry];
|
||||
auto &graph_item = ctx->qnn_graph_map[map_entry];
|
||||
qnn::ggml_qnn_tensor_input tensor_input0(src0, std::get<1>(graph_item), ctx);
|
||||
qnn::ggml_qnn_tensor_input tensor_input1(src1, std::get<2>(graph_item), ctx);
|
||||
qnn::ggml_qnn_tensor_output tensor_output(dst, std::get<3>(graph_item), ctx);
|
||||
|
|
|
@ -1,6 +1,8 @@
|
|||
|
||||
#pragma once
|
||||
|
||||
#include <unordered_map>
|
||||
|
||||
#include "ggml.h"
|
||||
|
||||
#include "ggml-backend.h"
|
||||
|
@ -17,4 +19,5 @@ struct ggml_backend_qnn_context {
|
|||
QNN_INTERFACE_VER_TYPE raw_interface;
|
||||
QNN_SYSTEM_INTERFACE_VER_TYPE raw_system_interface;
|
||||
qnn::qcom_socinfo socinfo;
|
||||
std::unordered_map<std::string, std::tuple<Qnn_GraphHandle_t, Qnn_Tensor_t *, Qnn_Tensor_t *, Qnn_Tensor_t *>> qnn_graph_map;
|
||||
};
|
||||
|
|
|
@ -2,7 +2,6 @@
|
|||
|
||||
#include <math.h>
|
||||
|
||||
#include <map>
|
||||
#include <mutex>
|
||||
#include <string>
|
||||
#include <unordered_map>
|
||||
|
@ -705,9 +704,6 @@ public:
|
|||
|
||||
const qnn::qcom_socinfo &get_soc_info() { return _soc_info; }
|
||||
|
||||
public:
|
||||
std::map<std::string, std::tuple<Qnn_GraphHandle_t, Qnn_Tensor_t *, Qnn_Tensor_t *, Qnn_Tensor_t *>> _qnn_graph_map;
|
||||
|
||||
private:
|
||||
int load_system() {
|
||||
Qnn_ErrorHandle_t error = QNN_SUCCESS;
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue