From 1d650ce6b4d503f6d5a47a3a4c4ebe751334e934 Mon Sep 17 00:00:00 2001 From: Georgi Gerganov Date: Tue, 23 Jan 2024 14:12:32 +0200 Subject: [PATCH] ggml : add comment --- ggml.c | 1 + 1 file changed, 1 insertion(+) diff --git a/ggml.c b/ggml.c index dc43b0bbe..ca98fde8a 100644 --- a/ggml.c +++ b/ggml.c @@ -16932,6 +16932,7 @@ struct ggml_cplan ggml_graph_plan(const struct ggml_cgraph * cgraph, int n_threa if (ggml_compute_forward_mul_mat_use_blas(node)) { if (node->src[0]->type != GGML_TYPE_F32) { // here we need memory for fully dequantized matrix from src0 + // take into account that src0 can be broadcasted into src1[2,3] cur = ggml_type_size(GGML_TYPE_F32) * node->src[0]->ne[0]*node->src[0]->ne[1] * node->src[1]->ne[2]*node->src[1]->ne[3];