From daa87b1813dec45c36635f8358719b2d2ba83893 Mon Sep 17 00:00:00 2001
From: Kunnis <kunnis@gmail.com>
Date: Thu, 9 May 2024 22:12:20 -0500
Subject: [PATCH] adding the current_chunk

---
 ggml.c | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/ggml.c b/ggml.c
index 32eeb247f..6d368185a 100644
--- a/ggml.c
+++ b/ggml.c
@@ -1578,6 +1578,8 @@ struct ggml_compute_state_shared {
 
     ggml_abort_callback abort_callback; // abort ggml_graph_compute when true
     void* abort_callback_data;
+
+    atomic_int current_chunk; // currently processing chunk during Mat_Mul, shared between all the threads.
 };
 
 struct ggml_compute_state {
@@ -12003,6 +12005,8 @@ UseGgmlGemm1:;
         if (ith != 0) {
             return;
         }
+        //Every thread starts at ith, so the first unprocessed chunk is nth.  This save a bit of coordination right at the start.
+        atomic_store(&state->shared->current_chunk, nth);
         if (src1->type != vec_dot_type) {
             char * wdata = params->wdata;
             const size_t row_size = ggml_row_size(vec_dot_type, ne10);