norm & rms_norm can not be threaded:
after investigation rms norm for quite some time I come to the conclusion that neither norm, nor rms_norm can be threaded, because we need mean over all items, not just of the slices each thread sees.
This commit is contained in:
parent
b164343529
commit
b908007471
1 changed files with 2 additions and 2 deletions
4
ggml.c
4
ggml.c
|
@ -13288,8 +13288,8 @@ void ggml_graph_compute(struct ggml_context * ctx, struct ggml_cgraph * cgraph)
|
|||
case GGML_OP_RMS_NORM:
|
||||
case GGML_OP_RMS_NORM_BACK:
|
||||
{
|
||||
// i think this must not be threaded, because we need mean over all items, not just the slices each thread sees
|
||||
node->n_tasks = n_threads;
|
||||
// i think this cannot be threaded, because we need mean over all items, not just the slices each thread sees.
|
||||
node->n_tasks = 1;
|
||||
} break;
|
||||
case GGML_OP_MUL_MAT:
|
||||
{
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue