From df54d2f1d4a62975a6e45d52b6b32a3308625fb4 Mon Sep 17 00:00:00 2001 From: Georgi Gerganov Date: Wed, 30 Aug 2023 19:37:26 +0300 Subject: [PATCH] ggml : use less ggml_mul tasks when src0 rows are few --- ggml.c | 11 +++++++++-- 1 file changed, 9 insertions(+), 2 deletions(-) diff --git a/ggml.c b/ggml.c index 631d4b953..12e3a1f91 100644 --- a/ggml.c +++ b/ggml.c @@ -9329,11 +9329,12 @@ static void ggml_compute_forward_mul_f32( struct ggml_tensor * dst) { GGML_ASSERT(ggml_can_repeat_rows(src1, src0) && ggml_are_same_shape(src0, dst)); + const int ith = params->ith; + const int nth = params->nth; + if (params->type == GGML_TASK_INIT || params->type == GGML_TASK_FINALIZE) { return; } - const int ith = params->ith; - const int nth = params->nth; #ifdef GGML_USE_CLBLAST if (src1->backend == GGML_BACKEND_GPU) { @@ -17229,7 +17230,13 @@ struct ggml_cplan ggml_graph_plan(struct ggml_cgraph * cgraph, int n_threads) { } } break; case GGML_OP_SILU_BACK: + { + n_tasks = n_threads; + } break; case GGML_OP_MUL: + { + n_tasks = MIN(n_threads, ggml_nrows(node->src[0])); + } break; case GGML_OP_NORM: case GGML_OP_RMS_NORM: case GGML_OP_RMS_NORM_BACK: