From d347a59a5f224f6a5ab0084ec95715451972d3b0 Mon Sep 17 00:00:00 2001 From: Georgi Gerganov Date: Sat, 7 Jan 2023 19:48:56 +0200 Subject: [PATCH] ggml : when using BLAS start only 1 CPU thread --- ggml.c | 1 + 1 file changed, 1 insertion(+) diff --git a/ggml.c b/ggml.c index 058241e..f4c96eb 100644 --- a/ggml.c +++ b/ggml.c @@ -7257,6 +7257,7 @@ void ggml_graph_compute(struct ggml_context * ctx, struct ggml_cgraph * cgraph) node->src1->type == GGML_TYPE_F32) { #if defined(GGML_USE_ACCELERATE) || defined(GGML_USE_OPENBLAS) if (ggml_compute_forward_mul_mat_use_blas(node->src0, node->src1, node)) { + node->n_tasks = 1; cur = sizeof(float)*(node->src0->ne[0]*node->src0->ne[1]); } else { cur = sizeof(ggml_fp16_t)*ggml_nelements(node->src1);