ggml : when using BLAS start only 1 CPU thread

pull/383/head
Georgi Gerganov 1 year ago
parent 6394c906af
commit d347a59a5f
No known key found for this signature in database
GPG Key ID: 449E073F9DC10735

@ -7257,6 +7257,7 @@ void ggml_graph_compute(struct ggml_context * ctx, struct ggml_cgraph * cgraph)
node->src1->type == GGML_TYPE_F32) {
#if defined(GGML_USE_ACCELERATE) || defined(GGML_USE_OPENBLAS)
if (ggml_compute_forward_mul_mat_use_blas(node->src0, node->src1, node)) {
node->n_tasks = 1;
cur = sizeof(float)*(node->src0->ne[0]*node->src0->ne[1]);
} else {
cur = sizeof(ggml_fp16_t)*ggml_nelements(node->src1);

Loading…
Cancel
Save