ggml : when using BLAS start only 1 CPU thread

2025-08-18 15:28:50 +02:00 · 2023-01-07 19:48:56 +02:00
parent 6394c906af
commit d347a59a5f
1 changed files with 1 additions and 0 deletions
--- a/ggml.c
+++ b/ggml.c
@@ -7257,6 +7257,7 @@ void ggml_graph_compute(struct ggml_context * ctx, struct ggml_cgraph * cgraph)
                                node->src1->type == GGML_TYPE_F32) {
 #if defined(GGML_USE_ACCELERATE) || defined(GGML_USE_OPENBLAS)
                                if (ggml_compute_forward_mul_mat_use_blas(node->src0, node->src1, node)) {
                                    node->n_tasks = 1;
                                    cur = sizeof(float)*(node->src0->ne[0]*node->src0->ne[1]);
                                } else {
                                    cur = sizeof(ggml_fp16_t)*ggml_nelements(node->src1);