threadpool: update calling thread prio and affinity only at start/resume

max-krasnyansky · max-krasnyansky · commit 693b6685f863 · 2024-08-26T13:10:11.000-07:00
This avoids extra syscalls for each graph_compute()
diff --git a/ggml/src/ggml.c b/ggml/src/ggml.c
@@ -18898,6 +18898,12 @@ static void ggml_resume_threadpool_locked(struct ggml_compute_threadpool * threa
     GGML_PRINT_DEBUG("Resuming threadpool\n");
     threadpool->pause = false;
     ggml_cond_broadcast(&threadpool->cond);
+
+    // Update main thread prio and affinity to match the threadpool settings
+    ggml_thread_apply_thread_priority(threadpool->prio);
+    if (ggml_thread_cpumask_is_valid(threadpool->workers[0].cpumask)) {
+        ggml_thread_apply_affinity(threadpool->workers[0].cpumask);
+    }
 }
 #endif
 
@@ -19324,6 +19330,14 @@ static struct ggml_compute_threadpool * ggml_create_threadpool_impl(
     }
 
     ggml_thread_cpumask_next(tpp->cpumask, workers[0].cpumask, tpp->strict_cpu, &cpumask_iter);
+
+    if (!threadpool->pause) {
+        // Update main thread prio and affinity at the start, otherwise we'll do it in resume
+        ggml_thread_apply_thread_priority(threadpool->prio);
+        if (ggml_thread_cpumask_is_valid(threadpool->workers[0].cpumask)) {
+            ggml_thread_apply_affinity(threadpool->workers[0].cpumask);
+        }
+    }
 #endif // GGML_USE_OPENMP
 
     return threadpool;
@@ -19380,12 +19394,6 @@ enum ggml_status ggml_graph_compute(struct ggml_cgraph * cgraph, struct ggml_cpl
         ggml_graph_compute_thread(&threadpool->workers[0]);
     }
 #else
-    // Update main thread prio and affinity to match the current threadpool
-    ggml_thread_apply_thread_priority(threadpool->prio);
-    if (ggml_thread_cpumask_is_valid(threadpool->workers[0].cpumask)) {
-        ggml_thread_apply_affinity(threadpool->workers[0].cpumask);
-    }
-
     // Kick all threads to start the new graph
     ggml_graph_compute_kickoff(threadpool);