benchmarks

jangorecki · jangorecki · commit ee6fb9d0f796 · 2025-10-17T09:02:44.000+02:00
diff --git a/R/utils.R b/R/utils.R
@@ -227,3 +227,13 @@ formula_vars = function(f, x) { # .formula2varlist is not API and seems to have
     attr(terms, "term.labels")
   )
 }
+
+omp_flags = function(variant, len, halt, th) {
+  th = as.integer(th)
+  halt = as.integer(halt)
+  len = as.integer(len)
+  variant = as.integer(variant)
+  stopifnot(is.integer(th))
+  stopifnot(th <= parallel::detectCores(), th > 0L)
+  .Call("Cbenchmark_omp_flagR", variant, len, halt, th)
+}
diff --git a/src/data.table.h b/src/data.table.h
@@ -410,3 +410,5 @@ SEXP dt_has_zlib(void);
 SEXP startsWithAny(SEXP, SEXP, SEXP);
 SEXP convertDate(SEXP, SEXP);
 SEXP fastmean(SEXP);
+
+SEXP benchmark_omp_flagR(SEXP, SEXP, SEXP, SEXP);
diff --git a/src/init.c b/src/init.c
@@ -160,6 +160,7 @@ R_CallMethodDef callMethods[] = {
 {"CmemcpyDTadaptive", (DL_FUNC)&memcpyDTadaptive, -1},
 {"Csetgrowable", (DL_FUNC)&setgrowable, -1},
 {"Cfrolladapt", (DL_FUNC)&frolladapt, -1},
+{"Cbenchmark_omp_flagR", (DL_FUNC)&benchmark_omp_flagR, -1},
 {NULL, NULL, 0}
 };
 
diff --git a/src/omp-flags.c b/src/omp-flags.c
@@ -0,0 +1,80 @@
+#include "data.table.h"
+
+void benchmark_omp_flag(const int variant, int len, int halt, int th, int *cnt) {
+  if (variant == 1) {
+    // plain as is now
+    bool skip = false;
+    #pragma omp parallel for num_threads(th)
+    for (int i=0; i<len; i++) {
+      if (skip)
+        continue;
+      int tid = omp_get_thread_num(); 
+      cnt[tid]++;
+      if (i == halt)
+        skip = true;
+    }
+  } else if (variant == 2) {
+    // volatile
+    volatile bool skip = false;
+    #pragma omp parallel for num_threads(th)
+    for (int i=0; i<len; i++) {
+      if (skip)
+        continue;
+      int tid = omp_get_thread_num(); 
+      cnt[tid]++;
+      if (i == halt)
+        skip = true;
+    }
+  } else if (variant == 3) {
+    // volatile and shared
+    volatile bool skip = false;
+    #pragma omp parallel for num_threads(th) shared(skip)
+    for (int i=0; i<len; i++) {
+      if (skip)
+        continue;
+      int tid = omp_get_thread_num(); 
+      cnt[tid]++;
+      if (i == halt)
+        skip = true;
+    }
+  } else if (variant == 4) {
+    // atomic write
+    bool skip = false;
+    #pragma omp parallel for num_threads(th) shared(skip)
+    for (int i=0; i<len; i++) {
+      if (skip)
+        continue;
+      int tid = omp_get_thread_num(); 
+      cnt[tid]++;
+      if (i == halt) {
+        #pragma omp atomic write
+        skip = true;
+      }
+    }
+  } else if (variant == 5) {
+    // atomic read and atomic write
+    bool skip = false;
+    #pragma omp parallel for num_threads(th) shared(skip)
+    for (int i=0; i<len; i++) {
+      bool local_skip;
+      #pragma omp atomic read
+      local_skip = skip;
+      if (local_skip)
+          continue;
+      int tid = omp_get_thread_num(); 
+      cnt[tid]++;
+      if (i == halt) {
+        #pragma omp atomic write
+        skip = true;
+      }
+    }
+  }
+}
+
+SEXP benchmark_omp_flagR(SEXP variant, SEXP len, SEXP halt, SEXP th) {
+  SEXP ans = PROTECT(allocVector(INTSXP, INTEGER_RO(th)[0]));
+  for (int i=0; i<INTEGER_RO(th)[0]; i++) INTEGER(ans)[i] = 0;
+  benchmark_omp_flag(INTEGER_RO(variant)[0], INTEGER_RO(len)[0], INTEGER_RO(halt)[0]-1, INTEGER_RO(th)[0], INTEGER(ans));
+  UNPROTECT(1);
+  return(ans);
+}

Original file line number	Diff line number	Diff line change
`@@ -227,3 +227,13 @@ formula_vars = function(f, x) { # .formula2varlist is not API and seems to have`
`227`	`227`	`attr(terms, "term.labels")`
`228`	`228`	`)`
`229`	`229`	`}`
	`230`	`+`
	`231`	`+omp_flags = function(variant, len, halt, th) {`
	`232`	`+ th = as.integer(th)`
	`233`	`+ halt = as.integer(halt)`
	`234`	`+ len = as.integer(len)`
	`235`	`+ variant = as.integer(variant)`
	`236`	`+ stopifnot(is.integer(th))`
	`237`	`+ stopifnot(th <= parallel::detectCores(), th > 0L)`
	`238`	`+ .Call("Cbenchmark_omp_flagR", variant, len, halt, th)`
	`239`	`+}`