Kotlin
diff --git a/‎benchmarks/build.gradle‎
Lines changed: 1 addition & 1 deletion b/‎benchmarks/build.gradle‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎benchmarks/src/jmh/kotlin/benchmarks/ForkJoinBenchmark.kt‎
Lines changed: 166 additions & 0 deletions b/‎benchmarks/src/jmh/kotlin/benchmarks/ForkJoinBenchmark.kt‎
Lines changed: 166 additions & 0 deletions
diff --git a/‎benchmarks/src/jmh/kotlin/benchmarks/GuideSyncBenchmark.kt‎
Lines changed: 7 additions & 7 deletions b/‎benchmarks/src/jmh/kotlin/benchmarks/GuideSyncBenchmark.kt‎
Lines changed: 7 additions & 7 deletions
diff --git a/‎benchmarks/src/jmh/kotlin/benchmarks/LaunchBenchmark.kt‎
Lines changed: 52 additions & 0 deletions b/‎benchmarks/src/jmh/kotlin/benchmarks/LaunchBenchmark.kt‎
Lines changed: 52 additions & 0 deletions
diff --git a/‎benchmarks/src/jmh/kotlin/benchmarks/ParametrizedDispatcherBase.kt‎
Lines changed: 43 additions & 0 deletions b/‎benchmarks/src/jmh/kotlin/benchmarks/ParametrizedDispatcherBase.kt‎
Lines changed: 43 additions & 0 deletions
@@ -11,7 +11,7 @@ repositories {
 }
 
 dependencies {
-    jmh 'com.typesafe.akka:akka-actor:2.0.2'
+    jmh 'com.typesafe.akka:akka-actor_2.12:2.5.0'
     jmh project(':kotlinx-coroutines-core-common')
     jmh project(':kotlinx-coroutines-core')
     jmh project(':kotlinx-coroutines-core').sourceSets.test.output
 
@@ -0,0 +1,166 @@
+package benchmarks
+
+import benchmarks.ForkJoinBenchmark.Companion.BATCH_SIZE
+import kotlinx.coroutines.experimental.CommonPool
+import kotlinx.coroutines.experimental.Deferred
+import kotlinx.coroutines.experimental.async
+import kotlinx.coroutines.experimental.runBlocking
+import org.openjdk.jmh.annotations.*
+import java.util.concurrent.*
+import kotlin.coroutines.experimental.CoroutineContext
+
+/*
+ * Comparison of fork-join tasks using specific FJP API and classic [async] jobs.
+ * FJP job is organized in perfectly balanced binary tree, every leaf node computes
+ * FPU-heavy sum over its data and intermediate nodes sum results.
+ *
+ * Fine-grained batch size (8192 * 1024 tasks, 128 in sequential batch)
+ * ForkJoinBenchmark.asyncExperimental  avgt   10  681.512 ± 32.069  ms/op
+ * ForkJoinBenchmark.asyncFjp           avgt   10  845.386 ± 73.204  ms/op
+ * ForkJoinBenchmark.fjpRecursiveTask   avgt   10  692.120 ± 26.224  ms/op
+ * ForkJoinBenchmark.fjpTask            avgt   10  791.087 ± 66.544  ms/op
+ *
+ * Too small tasks (8192 * 1024 tasks, 128 batch, 16 in sequential batch)
+ * Benchmark                            Mode  Cnt     Score     Error  Units
+ * ForkJoinBenchmark.asyncExperimental  avgt   10  1273.271 ± 190.372  ms/op
+ * ForkJoinBenchmark.asyncFjp           avgt   10  1406.102 ± 216.793  ms/op
+ * ForkJoinBenchmark.fjpRecursiveTask   avgt   10   849.941 ± 141.254  ms/op
+ * ForkJoinBenchmark.fjpTask            avgt   10   831.554 ±  57.276  ms/op
+ */
+@Warmup(iterations = 5, time = 1, timeUnit = TimeUnit.SECONDS)
+@Measurement(iterations = 5, time = 1, timeUnit = TimeUnit.SECONDS)
+@Fork(value = 2)
+@BenchmarkMode(Mode.AverageTime)
+@OutputTimeUnit(TimeUnit.MILLISECONDS)
+@State(Scope.Benchmark)
+open class ForkJoinBenchmark : ParametrizedDispatcherBase() {
+
+    companion object {
+        /*
+         * Change task size to control global granularity of benchmark
+         * Change batch size to control affinity/work stealing/scheduling overhead effects
+         */
+        const val TASK_SIZE = 8192 * 1024
+        const val BATCH_SIZE = 32 * 8192
+    }
+
+    lateinit var coefficients: LongArray
+    override var dispatcher: String = "experimental"
+
+    @Setup
+    override fun setup() {
+        super.setup()
+        coefficients = LongArray(TASK_SIZE) { ThreadLocalRandom.current().nextLong(0, 1024 * 1024) }
+    }
+
+    @Benchmark
+    fun asyncFjp() = runBlocking {
+        startAsync(coefficients, 0, coefficients.size, CommonPool).await()
+    }
+
+    @Benchmark
+    fun asyncExperimental() = runBlocking {
+        startAsync(coefficients, 0, coefficients.size, benchmarkContext).await()
+    }
+
+    @Benchmark
+    fun fjpRecursiveTask(): Double {
+        val task = RecursiveAction(coefficients, 0, coefficients.size)
+        return ForkJoinPool.commonPool().submit(task).join()
+    }
+
+    @Benchmark
+    fun fjpTask(): Double {
+        val task = Task(coefficients, 0, coefficients.size)
+        return ForkJoinPool.commonPool().submit(task).join()
+    }
+
+    suspend fun startAsync(coefficients: LongArray, start: Int, end: Int, dispatcher: CoroutineContext): Deferred<Double> = async(dispatcher) {
+        if (end - start <= BATCH_SIZE) {
+            compute(coefficients, start, end)
+        } else {
+            val first = startAsync(coefficients, start, start + (end - start) / 2, dispatcher)
+            val second = startAsync(coefficients, start + (end - start) / 2, end, dispatcher)
+            first.await() + second.await()
+        }
+    }
+
+    class Task(val coefficients: LongArray, val start: Int, val end: Int) : RecursiveTask<Double>() {
+        override fun compute(): Double {
+            if (end - start <= BATCH_SIZE) {
+                return compute(coefficients, start, end)
+            }
+
+            val first = Task(coefficients, start, start + (end - start) / 2).fork()
+            val second = Task(coefficients, start + (end - start) / 2, end).fork()
+
+            var result = 0.0
+            result += first.join()
+            result += second.join()
+            return result
+        }
+
+        private fun compute(coefficients: LongArray, start: Int, end: Int): Double {
+            var result = 0.0
+            for (i in start until end) {
+                result += Math.sin(Math.pow(coefficients[i].toDouble(), 1.1)) + 1e-8
+            }
+
+            return result
+        }
+    }
+
+    class RecursiveAction(val coefficients: LongArray, val start: Int, val end: Int, @Volatile var result: Double = 0.0,
+                          parent: RecursiveAction? = null) : CountedCompleter<Double>(parent) {
+
+        private var first: ForkJoinTask<Double>? = null
+        private var second: ForkJoinTask<Double>? = null
+
+        override fun getRawResult(): Double {
+            return result
+        }
+
+        override fun setRawResult(t: Double) {
+            result = t
+        }
+
+        override fun compute() {
+            if (end - start <= BATCH_SIZE) {
+                rawResult = compute(coefficients, start, end)
+            } else {
+                pendingCount = 2
+                // One may fork only once here and executing second task here with looping over firstComplete to be even more efficient
+                first = RecursiveAction(coefficients, start, start + (end - start) / 2, parent = this).fork()
+                second = RecursiveAction(coefficients, start + (end - start) / 2, end, parent = this).fork()
+            }
+
+            tryComplete()
+        }
+
+        override fun onCompletion(caller: CountedCompleter<*>?) {
+            if (caller !== this) {
+                rawResult = first!!.rawResult + second!!.rawResult
+            }
+            super.onCompletion(caller)
+        }
+    }
+}
+
+
+private fun compute(coefficients: LongArray, start: Int, end: Int): Double {
+    var result = 0.0
+    for (i in start until end) {
+        result += Math.sin(Math.pow(coefficients[i].toDouble(), 1.1)) + 1e-8
+    }
+
+    return result
+}
+
+
+fun main(args: Array<String>) {
+    // Hand-rollled test
+    val arr = LongArray(BATCH_SIZE * 8) { ThreadLocalRandom.current().nextLong(0, 100) }
+
+    println(ForkJoinPool.commonPool().submit(ForkJoinBenchmark.Task(arr, 0, arr.size)).join())
+    println(ForkJoinBenchmark.RecursiveAction(arr, 0, arr.size).invoke())
+}
@@ -45,36 +45,36 @@ open class GuideSyncBenchmark {
 
     @Benchmark
     fun sync01Problem() {
-        guide.sync.example01.main(emptyArray())
+        kotlinx.coroutines.experimental.guide.sync01.main(emptyArray())
     }
 
     @Benchmark
     fun sync02Volatile() {
-        guide.sync.example02.main(emptyArray())
+        kotlinx.coroutines.experimental.guide.sync02.main(emptyArray())
     }
 
     @Benchmark
     fun sync03AtomicInt() {
-        guide.sync.example03.main(emptyArray())
+        kotlinx.coroutines.experimental.guide.sync03.main(emptyArray())
     }
 
     @Benchmark
     fun sync04ConfineFine() {
-        guide.sync.example04.main(emptyArray())
+        kotlinx.coroutines.experimental.guide.sync04.main(emptyArray())
     }
 
     @Benchmark
     fun sync05ConfineCoarse() {
-        guide.sync.example05.main(emptyArray())
+        kotlinx.coroutines.experimental.guide.sync05.main(emptyArray())
     }
 
     @Benchmark
     fun sync06Mutex() {
-        guide.sync.example06.main(emptyArray())
+        kotlinx.coroutines.experimental.guide.sync06.main(emptyArray())
     }
 
     @Benchmark
     fun sync07Actor() {
-        guide.sync.example07.main(emptyArray())
+        kotlinx.coroutines.experimental.guide.sync07.main(emptyArray())
     }
 }
@@ -0,0 +1,52 @@
+package benchmarks
+
+import kotlinx.coroutines.experimental.launch
+import org.openjdk.jmh.annotations.*
+import java.util.concurrent.CyclicBarrier
+import java.util.concurrent.TimeUnit
+
+/*
+ * Benchmark to measure scheduling overhead in comparison with FJP.
+ * LaunchBenchmark.massiveLaunch  experimental  avgt   30  328.662 ± 52.789  us/op
+ * LaunchBenchmark.massiveLaunch           fjp  avgt   30  179.762 ±  3.931  us/op
+ */
+@Warmup(iterations = 10, time = 1, timeUnit = TimeUnit.SECONDS)
+@Measurement(iterations = 10, time = 1, timeUnit = TimeUnit.SECONDS)
+@Fork(value = 2)
+@BenchmarkMode(Mode.AverageTime)
+@OutputTimeUnit(TimeUnit.MICROSECONDS)
+@State(Scope.Benchmark)
+open class LaunchBenchmark : ParametrizedDispatcherBase() {
+
+    @Param("experimental", "fjp")
+    override var dispatcher: String = "fjp"
+
+    private val jobsToLaunch = 100
+    private val submitters = 4
+
+    private val allLaunched = CyclicBarrier(submitters)
+    private val stopBarrier = CyclicBarrier(submitters + 1)
+
+    @Benchmark
+    fun massiveLaunch() {
+        repeat(submitters) {
+            launch(benchmarkContext) {
+                // Wait until all cores are occupied
+                allLaunched.await()
+                allLaunched.reset()
+
+                (1..jobsToLaunch).map {
+                    launch(coroutineContext) {
+                        // do nothing
+                    }
+                }.map { it.join() }
+
+                stopBarrier.await()
+            }
+        }
+
+        stopBarrier.await()
+        stopBarrier.reset()
+    }
+
+}
@@ -0,0 +1,43 @@
+package benchmarks
+
+import benchmarks.actors.CORES_COUNT
+import kotlinx.coroutines.experimental.CommonPool
+import kotlinx.coroutines.experimental.ThreadPoolDispatcher
+import kotlinx.coroutines.experimental.newFixedThreadPoolContext
+import kotlinx.coroutines.experimental.scheduling.*
+import org.openjdk.jmh.annotations.Param
+import org.openjdk.jmh.annotations.Setup
+import org.openjdk.jmh.annotations.TearDown
+import java.io.Closeable
+import kotlin.coroutines.experimental.CoroutineContext
+
+/**
+ * Base class to use different [CoroutineContext] in benchmarks via [Param] in inheritors.
+ * Currently allowed values are "fjp" for [CommonPool] and ftp_n for [ThreadPoolDispatcher] with n threads.
+ */
+abstract class ParametrizedDispatcherBase {
+
+    abstract var dispatcher: String
+    lateinit var benchmarkContext: CoroutineContext // coroutineContext clashes with scope parameter
+    var closeable: Closeable? = null
+
+    @Setup
+    open fun setup() {
+        benchmarkContext = when {
+            dispatcher == "fjp" -> CommonPool
+            dispatcher == "experimental" -> {
+                ExperimentalCoroutineDispatcher(CORES_COUNT).also { closeable = it }
+            }
+            dispatcher.startsWith("ftp") -> {
+                newFixedThreadPoolContext(dispatcher.substring(4).toInt(), dispatcher).also { closeable = it }
+            }
+            else -> error("Unexpected dispatcher: $dispatcher")
+        }
+    }
+
+    @TearDown
+    fun tearDown() {
+        closeable?.close()
+    }
+
+}
Original file line number	Diff line number	Diff line change
`@@ -11,7 +11,7 @@ repositories {`
`11`	`11`	`}`
`12`	`12`
`13`	`13`	`dependencies {`
`14`		`- jmh 'com.typesafe.akka:akka-actor:2.0.2'`
	`14`	`+ jmh 'com.typesafe.akka:akka-actor_2.12:2.5.0'`
`15`	`15`	`jmh project(':kotlinx-coroutines-core-common')`
`16`	`16`	`jmh project(':kotlinx-coroutines-core')`
`17`	`17`	`jmh project(':kotlinx-coroutines-core').sourceSets.test.output`
Original file line number	Diff line number	Diff line change
`@@ -45,36 +45,36 @@ open class GuideSyncBenchmark {`
`45`	`45`
`46`	`46`	`@Benchmark`
`47`	`47`	`fun sync01Problem() {`
`48`		`- guide.sync.example01.main(emptyArray())`
	`48`	`+ kotlinx.coroutines.experimental.guide.sync01.main(emptyArray())`
`49`	`49`	`}`
`50`	`50`
`51`	`51`	`@Benchmark`
`52`	`52`	`fun sync02Volatile() {`
`53`		`- guide.sync.example02.main(emptyArray())`
	`53`	`+ kotlinx.coroutines.experimental.guide.sync02.main(emptyArray())`
`54`	`54`	`}`
`55`	`55`
`56`	`56`	`@Benchmark`
`57`	`57`	`fun sync03AtomicInt() {`
`58`		`- guide.sync.example03.main(emptyArray())`
	`58`	`+ kotlinx.coroutines.experimental.guide.sync03.main(emptyArray())`
`59`	`59`	`}`
`60`	`60`
`61`	`61`	`@Benchmark`
`62`	`62`	`fun sync04ConfineFine() {`
`63`		`- guide.sync.example04.main(emptyArray())`
	`63`	`+ kotlinx.coroutines.experimental.guide.sync04.main(emptyArray())`
`64`	`64`	`}`
`65`	`65`
`66`	`66`	`@Benchmark`
`67`	`67`	`fun sync05ConfineCoarse() {`
`68`		`- guide.sync.example05.main(emptyArray())`
	`68`	`+ kotlinx.coroutines.experimental.guide.sync05.main(emptyArray())`
`69`	`69`	`}`
`70`	`70`
`71`	`71`	`@Benchmark`
`72`	`72`	`fun sync06Mutex() {`
`73`		`- guide.sync.example06.main(emptyArray())`
	`73`	`+ kotlinx.coroutines.experimental.guide.sync06.main(emptyArray())`
`74`	`74`	`}`
`75`	`75`
`76`	`76`	`@Benchmark`
`77`	`77`	`fun sync07Actor() {`
`78`		`- guide.sync.example07.main(emptyArray())`
	`78`	`+ kotlinx.coroutines.experimental.guide.sync07.main(emptyArray())`
`79`	`79`	`}`
`80`	`80`	`}`