improve_benchmark

coderfender · coderfender · commit b5e61b1a9d8a · 2026-01-02T19:25:34.000-08:00
diff --git a/Makefile b/Makefile
@@ -105,5 +105,35 @@ release-nogit:
 	./mvnw install -Prelease -DskipTests $(PROFILES) -Dmaven.gitcommitid.skip=true
 benchmark-%: release
 	cd spark && COMET_CONF_DIR=$(shell pwd)/conf MAVEN_OPTS='-Xmx20g ${call spark_jvm_17_extra_args}' ../mvnw exec:java -Dexec.mainClass="$*" -Dexec.classpathScope="test" -Dexec.cleanupDaemonThreads="false" -Dexec.args="$(filter-out $@,$(MAKECMDGOALS))" $(PROFILES)
+
+# Discover all benchmark classes dynamically
+BENCHMARK_CLASSES := $(shell find spark/src/test/scala/org/apache/spark/sql/benchmark -name "Comet*Benchmark.scala" -type f | \
+	xargs grep -l "object.*Benchmark.*extends.*CometBenchmarkBase" | \
+	sed 's|spark/src/test/scala/||g' | \
+	sed 's|/|.|g' | \
+	sed 's|.scala||g' | \
+	sort)
+
+# Run all discovered benchmarks
+benchmark-all:
+	@echo "Discovered benchmarks:"
+	@echo "$(BENCHMARK_CLASSES)" | tr ' ' '\n'
+	@echo ""
+	@echo "Running all benchmarks (this will take a long time)..."
+	@for benchmark in $(BENCHMARK_CLASSES); do \
+		echo ""; \
+		echo "======================================"; \
+		echo "Running: $$benchmark"; \
+		echo "======================================"; \
+		SPARK_GENERATE_BENCHMARK_FILES=1 $(MAKE) benchmark-$$benchmark || echo "WARNING: $$benchmark failed"; \
+	done
+	@echo ""
+	@echo "All benchmarks completed!"
+
+# List all available benchmarks
+list-benchmarks:
+	@echo "Available benchmarks:"
+	@echo "$(BENCHMARK_CLASSES)" | tr ' ' '\n'
+
 .DEFAULT:
 	@: # ignore arguments provided to benchmarks e.g. "make benchmark-foo -- --bar", we do not want to treat "--bar" as target
diff --git a/spark/src/test/scala/org/apache/spark/sql/benchmark/CometAggregateBenchmark.scala b/spark/src/test/scala/org/apache/spark/sql/benchmark/CometAggregateBenchmark.scala
@@ -19,8 +19,6 @@
 
 package org.apache.spark.sql.benchmark
 
-import scala.util.Try
-
 import org.apache.spark.benchmark.Benchmark
 import org.apache.spark.sql.SparkSession
 import org.apache.spark.sql.internal.SQLConf
@@ -87,7 +85,7 @@ object CometAggregateBenchmark extends CometBenchmarkBase {
           s"SQL Parquet - Spark (${aggregateFunction.toString}) ansi mode enabled : ${isAnsiMode}") {
           _ =>
             withSQLConf(SQLConf.ANSI_ENABLED.key -> isAnsiMode.toString) {
-              Try { spark.sql(query).noop() }
+              spark.sql(query).noop()
             }
         }
 
@@ -98,7 +96,7 @@ object CometAggregateBenchmark extends CometBenchmarkBase {
               CometConf.COMET_ENABLED.key -> "true",
               CometConf.COMET_EXEC_ENABLED.key -> "true",
               SQLConf.ANSI_ENABLED.key -> isAnsiMode.toString) {
-              Try { spark.sql(query).noop() }
+              spark.sql(query).noop()
             }
         }
 
@@ -137,7 +135,7 @@ object CometAggregateBenchmark extends CometBenchmarkBase {
           benchmark.addCase(
             s"SQL Parquet - Spark (${aggregateFunction.toString}) ansi mode enabled : ${isAnsiMode}") {
             _ =>
-              Try { spark.sql(query).noop() }
+              spark.sql(query).noop()
           }
         }
 
@@ -148,7 +146,7 @@ object CometAggregateBenchmark extends CometBenchmarkBase {
               CometConf.COMET_ENABLED.key -> "true",
               CometConf.COMET_EXEC_ENABLED.key -> "true",
               SQLConf.ANSI_ENABLED.key -> isAnsiMode.toString) {
-              Try { spark.sql(query).noop() }
+              spark.sql(query).noop()
             }
         }
 
@@ -185,7 +183,7 @@ object CometAggregateBenchmark extends CometBenchmarkBase {
           s"SQL Parquet - Spark (${aggregateFunction.toString}) isANSIMode: ${isAnsiMode.toString}") {
           _ =>
             withSQLConf(SQLConf.ANSI_ENABLED.key -> isAnsiMode.toString) {
-              Try { spark.sql(query).noop() }
+              spark.sql(query).noop()
             }
         }
 
@@ -197,7 +195,7 @@ object CometAggregateBenchmark extends CometBenchmarkBase {
               CometConf.COMET_EXEC_ENABLED.key -> "true",
               CometConf.COMET_ONHEAP_MEMORY_OVERHEAD.key -> "1G",
               SQLConf.ANSI_ENABLED.key -> isAnsiMode.toString) {
-              Try { spark.sql(query).noop() }
+              spark.sql(query).noop()
             }
         }
 
@@ -236,7 +234,7 @@ object CometAggregateBenchmark extends CometBenchmarkBase {
           s"SQL Parquet - Spark (${aggregateFunction.toString}) isANSIMode: ${isAnsiMode.toString}") {
           _ =>
             withSQLConf(SQLConf.ANSI_ENABLED.key -> isAnsiMode.toString) {
-              Try { spark.sql(query).noop() }
+              spark.sql(query).noop()
             }
         }
 
@@ -247,7 +245,7 @@ object CometAggregateBenchmark extends CometBenchmarkBase {
               CometConf.COMET_ENABLED.key -> "true",
               CometConf.COMET_EXEC_ENABLED.key -> "true",
               SQLConf.ANSI_ENABLED.key -> isAnsiMode.toString) {
-              Try { spark.sql(query).noop() }
+              spark.sql(query).noop()
             }
         }
 
@@ -260,36 +258,36 @@ object CometAggregateBenchmark extends CometBenchmarkBase {
     val total = 1024 * 1024 * 10
     val combinations = List(100, 1024, 1024 * 1024) // number of distinct groups
     benchmarkAggFuncs.foreach { aggFunc =>
-      Seq(true, false).foreach(k => {
-        runBenchmarkWithTable(
+      Seq(true, false).foreach(ansiMode => {
+        runBenchmarkWithSafeTable(
           s"Grouped Aggregate (single group key + single aggregate $aggFunc)",
           total) { v =>
           for (card <- combinations) {
-            singleGroupAndAggregate(v, card, aggFunc, k)
+            singleGroupAndAggregate(v, card, aggFunc, ansiMode)
           }
         }
 
-        runBenchmarkWithTable(
+        runBenchmarkWithSafeTable(
           s"Grouped Aggregate (multiple group keys + single aggregate $aggFunc)",
           total) { v =>
           for (card <- combinations) {
-            multiGroupKeys(v, card, aggFunc, k)
+            multiGroupKeys(v, card, aggFunc, ansiMode)
           }
         }
 
-        runBenchmarkWithTable(
+        runBenchmarkWithSafeTable(
           s"Grouped Aggregate (single group key + multiple aggregates $aggFunc)",
           total) { v =>
           for (card <- combinations) {
-            multiAggregates(v, card, aggFunc, k)
+            multiAggregates(v, card, aggFunc, ansiMode)
           }
         }
 
-        runBenchmarkWithTable(
+        runBenchmarkWithSafeTable(
           s"Grouped Aggregate (single group key + single aggregate $aggFunc on decimal)",
           total) { v =>
           for (card <- combinations) {
-            singleGroupAndAggregateDecimal(v, DecimalType(18, 10), card, aggFunc, k)
+            singleGroupAndAggregateDecimal(v, DecimalType(18, 10), card, aggFunc, ansiMode)
           }
         }
       })
diff --git a/spark/src/test/scala/org/apache/spark/sql/benchmark/CometArithmeticBenchmark.scala b/spark/src/test/scala/org/apache/spark/sql/benchmark/CometArithmeticBenchmark.scala
@@ -84,7 +84,7 @@ object CometArithmeticBenchmark extends CometBenchmarkBase {
 
     Seq(true, false).foreach { useDictionary =>
       Seq(Minus, Mul).foreach { op =>
-        runBenchmarkWithTable(op.name, TOTAL, useDictionary) { v =>
+        runBenchmarkWithSafeTable(op.name, TOTAL, useDictionary) { v =>
           integerArithmeticBenchmark(v, op, useDictionary)
         }
       }
diff --git a/spark/src/test/scala/org/apache/spark/sql/benchmark/CometBenchmarkBase.scala b/spark/src/test/scala/org/apache/spark/sql/benchmark/CometBenchmarkBase.scala
@@ -23,7 +23,7 @@ import java.io.File
 import java.nio.charset.StandardCharsets
 import java.util.Base64
 
-import scala.util.{Random, Try}
+import scala.util.Random
 
 import org.apache.parquet.crypto.DecryptionPropertiesFactory
 import org.apache.parquet.crypto.keytools.{KeyToolkit, PropertiesDrivenCryptoFactory}
@@ -33,7 +33,7 @@ import org.apache.spark.benchmark.Benchmark
 import org.apache.spark.sql.{DataFrame, DataFrameWriter, Row, SparkSession}
 import org.apache.spark.sql.execution.benchmark.SqlBasedBenchmark
 import org.apache.spark.sql.internal.SQLConf
-import org.apache.spark.sql.types.DecimalType
+import org.apache.spark.sql.types.{DataType, DecimalType}
 
 import org.apache.comet.CometConf
 import org.apache.comet.CometSparkSessionExtensions
@@ -88,6 +88,54 @@ trait CometBenchmarkBase extends SqlBasedBenchmark {
     }
   }
 
+  /**
+   * Creates a table with ANSI-safe values that won't overflow in arithmetic operations. Use this
+   * instead of runBenchmarkWithTable for arithmetic/aggregate benchmarks.
+   */
+  protected def runBenchmarkWithSafeTable(
+      benchmarkName: String,
+      values: Int,
+      useDictionary: Boolean = false)(f: Int => Any): Unit = {
+    withTempTable(tbl) {
+      import spark.implicits._
+      spark
+        .range(values)
+        .map(i => if (useDictionary) i % 5 else i % 10000)
+        .createOrReplaceTempView(tbl)
+      runBenchmark(benchmarkName)(f(values))
+    }
+  }
+
+  /**
+   * Generates ANSI-safe data for casting from Long to the specified target type. Returns a SQL
+   * expression that transforms the base "value" column to be within safe ranges.
+   *
+   * @param targetType
+   *   The target data type for casting
+   * @return
+   *   SQL expression to generate safe data
+   */
+  protected def generateAnsiSafeData(targetType: DataType): String = {
+    import org.apache.spark.sql.types._
+
+//    we generate long inputs initially and this case statement translates them into right data type so that the code doesn't fail in ANSI mode
+    targetType match {
+      case ByteType => "CAST((value % 128) AS BIGINT)"
+      case ShortType => "CAST((value % 32768) AS BIGINT)"
+      case IntegerType => "CAST((value % 2147483648) AS BIGINT)"
+      case LongType => "value"
+      case FloatType => "CAST((value % 1000000) AS BIGINT)"
+      case DoubleType => "value"
+      case _: DecimalType => "CAST((value % 100000000) AS BIGINT)"
+      case StringType => "CAST(value AS STRING)"
+      case BooleanType => "CAST((value % 2) AS BIGINT)"
+      case DateType => "CAST((value % 18262) AS BIGINT)"
+      case TimestampType => "value"
+      case BinaryType => "value"
+      case _ => "value"
+    }
+  }
+
   /**
    * Runs an expression benchmark with standard cases: Spark, Comet (Scan), Comet (Scan + Exec).
    * This provides a consistent benchmark structure for expression evaluation.
@@ -143,13 +191,8 @@ trait CometBenchmarkBase extends SqlBasedBenchmark {
   }
 
   private def runSparkCommand(spark: SparkSession, query: String, isANSIMode: Boolean): Unit = {
-    if (isANSIMode) {
-      Try {
-        spark.sql(query).noop()
-      }
-    } else {
-      spark.sql(query).noop()
-    }
+    // With ANSI-safe data generation, queries should not throw exceptions
+    spark.sql(query).noop()
   }
 
   protected def prepareTable(dir: File, df: DataFrame, partition: Option[String] = None): Unit = {
@@ -244,10 +287,12 @@ trait CometBenchmarkBase extends SqlBasedBenchmark {
       useDictionary: Boolean): DataFrame = {
     import spark.implicits._
 
-    val div = if (useDictionary) 5 else values
+    // Use safe range to avoid overflow in decimal operations
+    val maxValue = 10000
+    val div = if (useDictionary) 5 else maxValue
     spark
       .range(values)
-      .map(_ % div)
+      .map(i => i % div)
       .select((($"value" - 500) / 100.0) cast decimal as Symbol("dec"))
   }
 }
diff --git a/spark/src/test/scala/org/apache/spark/sql/benchmark/CometCastBenchmark.scala b/spark/src/test/scala/org/apache/spark/sql/benchmark/CometCastBenchmark.scala
@@ -79,7 +79,15 @@ object CometCastBenchmark extends CometBenchmarkBase {
 
     withTempPath { dir =>
       withTempTable("parquetV1Table") {
-        prepareTable(dir, spark.sql(s"SELECT value FROM $tbl"))
+        // Generate ANSI-safe data when in ANSI mode to avoid overflow exceptions
+        // In legacy mode, use raw values to test overflow handling
+        val dataExpr = if (isAnsiMode) {
+          generateAnsiSafeData(toDataType)
+        } else {
+          "value"
+        }
+
+        prepareTable(dir, spark.sql(s"SELECT $dataExpr as value FROM $tbl"))
 
         val functionSQL = castExprSQL(toDataType, "value")
         val query = s"SELECT $functionSQL FROM parquetV1Table"

Original file line number	Diff line number	Diff line change
`@@ -19,8 +19,6 @@`
`19`	`19`
`20`	`20`	`package org.apache.spark.sql.benchmark`
`21`	`21`
`22`		`-import scala.util.Try`
`23`		`-`
`24`	`22`	`import org.apache.spark.benchmark.Benchmark`
`25`	`23`	`import org.apache.spark.sql.SparkSession`
`26`	`24`	`import org.apache.spark.sql.internal.SQLConf`
`@@ -87,7 +85,7 @@ object CometAggregateBenchmark extends CometBenchmarkBase {`
`87`	`85`	`s"SQL Parquet - Spark (${aggregateFunction.toString}) ansi mode enabled : ${isAnsiMode}") {`
`88`	`86`	`_ =>`
`89`	`87`	`withSQLConf(SQLConf.ANSI_ENABLED.key -> isAnsiMode.toString) {`
`90`		`- Try { spark.sql(query).noop() }`
	`88`	`+ spark.sql(query).noop()`
`91`	`89`	`}`
`92`	`90`	`}`
`93`	`91`
`@@ -98,7 +96,7 @@ object CometAggregateBenchmark extends CometBenchmarkBase {`
`98`	`96`	`CometConf.COMET_ENABLED.key -> "true",`
`99`	`97`	`CometConf.COMET_EXEC_ENABLED.key -> "true",`
`100`	`98`	`SQLConf.ANSI_ENABLED.key -> isAnsiMode.toString) {`
`101`		`- Try { spark.sql(query).noop() }`
	`99`	`+ spark.sql(query).noop()`
`102`	`100`	`}`
`103`	`101`	`}`
`104`	`102`
`@@ -137,7 +135,7 @@ object CometAggregateBenchmark extends CometBenchmarkBase {`
`137`	`135`	`benchmark.addCase(`
`138`	`136`	`s"SQL Parquet - Spark (${aggregateFunction.toString}) ansi mode enabled : ${isAnsiMode}") {`
`139`	`137`	`_ =>`
`140`		`- Try { spark.sql(query).noop() }`
	`138`	`+ spark.sql(query).noop()`
`141`	`139`	`}`
`142`	`140`	`}`
`143`	`141`
`@@ -148,7 +146,7 @@ object CometAggregateBenchmark extends CometBenchmarkBase {`
`148`	`146`	`CometConf.COMET_ENABLED.key -> "true",`
`149`	`147`	`CometConf.COMET_EXEC_ENABLED.key -> "true",`
`150`	`148`	`SQLConf.ANSI_ENABLED.key -> isAnsiMode.toString) {`
`151`		`- Try { spark.sql(query).noop() }`
	`149`	`+ spark.sql(query).noop()`
`152`	`150`	`}`
`153`	`151`	`}`
`154`	`152`
`@@ -185,7 +183,7 @@ object CometAggregateBenchmark extends CometBenchmarkBase {`
`185`	`183`	`s"SQL Parquet - Spark (${aggregateFunction.toString}) isANSIMode: ${isAnsiMode.toString}") {`
`186`	`184`	`_ =>`
`187`	`185`	`withSQLConf(SQLConf.ANSI_ENABLED.key -> isAnsiMode.toString) {`
`188`		`- Try { spark.sql(query).noop() }`
	`186`	`+ spark.sql(query).noop()`
`189`	`187`	`}`
`190`	`188`	`}`
`191`	`189`
`@@ -197,7 +195,7 @@ object CometAggregateBenchmark extends CometBenchmarkBase {`
`197`	`195`	`CometConf.COMET_EXEC_ENABLED.key -> "true",`
`198`	`196`	`CometConf.COMET_ONHEAP_MEMORY_OVERHEAD.key -> "1G",`
`199`	`197`	`SQLConf.ANSI_ENABLED.key -> isAnsiMode.toString) {`
`200`		`- Try { spark.sql(query).noop() }`
	`198`	`+ spark.sql(query).noop()`
`201`	`199`	`}`
`202`	`200`	`}`
`203`	`201`
`@@ -236,7 +234,7 @@ object CometAggregateBenchmark extends CometBenchmarkBase {`
`236`	`234`	`s"SQL Parquet - Spark (${aggregateFunction.toString}) isANSIMode: ${isAnsiMode.toString}") {`
`237`	`235`	`_ =>`
`238`	`236`	`withSQLConf(SQLConf.ANSI_ENABLED.key -> isAnsiMode.toString) {`
`239`		`- Try { spark.sql(query).noop() }`
	`237`	`+ spark.sql(query).noop()`
`240`	`238`	`}`
`241`	`239`	`}`
`242`	`240`
`@@ -247,7 +245,7 @@ object CometAggregateBenchmark extends CometBenchmarkBase {`
`247`	`245`	`CometConf.COMET_ENABLED.key -> "true",`
`248`	`246`	`CometConf.COMET_EXEC_ENABLED.key -> "true",`
`249`	`247`	`SQLConf.ANSI_ENABLED.key -> isAnsiMode.toString) {`
`250`		`- Try { spark.sql(query).noop() }`
	`248`	`+ spark.sql(query).noop()`
`251`	`249`	`}`
`252`	`250`	`}`
`253`	`251`
`@@ -260,36 +258,36 @@ object CometAggregateBenchmark extends CometBenchmarkBase {`
`260`	`258`	`val total = 1024 * 1024 * 10`
`261`	`259`	`val combinations = List(100, 1024, 1024 * 1024) // number of distinct groups`
`262`	`260`	`benchmarkAggFuncs.foreach { aggFunc =>`
`263`		`- Seq(true, false).foreach(k => {`
`264`		`- runBenchmarkWithTable(`
	`261`	`+ Seq(true, false).foreach(ansiMode => {`
	`262`	`+ runBenchmarkWithSafeTable(`
`265`	`263`	`s"Grouped Aggregate (single group key + single aggregate $aggFunc)",`
`266`	`264`	`total) { v =>`
`267`	`265`	`for (card <- combinations) {`
`268`		`- singleGroupAndAggregate(v, card, aggFunc, k)`
	`266`	`+ singleGroupAndAggregate(v, card, aggFunc, ansiMode)`
`269`	`267`	`}`
`270`	`268`	`}`
`271`	`269`
`272`		`- runBenchmarkWithTable(`
	`270`	`+ runBenchmarkWithSafeTable(`
`273`	`271`	`s"Grouped Aggregate (multiple group keys + single aggregate $aggFunc)",`
`274`	`272`	`total) { v =>`
`275`	`273`	`for (card <- combinations) {`
`276`		`- multiGroupKeys(v, card, aggFunc, k)`
	`274`	`+ multiGroupKeys(v, card, aggFunc, ansiMode)`
`277`	`275`	`}`
`278`	`276`	`}`
`279`	`277`
`280`		`- runBenchmarkWithTable(`
	`278`	`+ runBenchmarkWithSafeTable(`
`281`	`279`	`s"Grouped Aggregate (single group key + multiple aggregates $aggFunc)",`
`282`	`280`	`total) { v =>`
`283`	`281`	`for (card <- combinations) {`
`284`		`- multiAggregates(v, card, aggFunc, k)`
	`282`	`+ multiAggregates(v, card, aggFunc, ansiMode)`
`285`	`283`	`}`
`286`	`284`	`}`
`287`	`285`
`288`		`- runBenchmarkWithTable(`
	`286`	`+ runBenchmarkWithSafeTable(`
`289`	`287`	`s"Grouped Aggregate (single group key + single aggregate $aggFunc on decimal)",`
`290`	`288`	`total) { v =>`
`291`	`289`	`for (card <- combinations) {`
`292`		`- singleGroupAndAggregateDecimal(v, DecimalType(18, 10), card, aggFunc, k)`
	`290`	`+ singleGroupAndAggregateDecimal(v, DecimalType(18, 10), card, aggFunc, ansiMode)`
`293`	`291`	`}`
`294`	`292`	`}`
`295`	`293`	`})`
Original file line number	Diff line number	Diff line change
`@@ -84,7 +84,7 @@ object CometArithmeticBenchmark extends CometBenchmarkBase {`
`84`	`84`
`85`	`85`	`Seq(true, false).foreach { useDictionary =>`
`86`	`86`	`Seq(Minus, Mul).foreach { op =>`
`87`		`- runBenchmarkWithTable(op.name, TOTAL, useDictionary) { v =>`
	`87`	`+ runBenchmarkWithSafeTable(op.name, TOTAL, useDictionary) { v =>`
`88`	`88`	`integerArithmeticBenchmark(v, op, useDictionary)`
`89`	`89`	`}`
`90`	`90`	`}`