Zouxxyy
diff --git a/‎scalastyle-config.xml‎
Lines changed: 2 additions & 2 deletions b/‎scalastyle-config.xml‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/rules/RuleExecutor.scala‎
Lines changed: 1 addition & 1 deletion b/‎sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/rules/RuleExecutor.scala‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎sql/core/pom.xml‎
Lines changed: 6 additions & 0 deletions b/‎sql/core/pom.xml‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎sql/core/src/test/resources/learn/datasource/json.text‎
Lines changed: 2 additions & 0 deletions b/‎sql/core/src/test/resources/learn/datasource/json.text‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎sql/core/src/test/resources/log4j2.properties‎
Lines changed: 2 additions & 2 deletions b/‎sql/core/src/test/resources/log4j2.properties‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎sql/core/src/test/scala/org/apache/spark/sql/learn/BaseTest.scala‎
Lines changed: 78 additions & 0 deletions b/‎sql/core/src/test/scala/org/apache/spark/sql/learn/BaseTest.scala‎
Lines changed: 78 additions & 0 deletions
diff --git a/‎sql/core/src/test/scala/org/apache/spark/sql/learn/bugfix/RDDAndDataframe.scala‎
Lines changed: 51 additions & 0 deletions b/‎sql/core/src/test/scala/org/apache/spark/sql/learn/bugfix/RDDAndDataframe.scala‎
Lines changed: 51 additions & 0 deletions
diff --git a/‎sql/core/src/test/scala/org/apache/spark/sql/learn/bugfix/WriteChar.scala‎
Lines changed: 58 additions & 0 deletions b/‎sql/core/src/test/scala/org/apache/spark/sql/learn/bugfix/WriteChar.scala‎
Lines changed: 58 additions & 0 deletions
diff --git a/‎sql/core/src/test/scala/org/apache/spark/sql/learn/datasource/DataType.scala‎
Lines changed: 103 additions & 0 deletions b/‎sql/core/src/test/scala/org/apache/spark/sql/learn/datasource/DataType.scala‎
Lines changed: 103 additions & 0 deletions
diff --git a/‎sql/core/src/test/scala/org/apache/spark/sql/learn/datasource/Filter.scala‎
Lines changed: 55 additions & 0 deletions b/‎sql/core/src/test/scala/org/apache/spark/sql/learn/datasource/Filter.scala‎
Lines changed: 55 additions & 0 deletions
@@ -71,9 +71,9 @@ This file is divided into 3 sections:
 
   <check level="error" class="org.scalastyle.scalariform.SpacesBeforePlusChecker" enabled="true"></check>
 
-  <check level="error" class="org.scalastyle.file.WhitespaceEndOfLineChecker" enabled="true"></check>
+  <check level="error" class="org.scalastyle.file.WhitespaceEndOfLineChecker" enabled="false"></check>
 
-  <check level="error" class="org.scalastyle.file.FileLineLengthChecker" enabled="true">
+  <check level="error" class="org.scalastyle.file.FileLineLengthChecker" enabled="false">
     <parameters>
       <parameter name="maxLineLength"><![CDATA[100]]></parameter>
       <parameter name="tabSize"><![CDATA[2]]></parameter>
 
@@ -285,7 +285,7 @@ abstract class RuleExecutor[TreeType <: TreeNode[_]] extends Logging {
 
       planChangeLogger.logBatch(batch.name, batchStartPlan, curPlan)
     }
-    planChangeLogger.logMetrics(RuleExecutor.getCurrentMetrics() - beforeMetrics)
+    // planChangeLogger.logMetrics(RuleExecutor.getCurrentMetrics() - beforeMetrics)
 
     curPlan
   }
 
@@ -217,6 +217,12 @@
       <artifactId>htmlunit-driver</artifactId>
       <scope>test</scope>
     </dependency>
+    <dependency>
+      <groupId>org.apache.paimon</groupId>
+      <artifactId>paimon-spark-3.5</artifactId>
+      <version>1.0.1</version>
+      <scope>test</scope>
+    </dependency>
   </dependencies>
   <build>
     <outputDirectory>target/scala-${scala.binary.version}/classes</outputDirectory>
 
@@ -0,0 +1,2 @@
+{"name":"Yin", "address":{"city":"Columbus","state":"Ohio"}}
+{"name":123456, "address":{"city":null, "state":"California", "extraMetadata":"test message"}}
@@ -25,9 +25,9 @@ appender.console.type = Console
 appender.console.name = STDOUT
 appender.console.target = SYSTEM_OUT
 appender.console.layout.type = PatternLayout
-appender.console.layout.pattern = %d{HH:mm:ss.SSS} %p %c: %maxLen{%m}{512}%n%ex{8}%n
+appender.console.layout.pattern = %d{HH:mm:ss.SSS} %p %c: %maxLen{%m}{5120}%n%ex{8}%n
 appender.console.filter.threshold.type = ThresholdFilter
-appender.console.filter.threshold.level = warn
+appender.console.filter.threshold.level = error
 
 #File Appender
 appender.file.type = File
 
@@ -0,0 +1,78 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.learn
+
+import java.io.File
+
+import org.apache.spark.SparkConf
+import org.apache.spark.sql.{DataFrame, QueryTest, SparkSession}
+import org.apache.spark.sql.test.SharedSparkSession
+import org.apache.spark.util.Utils
+
+abstract class BaseTest extends QueryTest with SharedSparkSession {
+
+  val _spark: SparkSession = spark
+
+  protected lazy val tempDBDir: File = Utils.createTempDir()
+
+  protected val dbName0: String = "test"
+
+  override protected def sparkConf: SparkConf = {
+    super.sparkConf
+      .set("spark.sql.catalog.paimon", "org.apache.paimon.spark.SparkCatalog")
+      .set("spark.sql.catalog.paimon.warehouse", tempDBDir.getCanonicalPath)
+      .set("spark.sql.extensions",
+        "org.apache.paimon.spark.extensions.PaimonSparkSessionExtensions")
+      .set("spark.sql.planChangeLog.level", "error")
+      .set("spark.sql.planChangeLog.batches", "")
+      .set("spark.sql.planChangeLog.rules", "")
+//      .set("spark.default.parallelism", "4")
+      .set("spark.eventLog.enabled", "false")
+      .set("spark.eventLog.dir", "/Users/zxy/data/spark/history")
+  }
+
+  override protected def beforeAll(): Unit = {
+    super.beforeAll()
+    spark.sql(s"USE paimon")
+    spark.sql(s"CREATE DATABASE IF NOT EXISTS paimon.$dbName0")
+  }
+
+  override protected def afterAll(): Unit = {
+    try {
+      spark.sql(s"USE paimon")
+      // spark.sql(s"USE default")
+      spark.sql(s"DROP DATABASE IF EXISTS paimon.$dbName0 CASCADE")
+    } finally {
+      super.afterAll()
+    }
+  }
+
+  def printPlan(df: DataFrame): Unit = {
+    // scalastyle:off println
+    println("=== Optimized Plan ===")
+    val optimizedPlan = df.queryExecution.optimizedPlan
+    println(optimizedPlan)
+
+    println("=== Executed Plan ===")
+    val executedPlan = df.queryExecution.executedPlan
+    println(executedPlan)
+    // scalastyle:on println
+
+    df.show()
+  }
+}
@@ -0,0 +1,51 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.learn.bugfix
+
+import org.apache.spark.sql.functions.col
+import org.apache.spark.sql.learn.BaseTest
+
+class RDDAndDataframe extends BaseTest {
+
+  import testImplicits._
+
+  test("RDD: test parallelize") {
+    val tuples = spark.sparkContext.parallelize(1 to 1).map(x => (x, x)).collect()
+    tuples
+  }
+
+  test("Dataframe: test repartitionByCol") {
+    withSQLConf("spark.sql.adaptive.enabled" -> "false") {
+      withSQLConf("spark.sql.shuffle.partitions" -> "40") {
+        val df = (1 to 20).toDF("id")
+        val partitions = df.rdd.getNumPartitions
+        val df2 = df.repartition(col("id"))
+        val partitions2 = df2.rdd.getNumPartitions
+        df2.collect()
+      }
+
+      withSQLConf("spark.sql.shuffle.partitions" -> "10") {
+        val df = (1 to 20).toDF("id")
+        val partitions = df.rdd.getNumPartitions
+        val df2 = df.repartition(col("id"))
+        val partitions2 = df2.rdd.getNumPartitions
+        df2.collect()
+      }
+    }
+  }
+}
@@ -0,0 +1,58 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.learn.bugfix
+
+import org.apache.spark.sql.Row
+import org.apache.spark.sql.learn.BaseTest
+
+class WriteChar extends BaseTest {
+
+  test("Bug fix: test write char with parquet") {
+    sql("use spark_catalog")
+    sql(s"CREATE DATABASE test_db LOCATION '$tempDBDir'")
+    sql(s"USE test_db")
+
+    withTable("target", "source") {
+      sql(
+        s"""
+           |CREATE TABLE test_db.target (c char(6))
+           |USING parquet
+           |""".stripMargin)
+
+      sql(
+        s"""
+           |CREATE TABLE test_db.source (c char(6))
+           |USING parquet
+           |""".stripMargin)
+
+      withSQLConf("spark.sql.legacy.charVarcharAsString" -> "true") {
+        sql("INSERT INTO test_db.source VALUES ('ab')")
+      }
+
+      withSQLConf("spark.sql.readSideCharPadding" -> "false") {
+        sql(s"INSERT INTO target SELECT * FROM source")
+        checkAnswer(
+          spark.sql("SELECT c FROM source"), Row("ab"))
+        checkAnswer(
+          spark.sql("SELECT c FROM target"), Row("ab    "))
+      }
+    }
+    sql(s"DROP DATABASE test_db")
+    sql(s"USE paimon")
+  }
+}
@@ -0,0 +1,103 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.learn.datasource
+
+import org.apache.spark.sql.learn.BaseTest
+
+class DataType extends BaseTest {
+
+  test("DataType: struct type") {
+    withTable("students") {
+      sql(
+        """
+          |CREATE TABLE students (
+          |    name STRING,
+          |    age INT,
+          |    courses ARRAY<STRUCT<course_name: STRING, grade: DOUBLE>>
+          |) USING paimon;
+          |""".stripMargin)
+
+      sql(
+        """
+          |INSERT INTO students VALUES
+          |('Alice', 20, ARRAY(STRUCT('Math', 85.0), STRUCT('English', 88.0))),
+          |('Bob', 22, ARRAY(STRUCT('Math', 90.0), STRUCT('Biology', 92.0))),
+          |('Cathy', 21, ARRAY(STRUCT('History', 95.0)));
+          |""".stripMargin)
+
+      sql(
+        """
+          |SELECT
+          |    name,
+          |    age,
+          |    course.course_name,
+          |    course.grade
+          |FROM
+          |    students
+          |LATERAL VIEW explode(courses) AS course;
+          |""".stripMargin).show()
+    }
+  }
+
+  test("DataType: struct type CTAS") {
+    withTable("students") {
+      sql(
+        """
+          |CREATE TABLE students AS
+          |SELECT *
+          |FROM (VALUES ('Alice', 20, ARRAY(STRUCT('Math', 85.0), STRUCT('English', 88.0))),
+          |             ('Bob', 22, ARRAY(STRUCT('Math', 90.0), STRUCT('Biology', 92.0))),
+          |             ('Cathy', 21, ARRAY(STRUCT('History', 95.0)))) ;
+          |""".stripMargin)
+
+      sql("desc table extended students").show(false)
+    }
+  }
+
+  test("DataType: struct type get") {
+    withTable("students") {
+      sql(
+        """
+          |CREATE TABLE students (
+          |    name STRING,
+          |    age INT,
+          |    course STRUCT<course_name: STRING, grade: DOUBLE>
+          |) USING paimon;
+          |""".stripMargin)
+
+      sql(
+        """
+          |INSERT INTO students VALUES
+          |('Alice', 20, STRUCT('Math', 85.0)),
+          |('Bob', 22, STRUCT('Biology', 92.0)),
+          |('Cathy', 21, STRUCT('History', 95.0));
+          |""".stripMargin)
+
+      sql(
+        """
+          |SELECT
+          |    name,
+          |    age,
+          |    course.course_name,
+          |    course.grade
+          |FROM
+          |    students;
+          |""".stripMargin).show()
+    }
+  }
+}
@@ -0,0 +1,55 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.spark.sql.learn.datasource
+
+import org.apache.spark.sql.learn.BaseTest
+
+class Filter extends BaseTest {
+
+  test("Filter: test partition filter") {
+    sql("use spark_catalog")
+    sql(s"CREATE DATABASE test_db LOCATION '$tempDBDir'")
+    sql(s"USE test_db")
+
+    withTable("t") {
+      sql(
+        s"""
+           |CREATE TABLE test_db.t (id INT, p STRING)
+           |USING parquet
+           |PARTITIONED BY (p)
+           |""".stripMargin)
+      sql("INSERT INTO test_db.t VALUES (1, '1')")
+
+      printPlan(sql("SELECT * FROM test_db.t WHERE p = 1"))
+    }
+
+    withTable("t") {
+      sql(
+        s"""
+           |CREATE TABLE test_db.t (id INT, p INT)
+           |USING parquet
+           |PARTITIONED BY (p)
+           |""".stripMargin)
+      sql("INSERT INTO test_db.t VALUES (1, 1)")
+
+      printPlan(sql("SELECT * FROM test_db.t WHERE p = '1'"))
+    }
+    sql(s"DROP DATABASE test_db")
+    sql(s"USE paimon")
+  }
+}
Original file line number	Diff line number	Diff line change
`@@ -285,7 +285,7 @@ abstract class RuleExecutor[TreeType <: TreeNode[_]] extends Logging {`
`285`	`285`
`286`	`286`	`planChangeLogger.logBatch(batch.name, batchStartPlan, curPlan)`
`287`	`287`	`}`
`288`		`- planChangeLogger.logMetrics(RuleExecutor.getCurrentMetrics() - beforeMetrics)`
	`288`	`+ // planChangeLogger.logMetrics(RuleExecutor.getCurrentMetrics() - beforeMetrics)`
`289`	`289`
`290`	`290`	`curPlan`
`291`	`291`	`}`
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,2 @@`
	`1`	`+{"name":"Yin", "address":{"city":"Columbus","state":"Ohio"}}`
	`2`	`+{"name":123456, "address":{"city":null, "state":"California", "extraMetadata":"test message"}}`