apache
diff --git a/‎fluss-spark/fluss-spark-common/src/main/scala/org/apache/fluss/spark/SparkCatalog.scala‎
Lines changed: 2 additions & 1 deletion b/‎fluss-spark/fluss-spark-common/src/main/scala/org/apache/fluss/spark/SparkCatalog.scala‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎fluss-spark/fluss-spark-common/src/main/scala/org/apache/fluss/spark/SparkTable.scala‎
Lines changed: 19 additions & 4 deletions b/‎fluss-spark/fluss-spark-common/src/main/scala/org/apache/fluss/spark/SparkTable.scala‎
Lines changed: 19 additions & 4 deletions
diff --git a/‎fluss-spark/fluss-spark-common/src/main/scala/org/apache/fluss/spark/catalog/AbstractSparkTable.scala‎
Lines changed: 5 additions & 2 deletions b/‎fluss-spark/fluss-spark-common/src/main/scala/org/apache/fluss/spark/catalog/AbstractSparkTable.scala‎
Lines changed: 5 additions & 2 deletions
diff --git a/‎fluss-spark/fluss-spark-common/src/main/scala/org/apache/fluss/spark/catalog/WithFlussAdmin.scala‎
Lines changed: 8 additions & 1 deletion b/‎fluss-spark/fluss-spark-common/src/main/scala/org/apache/fluss/spark/catalog/WithFlussAdmin.scala‎
Lines changed: 8 additions & 1 deletion
diff --git a/‎fluss-spark/fluss-spark-common/src/main/scala/org/apache/fluss/spark/row/SparkAsFlussArray.scala‎
Lines changed: 131 additions & 0 deletions b/‎fluss-spark/fluss-spark-common/src/main/scala/org/apache/fluss/spark/row/SparkAsFlussArray.scala‎
Lines changed: 131 additions & 0 deletions
diff --git a/‎fluss-spark/fluss-spark-common/src/main/scala/org/apache/fluss/spark/row/SparkAsFlussRow.scala‎
Lines changed: 129 additions & 0 deletions b/‎fluss-spark/fluss-spark-common/src/main/scala/org/apache/fluss/spark/row/SparkAsFlussRow.scala‎
Lines changed: 129 additions & 0 deletions
@@ -49,7 +49,8 @@ class SparkCatalog extends TableCatalog with SupportsFlussNamespaces with WithFl
 
   override def loadTable(ident: Identifier): Table = {
     try {
-      SparkTable(admin.getTableInfo(toTablePath(ident)).get())
+      val tablePath = toTablePath(ident)
+      SparkTable(tablePath, admin.getTableInfo(tablePath).get(), flussConfig)
     } catch {
       case e: ExecutionException if e.getCause.isInstanceOf[TableNotExistException] =>
         throw new NoSuchTableException(ident)
 
@@ -17,9 +17,24 @@
 
 package org.apache.fluss.spark
 
-import org.apache.fluss.metadata.TableInfo
+import org.apache.fluss.config.{Configuration => FlussConfiguration}
+import org.apache.fluss.metadata.{TableInfo, TablePath}
 import org.apache.fluss.spark.catalog.{AbstractSparkTable, SupportsFlussPartitionManagement}
+import org.apache.fluss.spark.write.{FlussAppendWriteBuilder, FlussUpsertWriteBuilder}
 
-case class SparkTable(table: TableInfo)
-  extends AbstractSparkTable(table)
-  with SupportsFlussPartitionManagement {}
+import org.apache.spark.sql.connector.catalog.SupportsWrite
+import org.apache.spark.sql.connector.write.{LogicalWriteInfo, WriteBuilder}
+
+case class SparkTable(tablePath: TablePath, tableInfo: TableInfo, flussConfig: FlussConfiguration)
+  extends AbstractSparkTable(tableInfo)
+  with SupportsFlussPartitionManagement
+  with SupportsWrite {
+
+  override def newWriteBuilder(logicalWriteInfo: LogicalWriteInfo): WriteBuilder = {
+    if (tableInfo.getPrimaryKeys.isEmpty) {
+      new FlussAppendWriteBuilder(tablePath, logicalWriteInfo.schema(), flussConfig)
+    } else {
+      new FlussUpsertWriteBuilder(tablePath, logicalWriteInfo.schema(), flussConfig)
+    }
+  }
+}
@@ -17,7 +17,8 @@
 
 package org.apache.fluss.spark.catalog
 
-import org.apache.fluss.metadata.TableInfo
+import org.apache.fluss.config.{Configuration => FlussConfiguration}
+import org.apache.fluss.metadata.{TableInfo, TablePath}
 import org.apache.fluss.spark.SparkConversions
 
 import org.apache.spark.sql.connector.catalog.{Table, TableCapability}
@@ -39,5 +40,7 @@ abstract class AbstractSparkTable(tableInfo: TableInfo) extends Table {
 
   override def schema(): StructType = _schema
 
-  override def capabilities(): util.Set[TableCapability] = Set.empty[TableCapability].asJava
+  override def capabilities(): util.Set[TableCapability] = {
+    Set(TableCapability.BATCH_WRITE).asJava
+  }
 }
@@ -33,6 +33,7 @@ trait WithFlussAdmin extends AutoCloseable {
 
   private var _connection: Connection = _
   private var _admin: Admin = _
+  private var _flussConfig: FlussConfiguration = _
 
   // TODO: init lake spark catalog
   protected var lakeCatalog: CatalogPlugin = _
@@ -43,10 +44,16 @@ trait WithFlussAdmin extends AutoCloseable {
       entry: util.Map.Entry[String, String] => flussConfigs.put(entry.getKey, entry.getValue)
     }
 
-    _connection = ConnectionFactory.createConnection(FlussConfiguration.fromMap(flussConfigs))
+    _flussConfig = FlussConfiguration.fromMap(flussConfigs)
+    _connection = ConnectionFactory.createConnection(_flussConfig)
     _admin = _connection.getAdmin
   }
 
+  protected def flussConfig: FlussConfiguration = {
+    Preconditions.checkNotNull(_flussConfig, "Fluss Configuration is not initialized.")
+    _flussConfig
+  }
+
   protected def admin: Admin = {
     Preconditions.checkNotNull(_admin, "Fluss Admin is not initialized.")
     _admin
 
@@ -0,0 +1,131 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.fluss.spark.row
+
+import org.apache.fluss.row.{BinaryString, Decimal, InternalArray => FlussInternalArray, InternalRow => FlussInternalRow, TimestampLtz, TimestampNtz}
+
+import org.apache.spark.sql.catalyst.util.{ArrayData => SparkArrayData, SparkDateTimeUtils}
+import org.apache.spark.sql.types.{ArrayType => SparkArrayType, DataType => SparkDataType, StructType}
+
+/** Wraps a Spark [[SparkArrayData]] as a Fluss [[FlussInternalArray]]. */
+class SparkAsFlussArray(arrayData: SparkArrayData, elementType: SparkDataType)
+  extends FlussInternalArray {
+
+  /** Returns the number of elements in this array. */
+  override def size(): Int = arrayData.numElements()
+
+  override def toBooleanArray: Array[Boolean] = arrayData.toBooleanArray()
+
+  override def toByteArray: Array[Byte] = arrayData.toByteArray()
+
+  override def toShortArray: Array[Short] = arrayData.toShortArray()
+
+  override def toIntArray: Array[Int] = arrayData.toIntArray()
+
+  override def toLongArray: Array[Long] = arrayData.toLongArray()
+
+  override def toFloatArray: Array[Float] = arrayData.toFloatArray()
+
+  override def toDoubleArray: Array[Double] = arrayData.toDoubleArray()
+
+  /** Returns true if the element is null at the given position. */
+  override def isNullAt(pos: Int): Boolean = arrayData.isNullAt(pos)
+
+  /** Returns the boolean value at the given position. */
+  override def getBoolean(pos: Int): Boolean = arrayData.getBoolean(pos)
+
+  /** Returns the byte value at the given position. */
+  override def getByte(pos: Int): Byte = arrayData.getByte(pos)
+
+  /** Returns the short value at the given position. */
+  override def getShort(pos: Int): Short = arrayData.getShort(pos)
+
+  /** Returns the integer value at the given position. */
+  override def getInt(pos: Int): Int = arrayData.getInt(pos)
+
+  /** Returns the long value at the given position. */
+  override def getLong(pos: Int): Long = arrayData.getLong(pos)
+
+  /** Returns the float value at the given position. */
+  override def getFloat(pos: Int): Float = arrayData.getFloat(pos)
+
+  /** Returns the double value at the given position. */
+  override def getDouble(pos: Int): Double = arrayData.getDouble(pos)
+
+  /** Returns the string value at the given position with fixed length. */
+  override def getChar(pos: Int, length: Int): BinaryString =
+    BinaryString.fromBytes(arrayData.getUTF8String(pos).getBytes)
+
+  /** Returns the string value at the given position. */
+  override def getString(pos: Int): BinaryString =
+    BinaryString.fromBytes(arrayData.getUTF8String(pos).getBytes)
+
+  /**
+   * Returns the decimal value at the given position.
+   *
+   * <p>The precision and scale are required to determine whether the decimal value was stored in a
+   * compact representation (see {@link Decimal}).
+   */
+  override def getDecimal(pos: Int, precision: Int, scale: Int): Decimal = {
+    val sparkDecimal = arrayData.getDecimal(pos, precision, scale)
+    if (sparkDecimal.precision <= org.apache.spark.sql.types.Decimal.MAX_LONG_DIGITS)
+      Decimal.fromUnscaledLong(
+        sparkDecimal.toUnscaledLong,
+        sparkDecimal.precision,
+        sparkDecimal.scale)
+    else
+      Decimal.fromBigDecimal(
+        sparkDecimal.toJavaBigDecimal,
+        sparkDecimal.precision,
+        sparkDecimal.scale)
+  }
+
+  /**
+   * Returns the timestamp value at the given position.
+   *
+   * <p>The precision is required to determine whether the timestamp value was stored in a compact
+   * representation (see {@link TimestampNtz}).
+   */
+  override def getTimestampNtz(pos: Int, precision: Int): TimestampNtz =
+    TimestampNtz.fromMillis(SparkDateTimeUtils.microsToMillis(arrayData.getLong(pos)))
+
+  /**
+   * Returns the timestamp value at the given position.
+   *
+   * <p>The precision is required to determine whether the timestamp value was stored in a compact
+   * representation (see {@link TimestampLtz}).
+   */
+  override def getTimestampLtz(pos: Int, precision: Int): TimestampLtz =
+    TimestampLtz.fromEpochMicros(arrayData.getLong(pos))
+
+  /** Returns the binary value at the given position with fixed length. */
+  override def getBinary(pos: Int, length: Int): Array[Byte] = arrayData.getBinary(pos)
+
+  /** Returns the binary value at the given position. */
+  override def getBytes(pos: Int): Array[Byte] = arrayData.getBinary(pos)
+
+  /** Returns the array value at the given position. */
+  override def getArray(pos: Int) = new SparkAsFlussArray(
+    arrayData.getArray(pos),
+    elementType.asInstanceOf[SparkArrayType].elementType)
+
+  /** Returns the row value at the given position. */
+  override def getRow(pos: Int, numFields: Int): FlussInternalRow =
+    new SparkAsFlussRow(elementType.asInstanceOf[StructType])
+      .replace(arrayData.getStruct(pos, numFields))
+}
@@ -0,0 +1,129 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.fluss.spark.row
+
+import org.apache.fluss.row.{BinaryString, Decimal, InternalRow => FlussInternalRow, TimestampLtz, TimestampNtz}
+
+import org.apache.spark.sql.catalyst.{InternalRow => SparkInternalRow}
+import org.apache.spark.sql.catalyst.util.SparkDateTimeUtils
+import org.apache.spark.sql.types.StructType
+
+/** Wraps a Spark [[SparkInternalRow]] as a Fluss [[FlussInternalRow]]. */
+class SparkAsFlussRow(schema: StructType) extends FlussInternalRow with Serializable {
+
+  val fieldCount: Int = schema.length
+
+  var row: SparkInternalRow = _
+
+  def replace(row: SparkInternalRow): SparkAsFlussRow = {
+    this.row = row
+    this
+  }
+
+  /**
+   * Returns the number of fields in this row.
+   *
+   * <p>The number does not include {@link ChangeType}. It is kept separately.
+   */
+  override def getFieldCount: Int = fieldCount
+
+  /** Returns true if the element is null at the given position. */
+  override def isNullAt(pos: Int): Boolean = row.isNullAt(pos)
+
+  /** Returns the boolean value at the given position. */
+  override def getBoolean(pos: Int): Boolean = row.getBoolean(pos)
+
+  /** Returns the byte value at the given position. */
+  override def getByte(pos: Int): Byte = row.getByte(pos)
+
+  /** Returns the short value at the given position. */
+  override def getShort(pos: Int): Short = row.getShort(pos)
+
+  /** Returns the integer value at the given position. */
+  override def getInt(pos: Int): Int = row.getInt(pos)
+
+  /** Returns the long value at the given position. */
+  override def getLong(pos: Int): Long = row.getLong(pos)
+
+  /** Returns the float value at the given position. */
+  override def getFloat(pos: Int): Float = row.getFloat(pos)
+
+  /** Returns the double value at the given position. */
+  override def getDouble(pos: Int): Double = row.getDouble(pos)
+
+  /** Returns the string value at the given position with fixed length. */
+  override def getChar(pos: Int, length: Int): BinaryString =
+    BinaryString.fromString(row.getUTF8String(pos).toString)
+
+  /** Returns the string value at the given position. */
+  override def getString(pos: Int): BinaryString = BinaryString.fromString(row.getString(pos))
+
+  /**
+   * Returns the decimal value at the given position.
+   *
+   * <p>The precision and scale are required to determine whether the decimal value was stored in a
+   * compact representation (see {@link Decimal}).
+   */
+  override def getDecimal(pos: Int, precision: Int, scale: Int): Decimal = {
+    val sparkDecimal = row.getDecimal(pos, precision, scale)
+    if (sparkDecimal.precision <= org.apache.spark.sql.types.Decimal.MAX_LONG_DIGITS)
+      Decimal.fromUnscaledLong(
+        sparkDecimal.toUnscaledLong,
+        sparkDecimal.precision,
+        sparkDecimal.scale)
+    else
+      Decimal.fromBigDecimal(
+        sparkDecimal.toJavaBigDecimal,
+        sparkDecimal.precision,
+        sparkDecimal.scale)
+  }
+
+  /**
+   * Returns the timestamp value at the given position.
+   *
+   * <p>The precision is required to determine whether the timestamp value was stored in a compact
+   * representation (see {@link TimestampNtz}).
+   */
+  override def getTimestampNtz(pos: Int, precision: Int): TimestampNtz =
+    TimestampNtz.fromMillis(SparkDateTimeUtils.microsToMillis(row.getLong(pos)))
+
+  /**
+   * Returns the timestamp value at the given position.
+   *
+   * <p>The precision is required to determine whether the timestamp value was stored in a compact
+   * representation (see {@link TimestampLtz}).
+   */
+  override def getTimestampLtz(pos: Int, precision: Int): TimestampLtz =
+    TimestampLtz.fromEpochMicros(row.getLong(pos))
+
+  /** Returns the binary value at the given position with fixed length. */
+  override def getBinary(pos: Int, length: Int): Array[Byte] = row.getBinary(pos)
+
+  /** Returns the binary value at the given position. */
+  override def getBytes(pos: Int): Array[Byte] = row.getBinary(pos)
+
+  /** Returns the array value at the given position. */
+  override def getArray(pos: Int) =
+    new SparkAsFlussArray(row.getArray(pos), schema.fields(pos).dataType)
+
+  /** Returns the row value at the given position. */
+  override def getRow(pos: Int, numFields: Int): FlussInternalRow =
+    new SparkAsFlussRow(schema.fields(pos).dataType.asInstanceOf[StructType])
+      .replace(row.getStruct(pos, numFields))
+
+}