lensesio
diff --git a/‎kafka-connect-aws-s3/src/it/scala/io/lenses/streamreactor/connect/aws/s3/sink/S3SinkTaskParquetSchemaOptimizationTest.scala‎
Lines changed: 23 additions & 15 deletions b/‎kafka-connect-aws-s3/src/it/scala/io/lenses/streamreactor/connect/aws/s3/sink/S3SinkTaskParquetSchemaOptimizationTest.scala‎
Lines changed: 23 additions & 15 deletions
diff --git a/‎kafka-connect-aws-s3/src/it/scala/io/lenses/streamreactor/connect/aws/s3/sink/S3SinkTaskParquetV3ThenV2SchemaOptimizationTest.scala‎
Lines changed: 37 additions & 37 deletions b/‎kafka-connect-aws-s3/src/it/scala/io/lenses/streamreactor/connect/aws/s3/sink/S3SinkTaskParquetV3ThenV2SchemaOptimizationTest.scala‎
Lines changed: 37 additions & 37 deletions
diff --git a/‎kafka-connect-cloud-common/src/main/scala/io/lenses/streamreactor/connect/cloud/common/sink/conversion/ToAvroDataConverter.scala‎
Lines changed: 28 additions & 22 deletions b/‎kafka-connect-cloud-common/src/main/scala/io/lenses/streamreactor/connect/cloud/common/sink/conversion/ToAvroDataConverter.scala‎
Lines changed: 28 additions & 22 deletions
@@ -37,12 +37,12 @@ import scala.jdk.CollectionConverters.MapHasAsJava
 import scala.jdk.CollectionConverters.SeqHasAsJava
 
 /**
-  * Integration test for Parquet format with schema optimization enabled.
-  *
-  * This test verifies that the fix for ArrayIndexOutOfBoundsException works correctly
-  * when latest.schema.optimization.enabled is true and records with different schema
-  * versions are interleaved, requiring adaptation to the latest schema.
-  */
+ * Integration test for Parquet format with schema optimization enabled.
+ *
+ * This test verifies that the fix for ArrayIndexOutOfBoundsException works correctly
+ * when latest.schema.optimization.enabled is true and records with different schema
+ * versions are interleaved, requiring adaptation to the latest schema.
+ */
 class S3SinkTaskParquetSchemaOptimizationTest
     extends AnyFlatSpec
     with Matchers
@@ -144,7 +144,10 @@ class S3SinkTaskParquetSchemaOptimizationTest
 
     // Record 4: V3 schema (introduces address)
     val address4 = new Struct(addressSchema).put("street", "123 Main St").put("city", "Seattle").put("zipCode", "98101")
-    val struct4  = new Struct(schemaV3).put("name", "Diana").put("age", 28).put("email", "diana@example.com").put("address", address4)
+    val struct4 =
+      new Struct(schemaV3).put("name", "Diana").put("age", 28).put("email", "diana@example.com").put("address",
+                                                                                                     address4,
+      )
 
     // Record 5: V2 schema again (should be adapted to latest V3)
     val struct5 = new Struct(schemaV2).put("name", "Eve").put("age", 32).put("email", "eve@example.com")
@@ -194,7 +197,7 @@ class S3SinkTaskParquetSchemaOptimizationTest
     rec3.get("address") should be(null)
 
     // Record 4: V3 (full schema)
-    val rec4     = genericRecords(3)
+    val rec4        = genericRecords(3)
     val address4Rec = rec4.get("address").asInstanceOf[GenericRecord]
     rec4.get("name").toString should be("Diana")
     rec4.get("age") should be(28)
@@ -273,15 +276,21 @@ class S3SinkTaskParquetSchemaOptimizationTest
     val struct1 = new Struct(orderSchemaV1).put("orderId", "ORD-001").put("amount", 100.50).put("metadata", meta1)
 
     // Record 2: V2 schema (introduces offset and timestamp in metadata)
-    val meta2   = new Struct(metadataSchemaV2).put("topic", TopicName).put("partition", 1).put("offset", 2L).put("timestamp", 20002L)
+    val meta2 =
+      new Struct(metadataSchemaV2).put("topic", TopicName).put("partition", 1).put("offset", 2L).put("timestamp",
+                                                                                                     20002L,
+      )
     val struct2 = new Struct(orderSchemaV2).put("orderId", "ORD-002").put("amount", 250.75).put("metadata", meta2)
 
     // Record 3: V1 schema again (should be adapted to V2)
     val meta3   = new Struct(metadataSchemaV1).put("topic", TopicName).put("partition", 1)
     val struct3 = new Struct(orderSchemaV1).put("orderId", "ORD-003").put("amount", 75.00).put("metadata", meta3)
 
     // Record 4: V2 schema
-    val meta4   = new Struct(metadataSchemaV2).put("topic", TopicName).put("partition", 1).put("offset", 4L).put("timestamp", 20004L)
+    val meta4 =
+      new Struct(metadataSchemaV2).put("topic", TopicName).put("partition", 1).put("offset", 4L).put("timestamp",
+                                                                                                     20004L,
+      )
     val struct4 = new Struct(orderSchemaV2).put("orderId", "ORD-004").put("amount", 500.00).put("metadata", meta4)
 
     val record1 = toSinkRecord(struct1, TopicName, 1, 1L, 20001L)
@@ -301,7 +310,7 @@ class S3SinkTaskParquetSchemaOptimizationTest
     genericRecords.size should be(4)
 
     // Record 1: V1 -> V2 (metadata.offset and metadata.timestamp should be null)
-    val rec1      = genericRecords.head
+    val rec1     = genericRecords.head
     val metaRec1 = rec1.get("metadata").asInstanceOf[GenericRecord]
     rec1.get("orderId").toString should be("ORD-001")
     rec1.get("amount") should be(100.50)
@@ -311,7 +320,7 @@ class S3SinkTaskParquetSchemaOptimizationTest
     metaRec1.get("timestamp") should be(null)
 
     // Record 2: V2 (full metadata)
-    val rec2      = genericRecords(1)
+    val rec2     = genericRecords(1)
     val metaRec2 = rec2.get("metadata").asInstanceOf[GenericRecord]
     rec2.get("orderId").toString should be("ORD-002")
     rec2.get("amount") should be(250.75)
@@ -321,7 +330,7 @@ class S3SinkTaskParquetSchemaOptimizationTest
     metaRec2.get("timestamp") should be(20002L)
 
     // Record 3: V1 -> V2
-    val rec3      = genericRecords(2)
+    val rec3     = genericRecords(2)
     val metaRec3 = rec3.get("metadata").asInstanceOf[GenericRecord]
     rec3.get("orderId").toString should be("ORD-003")
     rec3.get("amount") should be(75.00)
@@ -331,7 +340,7 @@ class S3SinkTaskParquetSchemaOptimizationTest
     metaRec3.get("timestamp") should be(null)
 
     // Record 4: V2
-    val rec4      = genericRecords(3)
+    val rec4     = genericRecords(3)
     val metaRec4 = rec4.get("metadata").asInstanceOf[GenericRecord]
     rec4.get("orderId").toString should be("ORD-004")
     rec4.get("amount") should be(500.00)
@@ -342,4 +351,3 @@ class S3SinkTaskParquetSchemaOptimizationTest
   }
 
 }
-
 
@@ -37,22 +37,22 @@ import scala.jdk.CollectionConverters.MapHasAsJava
 import scala.jdk.CollectionConverters.SeqHasAsJava
 
 /**
-  * Integration test that reproduces the VersionSchemaChangeDetector bug.
-  *
-  * This test sends records with schema v3 first, then v2.
-  * When processed with schema.change.detector=version (without the fix),
-  * it would fail because:
-  *   - v3 written first, file initialized with v3 schema
-  *   - v2 arrives, detector checks: 2 > 3 = False (no schema change detected)
-  *   - v2 record written to v3 file → ArrayIndexOutOfBoundsException
-  *
-  * With latest.schema.optimization.enabled=true, records should be adapted
-  * to the latest schema seen (v3) and written correctly.
-  *
-  * Based on the Python test producer script that reproduces the bug with:
-  *   - DslSDPEvent schema v2 (without businessUnit field)
-  *   - DslSDPEvent schema v3 (with businessUnit field)
-  */
+ * Integration test that reproduces the VersionSchemaChangeDetector bug.
+ *
+ * This test sends records with schema v3 first, then v2.
+ * When processed with schema.change.detector=version (without the fix),
+ * it would fail because:
+ *   - v3 written first, file initialized with v3 schema
+ *   - v2 arrives, detector checks: 2 > 3 = False (no schema change detected)
+ *   - v2 record written to v3 file → ArrayIndexOutOfBoundsException
+ *
+ * With latest.schema.optimization.enabled=true, records should be adapted
+ * to the latest schema seen (v3) and written correctly.
+ *
+ * Based on the Python test producer script that reproduces the bug with:
+ *   - DslSDPEvent schema v2 (without businessUnit field)
+ *   - DslSDPEvent schema v3 (with businessUnit field)
+ */
 class S3SinkTaskParquetV3ThenV2SchemaOptimizationTest
     extends AnyFlatSpec
     with Matchers
@@ -209,23 +209,23 @@ class S3SinkTaskParquetV3ThenV2SchemaOptimizationTest
   }
 
   /**
-    * Test that reproduces the exact bug scenario:
-    * - Send 5 v3 records first (with businessUnit field)
-    * - Then send 5 v2 records (without businessUnit field)
-    *
-    * Without the fix, this would cause ArrayIndexOutOfBoundsException because:
-    * - VersionSchemaChangeDetector only checks newVersion > oldVersion
-    * - 2 > 3 is False, so no schema change is detected
-    * - v2 record gets written to v3-initialized Parquet file
-    *
-    * With latest.schema.optimization.enabled=true, all records should be
-    * adapted to v3 schema and written correctly.
-    */
+   * Test that reproduces the exact bug scenario:
+   * - Send 5 v3 records first (with businessUnit field)
+   * - Then send 5 v2 records (without businessUnit field)
+   *
+   * Without the fix, this would cause ArrayIndexOutOfBoundsException because:
+   * - VersionSchemaChangeDetector only checks newVersion > oldVersion
+   * - 2 > 3 is False, so no schema change is detected
+   * - v2 record gets written to v3-initialized Parquet file
+   *
+   * With latest.schema.optimization.enabled=true, all records should be
+   * adapted to v3 schema and written correctly.
+   */
   "S3SinkTask" should "handle v3 then v2 schema sequence with parquet and schema optimization" in {
     val props = (
       defaultProps ++
         Map(
-          "connect.s3.kcql" -> s"insert into $BucketName:$PrefixName select * from $TopicName STOREAS PARQUET PROPERTIES('padding.length.partition'='12','padding.length.offset'='12','${FlushCount.entryName}'=10)",
+          "connect.s3.kcql"                               -> s"insert into $BucketName:$PrefixName select * from $TopicName STOREAS PARQUET PROPERTIES('padding.length.partition'='12','padding.length.offset'='12','${FlushCount.entryName}'=10)",
           "connect.s3.latest.schema.optimization.enabled" -> "true",
         )
     ).asJava
@@ -292,14 +292,14 @@ class S3SinkTaskParquetV3ThenV2SchemaOptimizationTest
   }
 
   /**
-    * Test with interleaved v3 and v2 records to ensure consistent handling.
-    * Pattern: v3, v2, v3, v2, v3, v2, v3, v2
-    */
+   * Test with interleaved v3 and v2 records to ensure consistent handling.
+   * Pattern: v3, v2, v3, v2, v3, v2, v3, v2
+   */
   "S3SinkTask" should "handle interleaved v3 and v2 records with parquet and schema optimization" in {
     val props = (
       defaultProps ++
         Map(
-          "connect.s3.kcql" -> s"insert into $BucketName:$PrefixName select * from $TopicName STOREAS PARQUET PROPERTIES('padding.length.partition'='12','padding.length.offset'='12','${FlushCount.entryName}'=8)",
+          "connect.s3.kcql"                               -> s"insert into $BucketName:$PrefixName select * from $TopicName STOREAS PARQUET PROPERTIES('padding.length.partition'='12','padding.length.offset'='12','${FlushCount.entryName}'=8)",
           "connect.s3.latest.schema.optimization.enabled" -> "true",
         )
     ).asJava
@@ -357,14 +357,14 @@ class S3SinkTaskParquetV3ThenV2SchemaOptimizationTest
   }
 
   /**
-    * Test multiple batches: first batch v3, second batch v2, simulating
-    * the real-world scenario where consumers process in batches.
-    */
+   * Test multiple batches: first batch v3, second batch v2, simulating
+   * the real-world scenario where consumers process in batches.
+   */
   "S3SinkTask" should "handle multiple batches with v3 first then v2 batch" in {
     val props = (
       defaultProps ++
         Map(
-          "connect.s3.kcql" -> s"insert into $BucketName:$PrefixName select * from $TopicName STOREAS PARQUET PROPERTIES('padding.length.partition'='12','padding.length.offset'='12','${FlushCount.entryName}'=6)",
+          "connect.s3.kcql"                               -> s"insert into $BucketName:$PrefixName select * from $TopicName STOREAS PARQUET PROPERTIES('padding.length.partition'='12','padding.length.offset'='12','${FlushCount.entryName}'=6)",
           "connect.s3.latest.schema.optimization.enabled" -> "true",
         )
     ).asJava
 
@@ -1,5 +1,5 @@
 /*
- * Copyright 2017-2025 Lenses.io Ltd
+ * Copyright 2017-2026 Lenses.io Ltd
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -56,26 +56,26 @@ object ToAvroDataConverter {
     }
 
   /**
-    * Converts SinkData to an Avro GenericRecord using a target Avro schema.
-    * This ensures the GenericRecord uses the exact schema object provided,
-    * which is critical for Parquet/Avro writers that rely on schema identity
-    * for field position lookups.
-    *
-    * @param sinkData The SinkData to convert
-    * @param targetSchema The target Avro schema to use for the GenericRecord
-    * @return The converted value (GenericRecord for structs, primitive values otherwise)
-    */
+   * Converts SinkData to an Avro GenericRecord using a target Avro schema.
+   * This ensures the GenericRecord uses the exact schema object provided,
+   * which is critical for Parquet/Avro writers that rely on schema identity
+   * for field position lookups.
+   *
+   * @param sinkData The SinkData to convert
+   * @param targetSchema The target Avro schema to use for the GenericRecord
+   * @return The converted value (GenericRecord for structs, primitive values otherwise)
+   */
   def convertToGenericRecordWithSchema(sinkData: SinkData, targetSchema: Schema): Any =
     sinkData match {
       case StructSinkData(structVal) => convertStructToGenericRecord(structVal, targetSchema)
       case other                     => convertNonStructSinkData(other)
     }
 
   /**
-    * Common handler for non-struct SinkData types.
-    * This consolidates the conversion logic for all SinkData variants except StructSinkData,
-    * which requires different handling depending on whether a target schema is provided.
-    */
+   * Common handler for non-struct SinkData types.
+   * This consolidates the conversion logic for all SinkData variants except StructSinkData,
+   * which requires different handling depending on whether a target schema is provided.
+   */
   private def convertNonStructSinkData(sinkData: SinkData): Any =
     sinkData match {
       case MapSinkData(map, _)         => convert(map)
@@ -90,9 +90,9 @@ object ToAvroDataConverter {
     }
 
   /**
-    * Converts a Connect Struct to an Avro GenericRecord using the specified target schema.
-    * This handles nested structures recursively.
-    */
+   * Converts a Connect Struct to an Avro GenericRecord using the specified target schema.
+   * This handles nested structures recursively.
+   */
   private def convertStructToGenericRecord(struct: Struct, targetSchema: Schema): GenericRecord = {
     val record = new GenericData.Record(targetSchema)
     targetSchema.getFields.asScala.foreach { avroField =>
@@ -111,9 +111,9 @@ object ToAvroDataConverter {
   }
 
   /**
-    * Converts a Connect value to an Avro value using the target Avro schema.
-    * Handles logical types (Date, Time, Timestamp) and nested structures.
-    */
+   * Converts a Connect value to an Avro value using the target Avro schema.
+   * Handles logical types (Date, Time, Timestamp) and nested structures.
+   */
   private def convertFieldValue(value: Any, targetSchema: Schema): Any =
     if (value == null) {
       null
@@ -145,15 +145,21 @@ object ToAvroDataConverter {
             case d: Date => d.getTime * 1000L
             case other => other
           }
+        case Some("decimal") =>
+          value match {
+            case bd: java.math.BigDecimal =>
+              ByteBuffer.wrap(bd.unscaledValue().toByteArray)
+            case other => other
+          }
         case _ =>
           // No logical type or unhandled logical type - convert based on physical schema type
           convertBySchemaType(value, targetSchema)
       }
     }
 
   /**
-    * Converts a value based on the physical Avro schema type.
-    */
+   * Converts a value based on the physical Avro schema type.
+   */
   private def convertBySchemaType(value: Any, targetSchema: Schema): Any =
     targetSchema.getType match {
       case Schema.Type.RECORD =>