fix: issues with large Decimals and Oracle variable scale

manticore-projects · manticore-projects · commit 54543af7d8e9 · 2024-12-27T22:31:30.000+07:00
- fix large negative decimals
- add test for large negative decimals
diff --git a/src/main/java/com/manticore/jdbc/parquetwriter/JDBCParquetWriter.java b/src/main/java/com/manticore/jdbc/parquetwriter/JDBCParquetWriter.java
@@ -41,6 +41,7 @@
 import java.sql.Statement;
 import java.sql.Time;
 import java.sql.Timestamp;
+import java.util.Arrays;
 import java.util.logging.Logger;
 
 /**
@@ -293,18 +294,26 @@ public static long write(File f, String tableName, ResultSet rs,
                                 if (scale > 0 && precision <= 18) {
                                     group.add(columnName, decimal.unscaledValue().longValue());
                                 } else if (scale > 0) {
-                                    byte[] bytes =
-                                            decimal.setScale(scale, RoundingMode.HALF_EVEN)
-                                                    .unscaledValue().toByteArray();
+                                    // Scale the decimal to the desired precision and scale
+                                    byte[] unscaledBytes = decimal
+                                            .setScale(scale, RoundingMode.HALF_EVEN)
+                                            .unscaledValue()
+                                            .toByteArray();
+                                    int requiredBytes = 16;
 
-                                    // Ensure the byte array is padded correctly for the precision
-                                    int numBytes =
-                                            Math.max((int) Math.ceil(precision / Math.log10(2) / 8),
-                                                    bytes.length); // Calculate required bytes
-                                    byte[] paddedBytes = new byte[numBytes];
-                                    System.arraycopy(bytes, 0, paddedBytes, numBytes - bytes.length,
-                                            bytes.length);
+                                    // Ensure the byte array is padded correctly with sign extension
+                                    byte[] paddedBytes = new byte[requiredBytes];
+                                    byte signByte = (unscaledBytes[0] < 0) ? (byte) 0xFF : 0x00; // Extend
+                                                                                                 // sign
+                                                                                                 // bit
+                                    Arrays.fill(paddedBytes, 0,
+                                            requiredBytes - unscaledBytes.length, signByte);
+                                    System.arraycopy(unscaledBytes, 0, paddedBytes,
+                                            requiredBytes - unscaledBytes.length,
+                                            unscaledBytes.length);
 
+                                    // Add the binary representation of the decimal to the Parquet
+                                    // group
                                     group.add(columnName,
                                             Binary.fromConstantByteArray(paddedBytes));
                                 } else if (scale == -127) {
@@ -317,17 +326,27 @@ public static long write(File f, String tableName, ResultSet rs,
                                      */
                                     precision = 38;
                                     scale = 10;
-                                    byte[] bytes = decimal.setScale(scale, RoundingMode.HALF_EVEN)
-                                            .unscaledValue().toByteArray();
 
-                                    // Ensure the byte array is padded correctly for the precision
-                                    int numBytes =
-                                            Math.max((int) Math.ceil(precision / Math.log10(2) / 8),
-                                                    bytes.length); // Calculate required bytes
-                                    byte[] paddedBytes = new byte[numBytes];
-                                    System.arraycopy(bytes, 0, paddedBytes, numBytes - bytes.length,
-                                            bytes.length);
+                                    // Scale the decimal to the desired precision and scale
+                                    byte[] unscaledBytes = decimal
+                                            .setScale(scale, RoundingMode.HALF_EVEN)
+                                            .unscaledValue()
+                                            .toByteArray();
+                                    int requiredBytes = 16;
 
+                                    // Ensure the byte array is padded correctly with sign extension
+                                    byte[] paddedBytes = new byte[requiredBytes];
+                                    byte signByte = (unscaledBytes[0] < 0) ? (byte) 0xFF : 0x00; // Extend
+                                                                                                 // sign
+                                                                                                 // bit
+                                    Arrays.fill(paddedBytes, 0,
+                                            requiredBytes - unscaledBytes.length, signByte);
+                                    System.arraycopy(unscaledBytes, 0, paddedBytes,
+                                            requiredBytes - unscaledBytes.length,
+                                            unscaledBytes.length);
+
+                                    // Add the binary representation of the decimal to the Parquet
+                                    // group
                                     group.add(columnName,
                                             Binary.fromConstantByteArray(paddedBytes));
                                 } else if (precision < 5) {
diff --git a/src/test/java/com/manticore/jdbc/parquetwriter/JDBCParquetWriterTest.java b/src/test/java/com/manticore/jdbc/parquetwriter/JDBCParquetWriterTest.java
@@ -22,6 +22,7 @@
 import org.junit.jupiter.api.Test;
 
 import java.io.File;
+import java.math.BigDecimal;
 import java.sql.Connection;
 import java.sql.DriverManager;
 import java.sql.ResultSet;
@@ -90,7 +91,6 @@ void write() throws Exception {
     }
 
     @Test
-    @Disabled
     void testVBoxQuery() throws Exception {
         Properties properties = new Properties();
         properties.put("user", "SA");
@@ -117,6 +117,55 @@ void testVBoxQuery() throws Exception {
 
     }
 
+    @Test
+    void testBigDecimal() throws Exception {
+        String tableName = "test";
+        String decimalStr = "-24999999999999.99500";
+
+        File file = File.createTempFile(tableName, ".parquet");
+        try (Connection conn = DriverManager.getConnection(
+                "jdbc:h2:mem:test")) {
+
+            String[] ddlStr = {
+                    "CREATE TABLE decimal_test (\n"
+                            + "   amount                 DECIMAL(23,5)  NULL\n"
+                            + ")\n"
+                            + ";"
+
+                    , "INSERT INTO decimal_test \n"
+                            + "VALUES (" + decimalStr + ");"
+            };
+
+            try (Statement st = conn.createStatement()) {
+                for (String sqlStr : ddlStr) {
+                    st.execute(sqlStr);
+                }
+            }
+
+            long writtenRows = 0;
+            String sqlStr = "SELECT  *\n"
+                    + "FROM decimal_test";
+            try (Statement st = conn.createStatement(); ResultSet rs = st.executeQuery(sqlStr);) {
+                writtenRows = JDBCParquetWriter.write(file, tableName, rs);
+            }
+        }
+
+        String sqlStr = "SELECT  *\n"
+                + "FROM '" + file.getAbsolutePath() + "';";
+        try (Connection conn = DriverManager.getConnection(
+                "jdbc:duckdb:");
+                Statement st = conn.createStatement();
+                ResultSet rs = st.executeQuery(sqlStr)) {
+            if (rs.next()) {
+                BigDecimal actualDecimal = rs.getBigDecimal(1);
+                Assertions.assertEquals(decimalStr, actualDecimal.toPlainString());
+
+                final boolean delete = file.delete();
+            }
+        }
+
+    }
+
     @Test
     @Disabled
     void getParquetSchemaFromResultSet() {}