Changes for supporting Atomic writes with Hadoop 3.4.2+

junmuz · ymuzammil · commit 33e92df7bf06 · 2026-02-06T00:21:50.000-08:00
diff --git a/paimon-filesystems/paimon-azure-impl/src/main/java/org/apache/paimon/azure/AzureFileIO.java b/paimon-filesystems/paimon-azure-impl/src/main/java/org/apache/paimon/azure/AzureFileIO.java
@@ -20,9 +20,12 @@
 
 import org.apache.paimon.catalog.CatalogContext;
 import org.apache.paimon.fs.FileIO;
+import org.apache.paimon.fs.Path;
 import org.apache.paimon.options.Options;
 
 import org.apache.hadoop.conf.Configuration;
+import org.apache.hadoop.fs.FSDataOutputStream;
+import org.apache.hadoop.fs.FileAlreadyExistsException;
 import org.apache.hadoop.fs.FileSystem;
 import org.apache.hadoop.fs.azure.NativeAzureFileSystem;
 import org.apache.hadoop.fs.azurebfs.AzureBlobFileSystem;
@@ -32,6 +35,7 @@
 import java.io.IOException;
 import java.io.UncheckedIOException;
 import java.net.URI;
+import java.nio.charset.StandardCharsets;
 import java.util.Map;
 import java.util.Objects;
 import java.util.concurrent.ConcurrentHashMap;
@@ -66,6 +70,34 @@ public void configure(CatalogContext context) {
         this.hadoopOptions = mirrorCertainHadoopConfig(loadHadoopConfigFromContext(context));
     }
 
+    /**
+     * Write content atomically using Azure conditional writes.
+     *
+     * @param path the target file path
+     * @param content the content to write
+     * @return true if write succeeded, false if file already exists
+     * @throws IOException on I/O errors
+     */
+    @Override
+    public boolean tryToWriteAtomic(Path path, String content) throws IOException {
+        org.apache.hadoop.fs.Path hadoopPath = path(path);
+        FileSystem fs = getFileSystem(hadoopPath);
+
+        byte[] contentBytes = content.getBytes(StandardCharsets.UTF_8);
+
+        try (FSDataOutputStream out =
+                fs.createFile(hadoopPath)
+                        .create()
+                        .overwrite(false) // Fails if file exists
+                        .build()) {
+            out.write(contentBytes);
+            return true;
+        } catch (FileAlreadyExistsException e) {
+            LOG.debug("Conditional write failed, file already exists: {}", path);
+            return false;
+        }
+    }
+
     // add additional config entries from the IO config to the Hadoop config
     private Options loadHadoopConfigFromContext(CatalogContext context) {
         Options hadoopConfig = new Options();
diff --git a/paimon-filesystems/paimon-azure-impl/src/main/java/org/apache/paimon/azure/HadoopCompliantFileIO.java b/paimon-filesystems/paimon-azure-impl/src/main/java/org/apache/paimon/azure/HadoopCompliantFileIO.java
@@ -102,11 +102,11 @@ public boolean rename(Path src, Path dst) throws IOException {
         return getFileSystem(hadoopSrc).rename(hadoopSrc, hadoopDst);
     }
 
-    private org.apache.hadoop.fs.Path path(Path path) {
+    protected org.apache.hadoop.fs.Path path(Path path) {
         return new org.apache.hadoop.fs.Path(path.toUri());
     }
 
-    private FileSystem getFileSystem(org.apache.hadoop.fs.Path path) throws IOException {
+    protected FileSystem getFileSystem(org.apache.hadoop.fs.Path path) throws IOException {
         if (fs == null) {
             synchronized (this) {
                 if (fs == null) {
diff --git a/paimon-filesystems/paimon-s3-impl/src/main/java/org/apache/paimon/s3/S3FileIO.java b/paimon-filesystems/paimon-s3-impl/src/main/java/org/apache/paimon/s3/S3FileIO.java
@@ -25,6 +25,8 @@
 import org.apache.paimon.options.Options;
 
 import org.apache.hadoop.conf.Configuration;
+import org.apache.hadoop.fs.FSDataOutputStream;
+import org.apache.hadoop.fs.FileAlreadyExistsException;
 import org.apache.hadoop.fs.FileSystem;
 import org.apache.hadoop.fs.s3a.S3AFileSystem;
 import org.slf4j.Logger;
@@ -33,6 +35,7 @@
 import java.io.IOException;
 import java.io.UncheckedIOException;
 import java.net.URI;
+import java.nio.charset.StandardCharsets;
 import java.util.Map;
 import java.util.Objects;
 import java.util.concurrent.ConcurrentHashMap;
@@ -85,6 +88,34 @@ public TwoPhaseOutputStream newTwoPhaseOutputStream(Path path, boolean overwrite
                 new S3MultiPartUpload(fs, fs.getConf()), hadoopPath, path);
     }
 
+    /**
+     * Write content atomically using S3 conditional writes via Hadoop 3.4+ native API.
+     *
+     * @param path the target file path
+     * @param content the content to write
+     * @return true if write succeeded, false if file already exists
+     * @throws IOException on I/O errors
+     */
+    @Override
+    public boolean tryToWriteAtomic(Path path, String content) throws IOException {
+        org.apache.hadoop.fs.Path hadoopPath = path(path);
+        S3AFileSystem fs = (S3AFileSystem) getFileSystem(hadoopPath);
+
+        byte[] contentBytes = content.getBytes(StandardCharsets.UTF_8);
+
+        try (FSDataOutputStream out =
+                fs.createFile(hadoopPath)
+                        .create()
+                        .overwrite(false) // Fails if file exists (uses If-None-Match: * on S3)
+                        .build()) {
+            out.write(contentBytes);
+            return true;
+        } catch (FileAlreadyExistsException e) {
+            LOG.debug("Conditional write failed, file already exists: {}", path);
+            return false;
+        }
+    }
+
     // add additional config entries from the IO config to the Hadoop config
     private Options loadHadoopConfigFromContext(CatalogContext context) {
         Options hadoopConfig = new Options();

Original file line number	Diff line number	Diff line change
`@@ -102,11 +102,11 @@ public boolean rename(Path src, Path dst) throws IOException {`
`102`	`102`	`return getFileSystem(hadoopSrc).rename(hadoopSrc, hadoopDst);`
`103`	`103`	`}`
`104`	`104`
`105`		`- private org.apache.hadoop.fs.Path path(Path path) {`
	`105`	`+ protected org.apache.hadoop.fs.Path path(Path path) {`
`106`	`106`	`return new org.apache.hadoop.fs.Path(path.toUri());`
`107`	`107`	`}`
`108`	`108`
`109`		`- private FileSystem getFileSystem(org.apache.hadoop.fs.Path path) throws IOException {`
	`109`	`+ protected FileSystem getFileSystem(org.apache.hadoop.fs.Path path) throws IOException {`
`110`	`110`	`if (fs == null) {`
`111`	`111`	`synchronized (this) {`
`112`	`112`	`if (fs == null) {`