local recovery via catalogsnapshot (#19841)

bharath-techie · web-flow · commit 546257ccbe46 · 2025-10-31T23:25:32.000+05:30
Signed-off-by: bharath-techie &lt;bharath78910@gmail.com&gt;
diff --git a/server/src/main/java/org/opensearch/index/engine/exec/WriterFileSet.java b/server/src/main/java/org/opensearch/index/engine/exec/WriterFileSet.java
@@ -8,12 +8,17 @@
 
 package org.opensearch.index.engine.exec;
 
+import org.opensearch.core.common.io.stream.StreamInput;
+import org.opensearch.core.common.io.stream.StreamOutput;
+import org.opensearch.core.common.io.stream.Writeable;
+
+import java.io.IOException;
 import java.io.Serializable;
 import java.nio.file.Path;
 import java.util.HashSet;
 import java.util.Set;
 
-public class WriterFileSet implements Serializable {
+public class WriterFileSet implements Serializable, Writeable {
 
     private final String directory;
     private final long writerGeneration;
@@ -25,6 +30,30 @@ public WriterFileSet(Path directory, long writerGeneration) {
         this.directory = directory.toString();
     }
 
+    public WriterFileSet(StreamInput in) throws IOException {
+        this.directory = in.readString();
+        this.writerGeneration = in.readLong();
+
+        int fileCount = in.readVInt();
+        this.files = new HashSet<>(fileCount);
+        for (int i = 0; i < fileCount; i++) {
+            this.files.add(in.readString());
+        }
+    }
+
+    /**
+     * Serialize this WriterFileSet to StreamOutput
+     */
+    @Override
+    public void writeTo(StreamOutput out) throws IOException {
+        out.writeString(directory);
+        out.writeLong(writerGeneration);
+        out.writeVInt(files.size());
+        for (String file : files) {
+            out.writeString(file);
+        }
+    }
+
     public void add(String file) {
         this.files.add(file);
     }
diff --git a/server/src/main/java/org/opensearch/index/engine/exec/commit/LuceneCommitEngine.java b/server/src/main/java/org/opensearch/index/engine/exec/commit/LuceneCommitEngine.java
@@ -47,12 +47,27 @@ public void addLuceneIndexes(CatalogSnapshot catalogSnapshot) {
                 throw new RuntimeException(e);
             }
         });
-        Map<String, String> userData = new HashMap<>();
-        catalogSnapshot.getSegments().forEach(segment -> userData.put(String.valueOf(segment.getGeneration()),
-            new String(SerializationUtils.serialize(segment))));
+
+        Map<String, String> userData = null;
+        try {
+            userData = catalogSnapshot.toCommitUserData();
+        } catch (IOException e) {
+            throw new RuntimeException(e);
+        }
         indexWriter.setLiveCommitData(userData.entrySet());
     }
 
+    public CatalogSnapshot readCatalogSnapshot() throws IOException {
+        if(indexWriter.getLiveCommitData().iterator().hasNext()) {
+            Map.Entry<String, String> entry = indexWriter.getLiveCommitData().iterator().next();
+            return CatalogSnapshot.fromCommitUserData(entry.getValue());
+        }
+        return null;
+    }
+    public IndexWriter getIndexWriter() {
+        return indexWriter;
+    }
+
     @Override
     public CommitPoint commit(CatalogSnapshot catalogSnapshot) {
         addLuceneIndexes(catalogSnapshot);
diff --git a/server/src/main/java/org/opensearch/index/engine/exec/coord/CatalogSnapshot.java b/server/src/main/java/org/opensearch/index/engine/exec/coord/CatalogSnapshot.java
@@ -9,24 +9,32 @@
 package org.opensearch.index.engine.exec.coord;
 
 import org.opensearch.common.annotation.ExperimentalApi;
+import org.opensearch.common.io.stream.BytesStreamOutput;
 import org.opensearch.common.util.concurrent.AbstractRefCounted;
+import org.opensearch.core.common.io.stream.BytesStreamInput;
+import org.opensearch.core.common.io.stream.StreamInput;
+import org.opensearch.core.common.io.stream.StreamOutput;
+import org.opensearch.core.common.io.stream.Writeable;
 import org.opensearch.index.engine.exec.FileMetadata;
 import org.opensearch.index.engine.exec.RefreshResult;
 import org.opensearch.index.engine.exec.WriterFileSet;
 
+import java.io.IOException;
 import java.io.Serializable;
 import java.util.ArrayList;
+import java.util.Base64;
 import java.util.Collection;
 import java.util.Collections;
 import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
 
 @ExperimentalApi
-public class CatalogSnapshot extends AbstractRefCounted {
+public class CatalogSnapshot extends AbstractRefCounted implements Writeable {
 
     private final long id;
     private final Map<String, Collection<WriterFileSet>> dfGroupedSearchableFiles;
+    private static final String CATALOG_SNAPSHOT_KEY = "_catalog_snapshot_";
 
     public CatalogSnapshot(RefreshResult refreshResult, long id) {
         super("catalog_snapshot");
@@ -35,6 +43,60 @@ public CatalogSnapshot(RefreshResult refreshResult, long id) {
         refreshResult.getRefreshedFiles().forEach((dataFormat, writerFiles) -> dfGroupedSearchableFiles.put(dataFormat.name(), writerFiles));
     }
 
+    public CatalogSnapshot(StreamInput in) throws IOException {
+        super("catalog_snapshot");
+        this.id = in.readLong();
+        this.dfGroupedSearchableFiles = new HashMap<>();
+
+        int mapSize = in.readVInt();
+        for (int i = 0; i < mapSize; i++) {
+            String dataFormat = in.readString();
+            int fileSetCount = in.readVInt();
+            List<WriterFileSet> fileSets = new ArrayList<>(fileSetCount);
+            for (int j = 0; j < fileSetCount; j++) {
+                fileSets.add(new WriterFileSet(in));
+            }
+            dfGroupedSearchableFiles.put(dataFormat, fileSets);
+        }
+    }
+
+    @Override
+    public void writeTo(StreamOutput out) throws IOException {
+        out.writeLong(id);
+        out.writeVInt(dfGroupedSearchableFiles.size());
+        for (Map.Entry<String, Collection<WriterFileSet>> entry : dfGroupedSearchableFiles.entrySet()) {
+            out.writeString(entry.getKey());
+            out.writeVInt(entry.getValue().size());
+            for (WriterFileSet fileSet : entry.getValue()) {
+                fileSet.writeTo(out);
+            }
+        }
+    }
+
+    public String serializeToString() throws IOException {
+        try (BytesStreamOutput out = new BytesStreamOutput()) {
+            this.writeTo(out);
+            return Base64.getEncoder().encodeToString(out.bytes().toBytesRef().bytes);
+        }
+    }
+
+    public static CatalogSnapshot deserializeFromString(String serializedData) throws IOException {
+        byte[] bytes = Base64.getDecoder().decode(serializedData);
+        try (BytesStreamInput in = new BytesStreamInput(bytes)) {
+            return new CatalogSnapshot(in);
+        }
+    }
+
+    public Map<String, String> toCommitUserData() throws IOException {
+        Map<String, String> userData = new HashMap<>();
+        userData.put(CATALOG_SNAPSHOT_KEY, serializeToString());
+        return userData;
+    }
+
+    public static CatalogSnapshot fromCommitUserData(String userData) throws IOException {
+        return deserializeFromString(userData);
+    }
+
     public Collection<WriterFileSet> getSearchableFiles(String dataFormat) {
         if (dfGroupedSearchableFiles.containsKey(dataFormat)) {
             return dfGroupedSearchableFiles.get(dataFormat);
@@ -68,7 +130,7 @@ public String toString() {
             '}';
     }
 
-    public static class Segment implements Serializable {
+    public static class Segment implements Serializable, Writeable {
 
         private final long generation;
         private final Map<String, WriterFileSet> dfGroupedSearchableFiles;
@@ -78,6 +140,28 @@ public Segment(long generation) {
             this.generation = generation;
         }
 
+        public Segment(StreamInput in) throws IOException {
+            this.generation = in.readLong();
+            this.dfGroupedSearchableFiles = new HashMap<>();
+
+            int mapSize = in.readVInt();
+            for (int i = 0; i < mapSize; i++) {
+                String dataFormat = in.readString();
+                WriterFileSet fileSet = new WriterFileSet(in);
+                dfGroupedSearchableFiles.put(dataFormat, fileSet);
+            }
+        }
+
+        @Override
+        public void writeTo(StreamOutput out) throws IOException {
+            out.writeLong(generation);
+            out.writeVInt(dfGroupedSearchableFiles.size());
+            for (Map.Entry<String, WriterFileSet> entry : dfGroupedSearchableFiles.entrySet()) {
+                out.writeString(entry.getKey());
+                entry.getValue().writeTo(out);
+            }
+        }
+
         public void addSearchableFiles(String dataFormat, WriterFileSet writerFileSetGroup) {
             dfGroupedSearchableFiles.put(dataFormat, writerFileSetGroup);
         }
diff --git a/server/src/main/java/org/opensearch/index/engine/exec/coord/CompositeEngine.java b/server/src/main/java/org/opensearch/index/engine/exec/coord/CompositeEngine.java
@@ -8,6 +8,7 @@
 
 package org.opensearch.index.engine.exec.coord;
 
+import org.apache.commons.lang3.SerializationUtils;
 import org.apache.lucene.search.ReferenceManager;
 import org.opensearch.common.annotation.ExperimentalApi;
 import org.opensearch.index.engine.CatalogSnapshotAwareRefreshListener;
@@ -48,6 +49,7 @@
 import java.util.Collection;
 import java.util.Collections;
 import java.util.HashMap;
+import java.util.Iterator;
 import java.util.List;
 import java.util.Map;
 
@@ -67,17 +69,18 @@ public CompositeEngine(MapperService mapperService, PluginsService pluginsServic
         List<SearchEnginePlugin> searchEnginePlugins = pluginsService.filterPlugins(SearchEnginePlugin.class);
         // How to bring the Dataformat here? Currently this means only Text and LuceneFormat can be used
         this.engine = new CompositeIndexingExecutionEngine(mapperService, pluginsService, shardPath, 0);
-        Path committerPath = Files.createTempDirectory("lucene-committer-index");
-        this.compositeEngineCommitter = new LuceneCommitEngine(committerPath);
-
+        this.compositeEngineCommitter = new LuceneCommitEngine(shardPath.getDataPath());
+        this.catalogSnapshot = ((LuceneCommitEngine)this.compositeEngineCommitter).readCatalogSnapshot();
         this.mergeHandler = new ParquetMergeHandler(this, this.engine, this.engine.getDataFormat());
         mergeScheduler = new MergeScheduler(this.mergeHandler, this);
 
         // Refresh here so that catalog snapshot gets initialized
         // TODO : any better way to do this ?
         refresh("start");
+
         // TODO : how to extend this for Lucene ? where engine is a r/w engine
         // Create read specific engines for each format which is associated with shard
+
         for (SearchEnginePlugin searchEnginePlugin : searchEnginePlugins) {
             for (org.opensearch.vectorized.execution.search.DataFormat dataFormat : searchEnginePlugin.getSupportedFormats()) {
                 List<SearchExecEngine<?, ?, ?, ?>> currentSearchEngines = readEngines.getOrDefault(dataFormat, new ArrayList<>());
@@ -99,6 +102,13 @@ public CompositeEngine(MapperService mapperService, PluginsService pluginsServic
                 }
             }
         }
+        catalogSnapshotAwareRefreshListeners.forEach(ref -> {
+            try {
+                ref.afterRefresh(true, catalogSnapshot);
+            } catch (IOException e) {
+                throw new RuntimeException(e);
+            }
+        });
     }
 
     public SearchExecEngine<?, ?, ?, ?> getReadEngine(org.opensearch.vectorized.execution.search.DataFormat dataFormat) {