apache
diff --git a/‎.github/workflows/distribution.yml‎
Lines changed: 2 additions & 0 deletions b/‎.github/workflows/distribution.yml‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎.github/workflows/gradle-precommit.yml‎
Lines changed: 6 additions & 0 deletions b/‎.github/workflows/gradle-precommit.yml‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎.github/workflows/hunspell.yml‎
Lines changed: 3 additions & 0 deletions b/‎.github/workflows/hunspell.yml‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎gradle/ge.gradle‎
Lines changed: 41 additions & 0 deletions b/‎gradle/ge.gradle‎
Lines changed: 41 additions & 0 deletions
diff --git a/‎lucene/CHANGES.txt‎
Lines changed: 22 additions & 3 deletions b/‎lucene/CHANGES.txt‎
Lines changed: 22 additions & 3 deletions
diff --git a/‎lucene/backward-codecs/src/java/module-info.java‎
Lines changed: 5 additions & 2 deletions b/‎lucene/backward-codecs/src/java/module-info.java‎
Lines changed: 5 additions & 2 deletions
diff --git a/‎lucene/backward-codecs/src/java/org/apache/lucene/backward_codecs/lucene70/Lucene70SegmentInfoFormat.java‎
Lines changed: 1 addition & 0 deletions b/‎lucene/backward-codecs/src/java/org/apache/lucene/backward_codecs/lucene70/Lucene70SegmentInfoFormat.java‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎lucene/backward-codecs/src/java/org/apache/lucene/backward_codecs/lucene86/Lucene86SegmentInfoFormat.java‎
Lines changed: 1 addition & 0 deletions b/‎lucene/backward-codecs/src/java/org/apache/lucene/backward_codecs/lucene86/Lucene86SegmentInfoFormat.java‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎lucene/backward-codecs/src/java/org/apache/lucene/backward_codecs/lucene90/Lucene90Codec.java‎
Lines changed: 1 addition & 2 deletions b/‎lucene/backward-codecs/src/java/org/apache/lucene/backward_codecs/lucene90/Lucene90Codec.java‎
Lines changed: 1 addition & 2 deletions
diff --git a/‎lucene/backward-codecs/src/java/org/apache/lucene/backward_codecs/lucene90/Lucene90SegmentInfoFormat.java‎
Lines changed: 179 additions & 0 deletions b/‎lucene/backward-codecs/src/java/org/apache/lucene/backward_codecs/lucene90/Lucene90SegmentInfoFormat.java‎
Lines changed: 179 additions & 0 deletions
@@ -26,6 +26,8 @@ jobs:
         # we want to run the distribution tests on all major OSs, but it's occasionally too slow (or hangs or the forked process is not started at all..., not sure the cause) on windows.
         #os: [ubuntu-latest, macos-latest, windows-latest]
         os: [ubuntu-latest, macos-latest]
+    env:
+      GRADLE_ENTERPRISE_ACCESS_KEY: ${{ secrets.GE_ACCESS_TOKEN }}
 
     steps:
     - uses: actions/checkout@v3
 
@@ -27,6 +27,9 @@ jobs:
         # Test JVMs.
         java: [ '17' ]
 
+    env:
+      GRADLE_ENTERPRISE_ACCESS_KEY: ${{ secrets.GE_ACCESS_TOKEN }}
+
     steps:
     - uses: actions/checkout@v3
 
@@ -58,6 +61,9 @@ jobs:
         # Test JVMs.
         java: [ '17' ]
 
+    env:
+      GRADLE_ENTERPRISE_ACCESS_KEY: ${{ secrets.GE_ACCESS_TOKEN }}
+
     steps:
     - uses: actions/checkout@v3
 
 
@@ -15,6 +15,9 @@ jobs:
 
     runs-on: ubuntu-latest
 
+    env:
+      GRADLE_ENTERPRISE_ACCESS_KEY: ${{ secrets.GE_ACCESS_TOKEN }}
+
     steps:
     - uses: actions/checkout@v3
 
 
@@ -0,0 +1,41 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+def isCIBuild = System.getenv().keySet().find { it ==~ /(?i)((JENKINS|HUDSON)(_\w+)?|CI)/ } != null
+
+gradleEnterprise {
+    server = "https://ge.apache.org"
+    buildScan {
+        capture { taskInputFiles = true }
+        uploadInBackground = !isCIBuild
+        publishAlways()
+        publishIfAuthenticated()
+        obfuscation {
+            ipAddresses { addresses -> addresses.collect { address -> "0.0.0.0"} }
+        }
+    }
+}
+
+buildCache {
+    local {
+        enabled = !isCIBuild
+    }
+
+    remote(gradleEnterprise.buildCache) {
+        enabled = false
+    }
+}
@@ -62,6 +62,9 @@ API Changes
 
 * GITHUB#12599: Add RandomAccessInput#readBytes method to the RandomAccessInput interface. (Ignacio Vera)
 
+* GITHUB#12709 Consolidate FSTStore and BytesStore in FST. Created FSTReader which contains the common methods
+  of the two (Anh Dung Bui)
+
 New Features
 ---------------------
 
@@ -150,13 +153,18 @@ API Changes
 * GITHUB#12592: Add RandomAccessInput#length method to the RandomAccessInput interface. In addition deprecate
   ByteBuffersDataInput#size in favour of this new method. (Ignacio Vera)
 
-* GITHUB#12646: Move FST#addNode to FSTCompiler to avoid a circular dependency between FST and FSTCompiler
+* GITHUB#12646, GITHUB#12690: Move FST#addNode to FSTCompiler to avoid a circular dependency
+  between FST and FSTCompiler (Anh Dung Bui)
 
 New Features
 ---------------------
+
 * GITHUB#12548: Added similarityToQueryVector API to compute vector similarity scores
   with DoubleValuesSource. (Shubham Chaudhary)
 
+* GITHUB#12685: Lucene now records if documents have been indexed as blocks in SegmentInfo. This is recorded on a per
+  segment basis and maintained across merges. The property is exposed via LeafReaderMetadata. (Simon Willnauer)
+
 Improvements
 ---------------------
 * GITHUB#12523: TaskExecutor waits for all tasks to complete before returning when Exceptions
@@ -186,6 +194,8 @@ Improvements
 * GITHUB#12705, GITHUB#12705: Improve handling of NullPointerException and IllegalStateException
   in MMapDirectory's IndexInputs.  (Uwe Schindler, Michael Sokolov)
 
+* GITHUB#12689: TaskExecutor to cancel all tasks on exception to avoid needless computation. (Luca Cavanna)
+
 Optimizations
 ---------------------
 * GITHUB#12183: Make TermStates#build concurrent. (Shubham Chaudhary)
@@ -194,7 +204,7 @@ Optimizations
 
 * GITHUB#12382: Faster top-level conjunctions on term queries when sorting by
   descending score. (Adrien Grand)
-  
+
 * GITHUB#12591: Use stable radix sort to speed up the sorting of update terms. (Guo Feng)
 
 * GITHUB#12587: Use radix sort to speed up the sorting of terms in TermInSetQuery. (Guo Feng)
@@ -209,11 +219,18 @@ Optimizations
 
 * GITHUB#12668: ImpactsEnums now decode frequencies lazily like PostingsEnums.
   (Adrien Grand)
-  
+
 * GITHUB#12651: Use 2d array for OnHeapHnswGraph representation. (Patrick Zhai)
 
 * GITHUB#12653: Optimize computing number of levels in MultiLevelSkipListWriter#bufferSkip. (Shubham Chaudhary)
 
+* GITHUB#12589: Disjunctions now sometimes run as conjunctions when the minimum
+  competitive score requires multiple clauses to match. (Adrien Grand)
+
+* GITHUB#12710: Use Arrays#mismatch for Outputs#common operations. (Guo Feng)
+
+* GITHUB#12712: Speed up sorting postings file with an offline radix sorter in BPIndexReader. (Guo Feng)
+
 Changes in runtime behavior
 ---------------------
 
@@ -232,6 +249,8 @@ Bug Fixes
 
 * GITHUB#12642: Ensure #finish only gets called once on the base collector during drill-sideways (Greg Miller)
 
+* GITHUB#12682: Scorer should sum up scores into a double. (Shubham Chaudhary)
+
 Build
 ---------------------
 
 
@@ -34,6 +34,7 @@
   exports org.apache.lucene.backward_codecs.lucene91;
   exports org.apache.lucene.backward_codecs.lucene92;
   exports org.apache.lucene.backward_codecs.lucene94;
+  exports org.apache.lucene.backward_codecs.lucene95;
   exports org.apache.lucene.backward_codecs.packed;
   exports org.apache.lucene.backward_codecs.store;
 
@@ -46,7 +47,8 @@
       org.apache.lucene.backward_codecs.lucene90.Lucene90HnswVectorsFormat,
       org.apache.lucene.backward_codecs.lucene91.Lucene91HnswVectorsFormat,
       org.apache.lucene.backward_codecs.lucene92.Lucene92HnswVectorsFormat,
-      org.apache.lucene.backward_codecs.lucene94.Lucene94HnswVectorsFormat;
+      org.apache.lucene.backward_codecs.lucene94.Lucene94HnswVectorsFormat,
+      org.apache.lucene.backward_codecs.lucene95.Lucene95HnswVectorsFormat;
   provides org.apache.lucene.codecs.Codec with
       org.apache.lucene.backward_codecs.lucene80.Lucene80Codec,
       org.apache.lucene.backward_codecs.lucene84.Lucene84Codec,
@@ -55,5 +57,6 @@
       org.apache.lucene.backward_codecs.lucene90.Lucene90Codec,
       org.apache.lucene.backward_codecs.lucene91.Lucene91Codec,
       org.apache.lucene.backward_codecs.lucene92.Lucene92Codec,
-      org.apache.lucene.backward_codecs.lucene94.Lucene94Codec;
+      org.apache.lucene.backward_codecs.lucene94.Lucene94Codec,
+      org.apache.lucene.backward_codecs.lucene95.Lucene95Codec;
 }
@@ -307,6 +307,7 @@ private SegmentInfo parseSegmentInfo(
             segment,
             docCount,
             isCompoundFile,
+            false,
             null,
             diagnostics,
             segmentID,
 
@@ -164,6 +164,7 @@ private SegmentInfo parseSegmentInfo(
             segment,
             docCount,
             isCompoundFile,
+            false,
             null,
             diagnostics,
             segmentID,
 
@@ -36,7 +36,6 @@
 import org.apache.lucene.codecs.lucene90.Lucene90NormsFormat;
 import org.apache.lucene.codecs.lucene90.Lucene90PointsFormat;
 import org.apache.lucene.codecs.lucene90.Lucene90PostingsFormat;
-import org.apache.lucene.codecs.lucene90.Lucene90SegmentInfoFormat;
 import org.apache.lucene.codecs.lucene90.Lucene90StoredFieldsFormat;
 import org.apache.lucene.codecs.lucene90.Lucene90TermVectorsFormat;
 import org.apache.lucene.codecs.perfield.PerFieldDocValuesFormat;
@@ -143,7 +142,7 @@ public final FieldInfosFormat fieldInfosFormat() {
   }
 
   @Override
-  public final SegmentInfoFormat segmentInfoFormat() {
+  public SegmentInfoFormat segmentInfoFormat() {
     return segmentInfosFormat;
   }
 
 
@@ -0,0 +1,179 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.lucene.backward_codecs.lucene90;
+
+import java.io.IOException;
+import java.util.Map;
+import java.util.Set;
+import org.apache.lucene.codecs.CodecUtil;
+import org.apache.lucene.codecs.SegmentInfoFormat;
+import org.apache.lucene.index.CorruptIndexException;
+import org.apache.lucene.index.IndexFileNames;
+import org.apache.lucene.index.IndexWriter;
+import org.apache.lucene.index.SegmentInfo;
+import org.apache.lucene.index.SegmentInfos;
+import org.apache.lucene.index.SortFieldProvider;
+import org.apache.lucene.search.Sort;
+import org.apache.lucene.search.SortField;
+import org.apache.lucene.store.ChecksumIndexInput;
+import org.apache.lucene.store.DataInput;
+import org.apache.lucene.store.DataOutput;
+import org.apache.lucene.store.Directory;
+import org.apache.lucene.store.IOContext;
+import org.apache.lucene.util.Version;
+
+/**
+ * Lucene 9.0 Segment info format.
+ *
+ * <p>Files:
+ *
+ * <ul>
+ *   <li><code>.si</code>: Header, SegVersion, SegSize, IsCompoundFile, Diagnostics, Files,
+ *       Attributes, IndexSort, Footer
+ * </ul>
+ *
+ * Data types:
+ *
+ * <ul>
+ *   <li>Header --&gt; {@link CodecUtil#writeIndexHeader IndexHeader}
+ *   <li>SegSize --&gt; {@link DataOutput#writeInt Int32}
+ *   <li>SegVersion --&gt; {@link DataOutput#writeString String}
+ *   <li>SegMinVersion --&gt; {@link DataOutput#writeString String}
+ *   <li>Files --&gt; {@link DataOutput#writeSetOfStrings Set&lt;String&gt;}
+ *   <li>Diagnostics,Attributes --&gt; {@link DataOutput#writeMapOfStrings Map&lt;String,String&gt;}
+ *   <li>IsCompoundFile --&gt; {@link DataOutput#writeByte Int8}
+ *   <li>IndexSort --&gt; {@link DataOutput#writeVInt Int32} count, followed by {@code count}
+ *       SortField
+ *   <li>SortField --&gt; {@link DataOutput#writeString String} sort class, followed by a per-sort
+ *       bytestream (see {@link SortFieldProvider#readSortField(DataInput)})
+ *   <li>Footer --&gt; {@link CodecUtil#writeFooter CodecFooter}
+ * </ul>
+ *
+ * Field Descriptions:
+ *
+ * <ul>
+ *   <li>SegVersion is the code version that created the segment.
+ *   <li>SegMinVersion is the minimum code version that contributed documents to the segment.
+ *   <li>SegSize is the number of documents contained in the segment index.
+ *   <li>IsCompoundFile records whether the segment is written as a compound file or not. If this is
+ *       -1, the segment is not a compound file. If it is 1, the segment is a compound file.
+ *   <li>The Diagnostics Map is privately written by {@link IndexWriter}, as a debugging aid, for
+ *       each segment it creates. It includes metadata like the current Lucene version, OS, Java
+ *       version, why the segment was created (merge, flush, addIndexes), etc.
+ *   <li>Files is a list of files referred to by this segment.
+ * </ul>
+ *
+ * @see SegmentInfos
+ * @lucene.experimental
+ */
+public class Lucene90SegmentInfoFormat extends SegmentInfoFormat {
+
+  /** File extension used to store {@link SegmentInfo}. */
+  public static final String SI_EXTENSION = "si";
+
+  static final String CODEC_NAME = "Lucene90SegmentInfo";
+  static final int VERSION_START = 0;
+  static final int VERSION_CURRENT = VERSION_START;
+
+  /** Sole constructor. */
+  public Lucene90SegmentInfoFormat() {}
+
+  @Override
+  public SegmentInfo read(Directory dir, String segment, byte[] segmentID, IOContext context)
+      throws IOException {
+    final String fileName = IndexFileNames.segmentFileName(segment, "", SI_EXTENSION);
+    try (ChecksumIndexInput input = dir.openChecksumInput(fileName)) {
+      Throwable priorE = null;
+      SegmentInfo si = null;
+      try {
+        CodecUtil.checkIndexHeader(
+            input, CODEC_NAME, VERSION_START, VERSION_CURRENT, segmentID, "");
+        si = parseSegmentInfo(dir, input, segment, segmentID);
+      } catch (Throwable exception) {
+        priorE = exception;
+      } finally {
+        CodecUtil.checkFooter(input, priorE);
+      }
+      return si;
+    }
+  }
+
+  private SegmentInfo parseSegmentInfo(
+      Directory dir, DataInput input, String segment, byte[] segmentID) throws IOException {
+    final Version version = Version.fromBits(input.readInt(), input.readInt(), input.readInt());
+    byte hasMinVersion = input.readByte();
+    final Version minVersion;
+    switch (hasMinVersion) {
+      case 0:
+        minVersion = null;
+        break;
+      case 1:
+        minVersion = Version.fromBits(input.readInt(), input.readInt(), input.readInt());
+        break;
+      default:
+        throw new CorruptIndexException("Illegal boolean value " + hasMinVersion, input);
+    }
+
+    final int docCount = input.readInt();
+    if (docCount < 0) {
+      throw new CorruptIndexException("invalid docCount: " + docCount, input);
+    }
+    final boolean isCompoundFile = input.readByte() == SegmentInfo.YES;
+
+    final Map<String, String> diagnostics = input.readMapOfStrings();
+    final Set<String> files = input.readSetOfStrings();
+    final Map<String, String> attributes = input.readMapOfStrings();
+
+    int numSortFields = input.readVInt();
+    Sort indexSort;
+    if (numSortFields > 0) {
+      SortField[] sortFields = new SortField[numSortFields];
+      for (int i = 0; i < numSortFields; i++) {
+        String name = input.readString();
+        sortFields[i] = SortFieldProvider.forName(name).readSortField(input);
+      }
+      indexSort = new Sort(sortFields);
+    } else if (numSortFields < 0) {
+      throw new CorruptIndexException("invalid index sort field count: " + numSortFields, input);
+    } else {
+      indexSort = null;
+    }
+
+    SegmentInfo si =
+        new SegmentInfo(
+            dir,
+            version,
+            minVersion,
+            segment,
+            docCount,
+            isCompoundFile,
+            false,
+            null,
+            diagnostics,
+            segmentID,
+            attributes,
+            indexSort);
+    si.setFiles(files);
+    return si;
+  }
+
+  @Override
+  public void write(Directory dir, SegmentInfo si, IOContext ioContext) throws IOException {
+    throw new UnsupportedOperationException("Old formats can't be used for writing");
+  }
+}
Original file line number	Diff line number	Diff line change
`@@ -36,7 +36,6 @@`
`36`	`36`	`import org.apache.lucene.codecs.lucene90.Lucene90NormsFormat;`
`37`	`37`	`import org.apache.lucene.codecs.lucene90.Lucene90PointsFormat;`
`38`	`38`	`import org.apache.lucene.codecs.lucene90.Lucene90PostingsFormat;`
`39`		`-import org.apache.lucene.codecs.lucene90.Lucene90SegmentInfoFormat;`
`40`	`39`	`import org.apache.lucene.codecs.lucene90.Lucene90StoredFieldsFormat;`
`41`	`40`	`import org.apache.lucene.codecs.lucene90.Lucene90TermVectorsFormat;`
`42`	`41`	`import org.apache.lucene.codecs.perfield.PerFieldDocValuesFormat;`
`@@ -143,7 +142,7 @@ public final FieldInfosFormat fieldInfosFormat() {`
`143`	`142`	`}`
`144`	`143`
`145`	`144`	`@Override`
`146`		`- public final SegmentInfoFormat segmentInfoFormat() {`
	`145`	`+ public SegmentInfoFormat segmentInfoFormat() {`
`147`	`146`	`return segmentInfosFormat;`
`148`	`147`	`}`
`149`	`148`