apache
diff --git a/‎lucene/codecs/src/java/org/apache/lucene/codecs/simpletext/SimpleTextVectorReader.java‎
Lines changed: 5 additions & 5 deletions b/‎lucene/codecs/src/java/org/apache/lucene/codecs/simpletext/SimpleTextVectorReader.java‎
Lines changed: 5 additions & 5 deletions
diff --git a/‎lucene/core/src/java/org/apache/lucene/codecs/VectorFormat.java‎
Lines changed: 8 additions & 1 deletion b/‎lucene/core/src/java/org/apache/lucene/codecs/VectorFormat.java‎
Lines changed: 8 additions & 1 deletion
diff --git a/‎lucene/core/src/java/org/apache/lucene/codecs/VectorReader.java‎
Lines changed: 17 additions & 0 deletions b/‎lucene/core/src/java/org/apache/lucene/codecs/VectorReader.java‎
Lines changed: 17 additions & 0 deletions
diff --git a/‎lucene/core/src/java/org/apache/lucene/codecs/VectorWriter.java‎
Lines changed: 0 additions & 6 deletions b/‎lucene/core/src/java/org/apache/lucene/codecs/VectorWriter.java‎
Lines changed: 0 additions & 6 deletions
diff --git a/‎lucene/core/src/java/org/apache/lucene/codecs/lucene90/Lucene90VectorReader.java‎
Lines changed: 65 additions & 55 deletions b/‎lucene/core/src/java/org/apache/lucene/codecs/lucene90/Lucene90VectorReader.java‎
Lines changed: 65 additions & 55 deletions
diff --git a/‎lucene/core/src/java/org/apache/lucene/index/CodecReader.java‎
Lines changed: 14 additions & 0 deletions b/‎lucene/core/src/java/org/apache/lucene/index/CodecReader.java‎
Lines changed: 14 additions & 0 deletions
diff --git a/‎lucene/core/src/java/org/apache/lucene/index/DocValuesLeafReader.java‎
Lines changed: 7 additions & 0 deletions b/‎lucene/core/src/java/org/apache/lucene/index/DocValuesLeafReader.java‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎lucene/core/src/java/org/apache/lucene/index/FilterLeafReader.java‎
Lines changed: 7 additions & 0 deletions b/‎lucene/core/src/java/org/apache/lucene/index/FilterLeafReader.java‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎lucene/core/src/java/org/apache/lucene/index/LeafReader.java‎
Lines changed: 20 additions & 0 deletions b/‎lucene/core/src/java/org/apache/lucene/index/LeafReader.java‎
Lines changed: 20 additions & 0 deletions
diff --git a/‎lucene/core/src/java/org/apache/lucene/index/MergeReaderWrapper.java‎
Lines changed: 7 additions & 0 deletions b/‎lucene/core/src/java/org/apache/lucene/index/MergeReaderWrapper.java‎
Lines changed: 7 additions & 0 deletions
@@ -141,6 +141,11 @@ public VectorValues getVectorValues(String field) throws IOException {
     return new SimpleTextVectorValues(fieldEntry, bytesSlice);
   }
 
+  @Override
+  public TopDocs search(String field, float[] target, int k, int fanout) throws IOException {
+    throw new UnsupportedOperationException();
+  }
+
   @Override
   public void checkIntegrity() throws IOException {
     IndexInput clone = dataIn.clone();
@@ -334,11 +339,6 @@ public float[] vectorValue(int targetOrd) throws IOException {
     public BytesRef binaryValue(int targetOrd) throws IOException {
       throw new UnsupportedOperationException();
     }
-
-    @Override
-    public TopDocs search(float[] target, int k, int fanout) throws IOException {
-      throw new UnsupportedOperationException();
-    }
   }
 
   private int readInt(IndexInput in, BytesRef field) throws IOException {
 
@@ -21,6 +21,8 @@
 import org.apache.lucene.index.SegmentReadState;
 import org.apache.lucene.index.SegmentWriteState;
 import org.apache.lucene.index.VectorValues;
+import org.apache.lucene.search.TopDocs;
+import org.apache.lucene.search.TopDocsCollector;
 
 /**
  * Encodes/decodes per-document vector and any associated indexing structures required to support
@@ -61,7 +63,12 @@ public VectorValues getVectorValues(String field) {
             }
 
             @Override
-            public void close() throws IOException {}
+            public TopDocs search(String field, float[] target, int k, int fanout) {
+              return TopDocsCollector.EMPTY_TOPDOCS;
+            }
+
+            @Override
+            public void close() {}
 
             @Override
             public long ramBytesUsed() {
 
@@ -20,6 +20,7 @@
 import java.io.Closeable;
 import java.io.IOException;
 import org.apache.lucene.index.VectorValues;
+import org.apache.lucene.search.TopDocs;
 import org.apache.lucene.util.Accountable;
 
 /** Reads vectors from an index. */
@@ -41,6 +42,22 @@ protected VectorReader() {}
   /** Returns the {@link VectorValues} for the given {@code field} */
   public abstract VectorValues getVectorValues(String field) throws IOException;
 
+  /**
+   * Return the k nearest neighbor documents as determined by comparison of their vector values for
+   * this field, to the given vector, by the field's search strategy. If the search strategy is
+   * reversed, lower values indicate nearer vectors, otherwise higher scores indicate nearer
+   * vectors. Unlike relevance scores, vector scores may be negative.
+   *
+   * @param field the vector field to search
+   * @param target the vector-valued query
+   * @param k the number of docs to return
+   * @param fanout control the accuracy/speed tradeoff - larger values give better recall at higher
+   *     cost
+   * @return the k nearest neighbor documents, along with their (searchStrategy-specific) scores.
+   */
+  public abstract TopDocs search(String field, float[] target, int k, int fanout)
+      throws IOException;
+
   /**
    * Returns an instance optimized for merging. This instance may only be consumed in the thread
    * that called {@link #getMergeInstance()}.
 
@@ -30,7 +30,6 @@
 import org.apache.lucene.index.RandomAccessVectorValues;
 import org.apache.lucene.index.RandomAccessVectorValuesProducer;
 import org.apache.lucene.index.VectorValues;
-import org.apache.lucene.search.TopDocs;
 import org.apache.lucene.util.BytesRef;
 
 /** Writes vectors to an index. */
@@ -246,11 +245,6 @@ public SearchStrategy searchStrategy() {
       return subs.get(0).values.searchStrategy();
     }
 
-    @Override
-    public TopDocs search(float[] target, int k, int fanout) throws IOException {
-      throw new UnsupportedOperationException();
-    }
-
     class MergerRandomAccess implements RandomAccessVectorValues {
 
       private final List<RandomAccessVectorValues> raSubs;
 
@@ -154,7 +154,36 @@ private void readFields(ChecksumIndexInput meta, FieldInfos infos) throws IOExce
       if (info == null) {
         throw new CorruptIndexException("Invalid field number: " + fieldNumber, meta);
       }
-      fields.put(info.name, readField(meta));
+
+      FieldEntry fieldEntry = readField(meta);
+      validateFieldEntry(info, fieldEntry);
+      fields.put(info.name, fieldEntry);
+    }
+  }
+
+  private void validateFieldEntry(FieldInfo info, FieldEntry fieldEntry) {
+    int dimension = info.getVectorDimension();
+    if (dimension != fieldEntry.dimension) {
+      throw new IllegalStateException(
+          "Inconsistent vector dimension for field=\""
+              + info.name
+              + "\"; "
+              + dimension
+              + " != "
+              + fieldEntry.dimension);
+    }
+
+    long numBytes = (long) fieldEntry.size() * dimension * Float.BYTES;
+    if (numBytes != fieldEntry.vectorDataLength) {
+      throw new IllegalStateException(
+          "Vector data length "
+              + fieldEntry.vectorDataLength
+              + " not matching size="
+              + fieldEntry.size()
+              + " * dim="
+              + dimension
+              + " * 4 = "
+              + numBytes);
     }
   }
 
@@ -199,40 +228,47 @@ public void checkIntegrity() throws IOException {
 
   @Override
   public VectorValues getVectorValues(String field) throws IOException {
-    FieldInfo info = fieldInfos.fieldInfo(field);
-    if (info == null) {
+    FieldEntry fieldEntry = fields.get(field);
+    if (fieldEntry == null || fieldEntry.dimension == 0) {
       return null;
     }
-    int dimension = info.getVectorDimension();
-    if (dimension == 0) {
-      return VectorValues.EMPTY;
-    }
+
+    return getOffHeapVectorValues(fieldEntry);
+  }
+
+  @Override
+  public TopDocs search(String field, float[] target, int k, int fanout) throws IOException {
     FieldEntry fieldEntry = fields.get(field);
-    if (fieldEntry == null) {
-      // There is a FieldInfo, but no vectors. Should we have deleted the FieldInfo?
+    if (fieldEntry == null || fieldEntry.dimension == 0) {
       return null;
     }
-    if (dimension != fieldEntry.dimension) {
-      throw new IllegalStateException(
-          "Inconsistent vector dimension for field=\""
-              + field
-              + "\"; "
-              + dimension
-              + " != "
-              + fieldEntry.dimension);
-    }
-    long numBytes = (long) fieldEntry.size() * dimension * Float.BYTES;
-    if (numBytes != fieldEntry.vectorDataLength) {
-      throw new IllegalStateException(
-          "Vector data length "
-              + fieldEntry.vectorDataLength
-              + " not matching size="
-              + fieldEntry.size()
-              + " * dim="
-              + dimension
-              + " * 4 = "
-              + numBytes);
+
+    OffHeapVectorValues vectorValues = getOffHeapVectorValues(fieldEntry);
+
+    // use a seed that is fixed for the index so we get reproducible results for the same query
+    final Random random = new Random(checksumSeed);
+    NeighborQueue results =
+        HnswGraph.search(target, k, k + fanout, vectorValues, getGraphValues(fieldEntry), random);
+    int i = 0;
+    ScoreDoc[] scoreDocs = new ScoreDoc[Math.min(results.size(), k)];
+    boolean reversed = fieldEntry.searchStrategy.reversed;
+    while (results.size() > 0) {
+      int node = results.topNode();
+      float score = results.topScore();
+      results.pop();
+      if (reversed) {
+        score = (float) Math.exp(-score / target.length);
+      }
+      scoreDocs[scoreDocs.length - ++i] = new ScoreDoc(fieldEntry.ordToDoc[node], score);
     }
+    // always return >= the case where we can assert == is only when there are fewer than topK
+    // vectors in the index
+    return new TopDocs(
+        new TotalHits(results.visitedCount(), TotalHits.Relation.GREATER_THAN_OR_EQUAL_TO),
+        scoreDocs);
+  }
+
+  private OffHeapVectorValues getOffHeapVectorValues(FieldEntry fieldEntry) throws IOException {
     IndexInput bytesSlice =
         vectorData.slice("vector-data", fieldEntry.vectorDataOffset, fieldEntry.vectorDataLength);
     return new OffHeapVectorValues(fieldEntry, bytesSlice);
@@ -408,32 +444,6 @@ public RandomAccessVectorValues randomAccess() {
       return new OffHeapVectorValues(fieldEntry, dataIn.clone());
     }
 
-    @Override
-    public TopDocs search(float[] vector, int topK, int fanout) throws IOException {
-      // use a seed that is fixed for the index so we get reproducible results for the same query
-      final Random random = new Random(checksumSeed);
-      NeighborQueue results =
-          HnswGraph.search(
-              vector, topK, topK + fanout, randomAccess(), getGraphValues(fieldEntry), random);
-      int i = 0;
-      ScoreDoc[] scoreDocs = new ScoreDoc[Math.min(results.size(), topK)];
-      boolean reversed = searchStrategy().reversed;
-      while (results.size() > 0) {
-        int node = results.topNode();
-        float score = results.topScore();
-        results.pop();
-        if (reversed) {
-          score = (float) Math.exp(-score / vector.length);
-        }
-        scoreDocs[scoreDocs.length - ++i] = new ScoreDoc(fieldEntry.ordToDoc[node], score);
-      }
-      // always return >= the case where we can assert == is only when there are fewer than topK
-      // vectors in the index
-      return new TopDocs(
-          new TotalHits(results.visitedCount(), TotalHits.Relation.GREATER_THAN_OR_EQUAL_TO),
-          scoreDocs);
-    }
-
     @Override
     public float[] vectorValue(int targetOrd) throws IOException {
       dataIn.seek((long) targetOrd * byteSize);
 
@@ -25,6 +25,7 @@
 import org.apache.lucene.codecs.StoredFieldsReader;
 import org.apache.lucene.codecs.TermVectorsReader;
 import org.apache.lucene.codecs.VectorReader;
+import org.apache.lucene.search.TopDocs;
 
 /** LeafReader implemented by codec APIs. */
 public abstract class CodecReader extends LeafReader {
@@ -218,6 +219,19 @@ public final VectorValues getVectorValues(String field) throws IOException {
     return getVectorReader().getVectorValues(field);
   }
 
+  @Override
+  public final TopDocs searchNearestVectors(String field, float[] target, int k, int fanout)
+      throws IOException {
+    ensureOpen();
+    FieldInfo fi = getFieldInfos().fieldInfo(field);
+    if (fi == null || fi.getVectorDimension() == 0) {
+      // Field does not exist or does not index vectors
+      return null;
+    }
+
+    return getVectorReader().search(field, target, k, fanout);
+  }
+
   @Override
   protected void doClose() throws IOException {}
 
 
@@ -18,6 +18,7 @@
 package org.apache.lucene.index;
 
 import java.io.IOException;
+import org.apache.lucene.search.TopDocs;
 import org.apache.lucene.util.Bits;
 
 abstract class DocValuesLeafReader extends LeafReader {
@@ -51,6 +52,12 @@ public final VectorValues getVectorValues(String field) throws IOException {
     throw new UnsupportedOperationException();
   }
 
+  @Override
+  public TopDocs searchNearestVectors(String field, float[] target, int k, int fanout)
+      throws IOException {
+    throw new UnsupportedOperationException();
+  }
+
   @Override
   public final void checkIntegrity() throws IOException {
     throw new UnsupportedOperationException();
 
@@ -18,6 +18,7 @@
 
 import java.io.IOException;
 import java.util.Iterator;
+import org.apache.lucene.search.TopDocs;
 import org.apache.lucene.util.AttributeSource;
 import org.apache.lucene.util.Bits;
 import org.apache.lucene.util.BytesRef;
@@ -343,6 +344,12 @@ public VectorValues getVectorValues(String field) throws IOException {
     return in.getVectorValues(field);
   }
 
+  @Override
+  public TopDocs searchNearestVectors(String field, float[] target, int k, int fanout)
+      throws IOException {
+    return in.searchNearestVectors(field, target, k, fanout);
+  }
+
   @Override
   public Fields getTermVectors(int docID) throws IOException {
     ensureOpen();
 
@@ -17,6 +17,7 @@
 package org.apache.lucene.index;
 
 import java.io.IOException;
+import org.apache.lucene.search.TopDocs;
 import org.apache.lucene.util.Bits;
 
 /**
@@ -207,9 +208,28 @@ public final PostingsEnum postings(Term term) throws IOException {
   /**
    * Returns {@link VectorValues} for this field, or null if no {@link VectorValues} were indexed.
    * The returned instance should only be used by a single thread.
+   *
+   * @lucene.experimental
    */
   public abstract VectorValues getVectorValues(String field) throws IOException;
 
+  /**
+   * Return the k nearest neighbor documents as determined by comparison of their vector values for
+   * this field, to the given vector, by the field's search strategy. If the search strategy is
+   * reversed, lower values indicate nearer vectors, otherwise higher scores indicate nearer
+   * vectors. Unlike relevance scores, vector scores may be negative.
+   *
+   * @param field the vector field to search
+   * @param target the vector-valued query
+   * @param k the number of docs to return
+   * @param fanout control the accuracy/speed tradeoff - larger values give better recall at higher
+   *     cost
+   * @return the k nearest neighbor documents, along with their (searchStrategy-specific) scores.
+   * @lucene.experimental
+   */
+  public abstract TopDocs searchNearestVectors(String field, float[] target, int k, int fanout)
+      throws IOException;
+
   /**
    * Get the {@link FieldInfos} describing all fields in this reader.
    *
 
@@ -24,6 +24,7 @@
 import org.apache.lucene.codecs.NormsProducer;
 import org.apache.lucene.codecs.StoredFieldsReader;
 import org.apache.lucene.codecs.TermVectorsReader;
+import org.apache.lucene.search.TopDocs;
 import org.apache.lucene.util.Bits;
 
 /**
@@ -202,6 +203,12 @@ public VectorValues getVectorValues(String fieldName) throws IOException {
     return in.getVectorValues(fieldName);
   }
 
+  @Override
+  public TopDocs searchNearestVectors(String field, float[] target, int k, int fanout)
+      throws IOException {
+    return in.searchNearestVectors(field, target, k, fanout);
+  }
+
   @Override
   public int numDocs() {
     return in.numDocs();