Save allocation of a large array in PQVectors.encodeAndBuild (#574)

marianotepper · web-flow · commit 02fea879d63d · 2025-11-20T13:25:44.000-08:00
* Save allocation of a large array in PQVectors.encodeAndBuild
* Using IntUnaryOperator instead of int[] in version of PQVectors.encodeAndBuild with remapping
diff --git a/jvector-base/src/main/java/io/github/jbellis/jvector/quantization/PQVectors.java b/jvector-base/src/main/java/io/github/jbellis/jvector/quantization/PQVectors.java
@@ -32,6 +32,7 @@
 import java.util.Objects;
 import java.util.concurrent.ForkJoinPool;
 import java.util.concurrent.atomic.AtomicReference;
+import java.util.function.IntUnaryOperator;
 import java.util.stream.IntStream;
 
 public abstract class PQVectors implements CompressedVectors {
@@ -76,7 +77,7 @@ public static PQVectors load(RandomAccessReader in, long offset) throws IOExcept
     /**
      * Build a PQVectors instance from the given RandomAccessVectorValues. The vectors are encoded in parallel
      * and split into chunks to avoid exceeding the maximum array size.
-     *
+     * <p>
      * This is a helper method for the special case where the ordinals mapping in the graph and the RAVV/PQVectors are the same.
      *
      * @param pq           the ProductQuantization to use
@@ -86,7 +87,7 @@ public static PQVectors load(RandomAccessReader in, long offset) throws IOExcept
      * @return the PQVectors instance
      */
     public static ImmutablePQVectors encodeAndBuild(ProductQuantization pq, int vectorCount, RandomAccessVectorValues ravv, ForkJoinPool simdExecutor) {
-        return encodeAndBuild(pq, vectorCount, IntStream.range(0, vectorCount).toArray(), ravv, simdExecutor);
+        return encodeAndBuild(pq, vectorCount, IntUnaryOperator.identity(), ravv, simdExecutor);
     }
 
     /**
@@ -95,14 +96,14 @@ public static ImmutablePQVectors encodeAndBuild(ProductQuantization pq, int vect
      *
      * @param pq           the ProductQuantization to use
      * @param vectorCount  the number of vectors to encode
+     * @param ordinalsMapping the graph ordinals to RAVV mapping, the function should be defined in [0, vectorCount)
      * @param ravv         the RandomAccessVectorValues to encode
      * @param simdExecutor the ForkJoinPool to use for SIMD operations
-     * @param ordinalsMapping the graph ordinals to RAVV mapping
      * @return the PQVectors instance
      */
-    public static ImmutablePQVectors encodeAndBuild(ProductQuantization pq, int vectorCount, int[] ordinalsMapping, RandomAccessVectorValues ravv, ForkJoinPool simdExecutor) {
+    public static ImmutablePQVectors encodeAndBuild(ProductQuantization pq, int vectorCount, IntUnaryOperator ordinalsMapping, RandomAccessVectorValues ravv, ForkJoinPool simdExecutor) {
         int compressedDimension = pq.compressedVectorSize();
-        PQLayout layout = new PQLayout(vectorCount,compressedDimension);
+        PQLayout layout = new PQLayout(vectorCount, compressedDimension);
         final ByteSequence<?>[] chunks = new ByteSequence<?>[layout.totalChunks];
         for (int i = 0; i < layout.fullSizeChunks; i++) {
             chunks[i] = vectorTypeSupport.createByteSequence(layout.fullChunkBytes);
@@ -115,13 +116,13 @@ public static ImmutablePQVectors encodeAndBuild(ProductQuantization pq, int vect
         // The changes are concurrent, but because they are coordinated and do not overlap, we can use parallel streams
         // and then we are guaranteed safe publication because we join the thread after completion.
         var ravvCopy = ravv.threadLocalSupplier();
-        simdExecutor.submit(() -> IntStream.range(0, ordinalsMapping.length)
+        simdExecutor.submit(() -> IntStream.range(0, vectorCount)
                         .parallel()
                         .forEach(ordinal -> {
                             // Retrieve the slice and mutate it.
                             var localRavv = ravvCopy.get();
                             var slice = PQVectors.get(chunks, ordinal, layout.fullChunkVectors, pq.getSubspaceCount());
-                            var vector = localRavv.getVector(ordinalsMapping[ordinal]);
+                            var vector = localRavv.getVector(ordinalsMapping.applyAsInt(ordinal));
                             if (vector != null)
                                 pq.encodeTo(vector, slice);
                             else