Put sensible bounds on quantized scores (#15411)

mccullocht · web-flow · commit 7ceee5d5f926 · 2025-11-07T11:54:07.000-08:00
Loss from quantization can yield some unexpected values from the corrected dot product, sometimes producing values that are out-of-bounds. This is more likely when the inputs are "extreme" in the sense that they are very far from the segment-level centroid. Bound euclidean distance to a non-negative value -- negative values do not make any sense. Clamp dot product/cosine score to [-1,1] as the normalized dot product should always return values in this range. This works well enough for 4+ bit quantization but may not work as well for 1-bit quantization since the loss is so great. Fix the testSingleVectorCase to l2 normalize all vectors for DOT_PRODUCT similarity. This is a partial fix for #15408
diff --git a/lucene/core/src/java/org/apache/lucene/codecs/lucene104/Lucene104ScalarQuantizedVectorScorer.java b/lucene/core/src/java/org/apache/lucene/codecs/lucene104/Lucene104ScalarQuantizedVectorScorer.java
@@ -263,7 +263,9 @@ private static float quantizedScore(
           queryCorrections.additionalCorrection()
               + indexCorrections.additionalCorrection()
               - 2 * score;
-      return Math.max(1 / (1f + score), 0);
+      // Ensure that 'score' (the squared euclidean distance) is non-negative. The computed value
+      // may be negative as a result of quantization loss.
+      return 1 / (1f + Math.max(score, 0f));
     } else {
       // For cosine and max inner product, we need to apply the additional correction, which is
       // assumed to be the non-centered dot-product between the vector and the centroid
@@ -274,7 +276,10 @@ private static float quantizedScore(
       if (similarityFunction == MAXIMUM_INNER_PRODUCT) {
         return VectorUtil.scaleMaxInnerProductScore(score);
       }
-      return Math.max((1f + score) / 2f, 0);
+      // Ensure that 'score' (a normalized dot product) is in [-1,1]. The computed value may be out
+      // of bounds as a result of quantization loss.
+      score = Math.clamp(score, -1, 1);
+      return (1f + score) / 2f;
     }
   }
 }
diff --git a/lucene/core/src/test/org/apache/lucene/codecs/lucene104/TestLucene104HnswScalarQuantizedVectorsFormat.java b/lucene/core/src/test/org/apache/lucene/codecs/lucene104/TestLucene104HnswScalarQuantizedVectorsFormat.java
@@ -47,7 +47,9 @@
 import org.apache.lucene.store.Directory;
 import org.apache.lucene.tests.index.BaseKnnVectorsFormatTestCase;
 import org.apache.lucene.tests.util.TestUtil;
+import org.apache.lucene.util.ArrayUtil;
 import org.apache.lucene.util.SameThreadExecutorService;
+import org.apache.lucene.util.VectorUtil;
 import org.junit.Before;
 
 public class TestLucene104HnswScalarQuantizedVectorsFormat extends BaseKnnVectorsFormatTestCase {
@@ -109,7 +111,11 @@ public void testSingleVectorCase() throws Exception {
       try (Directory dir = newDirectory();
           IndexWriter w = new IndexWriter(dir, newIndexWriterConfig())) {
         Document doc = new Document();
-        doc.add(new KnnFloatVectorField("f", vector, similarityFunction));
+        float[] docVector =
+            similarityFunction == VectorSimilarityFunction.DOT_PRODUCT
+                ? VectorUtil.l2normalize(ArrayUtil.copyArray(vector))
+                : vector;
+        doc.add(new KnnFloatVectorField("f", docVector, similarityFunction));
         w.addDocument(doc);
         w.commit();
         try (IndexReader reader = DirectoryReader.open(w)) {
@@ -118,10 +124,14 @@ public void testSingleVectorCase() throws Exception {
           KnnVectorValues.DocIndexIterator docIndexIterator = vectorValues.iterator();
           assert (vectorValues.size() == 1);
           while (docIndexIterator.nextDoc() != NO_MORE_DOCS) {
-            assertArrayEquals(vector, vectorValues.vectorValue(docIndexIterator.index()), 0.00001f);
+            assertArrayEquals(
+                docVector, vectorValues.vectorValue(docIndexIterator.index()), 0.00001f);
           }
-          float[] randomVector = randomVector(vector.length);
-          float trueScore = similarityFunction.compare(vector, randomVector);
+          float[] randomVector =
+              similarityFunction == VectorSimilarityFunction.DOT_PRODUCT
+                  ? randomNormalizedVector(vector.length)
+                  : randomVector(vector.length);
+          float trueScore = similarityFunction.compare(docVector, randomVector);
           TopDocs td =
               r.searchNearestVectors(
                   "f",

Original file line number	Diff line number	Diff line change
`@@ -263,7 +263,9 @@ private static float quantizedScore(`
`263`	`263`	`queryCorrections.additionalCorrection()`
`264`	`264`	`+ indexCorrections.additionalCorrection()`
`265`	`265`	`- 2 * score;`
`266`		`- return Math.max(1 / (1f + score), 0);`
	`266`	`+ // Ensure that 'score' (the squared euclidean distance) is non-negative. The computed value`
	`267`	`+ // may be negative as a result of quantization loss.`
	`268`	`+ return 1 / (1f + Math.max(score, 0f));`
`267`	`269`	`} else {`
`268`	`270`	`// For cosine and max inner product, we need to apply the additional correction, which is`
`269`	`271`	`// assumed to be the non-centered dot-product between the vector and the centroid`
`@@ -274,7 +276,10 @@ private static float quantizedScore(`
`274`	`276`	`if (similarityFunction == MAXIMUM_INNER_PRODUCT) {`
`275`	`277`	`return VectorUtil.scaleMaxInnerProductScore(score);`
`276`	`278`	`}`
`277`		`- return Math.max((1f + score) / 2f, 0);`
	`279`	`+ // Ensure that 'score' (a normalized dot product) is in [-1,1]. The computed value may be out`
	`280`	`+ // of bounds as a result of quantization loss.`
	`281`	`+ score = Math.clamp(score, -1, 1);`
	`282`	`+ return (1f + score) / 2f;`
`278`	`283`	`}`
`279`	`284`	`}`
`280`	`285`	`}`