Handle multiple searchable copies in postFilterThreshold suggestion

boeker · boeker · commit d31cf09e1264 · 2026-02-23T07:25:47.000+01:00
diff --git a/vespa/evaluation/_base.py b/vespa/evaluation/_base.py
@@ -1780,6 +1780,7 @@ def __init__(
         self.queries = queries
         self.app = app
         self.verify_target_hits = verify_target_hits
+        self.searchable_copies = None
 
     def run(self):
         """
@@ -1834,6 +1835,16 @@ def extract_from_trace(obj: dict, type_name: str):
                     and blueprint["global_filter"]["calculated"]
                 ):
                     hit_ratios.append(blueprint["global_filter"]["hit_ratio"])
+                    actual_upper_limit = blueprint["global_filter"]["upper_limit"]
+                    if actual_upper_limit is not None and actual_upper_limit > 0.0:
+                        searchable_copies = round(1.0 / actual_upper_limit)
+                        if self.searchable_copies is None:
+                            self.searchable_copies = searchable_copies
+                        else:
+                            if self.searchable_copies != searchable_copies:
+                                print(
+                                    f"Searchable copies mismatch: {searchable_copies} vs. {self.searchable_copies} found earlier"
+                                )
 
                 if (
                     self.verify_target_hits is not None
@@ -1847,6 +1858,16 @@ def extract_from_trace(obj: dict, type_name: str):
 
         return all_hit_ratios
 
+    """
+    Returns number of searchable copies determined during hit-ratio computation.
+
+    Returns:
+        int: Number of searchable copies used by Vespa application.
+    """
+
+    def get_searchable_copies(self):
+        return self.searchable_copies
+
 
 class VespaNNRecallEvaluator:
     """
@@ -2151,6 +2172,8 @@ def __init__(
         self.recall_query_limit = recall_query_limit
         self.max_concurrent = max_concurrent
 
+        self.searchable_copies = None
+
     def get_bucket_interval_width(self) -> float:
         """
         Gets the width of the interval represented by a single bucket.
@@ -2299,6 +2322,7 @@ def determine_hit_ratios_and_distribute_to_buckets(
             queries, self.app, verify_target_hits=self.hits
         )
         hitratio_list = hitratio_evaluator.run()
+        self.searchable_copies = hitratio_evaluator.get_searchable_copies()
 
         for i in range(0, len(hitratio_list)):
             hitratios = hitratio_list[i]
@@ -2848,7 +2872,12 @@ def _suggest_post_filter_threshold(
                 threshold = i
                 response_time_gain = current_gain
 
-        return self.bucket_to_hitratio(threshold)
+        suggestion = self.bucket_to_hitratio(threshold)
+        if self.searchable_copies is not None:
+            suggestion = suggestion * self.searchable_copies
+            suggestion = min(suggestion, 1.0)
+
+        return suggestion
 
     def _test_filter_first_exploration(
         self, filter_first_exploration: float