atris
diff --git a/‎server/src/main/java/org/opensearch/action/search/QueryPhaseResultConsumer.java‎
Lines changed: 6 additions & 1 deletion b/‎server/src/main/java/org/opensearch/action/search/QueryPhaseResultConsumer.java‎
Lines changed: 6 additions & 1 deletion
diff --git a/‎server/src/main/java/org/opensearch/action/search/SearchProgressListener.java‎
Lines changed: 26 additions & 0 deletions b/‎server/src/main/java/org/opensearch/action/search/SearchProgressListener.java‎
Lines changed: 26 additions & 0 deletions
diff --git a/‎server/src/main/java/org/opensearch/action/search/SearchRequest.java‎
Lines changed: 32 additions & 0 deletions b/‎server/src/main/java/org/opensearch/action/search/SearchRequest.java‎
Lines changed: 32 additions & 0 deletions
diff --git a/‎server/src/main/java/org/opensearch/action/search/SearchResponse.java‎
Lines changed: 30 additions & 0 deletions b/‎server/src/main/java/org/opensearch/action/search/SearchResponse.java‎
Lines changed: 30 additions & 0 deletions
diff --git a/‎server/src/main/java/org/opensearch/action/search/StreamQueryPhaseResultConsumer.java‎
Lines changed: 125 additions & 2 deletions b/‎server/src/main/java/org/opensearch/action/search/StreamQueryPhaseResultConsumer.java‎
Lines changed: 125 additions & 2 deletions
diff --git a/‎server/src/main/java/org/opensearch/action/search/StreamSearchQueryThenFetchAsyncAction.java‎
Lines changed: 2 additions & 0 deletions b/‎server/src/main/java/org/opensearch/action/search/StreamSearchQueryThenFetchAsyncAction.java‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎server/src/main/java/org/opensearch/action/search/StreamSearchTransportService.java‎
Lines changed: 18 additions & 0 deletions b/‎server/src/main/java/org/opensearch/action/search/StreamSearchTransportService.java‎
Lines changed: 18 additions & 0 deletions
@@ -235,7 +235,12 @@ private MergeResult partialReduce(
             SearchShardTarget target = result.getSearchShardTarget();
             processedShards.add(new SearchShard(target.getClusterAlias(), target.getShardId()));
         }
-        progressListener.notifyPartialReduce(processedShards, topDocsStats.getTotalHits(), newAggs, numReducePhases);
+        // For streaming search with TopDocs, use the new notification method
+        if (hasTopDocs && newTopDocs != null) {
+            progressListener.notifyPartialReduceWithTopDocs(processedShards, topDocsStats.getTotalHits(), newTopDocs, newAggs, numReducePhases);
+        } else {
+            progressListener.notifyPartialReduce(processedShards, topDocsStats.getTotalHits(), newAggs, numReducePhases);
+        }
         // we leave the results un-serialized because serializing is slow but we compute the serialized
         // size as an estimate of the memory used by the newly reduced aggregations.
         long serializedSize = hasAggs ? newAggs.getSerializedSize() : 0;
 
@@ -99,6 +99,22 @@ protected void onQueryFailure(int shardIndex, SearchShardTarget shardTarget, Exc
      * @param reducePhase The version number for this reduce.
      */
     protected void onPartialReduce(List<SearchShard> shards, TotalHits totalHits, InternalAggregations aggs, int reducePhase) {}
+    
+    /**
+     * Executed when a partial reduce with TopDocs is created for streaming search.
+     *
+     * @param shards The list of shards that are part of this reduce.
+     * @param totalHits The total number of hits in this reduce.
+     * @param topDocs The partial TopDocs result (may be null if no docs).
+     * @param aggs The partial result for aggregations.
+     * @param reducePhase The version number for this reduce.
+     */
+    protected void onPartialReduceWithTopDocs(List<SearchShard> shards, TotalHits totalHits, 
+                                              org.apache.lucene.search.TopDocs topDocs, 
+                                              InternalAggregations aggs, int reducePhase) {
+        // Default implementation delegates to the original method for backward compatibility
+        onPartialReduce(shards, totalHits, aggs, reducePhase);
+    }
 
     /**
      * Executed once when the final reduce is created.
@@ -164,6 +180,16 @@ final void notifyPartialReduce(List<SearchShard> shards, TotalHits totalHits, In
             logger.warn(() -> new ParameterizedMessage("Failed to execute progress listener on partial reduce"), e);
         }
     }
+    
+    final void notifyPartialReduceWithTopDocs(List<SearchShard> shards, TotalHits totalHits, 
+                                               org.apache.lucene.search.TopDocs topDocs,
+                                               InternalAggregations aggs, int reducePhase) {
+        try {
+            onPartialReduceWithTopDocs(shards, totalHits, topDocs, aggs, reducePhase);
+        } catch (Exception e) {
+            logger.warn(() -> new ParameterizedMessage("Failed to execute progress listener on partial reduce with TopDocs"), e);
+        }
+    }
 
     protected final void notifyFinalReduce(List<SearchShard> shards, TotalHits totalHits, InternalAggregations aggs, int reducePhase) {
         try {
 
@@ -125,6 +125,9 @@ public class SearchRequest extends ActionRequest implements IndicesRequest.Repla
 
     private Boolean phaseTook = null;
 
+    private boolean streamingScoring = false;
+    private String streamingScoringMode = null; // Will use StreamingScoringMode.DEFAULT if null
+
     public SearchRequest() {
         this.localClusterAlias = null;
         this.absoluteStartMillis = DEFAULT_ABSOLUTE_START_MILLIS;
@@ -142,6 +145,7 @@ public SearchRequest(SearchRequest searchRequest) {
             searchRequest.absoluteStartMillis,
             searchRequest.finalReduce
         );
+        this.streamingScoring = searchRequest.streamingScoring;
     }
 
     /**
@@ -656,6 +660,34 @@ public void setPhaseTook(Boolean phaseTook) {
         this.phaseTook = phaseTook;
     }
 
+    /**
+     * Enable streaming scoring for this search request.
+     */
+    public void setStreamingScoring(boolean streamingScoring) {
+        this.streamingScoring = streamingScoring;
+    }
+
+    /**
+     * Check if streaming scoring is enabled for this search request.
+     */
+    public boolean isStreamingScoring() {
+        return streamingScoring;
+    }
+    
+    /**
+     * Set the streaming scoring mode.
+     */
+    public void setStreamingScoringMode(String mode) {
+        this.streamingScoringMode = mode;
+    }
+    
+    /**
+     * Get the streaming scoring mode.
+     */
+    public String getStreamingScoringMode() {
+        return streamingScoringMode;
+    }
+
     /**
      * Returns a threshold that enforces a pre-filter roundtrip to pre-filter search shards based on query rewriting if the number of shards
      * the search request expands to exceeds the threshold, or <code>null</code> if the threshold is unspecified.
 
@@ -102,6 +102,11 @@ public class SearchResponse extends ActionResponse implements StatusToXContentOb
     private final Clusters clusters;
     private final long tookInMillis;
     private final PhaseTook phaseTook;
+    
+    // Fields for streaming responses
+    private boolean isPartial = false;
+    private int sequenceNumber = 0;
+    private int totalPartials = 0;
 
     public SearchResponse(StreamInput in) throws IOException {
         super(in);
@@ -301,6 +306,31 @@ public ShardSearchFailure[] getShardFailures() {
     public String getScrollId() {
         return scrollId;
     }
+    
+    // Streaming response methods
+    public boolean isPartial() {
+        return isPartial;
+    }
+    
+    public void setPartial(boolean partial) {
+        this.isPartial = partial;
+    }
+    
+    public int getSequenceNumber() {
+        return sequenceNumber;
+    }
+    
+    public void setSequenceNumber(int sequenceNumber) {
+        this.sequenceNumber = sequenceNumber;
+    }
+    
+    public int getTotalPartials() {
+        return totalPartials;
+    }
+    
+    public void setTotalPartials(int totalPartials) {
+        this.totalPartials = totalPartials;
+    }
 
     /**
      * Returns the encoded string of the search context that the search request is used to executed
 
@@ -8,11 +8,19 @@
 
 package org.opensearch.action.search;
 
+import org.apache.logging.log4j.LogManager;
+import org.apache.logging.log4j.Logger;
 import org.opensearch.core.common.breaker.CircuitBreaker;
 import org.opensearch.core.common.io.stream.NamedWriteableRegistry;
 import org.opensearch.search.SearchPhaseResult;
 import org.opensearch.search.query.QuerySearchResult;
+import org.opensearch.search.query.HoeffdingBounds;
+import org.opensearch.search.query.StreamingScoringMode;
+import org.apache.lucene.search.TopDocs;
+import org.apache.lucene.search.ScoreDoc;
 
+import java.util.HashMap;
+import java.util.Map;
 import java.util.concurrent.Executor;
 import java.util.function.Consumer;
 
@@ -22,6 +30,13 @@
  * @opensearch.internal
  */
 public class StreamQueryPhaseResultConsumer extends QueryPhaseResultConsumer {
+    private static final Logger logger = LogManager.getLogger(StreamQueryPhaseResultConsumer.class);
+    
+    private final Map<Integer, HoeffdingBounds> shardBounds = new HashMap<>();
+    private final double confidence = 0.95; // Default confidence level
+    private int streamingEmissions = 0;
+    private int totalDocsProcessed = 0;
+    private final StreamingScoringMode scoringMode;
 
     public StreamQueryPhaseResultConsumer(
         SearchRequest request,
@@ -43,22 +58,130 @@ public StreamQueryPhaseResultConsumer(
             expectedResultSize,
             onPartialMergeFailure
         );
+        
+        // Determine scoring mode from request
+        this.scoringMode = StreamingScoringMode.fromString(request.getStreamingScoringMode());
     }
 
     /**
-     * For stream search, the minBatchReduceSize is set higher than shard number
+     * Adjust batch reduce size based on scoring mode.
      *
      * @param minBatchReduceSize: pass as number of shard
      */
     @Override
     int getBatchReduceSize(int requestBatchedReduceSize, int minBatchReduceSize) {
-        return super.getBatchReduceSize(requestBatchedReduceSize, minBatchReduceSize * 10);
+        switch (scoringMode) {
+            case NO_SCORING:
+                // Emit immediately as results arrive
+                return 1;
+                
+            case CONFIDENCE_BASED:
+                // Emit based on confidence threshold
+                if (confidence > 0.9) {
+                    return minBatchReduceSize;
+                }
+                return minBatchReduceSize * 2;
+                
+            case FULL_SCORING:
+                // Wait for all shards before reducing
+                return Integer.MAX_VALUE;
+                
+            default:
+                return super.getBatchReduceSize(requestBatchedReduceSize, minBatchReduceSize * 10);
+        }
     }
 
     void consumeStreamResult(SearchPhaseResult result, Runnable next) {
         // For streaming, we skip the ArraySearchPhaseResults.consumeResult() call
         // since it doesn't support multiple results from the same shard.
         QuerySearchResult querySearchResult = result.queryResult();
+        
+        // Track scores for Hoeffding bounds if this is a scoring query
+        if (querySearchResult.hasConsumedTopDocs()) {
+            updateHoeffdingBounds(result.getShardIndex(), querySearchResult);
+        }
+        
         pendingMerges.consume(querySearchResult, next);
     }
+    
+    /**
+     * Update Hoeffding bounds for a shard based on its scores.
+     */
+    private void updateHoeffdingBounds(int shardIndex, QuerySearchResult queryResult) {
+        var topDocsAndMaxScore = queryResult.topDocs();
+        if (topDocsAndMaxScore != null && topDocsAndMaxScore.topDocs != null && topDocsAndMaxScore.topDocs.scoreDocs != null) {
+            TopDocs topDocs = topDocsAndMaxScore.topDocs;
+            // Get or create bounds for this shard
+            HoeffdingBounds bounds = shardBounds.computeIfAbsent(
+                shardIndex,
+                k -> new HoeffdingBounds(confidence, 100.0)
+            );
+            
+            // Add scores to bounds tracker
+            for (ScoreDoc scoreDoc : topDocs.scoreDocs) {
+                bounds.addScore(scoreDoc.score);
+            }
+            
+            // Check if we should emit based on confidence
+            if (shouldEmitStreamingResults()) {
+                streamingEmissions++;
+                totalDocsProcessed += topDocs.scoreDocs.length;
+                
+                double maxBound = getMaxHoeffdingBound();
+                logger.info("Streaming emission #{}: {} shards, {} docs, bound={}",
+                    streamingEmissions, shardBounds.size(), totalDocsProcessed, maxBound);
+                
+                // Adjusted batch size triggers more frequent partial reductions
+            }
+        }
+    }
+    
+    /**
+     * Check if we should emit streaming results based on scoring mode.
+     */
+    private boolean shouldEmitStreamingResults() {
+        switch (scoringMode) {
+            case NO_SCORING:
+                // Always emit immediately
+                return true;
+                
+            case CONFIDENCE_BASED:
+                // Check Hoeffding bounds
+                if (shardBounds.isEmpty()) {
+                    return false;
+                }
+                double maxBound = getMaxHoeffdingBound();
+                boolean shouldEmit = maxBound <= 0.1; // Threshold for confidence
+                
+                if (logger.isDebugEnabled()) {
+                    logger.debug("Hoeffding bound check: {}, emit={}",
+                        maxBound, shouldEmit);
+                }
+                return shouldEmit;
+                
+            case FULL_SCORING:
+                // Never emit early - wait for all results
+                return false;
+                
+            default:
+                return false;
+        }
+    }
+    
+    /**
+     * Get the maximum Hoeffding bound across all shards.
+     */
+    private double getMaxHoeffdingBound() {
+        return shardBounds.values().stream()
+            .mapToDouble(HoeffdingBounds::getBound)
+            .max()
+            .orElse(Double.MAX_VALUE);
+    }
+    
+    /**
+     * Get the number of streaming emissions for monitoring.
+     */
+    public int getStreamingEmissions() {
+        return streamingEmissions;
+    }
 }
@@ -15,6 +15,7 @@
 import org.opensearch.search.SearchPhaseResult;
 import org.opensearch.search.SearchShardTarget;
 import org.opensearch.search.internal.AliasFilter;
+import org.opensearch.search.internal.ShardSearchRequest;
 import org.opensearch.telemetry.tracing.Tracer;
 import org.opensearch.transport.Transport;
 
@@ -188,4 +189,5 @@ private void successfulStreamExecution() {
             onPhaseFailure(this, "The phase has failed", ex);
         }
     }
+    
 }
@@ -123,6 +123,24 @@ public static void registerStreamRequestHandler(StreamTransportService transport
                 ThreadPool.Names.STREAM_SEARCH
             )
         );
+
+        // Override QUERY_ACTION_NAME to enable streaming for query phase
+        transportService.registerRequestHandler(
+            QUERY_ACTION_NAME,
+            ThreadPool.Names.SAME,
+            false,
+            true,
+            AdmissionControlActionType.SEARCH,
+            ShardSearchRequest::new,
+            (request, channel, task) -> searchService.executeQueryPhase(
+                request,
+                false,
+                (SearchShardTask) task,
+                new StreamSearchChannelListener<>(channel, QUERY_ACTION_NAME, request),
+                ThreadPool.Names.STREAM_SEARCH,
+                true  // isStreamSearch = true for streaming
+            )
+        );
     }
 
     @Override
Original file line number	Diff line number	Diff line change
`@@ -15,6 +15,7 @@`
`15`	`15`	`import org.opensearch.search.SearchPhaseResult;`
`16`	`16`	`import org.opensearch.search.SearchShardTarget;`
`17`	`17`	`import org.opensearch.search.internal.AliasFilter;`
	`18`	`+import org.opensearch.search.internal.ShardSearchRequest;`
`18`	`19`	`import org.opensearch.telemetry.tracing.Tracer;`
`19`	`20`	`import org.opensearch.transport.Transport;`
`20`	`21`
`@@ -188,4 +189,5 @@ private void successfulStreamExecution() {`
`188`	`189`	`onPhaseFailure(this, "The phase has failed", ex);`
`189`	`190`	`}`
`190`	`191`	`}`
	`192`	`+`
`191`	`193`	`}`