elastic · ioanatia · Mar 11, 2025 · Jan 30, 2025 · Feb 24, 2025 · Feb 25, 2025
diff --git a/...n/esql/compute/src/main/java/org/elasticsearch/compute/operator/RrfScoreEvalOperator.java b/...n/esql/compute/src/main/java/org/elasticsearch/compute/operator/RrfScoreEvalOperator.java
@@ -12,7 +12,6 @@
 import org.elasticsearch.compute.data.BytesRefBlock;
 import org.elasticsearch.compute.data.DoubleVector;
 import org.elasticsearch.compute.data.Page;
-import org.elasticsearch.core.Releasables;
 
 import java.util.HashMap;
 
@@ -22,7 +21,7 @@
  * The new score we assign to each row is equal to {@code 1 / (rank_constant + row_number)}.
  * We use the fork discriminator column to determine the {@code row_number} for each row.
  */
-public class RrfScoreEvalOperator implements Operator {
+public class RrfScoreEvalOperator extends AbstractPageMappingOperator {
 
     public record Factory(int forkPosition, int scorePosition) implements OperatorFactory {
         @Override
@@ -40,9 +39,6 @@ public String describe() {
     private final int scorePosition;
     private final int forkPosition;
 
-    private boolean finished = false;
-    private Page prev = null;
-
     private HashMap<String, Integer> counters = new HashMap<>();
 
     public RrfScoreEvalOperator(int forkPosition, int scorePosition) {
@@ -51,30 +47,7 @@ public RrfScoreEvalOperator(int forkPosition, int scorePosition) {
     }
 
     @Override
-    public boolean needsInput() {
-        return prev == null && finished == false;
-    }
-
-    @Override
-    public void addInput(Page page) {
-        assert prev == null : "has pending input page";
-        prev = page;
-    }
-
-    @Override
-    public void finish() {
-        finished = true;
-    }
-
-    @Override
-    public boolean isFinished() {
-        return finished && prev == null;
-    }
-
-    @Override
-    public Page getOutput() {
-        Page page = prev;
-
+    protected Page process(Page page) {
         BytesRefBlock forkBlock = (BytesRefBlock) page.getBlock(forkPosition);
 
         DoubleVector.Builder scores = forkBlock.blockFactory().newDoubleVectorBuilder(forkBlock.getPositionCount());
@@ -96,18 +69,11 @@ public Page getOutput() {
             projections[i] = i == scorePosition ? page.getBlockCount() - 1 : i;
         }
 
-        page = page.projectBlocks(projections);
-
-        prev = null;
-        return page;
+        return page.projectBlocks(projections);
     }
 
     @Override
-    public void close() {
-        Releasables.closeExpectNoException(() -> {
-            if (prev != null) {
-                prev.releaseBlocks();
-            }
-        });
+    public String toString() {
+        return "RrfScoreEvalOperator";
     }
 }
diff --git a/x-pack/plugin/esql/qa/testFixtures/src/main/resources/rrf.csv-spec b/x-pack/plugin/esql/qa/testFixtures/src/main/resources/rrf.csv-spec
@@ -11,12 +11,14 @@ FROM employees METADATA _id, _index, _score
 | FORK ( WHERE emp_no:10001 )
        ( WHERE emp_no:10002 )
 | RRF
+| EVAL _score = round(_score, 4)
 | KEEP _score, _fork, emp_no
+| SORT _score, _fork, emp_no
 ;
 
-_score:double       | _fork:keyword  | emp_no:integer
-0.01639344262295082 | fork1          | 10001
-0.01639344262295082 | fork2          | 10002
+_score:double | _fork:keyword | emp_no:integer
+0.0164        | fork1         | 10001
+0.0164        | fork2         | 10002
 ;
 
 rrfWithMatchAndScore
@@ -25,16 +27,85 @@ required_capability: rrf
 required_capability: match_operator_colon
 
 FROM books METADATA _id, _index, _score
-| FORK ( WHERE title:"Tolkien" | SORT _score DESC | LIMIT 3 )
-       ( WHERE author:"Tolkien" | SORT _score DESC | LIMIT 3 )
+| FORK ( WHERE title:"Tolkien" | SORT _score, _id DESC | LIMIT 3 )
+       ( WHERE author:"Tolkien" | SORT _score, _id DESC | LIMIT 3 )
 | RRF
+| EVAL _fork = mv_sort(_fork)
+| EVAL _score = round(_score, 5)
 | KEEP _score, _fork, _id
 ;
 
-_score:double        | _fork:keyword  | _id:keyword
-0.03225806451612903  | [fork1, fork2] | 26
-0.01639344262295082  | fork2          | 18
-0.01639344262295082  | fork1          | 36
-0.015873015873015872 | fork1          | 56
-0.015873015873015872 | fork2          | 59
+_score:double | _fork:keyword  | _id:keyword
+0.03279       | [fork1, fork2] | 4
+0.01613       | fork1          | 56
+0.01613       | fork2          | 60
+0.01587       | fork2          | 1
+0.01587       | fork1          | 26
+;
+
+rrfWithDisjunctionAndPostFilter
+required_capability: fork
+required_capability: rrf
+required_capability: match_operator_colon
+
+FROM books METADATA _id, _index, _score
+| FORK ( WHERE title:"Tolkien" OR author:"Tolkien" | SORT _score, _id DESC | LIMIT 3 )
+       ( WHERE author:"Tolkien" | SORT _score, _id DESC | LIMIT 3 )
+| RRF
+| EVAL _fork = mv_sort(_fork)
+| EVAL _score = round(_score, 5)
+| KEEP _score, _fork, _id
+| WHERE _score > 0.014
+;
+
+_score:double | _fork:keyword  | _id:keyword
+0.03252       | [fork1, fork2] | 60
+0.032         | [fork1, fork2] | 1
+0.01639       | fork2          | 4
+0.01587       | fork1          | 40
+;
+
+rrfWithStats
+required_capability: fork
+required_capability: rrf
+required_capability: match_operator_colon
+
+FROM books METADATA _id, _index, _score
+| FORK ( WHERE title:"Tolkien" | SORT _score, _id DESC | LIMIT 3 )
+       ( WHERE author:"Tolkien" | SORT _score, _id DESC | LIMIT 3 )
+       ( WHERE author:"Ursula K. Le Guin" AND title:"short stories" | SORT _score, _id DESC | LIMIT 3)
+| RRF
+| STATS count_fork=COUNT(*) BY _fork
+;
+
+count_fork:long | _fork:keyword
+3               | fork1
+3               | fork2
+1               | fork3
+;
+
+rrfWithMultipleForkBranches
+required_capability: fork
+required_capability: rrf
+required_capability: match_operator_colon
+
+FROM books METADATA _id, _index, _score
+| FORK (WHERE author:"Keith Faulkner" AND qstr("author:Rory or author:Beverlie") | SORT _score, _id DESC | LIMIT 3)
+       (WHERE author:"Ursula K. Le Guin" | SORT _score, _id DESC | LIMIT 3)
+       (WHERE title:"Tolkien" AND author:"Tolkien" AND year > 2000 AND mv_count(author) == 1 | SORT _score, _id DESC | LIMIT 3)
+       (WHERE match(author, "Keith Faulkner") AND match(author, "Rory Tyger") | SORT _score, _id DESC | LIMIT 3)
+| RRF
+| EVAL _fork = mv_sort(_fork)
+| EVAL _score = round(_score, 4)
+| EVAL title = trim(substring(title, 1, 20))
+| KEEP _score, author, title, _fork
+;
+
+_score:double | author:keyword                    | title:keyword        | _fork:keyword
+0.0328        | [Keith Faulkner, Rory Tyger]      | Pop! Went Another Ba | [fork1, fork4]
+0.0164        | J.R.R. Tolkien                    | Letters of J R R Tol | fork3
+0.0164        | Ursula K. Le Guin                 | The wind's twelve qu | fork2
+0.0161        | [Beverlie Manson, Keith Faulkner] | Rainbow's End: A Mag | fork1
+0.0161        | Ursula K. Le Guin                 | The Word For World i | fork2
+0.0159        | Ursula K. Le Guin                 | The Dispossessed     | fork2
 ;
diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/parser/LogicalPlanBuilder.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/parser/LogicalPlanBuilder.java
@@ -16,6 +16,7 @@
 import org.elasticsearch.dissect.DissectException;
 import org.elasticsearch.dissect.DissectParser;
 import org.elasticsearch.index.IndexMode;
+import org.elasticsearch.index.mapper.IdFieldMapper;
 import org.elasticsearch.transport.RemoteClusterAware;
 import org.elasticsearch.xpack.esql.VerificationException;
 import org.elasticsearch.xpack.esql.action.EsqlCapabilities;
@@ -658,10 +659,10 @@ public List<PlanFactory> visitForkSubQueries(EsqlBaseParser.ForkSubQueriesContex
             // align _fork id across all fork branches
             Alias alias = null;
             if (firstForkNameId == null) {
-                alias = new Alias(source(ctx), "_fork", literal);
+                alias = new Alias(source(ctx), Fork.FORK_FIELD, literal);
                 firstForkNameId = alias.id();
             } else {
-                alias = new Alias(source(ctx), "_fork", literal, firstForkNameId);
+                alias = new Alias(source(ctx), Fork.FORK_FIELD, literal, firstForkNameId);
             }
 
             var finalAlias = alias;
@@ -694,12 +695,12 @@ public PlanFactory visitCompositeForkSubQuery(EsqlBaseParser.CompositeForkSubQue
     public PlanFactory visitRrfCommand(EsqlBaseParser.RrfCommandContext ctx) {
         return input -> {
             Source source = source(ctx);
-            Attribute scoreAttr = new UnresolvedAttribute(source, "_score");
-            Attribute forkAttr = new UnresolvedAttribute(source, "_fork");
-            Attribute idAttr = new UnresolvedAttribute(source, "_id");
-            Attribute indexAttr = new UnresolvedAttribute(source, "_index");
+            Attribute scoreAttr = new UnresolvedAttribute(source, MetadataAttribute.SCORE);
+            Attribute forkAttr = new UnresolvedAttribute(source, Fork.FORK_FIELD);
+            Attribute idAttr = new UnresolvedAttribute(source, IdFieldMapper.NAME);
+            Attribute indexAttr = new UnresolvedAttribute(source, MetadataAttribute.INDEX);
             List<NamedExpression> aggregates = List.of(
-                new Alias(source, "_score", new Sum(source, scoreAttr, new Literal(source, true, DataType.BOOLEAN)))
+                new Alias(source, MetadataAttribute.SCORE, new Sum(source, scoreAttr, new Literal(source, true, DataType.BOOLEAN)))
             );
             List<Attribute> groupings = List.of(idAttr, indexAttr);
 

diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Fork.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/Fork.java
@@ -23,6 +23,7 @@
  * {@code FORK [WHERE content:"fox" ] [WHERE content:"dog"] }
  */
 public class Fork extends UnaryPlan implements SurrogateLogicalPlan {
+    public static final String FORK_FIELD = "_fork";
 
     private final List<LogicalPlan> subPlans;
     List<Attribute> lazyOutput;

diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/RrfScoreEval.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/logical/RrfScoreEval.java
@@ -8,13 +8,19 @@
 package org.elasticsearch.xpack.esql.plan.logical;
 
 import org.elasticsearch.common.io.stream.StreamOutput;
+import org.elasticsearch.xpack.esql.capabilities.PostAnalysisVerificationAware;
+import org.elasticsearch.xpack.esql.common.Failures;
 import org.elasticsearch.xpack.esql.core.expression.Attribute;
 import org.elasticsearch.xpack.esql.core.tree.NodeInfo;
 import org.elasticsearch.xpack.esql.core.tree.Source;
 
 import java.io.IOException;
+import java.util.Locale;
+import java.util.Objects;
 
-public class RrfScoreEval extends UnaryPlan {
+import static org.elasticsearch.xpack.esql.common.Failure.fail;
+
+public class RrfScoreEval extends UnaryPlan implements PostAnalysisVerificationAware {
     private final Attribute forkAttr;
     private final Attribute scoreAttr;
 
@@ -56,4 +62,35 @@ public Attribute scoreAttribute() {
     public Attribute forkAttribute() {
         return forkAttr;
     }
+
+    @Override
+    public void postAnalysisVerification(Failures failures) {
+        if (this.child() instanceof Fork == false) {
+            failures.add(
+                fail(
+                    this,
+                    "Invalid use of RRF. RRF can only be used after FORK, but found {}",
+                    child().sourceText().split(" ")[0].toUpperCase(Locale.ROOT)
+                )
+            );
+        }
+    }
+
+    @Override
+    public int hashCode() {
+        return Objects.hash(super.hashCode(), scoreAttr, forkAttr);
+    }
+
+    @Override
+    public boolean equals(Object obj) {
+        if (this == obj) {
+            return true;
+        }
+        if (obj == null || getClass() != obj.getClass()) {
+            return false;
+        }
+
+        RrfScoreEval rrf = (RrfScoreEval) obj;
+        return child().equals(rrf.child()) && scoreAttr.equals(rrf.scoreAttribute()) && forkAttr.equals(forkAttribute());
+    }
 }
diff --git a/...plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/LocalExecutionPlanner.java b/...plugin/esql/src/main/java/org/elasticsearch/xpack/esql/planner/LocalExecutionPlanner.java
@@ -63,6 +63,7 @@
 import org.elasticsearch.xpack.esql.core.expression.FieldAttribute;
 import org.elasticsearch.xpack.esql.core.expression.FoldContext;
 import org.elasticsearch.xpack.esql.core.expression.Literal;
+import org.elasticsearch.xpack.esql.core.expression.MetadataAttribute;
 import org.elasticsearch.xpack.esql.core.expression.NameId;
 import org.elasticsearch.xpack.esql.core.expression.NamedExpression;
 import org.elasticsearch.xpack.esql.core.expression.TypedAttribute;
@@ -76,6 +77,7 @@
 import org.elasticsearch.xpack.esql.evaluator.EvalMapper;
 import org.elasticsearch.xpack.esql.evaluator.command.GrokEvaluatorExtracter;
 import org.elasticsearch.xpack.esql.expression.Order;
+import org.elasticsearch.xpack.esql.plan.logical.Fork;
 import org.elasticsearch.xpack.esql.plan.physical.AggregateExec;
 import org.elasticsearch.xpack.esql.plan.physical.ChangePointExec;
 import org.elasticsearch.xpack.esql.plan.physical.DissectExec;
@@ -282,10 +284,10 @@ private PhysicalOperation planRrfScoreEvalExec(RrfScoreEvalExec rrf, LocalExecut
         int forkPosition = -1;
         int pos = 0;
         for (Attribute attr : rrf.child().output()) {
-            if (attr.name().equals("_fork")) {
+            if (attr.name().equals(Fork.FORK_FIELD)) {
                 forkPosition = pos;
             }
-            if (attr.name().equals("_score")) {
+            if (attr.name().equals(MetadataAttribute.SCORE)) {
                 scorePosition = pos;
             }
 

diff --git a/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/analysis/AnalyzerTests.java b/x-pack/plugin/esql/src/test/java/org/elasticsearch/xpack/esql/analysis/AnalyzerTests.java
@@ -2938,6 +2938,22 @@ public void testRrfError() {
         assertThat(e.getMessage(), containsString("Unknown column [_score]"));
 public static String errorMessage(String name, List<String> potentialMatches) { 
     String msg = "Unknown column [" + name + "]"; 
     if (CollectionUtils.isEmpty(potentialMatches) == false) { 
         msg += ", did you mean " 
             + (potentialMatches.size() == 1 ? "[" + potentialMatches.get(0) + "]" : "any of " + potentialMatches.toString()) 
             + "?"; 
     } 
     return msg; 
 } 
 public static String errorMessage(String name, List<String> potentialMatches) { 
     String msg = "Unknown column [" + name + "]"; 
     if (CollectionUtils.isEmpty(potentialMatches) == false) { 
         msg += ", did you mean " 
             + (potentialMatches.size() == 1 ? "[" + potentialMatches.get(0) + "]" : "any of " + potentialMatches.toString()) 
             + "?"; 
     } 
     return msg; 
 } 
         assertThat(e.getMessage(), containsString("Unknown column [_fork]"));
 
+        e = expectThrows(VerificationException.class, () -> analyze("""
+            from test metadata _score, _index, _id
+            | eval _fork = 1
+            | rrf
+            """));
+        assertThat(e.getMessage(), containsString("RRF can only be used after FORK, but found EVAL"));
+
+        e = expectThrows(VerificationException.class, () -> analyze("""
+             from test metadata _id, _index, _score
+            | fork ( where first_name:"foo" )
+                   ( where first_name:"bar" )
+            | rrf
+            | rrf
+            """));
+        assertThat(e.getMessage(), containsString("RRF can only be used after FORK, but found RRF"));
+
         e = expectThrows(VerificationException.class, () -> analyze("""
             from test
             | FORK ( WHERE emp_no == 1 )
@@ -2953,6 +2969,14 @@ public void testRrfError() {
             | RRF
             """));
         assertThat(e.getMessage(), containsString("Unknown column [_index]"));
+
+        e = expectThrows(VerificationException.class, () -> analyze("""
+            from test metadata _score, _index
+            | FORK ( WHERE emp_no == 1 )
+                   ( WHERE emp_no > 1 )
+            | RRF
+            """));
+        assertThat(e.getMessage(), containsString("Unknown column [_id]"));
     }
 
     // TODO There's too much boilerplate involved here! We need a better way of creating FieldCapabilitiesResponses from a mapping or index.