elastic
diff --git a/‎x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/rules/physical/ProjectAwayColumns.java‎
Lines changed: 3 additions & 1 deletion b/‎x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/optimizer/rules/physical/ProjectAwayColumns.java‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/AbstractAggregateExec.java‎
Lines changed: 183 additions & 0 deletions b/‎x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/plan/physical/AbstractAggregateExec.java‎
Lines changed: 183 additions & 0 deletions
@@ -17,6 +17,8 @@
 import org.elasticsearch.xpack.esql.plan.logical.Aggregate;
 import org.elasticsearch.xpack.esql.plan.logical.Eval;
 import org.elasticsearch.xpack.esql.plan.logical.Project;
+import org.elasticsearch.xpack.esql.plan.logical.TopN;
+import org.elasticsearch.xpack.esql.plan.logical.TopNAggregate;
 import org.elasticsearch.xpack.esql.plan.physical.ExchangeExec;
 import org.elasticsearch.xpack.esql.plan.physical.FragmentExec;
 import org.elasticsearch.xpack.esql.plan.physical.MergeExec;
@@ -61,7 +63,7 @@ public PhysicalPlan apply(PhysicalPlan plan) {
                     var logicalFragment = fragmentExec.fragment();
 
                     // no need for projection when dealing with aggs
-                    if (logicalFragment instanceof Aggregate == false) {
+                    if (logicalFragment instanceof Aggregate == false && logicalFragment instanceof TopNAggregate == false) {
                         List<Attribute> output = new ArrayList<>(requiredAttrBuilder.build());
                         // if all the fields are filtered out, it's only the count that matters
                         // however until a proper fix (see https://github.com/elastic/elasticsearch/issues/98703)
 
@@ -0,0 +1,183 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+package org.elasticsearch.xpack.esql.plan.physical;
+
+import org.elasticsearch.TransportVersions;
+import org.elasticsearch.common.io.stream.StreamInput;
+import org.elasticsearch.common.io.stream.StreamOutput;
+import org.elasticsearch.compute.aggregation.AggregatorMode;
+import org.elasticsearch.xpack.esql.core.expression.Attribute;
+import org.elasticsearch.xpack.esql.core.expression.AttributeSet;
+import org.elasticsearch.xpack.esql.core.expression.Expression;
+import org.elasticsearch.xpack.esql.core.expression.NamedExpression;
+import org.elasticsearch.xpack.esql.core.tree.Source;
+import org.elasticsearch.xpack.esql.expression.function.grouping.Categorize;
+import org.elasticsearch.xpack.esql.io.stream.PlanStreamInput;
+import org.elasticsearch.xpack.esql.plan.logical.Aggregate;
+
+import java.io.IOException;
+import java.util.ArrayList;
+import java.util.HashSet;
+import java.util.List;
+import java.util.Objects;
+
+/**
+ * Base class for aggregate nodes.
+ */
+public abstract class AbstractAggregateExec extends UnaryExec implements EstimatesRowSize {
+    protected final List<? extends Expression> groupings;
+    protected final List<? extends NamedExpression> aggregates;
+    /**
+     * The output attributes of {@link AggregatorMode#INITIAL} and {@link AggregatorMode#INTERMEDIATE} aggregations, resp.
+     * the input attributes of {@link AggregatorMode#FINAL} and {@link AggregatorMode#INTERMEDIATE} aggregations.
+     */
+    protected final List<Attribute> intermediateAttributes;
+
+    protected final AggregatorMode mode;
+
+    /**
+     * Estimate of the number of bytes that'll be loaded per position before
+     * the stream of pages is consumed.
+     */
+    protected final Integer estimatedRowSize;
+
+    protected AbstractAggregateExec(
+        Source source,
+        PhysicalPlan child,
+        List<? extends Expression> groupings,
+        List<? extends NamedExpression> aggregates,
+        AggregatorMode mode,
+        List<Attribute> intermediateAttributes,
+        Integer estimatedRowSize
+    ) {
+        super(source, child);
+        this.groupings = groupings;
+        this.aggregates = aggregates;
+        this.mode = mode;
+        this.intermediateAttributes = intermediateAttributes;
+        this.estimatedRowSize = estimatedRowSize;
+    }
+
+    protected AbstractAggregateExec(StreamInput in) throws IOException {
+        // This is only deserialized as part of node level reduction, which is turned off until at least 8.16.
+        // So, we do not have to consider previous transport versions here, because old nodes will not send AggregateExecs to new nodes.
+        super(Source.readFrom((PlanStreamInput) in), in.readNamedWriteable(PhysicalPlan.class));
+        this.groupings = in.readNamedWriteableCollectionAsList(Expression.class);
+        this.aggregates = in.readNamedWriteableCollectionAsList(NamedExpression.class);
+        this.mode = in.readEnum(AggregatorMode.class);
+        this.intermediateAttributes = in.readNamedWriteableCollectionAsList(Attribute.class);
+        this.estimatedRowSize = in.readOptionalVInt();
+    }
+
+    @Override
+    public void writeTo(StreamOutput out) throws IOException {
+        Source.EMPTY.writeTo(out);
+        out.writeNamedWriteable(child());
+        out.writeNamedWriteableCollection(groupings());
+        out.writeNamedWriteableCollection(aggregates());
+        if (out.getTransportVersion().onOrAfter(TransportVersions.V_8_16_0)) {
+            out.writeEnum(getMode());
+            out.writeNamedWriteableCollection(intermediateAttributes());
+        } else {
+            out.writeEnum(Mode.fromAggregatorMode(getMode()));
+        }
+        out.writeOptionalVInt(estimatedRowSize());
+    }
+
+    public List<? extends Expression> groupings() {
+        return groupings;
+    }
+
+    public List<? extends NamedExpression> aggregates() {
+        return aggregates;
+    }
+
+    /**
+     * Estimate of the number of bytes that'll be loaded per position before
+     * the stream of pages is consumed.
+     */
+    public Integer estimatedRowSize() {
+        return estimatedRowSize;
+    }
+
+    @Override
+    public PhysicalPlan estimateRowSize(State state) {
+        state.add(false, aggregates);  // The groupings are contained within the aggregates
+        int size = state.consumeAllFields(true);
+        size = Math.max(size, 1);
+        return Objects.equals(this.estimatedRowSize, size) ? this : withEstimatedSize(size);
+    }
+
+    protected abstract AbstractAggregateExec withEstimatedSize(int estimatedRowSize);
+
+    public AggregatorMode getMode() {
+        return mode;
+    }
+
+    /**
+     * Used only for bwc when de-/serializing.
+     */
+    @Deprecated
+    private enum Mode {
+        SINGLE,
+        PARTIAL, // maps raw inputs to intermediate outputs
+        FINAL; // maps intermediate inputs to final outputs
+
+        static Mode fromAggregatorMode(AggregatorMode aggregatorMode) {
+            return switch (aggregatorMode) {
+                case SINGLE -> SINGLE;
+                case INITIAL -> PARTIAL;
+                case FINAL -> FINAL;
+                // If needed, we could have this return an PARTIAL instead; that's how intermediate aggs were encoded in the past for
+                // data node level reduction.
+                case INTERMEDIATE -> throw new UnsupportedOperationException(
+                    "cannot turn intermediate aggregation into single, partial or final."
+                );
+            };
+        }
+    }
+
+    /**
+     * Aggregations are usually performed in two steps, first partial (e.g. locally on a data node) then final (on the coordinator node).
+     * These are the intermediate attributes output by a partial aggregation or consumed by a final one.
+     * C.f. {@link org.elasticsearch.xpack.esql.planner.AbstractPhysicalOperationProviders#intermediateAttributes}.
+     */
+    public List<Attribute> intermediateAttributes() {
+        return intermediateAttributes;
+    }
+
+    @Override
+    public List<Attribute> output() {
+        return mode.isOutputPartial() ? intermediateAttributes : Aggregate.output(aggregates);
+    }
+
+    @Override
+    protected AttributeSet computeReferences() {
+        return mode.isInputPartial()
+            ? AttributeSet.of(intermediateAttributes)
+            : Aggregate.computeReferences(aggregates, groupings).subtract(AttributeSet.of(ordinalAttributes()));
+    }
+
+    /** Returns the attributes that can be loaded from ordinals -- no explicit extraction is needed */
+    public List<Attribute> ordinalAttributes() {
+        List<Attribute> orginalAttributs = new ArrayList<>(groupings.size());
+        // Ordinals can be leveraged just for a single grouping. If there are multiple groupings, fields need to be laoded for the
+        // hash aggregator.
+        // CATEGORIZE requires the standard hash aggregator as well.
+        if (groupings().size() == 1 && groupings.get(0).anyMatch(e -> e instanceof Categorize) == false) {
+            var leaves = new HashSet<>();
+            aggregates.stream().filter(a -> groupings.contains(a) == false).forEach(a -> leaves.addAll(a.collectLeaves()));
+            groupings.forEach(g -> {
+                if (leaves.contains(g) == false) {
+                    orginalAttributs.add((Attribute) g);
+                }
+            });
+        }
+        return orginalAttributs;
+    }
+}