[feature](Nereids): eliminate groupby (#28615)

This commit is contained in:
jakevin
2023-12-28 14:00:41 +08:00
committed by GitHub
parent bc08535285
commit f816d13c56
5 changed files with 191 additions and 1 deletions

View File

@ -55,6 +55,7 @@ import org.apache.doris.nereids.rules.rewrite.EliminateAssertNumRows;
import org.apache.doris.nereids.rules.rewrite.EliminateDedupJoinCondition;
import org.apache.doris.nereids.rules.rewrite.EliminateEmptyRelation;
import org.apache.doris.nereids.rules.rewrite.EliminateFilter;
import org.apache.doris.nereids.rules.rewrite.EliminateGroupBy;
import org.apache.doris.nereids.rules.rewrite.EliminateJoinByFK;
import org.apache.doris.nereids.rules.rewrite.EliminateJoinCondition;
import org.apache.doris.nereids.rules.rewrite.EliminateLimit;
@ -276,6 +277,10 @@ public class Rewriter extends AbstractBatchJobExecutor {
topDown(new BuildAggForUnion())
),
topic("Eliminate GroupBy",
topDown(new EliminateGroupBy())
),
topic("Eager aggregation",
topDown(
new PushDownSumThroughJoin(),

View File

@ -220,7 +220,8 @@ public class FunctionalDependencies {
.map(s -> replaceMap.getOrDefault(s, s))
.collect(Collectors.toSet());
slotSets = slotSets.stream()
.map(set -> set.stream().map(replaceMap::get).collect(ImmutableSet.toImmutableSet()))
.map(set -> set.stream().map(s -> replaceMap.getOrDefault(s, s))
.collect(ImmutableSet.toImmutableSet()))
.collect(Collectors.toSet());
}

View File

@ -207,6 +207,7 @@ public enum RuleType {
ELIMINATE_NOT_NULL(RuleTypeClass.REWRITE),
ELIMINATE_UNNECESSARY_PROJECT(RuleTypeClass.REWRITE),
ELIMINATE_OUTER_JOIN(RuleTypeClass.REWRITE),
ELIMINATE_GROUP_BY(RuleTypeClass.REWRITE),
ELIMINATE_DEDUP_JOIN_CONDITION(RuleTypeClass.REWRITE),
ELIMINATE_NULL_AWARE_LEFT_ANTI_JOIN(RuleTypeClass.REWRITE),
ELIMINATE_ASSERT_NUM_ROWS(RuleTypeClass.REWRITE),

View File

@ -0,0 +1,83 @@
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the License for the
// specific language governing permissions and limitations
// under the License.
package org.apache.doris.nereids.rules.rewrite;
import org.apache.doris.nereids.rules.Rule;
import org.apache.doris.nereids.rules.RuleType;
import org.apache.doris.nereids.trees.expressions.Alias;
import org.apache.doris.nereids.trees.expressions.IsNull;
import org.apache.doris.nereids.trees.expressions.NamedExpression;
import org.apache.doris.nereids.trees.expressions.Slot;
import org.apache.doris.nereids.trees.expressions.functions.agg.AggregateFunction;
import org.apache.doris.nereids.trees.expressions.functions.agg.Count;
import org.apache.doris.nereids.trees.expressions.functions.agg.Max;
import org.apache.doris.nereids.trees.expressions.functions.agg.Min;
import org.apache.doris.nereids.trees.expressions.functions.agg.Sum;
import org.apache.doris.nereids.trees.expressions.functions.scalar.If;
import org.apache.doris.nereids.trees.expressions.literal.Literal;
import org.apache.doris.nereids.trees.plans.Plan;
import org.apache.doris.nereids.util.PlanUtils;
import java.util.List;
import java.util.Set;
import java.util.stream.Collectors;
/**
* Eliminate GroupBy.
*/
public class EliminateGroupBy extends OneRewriteRuleFactory {
@Override
public Rule build() {
return logicalAggregate()
.when(agg -> agg.getGroupByExpressions().stream().allMatch(expr -> expr instanceof Slot))
.then(agg -> {
Set<Slot> groupby = agg.getGroupByExpressions().stream().map(e -> (Slot) e)
.collect(Collectors.toSet());
Plan child = agg.child();
boolean unique = child.getLogicalProperties().getFunctionalDependencies()
.isUniqueAndNotNull(groupby);
if (!unique) {
return null;
}
Set<AggregateFunction> aggregateFunctions = agg.getAggregateFunctions();
if (!aggregateFunctions.stream().allMatch(
f -> (f instanceof Sum || f instanceof Count || f instanceof Min || f instanceof Max)
&& (f.arity() == 1 && f.child(0) instanceof Slot))) {
return null;
}
List<NamedExpression> newOutput = agg.getOutputExpressions().stream().map(ne -> {
if (ne instanceof Alias && ne.child(0) instanceof AggregateFunction) {
AggregateFunction f = (AggregateFunction) ne.child(0);
if (f instanceof Sum || f instanceof Min || f instanceof Max) {
return new Alias(ne.getExprId(), f.child(0), ne.getName());
} else if (f instanceof Count) {
return (NamedExpression) ne.withChildren(
new If(new IsNull(f.child(0)), Literal.of(0), Literal.of(1)));
} else {
throw new IllegalStateException("Unexpected aggregate function: " + f);
}
} else {
return ne;
}
}).collect(Collectors.toList());
return PlanUtils.projectOrSelf(newOutput, child);
}).toRule(RuleType.ELIMINATE_GROUP_BY);
}
}