[feature](Nereids): eager aggreagate support mix agg function (#30400)
This commit is contained in:
@ -98,16 +98,14 @@ import org.apache.doris.nereids.rules.rewrite.PullUpProjectUnderTopN;
|
||||
import org.apache.doris.nereids.rules.rewrite.PushConjunctsIntoEsScan;
|
||||
import org.apache.doris.nereids.rules.rewrite.PushConjunctsIntoJdbcScan;
|
||||
import org.apache.doris.nereids.rules.rewrite.PushConjunctsIntoOdbcScan;
|
||||
import org.apache.doris.nereids.rules.rewrite.PushDownAggThroughJoinOneSide;
|
||||
import org.apache.doris.nereids.rules.rewrite.PushDownCountThroughJoin;
|
||||
import org.apache.doris.nereids.rules.rewrite.PushDownCountThroughJoinOneSide;
|
||||
import org.apache.doris.nereids.rules.rewrite.PushDownDistinctThroughJoin;
|
||||
import org.apache.doris.nereids.rules.rewrite.PushDownFilterThroughProject;
|
||||
import org.apache.doris.nereids.rules.rewrite.PushDownLimit;
|
||||
import org.apache.doris.nereids.rules.rewrite.PushDownLimitDistinctThroughJoin;
|
||||
import org.apache.doris.nereids.rules.rewrite.PushDownLimitDistinctThroughUnion;
|
||||
import org.apache.doris.nereids.rules.rewrite.PushDownMinMaxThroughJoin;
|
||||
import org.apache.doris.nereids.rules.rewrite.PushDownSumThroughJoin;
|
||||
import org.apache.doris.nereids.rules.rewrite.PushDownSumThroughJoinOneSide;
|
||||
import org.apache.doris.nereids.rules.rewrite.PushDownTopNDistinctThroughJoin;
|
||||
import org.apache.doris.nereids.rules.rewrite.PushDownTopNDistinctThroughUnion;
|
||||
import org.apache.doris.nereids.rules.rewrite.PushDownTopNThroughJoin;
|
||||
@ -291,13 +289,9 @@ public class Rewriter extends AbstractBatchJobExecutor {
|
||||
topic("Eager aggregation",
|
||||
topDown(
|
||||
new PushDownSumThroughJoin(),
|
||||
new PushDownMinMaxThroughJoin(),
|
||||
new PushDownAggThroughJoinOneSide(),
|
||||
new PushDownCountThroughJoin()
|
||||
),
|
||||
topDown(
|
||||
new PushDownSumThroughJoinOneSide(),
|
||||
new PushDownCountThroughJoinOneSide()
|
||||
),
|
||||
custom(RuleType.PUSH_DOWN_DISTINCT_THROUGH_JOIN, PushDownDistinctThroughJoin::new)
|
||||
),
|
||||
|
||||
|
||||
@ -167,13 +167,10 @@ public enum RuleType {
|
||||
COLUMN_PRUNING(RuleTypeClass.REWRITE),
|
||||
ELIMINATE_SORT(RuleTypeClass.REWRITE),
|
||||
|
||||
PUSH_DOWN_MIN_MAX_THROUGH_JOIN(RuleTypeClass.REWRITE),
|
||||
PUSH_DOWN_AGG_THROUGH_JOIN_ONE_SIDE(RuleTypeClass.REWRITE),
|
||||
PUSH_DOWN_SUM_THROUGH_JOIN(RuleTypeClass.REWRITE),
|
||||
PUSH_DOWN_COUNT_THROUGH_JOIN(RuleTypeClass.REWRITE),
|
||||
|
||||
PUSH_DOWN_SUM_THROUGH_JOIN_ONE_SIDE(RuleTypeClass.REWRITE),
|
||||
PUSH_DOWN_COUNT_THROUGH_JOIN_ONE_SIDE(RuleTypeClass.REWRITE),
|
||||
|
||||
TRANSPOSE_LOGICAL_SEMI_JOIN_LOGICAL_JOIN(RuleTypeClass.REWRITE),
|
||||
TRANSPOSE_LOGICAL_SEMI_JOIN_LOGICAL_JOIN_PROJECT(RuleTypeClass.REWRITE),
|
||||
LOGICAL_SEMI_JOIN_COMMUTE(RuleTypeClass.REWRITE),
|
||||
|
||||
@ -24,8 +24,10 @@ import org.apache.doris.nereids.trees.expressions.Expression;
|
||||
import org.apache.doris.nereids.trees.expressions.NamedExpression;
|
||||
import org.apache.doris.nereids.trees.expressions.Slot;
|
||||
import org.apache.doris.nereids.trees.expressions.functions.agg.AggregateFunction;
|
||||
import org.apache.doris.nereids.trees.expressions.functions.agg.Count;
|
||||
import org.apache.doris.nereids.trees.expressions.functions.agg.Max;
|
||||
import org.apache.doris.nereids.trees.expressions.functions.agg.Min;
|
||||
import org.apache.doris.nereids.trees.expressions.functions.agg.Sum;
|
||||
import org.apache.doris.nereids.trees.plans.Plan;
|
||||
import org.apache.doris.nereids.trees.plans.logical.LogicalAggregate;
|
||||
import org.apache.doris.nereids.trees.plans.logical.LogicalJoin;
|
||||
@ -46,22 +48,22 @@ import java.util.Set;
|
||||
* TODO: distinct
|
||||
* Related paper "Eager aggregation and lazy aggregation".
|
||||
* <pre>
|
||||
* aggregate: Min/Max(x)
|
||||
* aggregate: Min/Max/Sum(x)
|
||||
* |
|
||||
* join
|
||||
* | \
|
||||
* | *
|
||||
* (x)
|
||||
* ->
|
||||
* aggregate: Min/Max(min1)
|
||||
* aggregate: Min/Max/Sum(min1)
|
||||
* |
|
||||
* join
|
||||
* | \
|
||||
* | *
|
||||
* aggregate: Min/Max(x) as min1
|
||||
* aggregate: Min/Max/Sum(x) as min1
|
||||
* </pre>
|
||||
*/
|
||||
public class PushDownMinMaxThroughJoin implements RewriteRuleFactory {
|
||||
public class PushDownAggThroughJoinOneSide implements RewriteRuleFactory {
|
||||
@Override
|
||||
public List<Rule> buildRules() {
|
||||
return ImmutableList.of(
|
||||
@ -71,19 +73,20 @@ public class PushDownMinMaxThroughJoin implements RewriteRuleFactory {
|
||||
.when(agg -> {
|
||||
Set<AggregateFunction> funcs = agg.getAggregateFunctions();
|
||||
return !funcs.isEmpty() && funcs.stream()
|
||||
.allMatch(f -> (f instanceof Min || f instanceof Max) && !f.isDistinct() && f.child(
|
||||
0) instanceof Slot);
|
||||
.allMatch(f -> (f instanceof Min || f instanceof Max || f instanceof Sum
|
||||
|| (f instanceof Count && !((Count) f).isCountStar())) && !f.isDistinct()
|
||||
&& f.child(0) instanceof Slot);
|
||||
})
|
||||
.thenApply(ctx -> {
|
||||
Set<Integer> enableNereidsRules = ctx.cascadesContext.getConnectContext()
|
||||
.getSessionVariable().getEnableNereidsRules();
|
||||
if (!enableNereidsRules.contains(RuleType.PUSH_DOWN_MIN_MAX_THROUGH_JOIN.type())) {
|
||||
if (!enableNereidsRules.contains(RuleType.PUSH_DOWN_AGG_THROUGH_JOIN_ONE_SIDE.type())) {
|
||||
return null;
|
||||
}
|
||||
LogicalAggregate<LogicalJoin<Plan, Plan>> agg = ctx.root;
|
||||
return pushMinMaxSum(agg, agg.child(), ImmutableList.of());
|
||||
return pushMinMaxSumCount(agg, agg.child(), ImmutableList.of());
|
||||
})
|
||||
.toRule(RuleType.PUSH_DOWN_MIN_MAX_THROUGH_JOIN),
|
||||
.toRule(RuleType.PUSH_DOWN_AGG_THROUGH_JOIN_ONE_SIDE),
|
||||
logicalAggregate(logicalProject(innerLogicalJoin()))
|
||||
.when(agg -> agg.child().isAllSlots())
|
||||
.when(agg -> agg.child().child().getOtherJoinConjuncts().isEmpty())
|
||||
@ -91,27 +94,27 @@ public class PushDownMinMaxThroughJoin implements RewriteRuleFactory {
|
||||
.when(agg -> {
|
||||
Set<AggregateFunction> funcs = agg.getAggregateFunctions();
|
||||
return !funcs.isEmpty() && funcs.stream()
|
||||
.allMatch(
|
||||
f -> (f instanceof Min || f instanceof Max) && !f.isDistinct() && f.child(
|
||||
0) instanceof Slot);
|
||||
.allMatch(f -> (f instanceof Min || f instanceof Max || f instanceof Sum
|
||||
|| (f instanceof Count && (!((Count) f).isCountStar()))) && !f.isDistinct()
|
||||
&& f.child(0) instanceof Slot);
|
||||
})
|
||||
.thenApply(ctx -> {
|
||||
Set<Integer> enableNereidsRules = ctx.cascadesContext.getConnectContext()
|
||||
.getSessionVariable().getEnableNereidsRules();
|
||||
if (!enableNereidsRules.contains(RuleType.PUSH_DOWN_MIN_MAX_THROUGH_JOIN.type())) {
|
||||
if (!enableNereidsRules.contains(RuleType.PUSH_DOWN_AGG_THROUGH_JOIN_ONE_SIDE.type())) {
|
||||
return null;
|
||||
}
|
||||
LogicalAggregate<LogicalProject<LogicalJoin<Plan, Plan>>> agg = ctx.root;
|
||||
return pushMinMaxSum(agg, agg.child().child(), agg.child().getProjects());
|
||||
return pushMinMaxSumCount(agg, agg.child().child(), agg.child().getProjects());
|
||||
})
|
||||
.toRule(RuleType.PUSH_DOWN_MIN_MAX_THROUGH_JOIN)
|
||||
.toRule(RuleType.PUSH_DOWN_AGG_THROUGH_JOIN_ONE_SIDE)
|
||||
);
|
||||
}
|
||||
|
||||
/**
|
||||
* Push down Min/Max/Sum through join.
|
||||
*/
|
||||
public static LogicalAggregate<Plan> pushMinMaxSum(LogicalAggregate<? extends Plan> agg,
|
||||
public static LogicalAggregate<Plan> pushMinMaxSumCount(LogicalAggregate<? extends Plan> agg,
|
||||
LogicalJoin<Plan, Plan> join, List<NamedExpression> projects) {
|
||||
List<Slot> leftOutput = join.left().getOutput();
|
||||
List<Slot> rightOutput = join.right().getOutput();
|
||||
@ -183,21 +186,22 @@ public class PushDownMinMaxThroughJoin implements RewriteRuleFactory {
|
||||
Preconditions.checkState(left != join.left() || right != join.right());
|
||||
Plan newJoin = join.withChildren(left, right);
|
||||
|
||||
// top agg
|
||||
// top agg TODO: AVG
|
||||
// replace
|
||||
// min(x) -> min(min#)
|
||||
// max(x) -> max(max#)
|
||||
// sum(x) -> sum(sum#)
|
||||
// count(x) -> sum(count#)
|
||||
List<NamedExpression> newOutputExprs = new ArrayList<>();
|
||||
for (NamedExpression ne : agg.getOutputExpressions()) {
|
||||
if (ne instanceof Alias && ((Alias) ne).child() instanceof AggregateFunction) {
|
||||
AggregateFunction func = (AggregateFunction) ((Alias) ne).child();
|
||||
Slot slot = (Slot) func.child(0);
|
||||
if (leftSlotToOutput.containsKey(slot)) {
|
||||
Expression newFunc = func.withChildren(leftSlotToOutput.get(slot).toSlot());
|
||||
Expression newFunc = replaceAggFunc(func, leftSlotToOutput.get(slot).toSlot());
|
||||
newOutputExprs.add((NamedExpression) ne.withChildren(newFunc));
|
||||
} else if (rightSlotToOutput.containsKey(slot)) {
|
||||
Expression newFunc = func.withChildren(rightSlotToOutput.get(slot).toSlot());
|
||||
Expression newFunc = replaceAggFunc(func, rightSlotToOutput.get(slot).toSlot());
|
||||
newOutputExprs.add((NamedExpression) ne.withChildren(newFunc));
|
||||
} else {
|
||||
throw new IllegalStateException("Slot " + slot + " not found in join output");
|
||||
@ -210,4 +214,12 @@ public class PushDownMinMaxThroughJoin implements RewriteRuleFactory {
|
||||
// TODO: column prune project
|
||||
return agg.withAggOutputChild(newOutputExprs, newJoin);
|
||||
}
|
||||
|
||||
private static Expression replaceAggFunc(AggregateFunction func, Slot inputSlot) {
|
||||
if (func instanceof Count) {
|
||||
return new Sum(inputSlot);
|
||||
} else {
|
||||
return func.withChildren(inputSlot);
|
||||
}
|
||||
}
|
||||
}
|
||||
@ -1,216 +0,0 @@
|
||||
// Licensed to the Apache Software Foundation (ASF) under one
|
||||
// or more contributor license agreements. See the NOTICE file
|
||||
// distributed with this work for additional information
|
||||
// regarding copyright ownership. The ASF licenses this file
|
||||
// to you under the Apache License, Version 2.0 (the
|
||||
// "License"); you may not use this file except in compliance
|
||||
// with the License. You may obtain a copy of the License at
|
||||
//
|
||||
// http://www.apache.org/licenses/LICENSE-2.0
|
||||
//
|
||||
// Unless required by applicable law or agreed to in writing,
|
||||
// software distributed under the License is distributed on an
|
||||
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
||||
// KIND, either express or implied. See the License for the
|
||||
// specific language governing permissions and limitations
|
||||
// under the License.
|
||||
|
||||
package org.apache.doris.nereids.rules.rewrite;
|
||||
|
||||
import org.apache.doris.nereids.rules.Rule;
|
||||
import org.apache.doris.nereids.rules.RuleType;
|
||||
import org.apache.doris.nereids.trees.expressions.Alias;
|
||||
import org.apache.doris.nereids.trees.expressions.Expression;
|
||||
import org.apache.doris.nereids.trees.expressions.NamedExpression;
|
||||
import org.apache.doris.nereids.trees.expressions.Slot;
|
||||
import org.apache.doris.nereids.trees.expressions.functions.agg.AggregateFunction;
|
||||
import org.apache.doris.nereids.trees.expressions.functions.agg.Count;
|
||||
import org.apache.doris.nereids.trees.expressions.functions.agg.Sum;
|
||||
import org.apache.doris.nereids.trees.plans.Plan;
|
||||
import org.apache.doris.nereids.trees.plans.logical.LogicalAggregate;
|
||||
import org.apache.doris.nereids.trees.plans.logical.LogicalJoin;
|
||||
import org.apache.doris.nereids.trees.plans.logical.LogicalProject;
|
||||
|
||||
import com.google.common.base.Preconditions;
|
||||
import com.google.common.collect.ImmutableList;
|
||||
import com.google.common.collect.ImmutableList.Builder;
|
||||
|
||||
import java.util.ArrayList;
|
||||
import java.util.HashMap;
|
||||
import java.util.HashSet;
|
||||
import java.util.List;
|
||||
import java.util.Map;
|
||||
import java.util.Set;
|
||||
|
||||
/**
|
||||
* TODO: distinct | just push one level
|
||||
* Support Pushdown Count(col).
|
||||
* Count(col) -> Sum( cnt )
|
||||
* <p>
|
||||
* Related paper "Eager aggregation and lazy aggregation".
|
||||
* <pre>
|
||||
* aggregate: count(x)
|
||||
* |
|
||||
* join
|
||||
* | \
|
||||
* | *
|
||||
* (x)
|
||||
* ->
|
||||
* aggregate: Sum( cnt )
|
||||
* |
|
||||
* join
|
||||
* | \
|
||||
* | *
|
||||
* aggregate: count(x) as cnt
|
||||
* </pre>
|
||||
* Notice: rule can't optimize condition that groupby is empty when Count(*) exists.
|
||||
*/
|
||||
public class PushDownCountThroughJoinOneSide implements RewriteRuleFactory {
|
||||
@Override
|
||||
public List<Rule> buildRules() {
|
||||
return ImmutableList.of(
|
||||
logicalAggregate(innerLogicalJoin())
|
||||
.when(agg -> agg.child().getOtherJoinConjuncts().isEmpty())
|
||||
.whenNot(agg -> agg.child().children().stream().anyMatch(p -> p instanceof LogicalAggregate))
|
||||
.when(agg -> agg.getGroupByExpressions().stream().allMatch(e -> e instanceof Slot))
|
||||
.when(agg -> {
|
||||
Set<AggregateFunction> funcs = agg.getAggregateFunctions();
|
||||
return !funcs.isEmpty() && funcs.stream()
|
||||
.allMatch(f -> f instanceof Count && !f.isDistinct()
|
||||
&& (!((Count) f).isCountStar() && f.child(0) instanceof Slot));
|
||||
})
|
||||
.thenApply(ctx -> {
|
||||
Set<Integer> enableNereidsRules = ctx.cascadesContext.getConnectContext()
|
||||
.getSessionVariable().getEnableNereidsRules();
|
||||
if (!enableNereidsRules.contains(RuleType.PUSH_DOWN_COUNT_THROUGH_JOIN_ONE_SIDE.type())) {
|
||||
return null;
|
||||
}
|
||||
LogicalAggregate<LogicalJoin<Plan, Plan>> agg = ctx.root;
|
||||
return pushCount(agg, agg.child(), ImmutableList.of());
|
||||
})
|
||||
.toRule(RuleType.PUSH_DOWN_COUNT_THROUGH_JOIN_ONE_SIDE),
|
||||
logicalAggregate(logicalProject(innerLogicalJoin()))
|
||||
.when(agg -> agg.child().isAllSlots())
|
||||
.when(agg -> agg.child().child().getOtherJoinConjuncts().isEmpty())
|
||||
.whenNot(agg -> agg.child().children().stream().anyMatch(p -> p instanceof LogicalAggregate))
|
||||
.when(agg -> agg.getGroupByExpressions().stream().allMatch(e -> e instanceof Slot))
|
||||
.when(agg -> {
|
||||
Set<AggregateFunction> funcs = agg.getAggregateFunctions();
|
||||
return !funcs.isEmpty() && funcs.stream()
|
||||
.allMatch(f -> f instanceof Count && !f.isDistinct()
|
||||
&& (!((Count) f).isCountStar() && f.child(0) instanceof Slot));
|
||||
})
|
||||
.thenApply(ctx -> {
|
||||
Set<Integer> enableNereidsRules = ctx.cascadesContext.getConnectContext()
|
||||
.getSessionVariable().getEnableNereidsRules();
|
||||
if (!enableNereidsRules.contains(RuleType.PUSH_DOWN_COUNT_THROUGH_JOIN_ONE_SIDE.type())) {
|
||||
return null;
|
||||
}
|
||||
LogicalAggregate<LogicalProject<LogicalJoin<Plan, Plan>>> agg = ctx.root;
|
||||
return pushCount(agg, agg.child().child(), agg.child().getProjects());
|
||||
})
|
||||
.toRule(RuleType.PUSH_DOWN_COUNT_THROUGH_JOIN_ONE_SIDE)
|
||||
);
|
||||
}
|
||||
|
||||
private LogicalAggregate<Plan> pushCount(LogicalAggregate<? extends Plan> agg,
|
||||
LogicalJoin<Plan, Plan> join, List<NamedExpression> projects) {
|
||||
List<Slot> leftOutput = join.left().getOutput();
|
||||
List<Slot> rightOutput = join.right().getOutput();
|
||||
|
||||
List<Count> leftCounts = new ArrayList<>();
|
||||
List<Count> rightCounts = new ArrayList<>();
|
||||
for (AggregateFunction f : agg.getAggregateFunctions()) {
|
||||
Count count = (Count) f;
|
||||
Slot slot = (Slot) count.child(0);
|
||||
if (leftOutput.contains(slot)) {
|
||||
leftCounts.add(count);
|
||||
} else if (rightOutput.contains(slot)) {
|
||||
rightCounts.add(count);
|
||||
} else {
|
||||
throw new IllegalStateException("Slot " + slot + " not found in join output");
|
||||
}
|
||||
}
|
||||
|
||||
Set<Slot> leftGroupBy = new HashSet<>();
|
||||
Set<Slot> rightGroupBy = new HashSet<>();
|
||||
for (Expression e : agg.getGroupByExpressions()) {
|
||||
Slot slot = (Slot) e;
|
||||
if (leftOutput.contains(slot)) {
|
||||
leftGroupBy.add(slot);
|
||||
} else if (rightOutput.contains(slot)) {
|
||||
rightGroupBy.add(slot);
|
||||
} else {
|
||||
return null;
|
||||
}
|
||||
}
|
||||
join.getHashJoinConjuncts().forEach(e -> e.getInputSlots().forEach(slot -> {
|
||||
if (leftOutput.contains(slot)) {
|
||||
leftGroupBy.add(slot);
|
||||
} else if (rightOutput.contains(slot)) {
|
||||
rightGroupBy.add(slot);
|
||||
} else {
|
||||
throw new IllegalStateException("Slot " + slot + " not found in join output");
|
||||
}
|
||||
}));
|
||||
|
||||
Plan left = join.left();
|
||||
Plan right = join.right();
|
||||
|
||||
Map<Slot, NamedExpression> leftCntSlotToOutput = new HashMap<>();
|
||||
Map<Slot, NamedExpression> rightCntSlotToOutput = new HashMap<>();
|
||||
|
||||
// left Count agg
|
||||
if (!leftCounts.isEmpty()) {
|
||||
Builder<NamedExpression> leftCntAggOutputBuilder = ImmutableList.<NamedExpression>builder()
|
||||
.addAll(leftGroupBy);
|
||||
leftCounts.forEach(func -> {
|
||||
Alias alias = func.alias(func.getName());
|
||||
leftCntSlotToOutput.put((Slot) func.child(0), alias);
|
||||
leftCntAggOutputBuilder.add(alias);
|
||||
});
|
||||
left = new LogicalAggregate<>(ImmutableList.copyOf(leftGroupBy), leftCntAggOutputBuilder.build(),
|
||||
join.left());
|
||||
}
|
||||
|
||||
// right Count agg
|
||||
if (!rightCounts.isEmpty()) {
|
||||
Builder<NamedExpression> rightCntAggOutputBuilder = ImmutableList.<NamedExpression>builder()
|
||||
.addAll(rightGroupBy);
|
||||
rightCounts.forEach(func -> {
|
||||
Alias alias = func.alias(func.getName());
|
||||
rightCntSlotToOutput.put((Slot) func.child(0), alias);
|
||||
rightCntAggOutputBuilder.add(alias);
|
||||
});
|
||||
|
||||
right = new LogicalAggregate<>(ImmutableList.copyOf(rightGroupBy), rightCntAggOutputBuilder.build(),
|
||||
join.right());
|
||||
}
|
||||
|
||||
Preconditions.checkState(left != join.left() || right != join.right());
|
||||
Plan newJoin = join.withChildren(left, right);
|
||||
|
||||
// top Sum agg
|
||||
// count(slot) -> sum( count(slot) as cnt )
|
||||
List<NamedExpression> newOutputExprs = new ArrayList<>();
|
||||
for (NamedExpression ne : agg.getOutputExpressions()) {
|
||||
if (ne instanceof Alias && ((Alias) ne).child() instanceof Count) {
|
||||
Count oldTopCnt = (Count) ((Alias) ne).child();
|
||||
|
||||
Slot slot = (Slot) oldTopCnt.child(0);
|
||||
if (leftCntSlotToOutput.containsKey(slot)) {
|
||||
Expression expr = new Sum(leftCntSlotToOutput.get(slot).toSlot());
|
||||
newOutputExprs.add((NamedExpression) ne.withChildren(expr));
|
||||
} else if (rightCntSlotToOutput.containsKey(slot)) {
|
||||
Expression expr = new Sum(rightCntSlotToOutput.get(slot).toSlot());
|
||||
newOutputExprs.add((NamedExpression) ne.withChildren(expr));
|
||||
} else {
|
||||
throw new IllegalStateException("Slot " + slot + " not found in join output");
|
||||
}
|
||||
} else {
|
||||
newOutputExprs.add(ne);
|
||||
}
|
||||
}
|
||||
return agg.withAggOutputChild(newOutputExprs, newJoin);
|
||||
}
|
||||
}
|
||||
@ -1,98 +0,0 @@
|
||||
// Licensed to the Apache Software Foundation (ASF) under one
|
||||
// or more contributor license agreements. See the NOTICE file
|
||||
// distributed with this work for additional information
|
||||
// regarding copyright ownership. The ASF licenses this file
|
||||
// to you under the Apache License, Version 2.0 (the
|
||||
// "License"); you may not use this file except in compliance
|
||||
// with the License. You may obtain a copy of the License at
|
||||
//
|
||||
// http://www.apache.org/licenses/LICENSE-2.0
|
||||
//
|
||||
// Unless required by applicable law or agreed to in writing,
|
||||
// software distributed under the License is distributed on an
|
||||
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
||||
// KIND, either express or implied. See the License for the
|
||||
// specific language governing permissions and limitations
|
||||
// under the License.
|
||||
|
||||
package org.apache.doris.nereids.rules.rewrite;
|
||||
|
||||
import org.apache.doris.nereids.rules.Rule;
|
||||
import org.apache.doris.nereids.rules.RuleType;
|
||||
import org.apache.doris.nereids.trees.expressions.Slot;
|
||||
import org.apache.doris.nereids.trees.expressions.functions.agg.AggregateFunction;
|
||||
import org.apache.doris.nereids.trees.expressions.functions.agg.Sum;
|
||||
import org.apache.doris.nereids.trees.plans.Plan;
|
||||
import org.apache.doris.nereids.trees.plans.logical.LogicalAggregate;
|
||||
import org.apache.doris.nereids.trees.plans.logical.LogicalJoin;
|
||||
import org.apache.doris.nereids.trees.plans.logical.LogicalProject;
|
||||
|
||||
import com.google.common.collect.ImmutableList;
|
||||
|
||||
import java.util.List;
|
||||
import java.util.Set;
|
||||
|
||||
/**
|
||||
* TODO: distinct
|
||||
* Related paper "Eager aggregation and lazy aggregation".
|
||||
* <pre>
|
||||
* aggregate: Sum(x)
|
||||
* |
|
||||
* join
|
||||
* | \
|
||||
* | *
|
||||
* (x)
|
||||
* ->
|
||||
* aggregate: Sum(sum1)
|
||||
* |
|
||||
* join
|
||||
* | \
|
||||
* | *
|
||||
* aggregate: Sum(x) as sum1
|
||||
* </pre>
|
||||
*/
|
||||
public class PushDownSumThroughJoinOneSide implements RewriteRuleFactory {
|
||||
@Override
|
||||
public List<Rule> buildRules() {
|
||||
return ImmutableList.of(
|
||||
logicalAggregate(innerLogicalJoin())
|
||||
.when(agg -> agg.child().getOtherJoinConjuncts().isEmpty())
|
||||
.whenNot(agg -> agg.child().children().stream().anyMatch(p -> p instanceof LogicalAggregate))
|
||||
.when(agg -> {
|
||||
Set<AggregateFunction> funcs = agg.getAggregateFunctions();
|
||||
return !funcs.isEmpty() && funcs.stream()
|
||||
.allMatch(f -> f instanceof Sum && !f.isDistinct() && f.child(0) instanceof Slot);
|
||||
})
|
||||
.thenApply(ctx -> {
|
||||
Set<Integer> enableNereidsRules = ctx.cascadesContext.getConnectContext()
|
||||
.getSessionVariable().getEnableNereidsRules();
|
||||
if (!enableNereidsRules.contains(RuleType.PUSH_DOWN_SUM_THROUGH_JOIN_ONE_SIDE.type())) {
|
||||
return null;
|
||||
}
|
||||
LogicalAggregate<LogicalJoin<Plan, Plan>> agg = ctx.root;
|
||||
return PushDownMinMaxThroughJoin.pushMinMaxSum(agg, agg.child(), ImmutableList.of());
|
||||
})
|
||||
.toRule(RuleType.PUSH_DOWN_SUM_THROUGH_JOIN),
|
||||
logicalAggregate(logicalProject(innerLogicalJoin()))
|
||||
.when(agg -> agg.child().isAllSlots())
|
||||
.when(agg -> agg.child().child().getOtherJoinConjuncts().isEmpty())
|
||||
.whenNot(agg -> agg.child().children().stream().anyMatch(p -> p instanceof LogicalAggregate))
|
||||
.when(agg -> {
|
||||
Set<AggregateFunction> funcs = agg.getAggregateFunctions();
|
||||
return !funcs.isEmpty() && funcs.stream()
|
||||
.allMatch(f -> f instanceof Sum && !f.isDistinct() && f.child(0) instanceof Slot);
|
||||
})
|
||||
.thenApply(ctx -> {
|
||||
Set<Integer> enableNereidsRules = ctx.cascadesContext.getConnectContext()
|
||||
.getSessionVariable().getEnableNereidsRules();
|
||||
if (!enableNereidsRules.contains(RuleType.PUSH_DOWN_SUM_THROUGH_JOIN_ONE_SIDE.type())) {
|
||||
return null;
|
||||
}
|
||||
LogicalAggregate<LogicalProject<LogicalJoin<Plan, Plan>>> agg = ctx.root;
|
||||
return PushDownMinMaxThroughJoin.pushMinMaxSum(agg, agg.child().child(),
|
||||
agg.child().getProjects());
|
||||
})
|
||||
.toRule(RuleType.PUSH_DOWN_SUM_THROUGH_JOIN)
|
||||
);
|
||||
}
|
||||
}
|
||||
Reference in New Issue
Block a user