[Performance](point query)Opimize partition prune for point query (#28150)

* [Performance](point query)Opimize partition prune for point query
This commit is contained in:
lihangyu
2023-12-19 11:00:13 +08:00
committed by GitHub
parent d17ac99abe
commit 88f0bee722
7 changed files with 343 additions and 1 deletions

View File

@ -28,6 +28,7 @@ import org.apache.doris.analysis.Expr;
import org.apache.doris.analysis.FunctionCallExpr;
import org.apache.doris.analysis.InPredicate;
import org.apache.doris.analysis.IntLiteral;
import org.apache.doris.analysis.LiteralExpr;
import org.apache.doris.analysis.PartitionNames;
import org.apache.doris.analysis.SlotDescriptor;
import org.apache.doris.analysis.SlotId;
@ -199,6 +200,11 @@ public class OlapScanNode extends ScanNode {
private boolean shouldColoScan = false;
// cached for prepared statement to quickly prune partition
// only used in short circuit plan at present
private final PartitionPruneV2ForShortCircuitPlan cachedPartitionPruner =
new PartitionPruneV2ForShortCircuitPlan();
// Constructs node to scan given data files of table 'tbl'.
public OlapScanNode(PlanNodeId id, TupleDescriptor desc, String planNodeName) {
super(id, desc, planNodeName, StatisticalType.OLAP_SCAN_NODE);
@ -674,8 +680,17 @@ public class OlapScanNode extends ScanNode {
} else {
keyItemMap = partitionInfo.getIdToItem(false);
}
if (partitionInfo.getType() == PartitionType.RANGE) {
if (isPointQuery() && partitionInfo.getPartitionColumns().size() == 1) {
// short circuit, a quick path to find partition
ColumnRange filterRange = columnNameToRange.get(partitionInfo.getPartitionColumns().get(0).getName());
LiteralExpr lowerBound = filterRange.getRangeSet().get().asRanges().stream()
.findFirst().get().lowerEndpoint().getValue();
LiteralExpr upperBound = filterRange.getRangeSet().get().asRanges().stream()
.findFirst().get().upperEndpoint().getValue();
cachedPartitionPruner.update(keyItemMap);
return cachedPartitionPruner.prune(lowerBound, upperBound);
}
partitionPruner = new RangePartitionPrunerV2(keyItemMap,
partitionInfo.getPartitionColumns(), columnNameToRange);
} else if (partitionInfo.getType() == PartitionType.LIST) {

View File

@ -0,0 +1,90 @@
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the License for the
// specific language governing permissions and limitations
// under the License.
package org.apache.doris.planner;
import org.apache.doris.analysis.LiteralExpr;
import org.apache.doris.catalog.Column;
import org.apache.doris.catalog.PartitionItem;
import org.apache.doris.catalog.PartitionKey;
import org.apache.doris.common.AnalysisException;
import com.google.common.collect.Range;
import org.apache.logging.log4j.LogManager;
import org.apache.logging.log4j.Logger;
import java.util.Collection;
import java.util.Map;
import java.util.Map.Entry;
public class PartitionPruneV2ForShortCircuitPlan extends PartitionPrunerV2Base {
private static final Logger LOG = LogManager.getLogger(PartitionPruneV2ForShortCircuitPlan.class);
// map to record literal range to find specific partition
private RangeMap<LiteralExpr, Long> partitionRangeMapByLiteral = new RangeMap<>();
// last timestamp partitionRangeMapByLiteral updated
private long lastPartitionRangeMapUpdateTimestampMs = 0;
PartitionPruneV2ForShortCircuitPlan() {
super();
}
public boolean update(Map<Long, PartitionItem> keyItemMap) {
// interval to update partitionRangeMapByLiteral
long partitionRangeMapUpdateIntervalS = 10;
if (System.currentTimeMillis() - lastPartitionRangeMapUpdateTimestampMs
> partitionRangeMapUpdateIntervalS * 1000) {
partitionRangeMapByLiteral = new RangeMap<>();
// recalculate map
for (Entry<Long, PartitionItem> entry : keyItemMap.entrySet()) {
Range<PartitionKey> range = entry.getValue().getItems();
LiteralExpr partitionLowerBound = (LiteralExpr) range.lowerEndpoint().getKeys().get(0);
LiteralExpr partitionUpperBound = (LiteralExpr) range.upperEndpoint().getKeys().get(0);
Range<LiteralExpr> partitionRange = Range.closedOpen(partitionLowerBound, partitionUpperBound);
partitionRangeMapByLiteral.put(partitionRange, entry.getKey());
}
LOG.debug("update partitionRangeMapByLiteral");
this.lastPartitionRangeMapUpdateTimestampMs = System.currentTimeMillis();
return true;
}
return false;
}
public Collection<Long> prune(LiteralExpr lowerBound, LiteralExpr upperBound) throws AnalysisException {
Range<LiteralExpr> filterRangeValue = Range.closed(lowerBound, upperBound);
return partitionRangeMapByLiteral.getOverlappingRangeValues(filterRangeValue);
}
@Override
public Collection<Long> prune() throws AnalysisException {
throw new AnalysisException("Not implemented");
}
@Override
void genSingleColumnRangeMap() {
}
@Override
FinalFilters getFinalFilters(ColumnRange columnRange,
Column column) throws AnalysisException {
throw new AnalysisException("Not implemented");
}
@Override
Collection<Long> pruneMultipleColumnPartition(Map<Column, FinalFilters> columnToFilters) throws AnalysisException {
throw new AnalysisException("Not implemented");
}
}

View File

@ -48,6 +48,13 @@ public abstract class PartitionPrunerV2Base implements PartitionPruner {
// currently only used for list partition
private Map.Entry<Long, PartitionItem> defaultPartition;
// Only called in PartitionPruneV2ByShortCircuitPlan constructor
PartitionPrunerV2Base() {
this.idToPartitionItem = null;
this.partitionColumns = null;
this.columnNameToRange = null;
}
public PartitionPrunerV2Base(Map<Long, PartitionItem> idToPartitionItem,
List<Column> partitionColumns,
Map<String, ColumnRange> columnNameToRange) {

View File

@ -0,0 +1,73 @@
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the License for the
// specific language governing permissions and limitations
// under the License.
package org.apache.doris.planner;
import com.google.common.collect.Range;
import java.util.ArrayList;
import java.util.List;
import java.util.Map;
import java.util.NavigableMap;
import java.util.TreeMap;
import java.util.stream.Collectors;
public class RangeMap<C extends Comparable<C>, V> {
private final NavigableMap<Range<C>, V> rangeMap = new TreeMap<>(new RangeComparator<C>());
public void put(Range<C> range, V value) {
rangeMap.put(range, value);
}
public List<V> getOverlappingRangeValues(Range<C> searchRange) {
return getOverlappingRanges(searchRange).stream()
.map(Map.Entry::getValue)
.collect(Collectors.toList());
}
public List<Map.Entry<Range<C>, V>> getOverlappingRanges(Range<C> searchRange) {
List<Map.Entry<Range<C>, V>> overlappingRanges = new ArrayList<>();
// Find the possible starting point for the search
Map.Entry<Range<C>, V> floorEntry = rangeMap.floorEntry(searchRange);
Map.Entry<Range<C>, V> ceilingEntry = rangeMap.ceilingEntry(searchRange);
// Start iterating from the earlier of the floor or ceiling entry
Map.Entry<Range<C>, V> startEntry = (floorEntry != null) ? floorEntry : ceilingEntry;
if (startEntry == null) {
return overlappingRanges;
}
for (Map.Entry<Range<C>, V> entry : rangeMap.tailMap(startEntry.getKey()).entrySet()) {
if (entry.getKey().lowerEndpoint().compareTo(searchRange.upperEndpoint()) > 0) {
break; // No more overlapping ranges possible
}
if (entry.getKey().isConnected(searchRange) && !entry.getKey().intersection(searchRange).isEmpty()) {
overlappingRanges.add(entry);
}
}
return overlappingRanges;
}
private static class RangeComparator<C extends Comparable<C>> implements java.util.Comparator<Range<C>> {
@Override
public int compare(Range<C> r1, Range<C> r2) {
return r1.lowerEndpoint().compareTo(r2.lowerEndpoint());
}
}
}

View File

@ -121,6 +121,9 @@ public class PointQueryExec implements CoordInterface {
OlapScanNode planRoot = getPlanRoot();
// compute scan range
List<TScanRangeLocations> locations = planRoot.lazyEvaluateRangeLocations();
if (planRoot.getScanTabletIds().isEmpty()) {
return;
}
Preconditions.checkState(planRoot.getScanTabletIds().size() == 1);
this.tabletID = planRoot.getScanTabletIds().get(0);
@ -167,6 +170,10 @@ public class PointQueryExec implements CoordInterface {
@Override
public RowBatch getNext() throws Exception {
setScanRangeLocations();
// No partition/tablet found return emtpy row batch
if (candidateBackends == null || candidateBackends.isEmpty()) {
return new RowBatch();
}
Iterator<Backend> backendIter = candidateBackends.iterator();
RowBatch rowBatch = null;
int tryCount = 0;