NDVToHll.java
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the License for the
// specific language governing permissions and limitations
// under the License.
package org.apache.doris.rewrite.mvrewrite;
import org.apache.doris.analysis.Analyzer;
import org.apache.doris.analysis.CreateMaterializedViewStmt;
import org.apache.doris.analysis.Expr;
import org.apache.doris.analysis.FunctionCallExpr;
import org.apache.doris.analysis.SlotRef;
import org.apache.doris.analysis.TableName;
import org.apache.doris.catalog.AggregateType;
import org.apache.doris.catalog.Column;
import org.apache.doris.catalog.FunctionSet;
import org.apache.doris.catalog.OlapTable;
import org.apache.doris.catalog.TableIf;
import org.apache.doris.common.AnalysisException;
import org.apache.doris.rewrite.ExprRewriteRule;
import org.apache.doris.rewrite.ExprRewriter;
import com.google.common.base.Preconditions;
import com.google.common.collect.Lists;
import java.util.List;
/**
* For duplicate table, the ndv(k1) could be rewritten to hll_union_agg(mv_hll_union_k1) when hll
* mv exists.
* For example:
* Table: (k1 int, k2 int)
* MV: (k1 int, mv_hll_union_k2 hll hll_union)
* mv_hll_union_k2 = hll_hash(k2)
* Query: select k1, ndv(k2) from table group by k1
* or select k1, approx_count_distinct(k2) from table group by k1
* Rewritten query: select k1, hll_union_agg(mv_hll_union_k2) from table group by k1
*/
public class NDVToHll implements ExprRewriteRule {
public static final ExprRewriteRule INSTANCE = new NDVToHll();
@Override
public Expr apply(Expr expr, Analyzer analyzer, ExprRewriter.ClauseType clauseType) throws AnalysisException {
// meet condition
if (!(expr instanceof FunctionCallExpr)) {
return expr;
}
FunctionCallExpr fnExpr = (FunctionCallExpr) expr;
if (!fnExpr.getFnName().getFunction().equalsIgnoreCase("ndv")
&& !fnExpr.getFnName().getFunction().equalsIgnoreCase("approx_count_distinct")) {
return expr;
}
if (fnExpr.getChildren().size() != 1 || !(fnExpr.getChild(0) instanceof SlotRef)) {
return expr;
}
SlotRef fnChild0 = (SlotRef) fnExpr.getChild(0);
Column column = fnChild0.getColumn();
TableIf table = fnChild0.getTable();
if (column == null || table == null || !(table instanceof OlapTable)) {
return expr;
}
OlapTable olapTable = (OlapTable) table;
// check column
String queryColumnName = column.getName();
String mvColumnName = CreateMaterializedViewStmt
.mvColumnBuilder(AggregateType.HLL_UNION.name().toLowerCase(), queryColumnName);
Column mvColumn = olapTable.getVisibleColumn(mvColumnName);
if (mvColumn == null) {
return expr;
}
// rewrite expr
return rewriteExpr(fnChild0, mvColumn, analyzer);
}
private Expr rewriteExpr(SlotRef queryColumnSlotRef, Column mvColumn, Analyzer analyzer) {
Preconditions.checkNotNull(mvColumn);
Preconditions.checkNotNull(queryColumnSlotRef);
TableName tableName = queryColumnSlotRef.getTableName();
Preconditions.checkNotNull(tableName);
SlotRef mvSlotRef = new SlotRef(tableName, mvColumn.getName());
List<Expr> newFnParams = Lists.newArrayList();
newFnParams.add(mvSlotRef);
FunctionCallExpr result = new FunctionCallExpr(FunctionSet.HLL_UNION_AGG, newFnParams);
result.analyzeNoThrow(analyzer);
return result;
}
}