This is an automated email from the ASF dual-hosted git repository.
dataroaring pushed a commit to branch branch-3.0
in repository https://gitbox.apache.org/repos/asf/doris.git
The following commit(s) were added to refs/heads/branch-3.0 by this push:
new 7f62e9c6190 branch-3.0: [fix](mv) Fix use sync mv wrongly when use rbo
materialized view rewrite rule #47650 (#47834)
7f62e9c6190 is described below
commit 7f62e9c6190ec272db61110b2060db35b7d5deb4
Author: github-actions[bot]
<41898282+github-actions[bot]@users.noreply.github.com>
AuthorDate: Mon Feb 24 17:32:46 2025 +0800
branch-3.0: [fix](mv) Fix use sync mv wrongly when use rbo materialized
view rewrite rule #47650 (#47834)
Cherry-picked from #47650
Co-authored-by: seawinde <[email protected]>
---
.../mv/SelectMaterializedIndexWithAggregate.java | 16 +++++-
.../agg_use_key_direct/agg_use_key_direct.out | Bin 0 -> 210 bytes
.../agg_use_key_direct/agg_use_key_direct.groovy | 63 +++++++++++++++++++++
3 files changed, 76 insertions(+), 3 deletions(-)
diff --git
a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/mv/SelectMaterializedIndexWithAggregate.java
b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/mv/SelectMaterializedIndexWithAggregate.java
index fa03165b37c..42f3f8dbe40 100644
---
a/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/mv/SelectMaterializedIndexWithAggregate.java
+++
b/fe/fe-core/src/main/java/org/apache/doris/nereids/rules/rewrite/mv/SelectMaterializedIndexWithAggregate.java
@@ -42,6 +42,7 @@ import
org.apache.doris.nereids.trees.expressions.SlotNotFromChildren;
import org.apache.doris.nereids.trees.expressions.VirtualSlotReference;
import org.apache.doris.nereids.trees.expressions.WhenClause;
import
org.apache.doris.nereids.trees.expressions.functions.agg.AggregateFunction;
+import org.apache.doris.nereids.trees.expressions.functions.agg.Avg;
import org.apache.doris.nereids.trees.expressions.functions.agg.BitmapUnion;
import
org.apache.doris.nereids.trees.expressions.functions.agg.BitmapUnionCount;
import org.apache.doris.nereids.trees.expressions.functions.agg.Count;
@@ -859,7 +860,8 @@ public class SelectMaterializedIndexWithAggregate extends
AbstractSelectMaterial
matchingAggType,
normalizeName(aggFunc.child(0).toSql())));
boolean contains = containsAllColumn(aggFunc.child(0),
ctx.keyNameToColumn.keySet());
- if (contains ||
ctx.keyNameToColumn.containsKey(childNameWithFuncName)) {
+ if ((contains ||
ctx.keyNameToColumn.containsKey(childNameWithFuncName))
+ && checkWhenUseKey(aggFunc, matchingAggType)) {
if (canUseKeyColumn || ctx.isDupKeysOrMergeOnWrite ||
(!ctx.isBaseIndex() && contains)) {
return PreAggStatus.on();
} else {
@@ -943,8 +945,7 @@ public class SelectMaterializedIndexWithAggregate extends
AbstractSelectMaterial
returnExp.toSql(), matchingAggType));
}
if (ctx.keyNameToColumn.containsKey(exprName)) {
- if (matchingAggType != AggregateType.MAX &&
matchingAggType != AggregateType.MIN
- && (aggFunc instanceof Count &&
!aggFunc.isDistinct())) {
+ if (!checkWhenUseKey(aggFunc, matchingAggType)) {
return PreAggStatus.off("agg on key column should be
MAX, MIN or COUNT DISTINCT.");
}
}
@@ -981,6 +982,15 @@ public class SelectMaterializedIndexWithAggregate extends
AbstractSelectMaterial
}
}
+ // agg on key column should be MAX, MIN, COUNT DISTINCT, SUM DISTINCT, AVG
DISTINCT. return true if valid
+ private static boolean checkWhenUseKey(AggregateFunction aggFunc,
AggregateType matchingAggType) {
+ return matchingAggType == AggregateType.MAX
+ || matchingAggType == AggregateType.MIN
+ || (aggFunc instanceof Sum && aggFunc.isDistinct())
+ || (aggFunc instanceof Count && aggFunc.isDistinct())
+ || (aggFunc instanceof Avg && aggFunc.isDistinct());
+ }
+
private static class CheckContext {
public final LogicalOlapScan scan;
diff --git
a/regression-test/data/mv_p0/agg_use_key_direct/agg_use_key_direct.out
b/regression-test/data/mv_p0/agg_use_key_direct/agg_use_key_direct.out
new file mode 100644
index 00000000000..92d3a082eb1
Binary files /dev/null and
b/regression-test/data/mv_p0/agg_use_key_direct/agg_use_key_direct.out differ
diff --git
a/regression-test/suites/mv_p0/agg_use_key_direct/agg_use_key_direct.groovy
b/regression-test/suites/mv_p0/agg_use_key_direct/agg_use_key_direct.groovy
new file mode 100644
index 00000000000..855ea157f88
--- /dev/null
+++ b/regression-test/suites/mv_p0/agg_use_key_direct/agg_use_key_direct.groovy
@@ -0,0 +1,63 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements. See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership. The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License. You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied. See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite ("agg_use_key_direct") {
+
+ String db = context.config.getDbNameByFile(context.file)
+
+ def tblName = "agg_use_key_direct"
+
+ sql "drop table if exists ${tblName} force;"
+ sql """
+ create table ${tblName} (
+ k1 int null,
+ k2 int not null,
+ k3 bigint null,
+ k4 bigint null,
+ k5 varchar(100) null
+ )
+ duplicate key (k1, k2, k3)
+ distributed by hash(k1) buckets 3
+ properties("replication_num" = "1");
+ """
+ sql "insert into ${tblName} select e1, -4, -4, -4, 'd' from (select 1 k1)
as t lateral view explode_numbers(100) tmp1 as e1;"
+ create_sync_mv(db, tblName, "common_mv", """select k1, k3, sum(k2),
count(k4) from ${tblName} group by k1, k3;""")
+
+ if (enable_sync_mv_cost_based_rewrite()) {
+ sql """set enable_sync_mv_cost_based_rewrite = false;"""
+ }
+
+ mv_rewrite_fail("""select count(k1) from agg_use_key_direct""",
"common_mv")
+ mv_rewrite_fail("""select sum(k1) from agg_use_key_direct""", "common_mv")
+ mv_rewrite_fail("""select avg(k3) from agg_use_key_direct""", "common_mv")
+
+
+ mv_rewrite_success("""select count(distinct k1) from
agg_use_key_direct""", "common_mv")
+ order_qt_select_count """select count(distinct k1) from
agg_use_key_direct"""
+
+ mv_rewrite_success("""select sum(distinct k1) from agg_use_key_direct""",
"common_mv")
+ order_qt_select_sum """select sum(distinct k1) from agg_use_key_direct"""
+
+ mv_rewrite_success("""select max(distinct k3) from agg_use_key_direct""",
"common_mv")
+ order_qt_select_max """select max(distinct k3) from agg_use_key_direct"""
+
+ mv_rewrite_success("""select min(distinct k3) from agg_use_key_direct""",
"common_mv")
+ order_qt_select_min """select min(distinct k3) from agg_use_key_direct"""
+
+ mv_rewrite_success("""select avg(distinct k3) from agg_use_key_direct""",
"common_mv")
+ order_qt_select_avg """select min(distinct k3) from agg_use_key_direct"""
+}
---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]