This is an automated email from the ASF dual-hosted git repository.
lzljs3620320 pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/paimon.git
The following commit(s) were added to refs/heads/master by this push:
new 5237031406 [core][spark] Introduce lower transform (#7134)
5237031406 is described below
commit 52370314068db0eed6a8332b32bb8c326990ad32
Author: xuzifu666 <[email protected]>
AuthorDate: Tue Jan 27 19:45:33 2026 +0800
[core][spark] Introduce lower transform (#7134)
---
.../apache/paimon/predicate/LowerTransform.java | 65 ++++++++++++++++++++++
.../org/apache/paimon/predicate/Transform.java | 3 +-
.../paimon/predicate/LowerTransformTest.java | 60 ++++++++++++++++++++
.../paimon/predicate/PredicateJsonSerdeTest.java | 10 ++++
.../spark/util/SparkExpressionConverter.scala | 2 +
.../paimon/spark/sql/PaimonPushDownTestBase.scala | 30 ++++++++++
6 files changed, 169 insertions(+), 1 deletion(-)
diff --git
a/paimon-common/src/main/java/org/apache/paimon/predicate/LowerTransform.java
b/paimon-common/src/main/java/org/apache/paimon/predicate/LowerTransform.java
new file mode 100644
index 0000000000..0565cb9215
--- /dev/null
+++
b/paimon-common/src/main/java/org/apache/paimon/predicate/LowerTransform.java
@@ -0,0 +1,65 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements. See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership. The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.predicate;
+
+import org.apache.paimon.data.BinaryString;
+
+import
org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonCreator;
+import
org.apache.paimon.shade.jackson2.com.fasterxml.jackson.annotation.JsonProperty;
+import
org.apache.paimon.shade.jackson2.com.fasterxml.jackson.databind.annotation.JsonDeserialize;
+
+import java.util.List;
+
+import static org.apache.paimon.utils.Preconditions.checkArgument;
+
+/** Lower {@link Transform}. */
+public class LowerTransform extends StringTransform {
+
+ private static final long serialVersionUID = 1L;
+
+ public static final String NAME = "LOWER";
+
+ @JsonCreator
+ public LowerTransform(
+ @JsonProperty(StringTransform.FIELD_INPUTS)
+ @JsonDeserialize(contentUsing =
StringTransform.InputDeserializer.class)
+ List<Object> inputs) {
+ super(inputs);
+ checkArgument(inputs.size() == 1);
+ }
+
+ @Override
+ public String name() {
+ return NAME;
+ }
+
+ @Override
+ public BinaryString transform(List<BinaryString> inputs) {
+ BinaryString string = inputs.get(0);
+ if (string == null) {
+ return null;
+ }
+ return string.toLowerCase();
+ }
+
+ @Override
+ public Transform copyWithNewInputs(List<Object> inputs) {
+ return new LowerTransform(inputs);
+ }
+}
diff --git
a/paimon-common/src/main/java/org/apache/paimon/predicate/Transform.java
b/paimon-common/src/main/java/org/apache/paimon/predicate/Transform.java
index 79f15699b5..199e1df170 100644
--- a/paimon-common/src/main/java/org/apache/paimon/predicate/Transform.java
+++ b/paimon-common/src/main/java/org/apache/paimon/predicate/Transform.java
@@ -37,7 +37,8 @@ import java.util.List;
@JsonSubTypes.Type(value = CastTransform.class, name = CastTransform.NAME),
@JsonSubTypes.Type(value = ConcatTransform.class, name =
ConcatTransform.NAME),
@JsonSubTypes.Type(value = ConcatWsTransform.class, name =
ConcatWsTransform.NAME),
- @JsonSubTypes.Type(value = UpperTransform.class, name =
UpperTransform.NAME)
+ @JsonSubTypes.Type(value = UpperTransform.class, name =
UpperTransform.NAME),
+ @JsonSubTypes.Type(value = LowerTransform.class, name =
LowerTransform.NAME)
})
public interface Transform extends Serializable {
diff --git
a/paimon-common/src/test/java/org/apache/paimon/predicate/LowerTransformTest.java
b/paimon-common/src/test/java/org/apache/paimon/predicate/LowerTransformTest.java
new file mode 100644
index 0000000000..a4ef62aa4b
--- /dev/null
+++
b/paimon-common/src/test/java/org/apache/paimon/predicate/LowerTransformTest.java
@@ -0,0 +1,60 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements. See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership. The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.paimon.predicate;
+
+import org.apache.paimon.data.BinaryString;
+import org.apache.paimon.data.GenericRow;
+
+import org.junit.jupiter.api.Test;
+
+import java.util.ArrayList;
+import java.util.List;
+
+import static org.assertj.core.api.Assertions.assertThat;
+import static org.assertj.core.api.Assertions.assertThatThrownBy;
+
+class LowerTransformTest {
+
+ @Test
+ public void testNullInputs() {
+ List<Object> inputs = new ArrayList<>();
+ inputs.add(null);
+ LowerTransform transform = new LowerTransform(inputs);
+ Object result = transform.transform(GenericRow.of());
+ assertThat(result).isNull();
+ }
+
+ @Test
+ public void testNormalInputs() {
+ List<Object> inputs = new ArrayList<>();
+ inputs.add(BinaryString.fromString("HELLO"));
+ LowerTransform transform = new LowerTransform(inputs);
+ Object result = transform.transform(GenericRow.of());
+ assertThat(result).isEqualTo(BinaryString.fromString("hello"));
+ }
+
+ @Test
+ public void testIllegalInputs() {
+ List<Object> inputs = new ArrayList<>();
+ inputs.add(BinaryString.fromString("HELLO"));
+ inputs.add(BinaryString.fromString("HI"));
+ assertThatThrownBy(() -> new LowerTransform(inputs))
+ .isInstanceOf(IllegalArgumentException.class);
+ }
+}
diff --git
a/paimon-common/src/test/java/org/apache/paimon/predicate/PredicateJsonSerdeTest.java
b/paimon-common/src/test/java/org/apache/paimon/predicate/PredicateJsonSerdeTest.java
index 18bbadb953..475e889c34 100644
---
a/paimon-common/src/test/java/org/apache/paimon/predicate/PredicateJsonSerdeTest.java
+++
b/paimon-common/src/test/java/org/apache/paimon/predicate/PredicateJsonSerdeTest.java
@@ -114,6 +114,16 @@ class PredicateJsonSerdeTest {
.expectJson(
"{\"kind\":\"LEAF\",\"transform\":{\"name\":\"UPPER\",\"inputs\":[{\"index\":2,\"name\":\"f2\",\"type\":\"STRING\"}]},\"function\":\"STARTS_WITH\",\"literals\":[\"ABC\"]}"),
+ // LeafPredicate - UpperTransform
+ TestSpec.forPredicate(
+ builder.startsWith(
+ new LowerTransform(
+ Collections.singletonList(
+ new FieldRef(2, "f2",
DataTypes.STRING()))),
+ BinaryString.fromString("abc")))
+ .expectJson(
+
"{\"kind\":\"LEAF\",\"transform\":{\"name\":\"LOWER\",\"inputs\":[{\"index\":2,\"name\":\"f2\",\"type\":\"STRING\"}]},\"function\":\"STARTS_WITH\",\"literals\":[\"abc\"]}"),
+
// LeafPredicate - ConcatTransform
TestSpec.forPredicate(
builder.contains(
diff --git
a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/util/SparkExpressionConverter.scala
b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/util/SparkExpressionConverter.scala
index 32409544b6..83a75c37dd 100644
---
a/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/util/SparkExpressionConverter.scala
+++
b/paimon-spark/paimon-spark-common/src/main/scala/org/apache/paimon/spark/util/SparkExpressionConverter.scala
@@ -37,6 +37,7 @@ object SparkExpressionConverter {
// Supported general scalar transform names
private val CONCAT = "CONCAT"
private val UPPER = "UPPER"
+ private val LOWER = "LOWER"
/** Convert Spark [[Expression]] to Paimon [[Transform]], return None if not
supported. */
def toPaimonTransform(exp: Expression, rowType: RowType): Option[Transform]
= {
@@ -60,6 +61,7 @@ object SparkExpressionConverter {
s.name() match {
case CONCAT => convertChildren(s.children()).map(i => new
ConcatTransform(i))
case UPPER => convertChildren(s.children()).map(i => new
UpperTransform(i))
+ case LOWER => convertChildren(s.children()).map(i => new
LowerTransform(i))
case _ => None
}
case c: Cast =>
diff --git
a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonPushDownTestBase.scala
b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonPushDownTestBase.scala
index 715a5642d2..3902e8c4ad 100644
---
a/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonPushDownTestBase.scala
+++
b/paimon-spark/paimon-spark-ut/src/test/scala/org/apache/paimon/spark/sql/PaimonPushDownTestBase.scala
@@ -160,6 +160,36 @@ abstract class PaimonPushDownTestBase extends
PaimonSparkTestBase with AdaptiveS
}
}
+ test(s"Paimon push down: apply LOWER") {
+ // Spark support push down LOWER since Spark 3.4.
+ if (gteqSpark3_4) {
+ withTable("t") {
+ sql("""
+ |CREATE TABLE t (id int, value int, dt STRING)
+ |using paimon
+ |PARTITIONED BY (dt)
+ |""".stripMargin)
+
+ sql("""
+ |INSERT INTO t values
+ |(1, 100, 'hello')
+ |""".stripMargin)
+
+ val q =
+ """
+ |SELECT * FROM t
+ |WHERE LOWER(dt) = 'hello'
+ |""".stripMargin
+ assert(!checkFilterExists(q))
+
+ checkAnswer(
+ spark.sql(q),
+ Seq(Row(1, 100, "hello"))
+ )
+ }
+ }
+ }
+
test(s"Paimon push down: apply CAST") {
if (gteqSpark3_4) {
withSparkSQLConf("spark.sql.ansi.enabled" -> "true") {