This is an automated email from the ASF dual-hosted git repository.
morrysnow pushed a commit to branch branch-3.1
in repository https://gitbox.apache.org/repos/asf/doris.git
The following commit(s) were added to refs/heads/branch-3.1 by this push:
new 38b23683c76 branch-3.1: [Feature](function) support function
array_flatten #47404 (#59319)
38b23683c76 is described below
commit 38b23683c7604705021731640836e7997dd16a97
Author: github-actions[bot]
<41898282+github-actions[bot]@users.noreply.github.com>
AuthorDate: Fri Dec 26 10:04:16 2025 +0800
branch-3.1: [Feature](function) support function array_flatten #47404
(#59319)
Cherry-picked from #47404
---------
Co-authored-by: Pxl <[email protected]>
---
.../vec/functions/array/function_array_flatten.cpp | 92 ++++++++++++++++++++++
.../functions/array/function_array_register.cpp | 3 +-
.../doris/catalog/BuiltinScalarFunctions.java | 2 +
.../expressions/functions/scalar/ArrayFlatten.java | 67 ++++++++++++++++
.../expressions/visitor/ScalarFunctionVisitor.java | 5 ++
.../nereids_function_p0/scalar_function/Array.out | 30 +++++++
.../array_functions/array_flatten.out | 6 ++
.../scalar_function/Array.groovy | 11 +++
.../array_functions/array_flatten.groovy | 46 +++++++++++
9 files changed, 261 insertions(+), 1 deletion(-)
diff --git a/be/src/vec/functions/array/function_array_flatten.cpp
b/be/src/vec/functions/array/function_array_flatten.cpp
new file mode 100644
index 00000000000..d58a76264dd
--- /dev/null
+++ b/be/src/vec/functions/array/function_array_flatten.cpp
@@ -0,0 +1,92 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements. See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership. The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License. You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied. See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+#include "common/status.h"
+#include "vec/aggregate_functions/aggregate_function.h"
+#include "vec/columns/column.h"
+#include "vec/columns/column_array.h"
+#include "vec/columns/column_nullable.h"
+#include "vec/common/assert_cast.h"
+#include "vec/core/block.h"
+#include "vec/core/column_numbers.h"
+#include "vec/core/column_with_type_and_name.h"
+#include "vec/core/types.h"
+#include "vec/data_types/data_type.h"
+#include "vec/data_types/data_type_array.h"
+#include "vec/functions/function.h"
+#include "vec/functions/simple_function_factory.h"
+
+namespace doris::vectorized {
+#include "common/compile_check_begin.h"
+
+class FunctionArrayFlatten : public IFunction {
+public:
+ static constexpr auto name = "array_flatten";
+ static FunctionPtr create() { return
std::make_shared<FunctionArrayFlatten>(); }
+
+ /// Get function name.
+ String get_name() const override { return name; }
+
+ size_t get_number_of_arguments() const override { return 1; }
+
+ DataTypePtr get_return_type_impl(const DataTypes& arguments) const
override {
+ DataTypePtr arg = arguments[0];
+ while (is_array(arg)) {
+ arg = remove_nullable(assert_cast<const
DataTypeArray*>(arg.get())->get_nested_type());
+ }
+ return std::make_shared<DataTypeArray>(make_nullable(arg));
+ }
+
+ Status execute_impl(FunctionContext* context, Block& block, const
ColumnNumbers& arguments,
+ size_t result, size_t input_rows_count) const override
{
+ auto src_column =
+
block.get_by_position(arguments[0]).column->convert_to_full_column_if_const();
+ auto* src_column_array_ptr =
+
assert_cast<ColumnArray*>(remove_nullable(src_column)->assume_mutable().get());
+ ColumnArray* nested_src_column_array_ptr = src_column_array_ptr;
+
+ auto result_column_offsets =
+
assert_cast<ColumnArray::ColumnOffsets&>(src_column_array_ptr->get_offsets_column())
+ .clone();
+ auto* offsets =
assert_cast<ColumnArray::ColumnOffsets*>(result_column_offsets.get())
+ ->get_data()
+ .data();
+
+ while (src_column_array_ptr->get_data_ptr()->is_column_array()) {
+ nested_src_column_array_ptr = assert_cast<ColumnArray*>(
+
remove_nullable(src_column_array_ptr->get_data_ptr())->assume_mutable().get());
+
+ for (size_t i = 0; i < input_rows_count; ++i) {
+ offsets[i] =
nested_src_column_array_ptr->get_offsets()[offsets[i] - 1];
+ }
+ src_column_array_ptr = nested_src_column_array_ptr;
+ }
+
+ block.replace_by_position(
+ result, ColumnArray::create(assert_cast<const ColumnNullable&>(
+
nested_src_column_array_ptr->get_data())
+ .clone(),
+ std::move(result_column_offsets)));
+ return Status::OK();
+ }
+};
+
+void register_function_array_flatten(SimpleFunctionFactory& factory) {
+ factory.register_function<FunctionArrayFlatten>();
+}
+
+} // namespace doris::vectorized
\ No newline at end of file
diff --git a/be/src/vec/functions/array/function_array_register.cpp
b/be/src/vec/functions/array/function_array_register.cpp
index 071c3198189..06b47d6c725 100644
--- a/be/src/vec/functions/array/function_array_register.cpp
+++ b/be/src/vec/functions/array/function_array_register.cpp
@@ -21,7 +21,7 @@
#include "vec/functions/simple_function_factory.h"
namespace doris::vectorized {
-
+void register_function_array_flatten(SimpleFunctionFactory&);
void register_function_array_shuffle(SimpleFunctionFactory&);
void register_function_array_exists(SimpleFunctionFactory&);
void register_function_array_element(SimpleFunctionFactory&);
@@ -59,6 +59,7 @@ void register_function_array_splits(SimpleFunctionFactory&);
void register_function_array_match(SimpleFunctionFactory&);
void register_function_array(SimpleFunctionFactory& factory) {
+ register_function_array_flatten(factory);
register_function_array_shuffle(factory);
register_function_array_exists(factory);
register_function_array_element(factory);
diff --git
a/fe/fe-core/src/main/java/org/apache/doris/catalog/BuiltinScalarFunctions.java
b/fe/fe-core/src/main/java/org/apache/doris/catalog/BuiltinScalarFunctions.java
index fa72b4e832c..4d6cdc8fc38 100644
---
a/fe/fe-core/src/main/java/org/apache/doris/catalog/BuiltinScalarFunctions.java
+++
b/fe/fe-core/src/main/java/org/apache/doris/catalog/BuiltinScalarFunctions.java
@@ -41,6 +41,7 @@ import
org.apache.doris.nereids.trees.expressions.functions.scalar.ArrayExists;
import org.apache.doris.nereids.trees.expressions.functions.scalar.ArrayFilter;
import org.apache.doris.nereids.trees.expressions.functions.scalar.ArrayFirst;
import
org.apache.doris.nereids.trees.expressions.functions.scalar.ArrayFirstIndex;
+import
org.apache.doris.nereids.trees.expressions.functions.scalar.ArrayFlatten;
import
org.apache.doris.nereids.trees.expressions.functions.scalar.ArrayIntersect;
import org.apache.doris.nereids.trees.expressions.functions.scalar.ArrayJoin;
import org.apache.doris.nereids.trees.expressions.functions.scalar.ArrayLast;
@@ -523,6 +524,7 @@ public class BuiltinScalarFunctions implements
FunctionHelper {
scalar(ArrayFilter.class, "array_filter"),
scalar(ArrayFirst.class, "array_first"),
scalar(ArrayFirstIndex.class, "array_first_index"),
+ scalar(ArrayFlatten.class, "array_flatten"),
scalar(ArrayIntersect.class, "array_intersect"),
scalar(ArrayJoin.class, "array_join"),
scalar(ArrayLast.class, "array_last"),
diff --git
a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/expressions/functions/scalar/ArrayFlatten.java
b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/expressions/functions/scalar/ArrayFlatten.java
new file mode 100644
index 00000000000..3f340ec01cd
--- /dev/null
+++
b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/expressions/functions/scalar/ArrayFlatten.java
@@ -0,0 +1,67 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements. See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership. The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License. You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied. See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+package org.apache.doris.nereids.trees.expressions.functions.scalar;
+
+import org.apache.doris.catalog.FunctionSignature;
+import org.apache.doris.nereids.trees.expressions.Expression;
+import org.apache.doris.nereids.trees.expressions.functions.CustomSignature;
+import org.apache.doris.nereids.trees.expressions.functions.PropagateNullable;
+import org.apache.doris.nereids.trees.expressions.visitor.ExpressionVisitor;
+import org.apache.doris.nereids.types.ArrayType;
+import org.apache.doris.nereids.types.DataType;
+
+import com.google.common.base.Preconditions;
+
+import java.util.List;
+
+/**
+ * ScalarFunction 'array_flatten'
+ */
+public class ArrayFlatten extends ScalarFunction
+ implements CustomSignature, PropagateNullable {
+
+ /**
+ * constructor with 1 arguments.
+ */
+ public ArrayFlatten(Expression arg) {
+ super("array_flatten", arg);
+ }
+
+ @Override
+ public FunctionSignature customSignature() {
+ DataType dataType = getArgument(0).getDataType();
+ while (dataType instanceof ArrayType) {
+ dataType = ((ArrayType) dataType).getItemType();
+ }
+ return
FunctionSignature.ret(ArrayType.of(dataType)).args(getArgument(0).getDataType());
+ }
+
+ /**
+ * withChildren.
+ */
+ @Override
+ public ArrayFlatten withChildren(List<Expression> children) {
+ Preconditions.checkArgument(children.size() == 1);
+ return new ArrayFlatten(children.get(0));
+ }
+
+ @Override
+ public <R, C> R accept(ExpressionVisitor<R, C> visitor, C context) {
+ return visitor.visitArrayFlatten(this, context);
+ }
+}
diff --git
a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/expressions/visitor/ScalarFunctionVisitor.java
b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/expressions/visitor/ScalarFunctionVisitor.java
index dd364b8be75..60e9a0dbb13 100644
---
a/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/expressions/visitor/ScalarFunctionVisitor.java
+++
b/fe/fe-core/src/main/java/org/apache/doris/nereids/trees/expressions/visitor/ScalarFunctionVisitor.java
@@ -42,6 +42,7 @@ import
org.apache.doris.nereids.trees.expressions.functions.scalar.ArrayExcept;
import org.apache.doris.nereids.trees.expressions.functions.scalar.ArrayExists;
import org.apache.doris.nereids.trees.expressions.functions.scalar.ArrayFilter;
import
org.apache.doris.nereids.trees.expressions.functions.scalar.ArrayFirstIndex;
+import
org.apache.doris.nereids.trees.expressions.functions.scalar.ArrayFlatten;
import
org.apache.doris.nereids.trees.expressions.functions.scalar.ArrayIntersect;
import org.apache.doris.nereids.trees.expressions.functions.scalar.ArrayJoin;
import
org.apache.doris.nereids.trees.expressions.functions.scalar.ArrayLastIndex;
@@ -683,6 +684,10 @@ public interface ScalarFunctionVisitor<R, C> {
return visitScalarFunction(arrayShuffle, context);
}
+ default R visitArrayFlatten(ArrayFlatten arrayFlatten, C context) {
+ return visitScalarFunction(arrayFlatten, context);
+ }
+
default R visitArrayMap(ArrayMap arraySort, C context) {
return visitScalarFunction(arraySort, context);
}
diff --git a/regression-test/data/nereids_function_p0/scalar_function/Array.out
b/regression-test/data/nereids_function_p0/scalar_function/Array.out
index 402a92a394c..e0dbb4e83cc 100644
--- a/regression-test/data/nereids_function_p0/scalar_function/Array.out
+++ b/regression-test/data/nereids_function_p0/scalar_function/Array.out
@@ -16924,3 +16924,33 @@ false false
-- !sql --
false false
+-- !sql --
+[1, 2, 3, 4, 5]
+
+-- !sql --
+[]
+
+-- !sql --
+[1]
+
+-- !sql --
+[1, 2, 3]
+
+-- !sql --
+[1, 2, 3, 4, 5]
+
+-- !sql --
+[null, null]
+
+-- !sql --
+[1, 2, 3, 4, 5]
+
+-- !sql --
+[1, 2, 3, 4, 5]
+
+-- !sql --
+[1, 2, 3, 4, 5, 6, 7, 8, 9]
+
+-- !sql --
+[1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12]
+
diff --git
a/regression-test/data/query_p0/sql_functions/array_functions/array_flatten.out
b/regression-test/data/query_p0/sql_functions/array_functions/array_flatten.out
new file mode 100644
index 00000000000..fa71438783d
--- /dev/null
+++
b/regression-test/data/query_p0/sql_functions/array_functions/array_flatten.out
@@ -0,0 +1,6 @@
+-- This file is automatically generated. You should know what you did if you
want to edit this
+-- !test --
+1 [1, 2, 3] [1, 2, 3] [1, 2, 3] [1, 2, 3] ["a",
"b", "c"]
+2 \N \N [] \N ["b", null]
+3 [1, 2, null] [null] [null, 2] [null, null, 3] [null, "aaaab",
"ccc"]
+
diff --git
a/regression-test/suites/nereids_function_p0/scalar_function/Array.groovy
b/regression-test/suites/nereids_function_p0/scalar_function/Array.groovy
index 8211877bfe2..4eb6fbc6430 100644
--- a/regression-test/suites/nereids_function_p0/scalar_function/Array.groovy
+++ b/regression-test/suites/nereids_function_p0/scalar_function/Array.groovy
@@ -1416,4 +1416,15 @@ suite("nereids_scalar_fn_Array") {
// map_contains_value
qt_sql """ select map_contains_value(map(1,1), 257),
map_contains_value(map(1,2), 258);"""
+ qt_sql """select array_flatten([[1,2,3],[4,5]]);"""
+ qt_sql """select array_flatten([[],[]]);"""
+ qt_sql """select array_flatten([[1],[]]);"""
+ qt_sql """select array_flatten([[1,2,3],null]);"""
+ qt_sql """select array_flatten([[1,2,3],null,[4,5]]);"""
+ qt_sql """select array_flatten([null,null]);"""
+ qt_sql """select array_flatten([[1,2,3,4,5]]);"""
+ qt_sql """select array_flatten([[[1,2,3,4,5]]]);;"""
+ qt_sql """select array_flatten([ [[1,2,3,4,5]],[[6,7],[8,9]] ]);"""
+ qt_sql """select
array_flatten([[[[[[1,2,3,4,5],[6,7],[8,9],[10,11],[12]]]]]]);"""
+
}
diff --git
a/regression-test/suites/query_p0/sql_functions/array_functions/array_flatten.groovy
b/regression-test/suites/query_p0/sql_functions/array_functions/array_flatten.groovy
new file mode 100644
index 00000000000..82d4a39a565
--- /dev/null
+++
b/regression-test/suites/query_p0/sql_functions/array_functions/array_flatten.groovy
@@ -0,0 +1,46 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements. See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership. The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License. You may obtain a copy of the License at
+//
+// http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied. See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+suite("array_flatten") {
+ sql """DROP TABLE IF EXISTS t_array_flatten"""
+ sql """
+ CREATE TABLE IF NOT EXISTS t_array_flatten (
+ `k1` int(11) NULL COMMENT "",
+ `a1` array<tinyint(4)> NULL COMMENT "",
+ `aaa1` array<array<array<tinyint(4)>>> NULL COMMENT "",
+ `aa3` array<array<int(11)>> NOT NULL COMMENT "",
+ `aa5` array<array<largeint(40)>> NULL COMMENT "",
+ `aa14` array<array<string>> NULL COMMENT ""
+
+ ) ENGINE=OLAP
+ DUPLICATE KEY(`k1`)
+ DISTRIBUTED BY HASH(`k1`) BUCKETS 1
+ PROPERTIES (
+ "replication_allocation" = "tag.location.default: 1",
+ "storage_format" = "V2"
+ )
+ """
+ sql """ INSERT INTO t_array_flatten VALUES(1, [1, 2,
3],[[[1]],[[2],[3]]],[[1,2],[3]],[[1,2],[3]],[['a'],['b','c']]) """
+ sql """ INSERT INTO t_array_flatten VALUES(2,
null,null,[],null,[null,['b',null]]) """
+ sql """ INSERT INTO t_array_flatten VALUES(3, [1, 2,
null],[[[]],[[null],[]]],[[null,2],[]],[[null,null],[3]],[[null],['aaaab','ccc']])
"""
+
+
+
+ qt_test """
+ select k1, array_flatten(a1), array_flatten(aaa1), array_flatten(aa3),
array_flatten(aa5), array_flatten(aa14) from t_array_flatten order by k1;
+ """
+}
---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]