xy720 commented on code in PR #20085:
URL: https://github.com/apache/doris/pull/20085#discussion_r1206257498
##########
be/src/vec/functions/array/function_array_intersect.cpp:
##########
@@ -79,8 +76,66 @@ struct IntersectAction {
}
};
-using FunctionArrayIntersect =
- FunctionArrayBinary<ArraySetImpl<SetOperation::INTERSECT>,
NameArrayIntersect>;
+class FunctionArrayIntersect : public IFunction {
+public:
+ static constexpr auto name = "array_intersect";
+ static FunctionPtr create() { return
std::make_shared<FunctionArrayIntersect>(); }
+
+ /// Get function name.
+ String get_name() const override { return name; }
+
+ bool is_variadic() const override { return true; }
+
+ bool use_default_implementation_for_constants() const override { return
true; }
+
+ size_t get_number_of_arguments() const override { return 0; }
+
+ DataTypePtr get_return_type_impl(const DataTypes& arguments) const
override {
+ DCHECK(arguments.size() >= 2)
+ << "function: " << get_name() << ", arguments should not less
than 2";
Review Comment:
```suggestion
<< "function: " << get_name() << ", arguments should not
larger equal than 2";
```
##########
be/src/vec/functions/array/function_array_intersect.cpp:
##########
@@ -79,8 +76,66 @@ struct IntersectAction {
}
};
-using FunctionArrayIntersect =
- FunctionArrayBinary<ArraySetImpl<SetOperation::INTERSECT>,
NameArrayIntersect>;
+class FunctionArrayIntersect : public IFunction {
+public:
+ static constexpr auto name = "array_intersect";
+ static FunctionPtr create() { return
std::make_shared<FunctionArrayIntersect>(); }
+
+ /// Get function name.
+ String get_name() const override { return name; }
+
+ bool is_variadic() const override { return true; }
+
+ bool use_default_implementation_for_constants() const override { return
true; }
+
+ size_t get_number_of_arguments() const override { return 0; }
+
+ DataTypePtr get_return_type_impl(const DataTypes& arguments) const
override {
+ DCHECK(arguments.size() >= 2)
+ << "function: " << get_name() << ", arguments should not less
than 2";
+ for (size_t i = 0; i < arguments.size(); ++i) {
+ DCHECK(is_array(arguments[i])) << i << "-th element is not array
type";
+ const auto* array_type =
check_and_get_data_type<DataTypeArray>(arguments[i].get());
Review Comment:
is_array(arguments[i])) already check the data type, why check again?
##########
be/src/vec/functions/array/function_array_intersect.cpp:
##########
@@ -79,8 +76,66 @@ struct IntersectAction {
}
};
-using FunctionArrayIntersect =
- FunctionArrayBinary<ArraySetImpl<SetOperation::INTERSECT>,
NameArrayIntersect>;
+class FunctionArrayIntersect : public IFunction {
Review Comment:
How about create a new class FunctionArrayNary, Just like
FunctionArrayBinary but it can have n arguments.
##########
be/src/vec/functions/array/function_array_intersect.cpp:
##########
@@ -79,8 +76,66 @@ struct IntersectAction {
}
};
-using FunctionArrayIntersect =
- FunctionArrayBinary<ArraySetImpl<SetOperation::INTERSECT>,
NameArrayIntersect>;
+class FunctionArrayIntersect : public IFunction {
+public:
+ static constexpr auto name = "array_intersect";
+ static FunctionPtr create() { return
std::make_shared<FunctionArrayIntersect>(); }
+
+ /// Get function name.
+ String get_name() const override { return name; }
+
+ bool is_variadic() const override { return true; }
+
+ bool use_default_implementation_for_constants() const override { return
true; }
+
+ size_t get_number_of_arguments() const override { return 0; }
+
+ DataTypePtr get_return_type_impl(const DataTypes& arguments) const
override {
+ DCHECK(arguments.size() >= 2)
+ << "function: " << get_name() << ", arguments should not less
than 2";
+ for (size_t i = 0; i < arguments.size(); ++i) {
+ DCHECK(is_array(arguments[i])) << i << "-th element is not array
type";
+ const auto* array_type =
check_and_get_data_type<DataTypeArray>(arguments[i].get());
+ DCHECK(array_type) << "function: " << get_name() << " " << i + 1
+ << "-th argument is not array";
+ }
+ DataTypePtr res_data_type =
+
ArraySetImpl<SetOperation::INTERSECT>::get_return_type(arguments);
+ return res_data_type;
+ }
+
+ Status execute_impl(FunctionContext* context, Block& block, const
ColumnNumbers& arguments,
+ size_t result, size_t input_rows_count) override {
+ CHECK(arguments.size() >= 2);
+ const auto& [left_column, left_const] =
+ unpack_if_const(block.get_by_position(arguments[0]).column);
+ ColumnPtr res_ptr = left_column;
+ ColumnArrayExecutionData left_data;
+ ColumnArrayExecutionData right_data;
+ for (int i = 1; i < arguments.size(); ++i) {
Review Comment:
You should put this loop in ArraySetImpl to avoid calling
`assemble_column_array` and `extract_column_array_info` too many times.
For example, a draft:
```
using ColumnArrayExecutionDatas = std::vector<ColumnArrayExecutionData>;
template <typename Impl, typename Name>
class FunctionArrayNary {
execute_impl(FunctionContext* context, Block& block, const ColumnNumbers&
arguments,
size_t result, size_t input_rows_count) override {
...
Columns cols(arguments.size());
std::unique_ptr<bool[]> col_const =
std::make_unique<bool[]>(arguments.size());
for (int i = 0; i < arguments.size(); ++i) {
std::tie(cols[i], col_const[i]) =
unpack_if_const(block.get_by_position(arguments[i]).column);
extract_column_array_info(*col[i], datas[i]);
}
...
Impl::execute(res_ptr, datas, col_const);
...
}
}
struct ArraySetImpl {
...
static Status execute(ColumnPtr& res_ptr, ColumnArrayExecutionDatas datas,
std::unique_ptr<bool[]> col_const) {
...
ColumnArrayMutableData dst;
dst = create_mutable_data(datas[0].nested_col);
for (int i = 1; i < datas.size(); ++i) {
if (col_const[i - 1]) {
_execute_internal<true, false, ALL_COLUMNS_SIMPLE>(dst,
dst.to_execution_data(), datas[i]);
} else if (col_const[i]) {
_execute_internal<false, true, ALL_COLUMNS_SIMPLE>(dst,
dst.to_execution_data(), datas[i]);
} else {
_execute_internal<false, false, ALL_COLUMNS_SIMPLE>(dst,
dst.to_execution_data(), datas[i]);
}
}
res_ptr = assemble_column_array(dst);
...
}
...
}
```
--
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.
To unsubscribe, e-mail: [email protected]
For queries about this service, please contact Infrastructure at:
[email protected]
---------------------------------------------------------------------
To unsubscribe, e-mail: [email protected]
For additional commands, e-mail: [email protected]