zhiqiang-hhhh commented on code in PR #32746: URL: https://github.com/apache/doris/pull/32746#discussion_r1546252400
########## be/src/vec/functions/round.h: ########## @@ -446,6 +479,179 @@ struct Dispatcher { return nullptr; } } + + // NOTE: This function is only tested for truncate + // DO NOT USE THIS METHOD FOR OTHER ROUNDING BASED FUNCTION UNTIL YOU KNOW EXACTLY WHAT YOU ARE DOING !!! + static ColumnPtr apply_vec_vec(const IColumn* col_general, const IColumn* col_scale) { + if constexpr (rounding_mode != RoundingMode::Trunc) { + throw doris::Exception(ErrorCode::INVALID_ARGUMENT, + "Using column as scale is only supported for function truncate"); + } + + const ColumnInt32& col_scale_i32 = assert_cast<const ColumnInt32&>(*col_scale); + const size_t input_row_count = col_scale_i32.size(); + for (size_t i = 0; i < input_row_count; ++i) { + const Int32 scale_arg = col_scale_i32.get_data()[i]; + if (scale_arg > std::numeric_limits<Int16>::max() || + scale_arg < std::numeric_limits<Int16>::min()) { + throw doris::Exception(ErrorCode::OUT_OF_BOUND, + "Scale argument for function is out of bound: {}", + scale_arg); + } + } + + if constexpr (IsNumber<T>) { + const auto* col = assert_cast<const ColumnVector<T>*>(col_general); + auto col_res = ColumnVector<T>::create(); + typename ColumnVector<T>::Container& vec_res = col_res->get_data(); + vec_res.resize(input_row_count); + + for (size_t i = 0; i < input_row_count; ++i) { + const Int32 scale_arg = col_scale_i32.get_data()[i]; + if (scale_arg == 0) { + size_t scale = 1; + FunctionRoundingImpl<ScaleMode::Zero>::apply(col->get_data()[i], scale, + vec_res[i]); + } else if (scale_arg > 0) { + size_t scale = int_exp10(scale_arg); + FunctionRoundingImpl<ScaleMode::Positive>::apply(col->get_data()[i], scale, + vec_res[i]); + } else { + size_t scale = int_exp10(-scale_arg); + FunctionRoundingImpl<ScaleMode::Negative>::apply(col->get_data()[i], scale, + vec_res[i]); + } + } + return col_res; + } else if constexpr (IsDecimalNumber<T>) { + const auto* decimal_col = assert_cast<const ColumnDecimal<T>*>(col_general); + + // For truncate, ALWAYS use SAME scale with source Decimal column + const Int32 input_scale = decimal_col->get_scale(); + auto col_res = ColumnDecimal<T>::create(input_row_count, input_scale); + + for (size_t i = 0; i < input_row_count; ++i) { + DecimalRoundingImpl<T, rounding_mode, tie_breaking_mode>::apply( + decimal_col->get_element(i).value, input_scale, + col_res->get_element(i).value, col_scale_i32.get_data()[i]); + } + + for (size_t i = 0; i < input_row_count; ++i) { + // For truncate(ColumnDecimal, ColumnInt32), we should always have same scale with source Decimal column + // So we need this check to make sure the result have correct digits count + // + // Case 0: scale_arg <= -(integer part digits count) + // do nothing, because result is 0 + // Case 1: scale_arg <= 0 && scale_arg > -(integer part digits count) + // decimal parts has been erased, so add them back by multiply 10^(scale_arg) + // Case 2: scale_arg > 0 && scale_arg < decimal part digits count + // decimal part now has scale_arg digits, so multiply 10^(input_scale - scal_arg) + // Case 3: scale_arg >= input_scale + // do nothing + const Int32 scale_arg = col_scale_i32.get_data()[i]; + if (scale_arg <= 0) { + col_res->get_element(i).value *= int_exp10(input_scale); + } else if (scale_arg > 0 && scale_arg < input_scale) { + col_res->get_element(i).value *= int_exp10(input_scale - scale_arg); + } + } + + return col_res; + } else { + LOG(FATAL) << "__builtin_unreachable"; + __builtin_unreachable(); + return nullptr; + } + } + + // NOTE: This function is only tested for truncate + // DO NOT USE THIS METHOD FOR OTHER ROUNDING BASED FUNCTION UNTIL YOU KNOW EXACTLY WHAT YOU ARE DOING !!! only test for truncate + static ColumnPtr apply_const_vec(const ColumnConst* const_col_general, + const IColumn* col_scale) { + if constexpr (rounding_mode != RoundingMode::Trunc) { + throw doris::Exception(ErrorCode::INVALID_ARGUMENT, + "Using column as scale is only supported for function truncate"); + } + + const ColumnInt32& col_scale_i32 = assert_cast<const ColumnInt32&>(*col_scale); + const size_t input_rows_count = col_scale->size(); + + for (size_t i = 0; i < input_rows_count; ++i) { + const Int32 scale_arg = col_scale_i32.get_data()[i]; + + if (scale_arg > std::numeric_limits<Int16>::max() || + scale_arg < std::numeric_limits<Int16>::min()) { + throw doris::Exception(ErrorCode::OUT_OF_BOUND, Review Comment: update: actually this loop is separated from the loop that processes the data block, so the exception will not break the auto vectorization. -- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. To unsubscribe, e-mail: commits-unsubscr...@doris.apache.org For queries about this service, please contact Infrastructure at: us...@infra.apache.org --------------------------------------------------------------------- To unsubscribe, e-mail: commits-unsubscr...@doris.apache.org For additional commands, e-mail: commits-h...@doris.apache.org