Given we no longer want vcond[u]{,_eq} and VEC_COND_EXPR or COND_EXPR with embedded GENERIC comparisons the whole check_bool_pattern and adjust_bool_stmts machinery is dead. It is effectively dead after r15-4713-g0942bb85fc5573 and the following patch removes it.
Bootstrapped and tested on x86_64-unknown-linux-gnu. * tree-vect-patterns.cc (check_bool_pattern): Remove. (adjust_bool_pattern_cast): Likewise. (adjust_bool_pattern): Likewise. (sort_after_uid): Likewise. (adjust_bool_stmts): Likewise. (vect_recog_bool_pattern): Remove calls to check_bool_pattern and fold as if it returns false. --- gcc/tree-vect-patterns.cc | 385 ++++---------------------------------- 1 file changed, 34 insertions(+), 351 deletions(-) diff --git a/gcc/tree-vect-patterns.cc b/gcc/tree-vect-patterns.cc index 302101fa6a0..945e7d2dc45 100644 --- a/gcc/tree-vect-patterns.cc +++ b/gcc/tree-vect-patterns.cc @@ -5360,300 +5360,6 @@ vect_recog_mod_var_pattern (vec_info *vinfo, } -/* Helper function of vect_recog_bool_pattern. Called recursively, return - true if bool VAR can and should be optimized that way. Assume it shouldn't - in case it's a result of a comparison which can be directly vectorized into - a vector comparison. Fills in STMTS with all stmts visited during the - walk. */ - -static bool -check_bool_pattern (tree var, vec_info *vinfo, hash_set<gimple *> &stmts) -{ - tree rhs1; - enum tree_code rhs_code; - - stmt_vec_info def_stmt_info = vect_get_internal_def (vinfo, var); - if (!def_stmt_info) - return false; - - gassign *def_stmt = dyn_cast <gassign *> (def_stmt_info->stmt); - if (!def_stmt) - return false; - - if (stmts.contains (def_stmt)) - return true; - - rhs1 = gimple_assign_rhs1 (def_stmt); - rhs_code = gimple_assign_rhs_code (def_stmt); - switch (rhs_code) - { - case SSA_NAME: - if (! check_bool_pattern (rhs1, vinfo, stmts)) - return false; - break; - - CASE_CONVERT: - if (!VECT_SCALAR_BOOLEAN_TYPE_P (TREE_TYPE (rhs1))) - return false; - if (! check_bool_pattern (rhs1, vinfo, stmts)) - return false; - break; - - case BIT_NOT_EXPR: - if (! check_bool_pattern (rhs1, vinfo, stmts)) - return false; - break; - - case BIT_AND_EXPR: - case BIT_IOR_EXPR: - case BIT_XOR_EXPR: - if (! check_bool_pattern (rhs1, vinfo, stmts) - || ! check_bool_pattern (gimple_assign_rhs2 (def_stmt), vinfo, stmts)) - return false; - break; - - default: - return false; - } - - bool res = stmts.add (def_stmt); - /* We can't end up recursing when just visiting SSA defs but not PHIs. */ - gcc_assert (!res); - - return true; -} - - -/* Helper function of adjust_bool_pattern. Add a cast to TYPE to a previous - stmt (SSA_NAME_DEF_STMT of VAR) adding a cast to STMT_INFOs - pattern sequence. */ - -static tree -adjust_bool_pattern_cast (vec_info *vinfo, - tree type, tree var, stmt_vec_info stmt_info) -{ - gimple *cast_stmt = gimple_build_assign (vect_recog_temp_ssa_var (type, NULL), - NOP_EXPR, var); - append_pattern_def_seq (vinfo, stmt_info, cast_stmt, - get_vectype_for_scalar_type (vinfo, type)); - return gimple_assign_lhs (cast_stmt); -} - -/* Helper function of vect_recog_bool_pattern. Do the actual transformations. - VAR is an SSA_NAME that should be transformed from bool to a wider integer - type, OUT_TYPE is the desired final integer type of the whole pattern. - STMT_INFO is the info of the pattern root and is where pattern stmts should - be associated with. DEFS is a map of pattern defs. */ - -static void -adjust_bool_pattern (vec_info *vinfo, tree var, tree out_type, - stmt_vec_info stmt_info, hash_map <tree, tree> &defs) -{ - gimple *stmt = SSA_NAME_DEF_STMT (var); - enum tree_code rhs_code, def_rhs_code; - tree itype, cond_expr, rhs1, rhs2, irhs1, irhs2; - location_t loc; - gimple *pattern_stmt, *def_stmt; - tree trueval = NULL_TREE; - - rhs1 = gimple_assign_rhs1 (stmt); - rhs2 = gimple_assign_rhs2 (stmt); - rhs_code = gimple_assign_rhs_code (stmt); - loc = gimple_location (stmt); - switch (rhs_code) - { - case SSA_NAME: - CASE_CONVERT: - irhs1 = *defs.get (rhs1); - itype = TREE_TYPE (irhs1); - pattern_stmt - = gimple_build_assign (vect_recog_temp_ssa_var (itype, NULL), - SSA_NAME, irhs1); - break; - - case BIT_NOT_EXPR: - irhs1 = *defs.get (rhs1); - itype = TREE_TYPE (irhs1); - pattern_stmt - = gimple_build_assign (vect_recog_temp_ssa_var (itype, NULL), - BIT_XOR_EXPR, irhs1, build_int_cst (itype, 1)); - break; - - case BIT_AND_EXPR: - /* Try to optimize x = y & (a < b ? 1 : 0); into - x = (a < b ? y : 0); - - E.g. for: - bool a_b, b_b, c_b; - TYPE d_T; - - S1 a_b = x1 CMP1 y1; - S2 b_b = x2 CMP2 y2; - S3 c_b = a_b & b_b; - S4 d_T = (TYPE) c_b; - - we would normally emit: - - S1' a_T = x1 CMP1 y1 ? 1 : 0; - S2' b_T = x2 CMP2 y2 ? 1 : 0; - S3' c_T = a_T & b_T; - S4' d_T = c_T; - - but we can save one stmt by using the - result of one of the COND_EXPRs in the other COND_EXPR and leave - BIT_AND_EXPR stmt out: - - S1' a_T = x1 CMP1 y1 ? 1 : 0; - S3' c_T = x2 CMP2 y2 ? a_T : 0; - S4' f_T = c_T; - - At least when VEC_COND_EXPR is implemented using masks - cond ? 1 : 0 is as expensive as cond ? var : 0, in both cases it - computes the comparison masks and ands it, in one case with - all ones vector, in the other case with a vector register. - Don't do this for BIT_IOR_EXPR, because cond ? 1 : var; is - often more expensive. */ - def_stmt = SSA_NAME_DEF_STMT (rhs2); - def_rhs_code = gimple_assign_rhs_code (def_stmt); - if (TREE_CODE_CLASS (def_rhs_code) == tcc_comparison) - { - irhs1 = *defs.get (rhs1); - tree def_rhs1 = gimple_assign_rhs1 (def_stmt); - if (TYPE_PRECISION (TREE_TYPE (irhs1)) - == GET_MODE_BITSIZE (SCALAR_TYPE_MODE (TREE_TYPE (def_rhs1)))) - { - rhs_code = def_rhs_code; - rhs1 = def_rhs1; - rhs2 = gimple_assign_rhs2 (def_stmt); - trueval = irhs1; - goto do_compare; - } - else - irhs2 = *defs.get (rhs2); - goto and_ior_xor; - } - def_stmt = SSA_NAME_DEF_STMT (rhs1); - def_rhs_code = gimple_assign_rhs_code (def_stmt); - if (TREE_CODE_CLASS (def_rhs_code) == tcc_comparison) - { - irhs2 = *defs.get (rhs2); - tree def_rhs1 = gimple_assign_rhs1 (def_stmt); - if (TYPE_PRECISION (TREE_TYPE (irhs2)) - == GET_MODE_BITSIZE (SCALAR_TYPE_MODE (TREE_TYPE (def_rhs1)))) - { - rhs_code = def_rhs_code; - rhs1 = def_rhs1; - rhs2 = gimple_assign_rhs2 (def_stmt); - trueval = irhs2; - goto do_compare; - } - else - irhs1 = *defs.get (rhs1); - goto and_ior_xor; - } - /* FALLTHRU */ - case BIT_IOR_EXPR: - case BIT_XOR_EXPR: - irhs1 = *defs.get (rhs1); - irhs2 = *defs.get (rhs2); - and_ior_xor: - if (TYPE_PRECISION (TREE_TYPE (irhs1)) - != TYPE_PRECISION (TREE_TYPE (irhs2))) - { - int prec1 = TYPE_PRECISION (TREE_TYPE (irhs1)); - int prec2 = TYPE_PRECISION (TREE_TYPE (irhs2)); - int out_prec = TYPE_PRECISION (out_type); - if (absu_hwi (out_prec - prec1) < absu_hwi (out_prec - prec2)) - irhs2 = adjust_bool_pattern_cast (vinfo, TREE_TYPE (irhs1), irhs2, - stmt_info); - else if (absu_hwi (out_prec - prec1) > absu_hwi (out_prec - prec2)) - irhs1 = adjust_bool_pattern_cast (vinfo, TREE_TYPE (irhs2), irhs1, - stmt_info); - else - { - irhs1 = adjust_bool_pattern_cast (vinfo, - out_type, irhs1, stmt_info); - irhs2 = adjust_bool_pattern_cast (vinfo, - out_type, irhs2, stmt_info); - } - } - itype = TREE_TYPE (irhs1); - pattern_stmt - = gimple_build_assign (vect_recog_temp_ssa_var (itype, NULL), - rhs_code, irhs1, irhs2); - break; - - default: - do_compare: - gcc_assert (TREE_CODE_CLASS (rhs_code) == tcc_comparison); - if (TREE_CODE (TREE_TYPE (rhs1)) != INTEGER_TYPE - || !TYPE_UNSIGNED (TREE_TYPE (rhs1)) - || maybe_ne (TYPE_PRECISION (TREE_TYPE (rhs1)), - GET_MODE_BITSIZE (TYPE_MODE (TREE_TYPE (rhs1))))) - { - scalar_mode mode = SCALAR_TYPE_MODE (TREE_TYPE (rhs1)); - itype - = build_nonstandard_integer_type (GET_MODE_BITSIZE (mode), 1); - } - else - itype = TREE_TYPE (rhs1); - cond_expr = build2_loc (loc, rhs_code, itype, rhs1, rhs2); - if (trueval == NULL_TREE) - trueval = build_int_cst (itype, 1); - else - gcc_checking_assert (useless_type_conversion_p (itype, - TREE_TYPE (trueval))); - pattern_stmt - = gimple_build_assign (vect_recog_temp_ssa_var (itype, NULL), - COND_EXPR, cond_expr, trueval, - build_int_cst (itype, 0)); - break; - } - - gimple_set_location (pattern_stmt, loc); - append_pattern_def_seq (vinfo, stmt_info, pattern_stmt, - get_vectype_for_scalar_type (vinfo, itype)); - defs.put (var, gimple_assign_lhs (pattern_stmt)); -} - -/* Comparison function to qsort a vector of gimple stmts after UID. */ - -static int -sort_after_uid (const void *p1, const void *p2) -{ - const gimple *stmt1 = *(const gimple * const *)p1; - const gimple *stmt2 = *(const gimple * const *)p2; - return gimple_uid (stmt1) - gimple_uid (stmt2); -} - -/* Create pattern stmts for all stmts participating in the bool pattern - specified by BOOL_STMT_SET and its root STMT_INFO with the desired type - OUT_TYPE. Return the def of the pattern root. */ - -static tree -adjust_bool_stmts (vec_info *vinfo, hash_set <gimple *> &bool_stmt_set, - tree out_type, stmt_vec_info stmt_info) -{ - /* Gather original stmts in the bool pattern in their order of appearance - in the IL. */ - auto_vec<gimple *> bool_stmts (bool_stmt_set.elements ()); - for (hash_set <gimple *>::iterator i = bool_stmt_set.begin (); - i != bool_stmt_set.end (); ++i) - bool_stmts.quick_push (*i); - bool_stmts.qsort (sort_after_uid); - - /* Now process them in that order, producing pattern stmts. */ - hash_map <tree, tree> defs; - for (unsigned i = 0; i < bool_stmts.length (); ++i) - adjust_bool_pattern (vinfo, gimple_assign_lhs (bool_stmts[i]), - out_type, stmt_info, defs); - - /* Pop the last pattern seq stmt and install it as pattern root for STMT. */ - gimple *pattern_stmt - = gimple_seq_last_stmt (STMT_VINFO_PATTERN_DEF_SEQ (stmt_info)); - return gimple_assign_lhs (pattern_stmt); -} - /* Return the proper type for converting bool VAR into an integer value or NULL_TREE if no such type exists. The type is chosen so that the converted value has the @@ -5823,47 +5529,32 @@ vect_recog_bool_pattern (vec_info *vinfo, return NULL; vectype = get_vectype_for_scalar_type (vinfo, TREE_TYPE (lhs)); - if (check_bool_pattern (var, vinfo, bool_stmts)) - { - rhs = adjust_bool_stmts (vinfo, bool_stmts, - TREE_TYPE (lhs), stmt_vinfo); - lhs = vect_recog_temp_ssa_var (TREE_TYPE (lhs), NULL); - if (useless_type_conversion_p (TREE_TYPE (lhs), TREE_TYPE (rhs))) - pattern_stmt = gimple_build_assign (lhs, SSA_NAME, rhs); - else - pattern_stmt - = gimple_build_assign (lhs, NOP_EXPR, rhs); - } - else - { - tree type = integer_type_for_mask (var, vinfo); - tree cst0, cst1, tmp; + tree type = integer_type_for_mask (var, vinfo); + tree cst0, cst1, tmp; - if (!type) - return NULL; + if (!type) + return NULL; - /* We may directly use cond with narrowed type to avoid - multiple cond exprs with following result packing and - perform single cond with packed mask instead. In case - of widening we better make cond first and then extract - results. */ - if (TYPE_MODE (type) == TYPE_MODE (TREE_TYPE (lhs))) - type = TREE_TYPE (lhs); + /* We may directly use cond with narrowed type to avoid multiple cond + exprs with following result packing and perform single cond with + packed mask instead. In case of widening we better make cond first + and then extract results. */ + if (TYPE_MODE (type) == TYPE_MODE (TREE_TYPE (lhs))) + type = TREE_TYPE (lhs); - cst0 = build_int_cst (type, 0); - cst1 = build_int_cst (type, 1); - tmp = vect_recog_temp_ssa_var (type, NULL); - pattern_stmt = gimple_build_assign (tmp, COND_EXPR, var, cst1, cst0); + cst0 = build_int_cst (type, 0); + cst1 = build_int_cst (type, 1); + tmp = vect_recog_temp_ssa_var (type, NULL); + pattern_stmt = gimple_build_assign (tmp, COND_EXPR, var, cst1, cst0); - if (!useless_type_conversion_p (type, TREE_TYPE (lhs))) - { - tree new_vectype = get_vectype_for_scalar_type (vinfo, type); - append_pattern_def_seq (vinfo, stmt_vinfo, - pattern_stmt, new_vectype); + if (!useless_type_conversion_p (type, TREE_TYPE (lhs))) + { + tree new_vectype = get_vectype_for_scalar_type (vinfo, type); + append_pattern_def_seq (vinfo, stmt_vinfo, + pattern_stmt, new_vectype); - lhs = vect_recog_temp_ssa_var (TREE_TYPE (lhs), NULL); - pattern_stmt = gimple_build_assign (lhs, CONVERT_EXPR, tmp); - } + lhs = vect_recog_temp_ssa_var (TREE_TYPE (lhs), NULL); + pattern_stmt = gimple_build_assign (lhs, CONVERT_EXPR, tmp); } *type_out = vectype; @@ -5892,9 +5583,7 @@ vect_recog_bool_pattern (vec_info *vinfo, return NULL; enum vect_def_type dt; - if (check_bool_pattern (var, vinfo, bool_stmts)) - var = adjust_bool_stmts (vinfo, bool_stmts, type, stmt_vinfo); - else if (integer_type_for_mask (var, vinfo)) + if (integer_type_for_mask (var, vinfo)) return NULL; else if (TREE_CODE (TREE_TYPE (var)) == BOOLEAN_TYPE && vect_is_simple_use (var, vinfo, &dt) @@ -5941,28 +5630,22 @@ vect_recog_bool_pattern (vec_info *vinfo, if (!vectype || !VECTOR_MODE_P (TYPE_MODE (vectype))) return NULL; - if (check_bool_pattern (var, vinfo, bool_stmts)) - rhs = adjust_bool_stmts (vinfo, bool_stmts, - TREE_TYPE (vectype), stmt_vinfo); - else - { - tree type = integer_type_for_mask (var, vinfo); - tree cst0, cst1, new_vectype; + tree type = integer_type_for_mask (var, vinfo); + tree cst0, cst1, new_vectype; - if (!type) - return NULL; + if (!type) + return NULL; - if (TYPE_MODE (type) == TYPE_MODE (TREE_TYPE (vectype))) - type = TREE_TYPE (vectype); + if (TYPE_MODE (type) == TYPE_MODE (TREE_TYPE (vectype))) + type = TREE_TYPE (vectype); - cst0 = build_int_cst (type, 0); - cst1 = build_int_cst (type, 1); - new_vectype = get_vectype_for_scalar_type (vinfo, type); + cst0 = build_int_cst (type, 0); + cst1 = build_int_cst (type, 1); + new_vectype = get_vectype_for_scalar_type (vinfo, type); - rhs = vect_recog_temp_ssa_var (type, NULL); - pattern_stmt = gimple_build_assign (rhs, COND_EXPR, var, cst1, cst0); - append_pattern_def_seq (vinfo, stmt_vinfo, pattern_stmt, new_vectype); - } + rhs = vect_recog_temp_ssa_var (type, NULL); + pattern_stmt = gimple_build_assign (rhs, COND_EXPR, var, cst1, cst0); + append_pattern_def_seq (vinfo, stmt_vinfo, pattern_stmt, new_vectype); lhs = build1 (VIEW_CONVERT_EXPR, TREE_TYPE (vectype), lhs); if (!useless_type_conversion_p (TREE_TYPE (lhs), TREE_TYPE (rhs))) -- 2.43.0