On Fri, Sep 28, 2012 at 12:42 AM, Marc Glisse <marc.gli...@inria.fr> wrote: > Hello, > > I have been experimenting with generating VEC_COND_EXPR from the front-end, > and these are just a couple things I noticed. > > 1) optabs.c requires that the first argument of vec_cond_expr be a > comparison, but verify_gimple_assign_ternary only checks is_gimple_condexpr, > like for COND_EXPR. In the long term, it seems better to also allow ssa_name > and vector_cst (thus match the is_gimple_condexpr condition), but for now I > just want to know early if I created an invalid vec_cond_expr.
optabs should be fixed instead, an is_gimple_val condition is implicitely val != 0. > 2) a little refactoring of the code to find a suitable vector type for > comparison results, and one more place where it should be used (no testcase > yet because I don't know if that path can be taken without front-end changes > first). Yes, it looks fine to me. > I did wonder, for tree-ssa-forwprop, about using directly TREE_TYPE > (cond) without truth_type_for. Yes, that should work. > Hmm, now I am wondering whether I should have waited until I had front-end > vec_cond_expr support to submit everything at once... ;) The tree.[ch] and gimple-fold.c hunks are ok if tested properly, the tree-ssa-forwprop.c idea of using TREE_TYPE (cond), too. I don't like the tree-cfg.c change, instead re-factor optabs.c to get a decomposed cond for vector_compare_rtx and appropriately "decompose" a non-comparison-class cond in expand_vec_cond_expr. If we for example have predicate = a < b; x = predicate ? d : e; y = predicate ? f : g; we ideally want to re-use the predicate computation on targets where that would be optimal (and combine should be able to recover the case where it is not). Thanks, Richard. > 2012-09-27 Marc Glisse <marc.gli...@inria.fr> > > * tree-cfg.c (verify_gimple_assign_ternary): Stricter check on > first argument of VEC_COND_EXPR. > * tree.c (truth_type_for): New function. > * tree.h (truth_type_for): Declare. > * gimple-fold.c (and_comparisons_1): Call it. > (or_comparisons_1): Likewise. > * tree-ssa-forwprop.c (forward_propagate_into_cond): Likewise. > > -- > Marc Glisse > Index: gcc/tree-ssa-forwprop.c > =================================================================== > --- gcc/tree-ssa-forwprop.c (revision 191810) > +++ gcc/tree-ssa-forwprop.c (working copy) > @@ -549,21 +549,22 @@ static bool > forward_propagate_into_cond (gimple_stmt_iterator *gsi_p) > { > gimple stmt = gsi_stmt (*gsi_p); > tree tmp = NULL_TREE; > tree cond = gimple_assign_rhs1 (stmt); > bool swap = false; > > /* We can do tree combining on SSA_NAME and comparison expressions. */ > if (COMPARISON_CLASS_P (cond)) > tmp = forward_propagate_into_comparison_1 (stmt, TREE_CODE (cond), > - boolean_type_node, > + truth_type_for > + (TREE_TYPE (cond)), > TREE_OPERAND (cond, 0), > TREE_OPERAND (cond, 1)); > else if (TREE_CODE (cond) == SSA_NAME) > { > enum tree_code code; > tree name = cond; > gimple def_stmt = get_prop_source_stmt (name, true, NULL); > if (!def_stmt || !can_propagate_from (def_stmt)) > return 0; > > Index: gcc/tree-cfg.c > =================================================================== > --- gcc/tree-cfg.c (revision 191810) > +++ gcc/tree-cfg.c (working copy) > @@ -3758,22 +3758,24 @@ verify_gimple_assign_ternary (gimple stm > tree rhs2_type = TREE_TYPE (rhs2); > tree rhs3 = gimple_assign_rhs3 (stmt); > tree rhs3_type = TREE_TYPE (rhs3); > > if (!is_gimple_reg (lhs)) > { > error ("non-register as LHS of ternary operation"); > return true; > } > > - if (((rhs_code == VEC_COND_EXPR || rhs_code == COND_EXPR) > - ? !is_gimple_condexpr (rhs1) : !is_gimple_val (rhs1)) > + if (((rhs_code == COND_EXPR) ? !is_gimple_condexpr (rhs1) > + : (rhs_code == VEC_COND_EXPR) ? (!is_gimple_condexpr (rhs1) > + || is_gimple_val (rhs1)) > + : !is_gimple_val (rhs1)) > || !is_gimple_val (rhs2) > || !is_gimple_val (rhs3)) > { > error ("invalid operands in ternary operation"); > return true; > } > > /* First handle operations that involve different types. */ > switch (rhs_code) > { > Index: gcc/gimple-fold.c > =================================================================== > --- gcc/gimple-fold.c (revision 191810) > +++ gcc/gimple-fold.c (working copy) > @@ -23,21 +23,20 @@ along with GCC; see the file COPYING3. > #include "coretypes.h" > #include "tm.h" > #include "tree.h" > #include "flags.h" > #include "function.h" > #include "dumpfile.h" > #include "tree-flow.h" > #include "tree-ssa-propagate.h" > #include "target.h" > #include "gimple-fold.h" > -#include "langhooks.h" > > /* Return true when DECL can be referenced from current unit. > FROM_DECL (if non-null) specify constructor of variable DECL was taken > from. > We can get declarations that are not possible to reference for various > reasons: > > 1) When analyzing C++ virtual tables. > C++ virtual tables do have known constructors even > when they are keyed to other compilation unit. > Those tables can contain pointers to methods and vars > @@ -1686,29 +1685,21 @@ and_var_with_comparison_1 (gimple stmt, > (OP1A CODE1 OP1B) and (OP2A CODE2 OP2B), respectively. > If this can be done without constructing an intermediate value, > return the resulting tree; otherwise NULL_TREE is returned. > This function is deliberately asymmetric as it recurses on SSA_DEFs > in the first comparison but not the second. */ > > static tree > and_comparisons_1 (enum tree_code code1, tree op1a, tree op1b, > enum tree_code code2, tree op2a, tree op2b) > { > - tree truth_type = boolean_type_node; > - if (TREE_CODE (TREE_TYPE (op1a)) == VECTOR_TYPE) > - { > - tree vec_type = TREE_TYPE (op1a); > - tree elem = lang_hooks.types.type_for_size > - (GET_MODE_BITSIZE (TYPE_MODE (TREE_TYPE (vec_type))), 0); > - truth_type = build_opaque_vector_type (elem, > - TYPE_VECTOR_SUBPARTS > (vec_type)); > - } > + tree truth_type = truth_type_for (TREE_TYPE (op1a)); > > /* First check for ((x CODE1 y) AND (x CODE2 y)). */ > if (operand_equal_p (op1a, op2a, 0) > && operand_equal_p (op1b, op2b, 0)) > { > /* Result will be either NULL_TREE, or a combined comparison. */ > tree t = combine_comparisons (UNKNOWN_LOCATION, > TRUTH_ANDIF_EXPR, code1, code2, > truth_type, op1a, op1b); > if (t) > @@ -2158,29 +2149,21 @@ or_var_with_comparison_1 (gimple stmt, > (OP1A CODE1 OP1B) and (OP2A CODE2 OP2B), respectively. > If this can be done without constructing an intermediate value, > return the resulting tree; otherwise NULL_TREE is returned. > This function is deliberately asymmetric as it recurses on SSA_DEFs > in the first comparison but not the second. */ > > static tree > or_comparisons_1 (enum tree_code code1, tree op1a, tree op1b, > enum tree_code code2, tree op2a, tree op2b) > { > - tree truth_type = boolean_type_node; > - if (TREE_CODE (TREE_TYPE (op1a)) == VECTOR_TYPE) > - { > - tree vec_type = TREE_TYPE (op1a); > - tree elem = lang_hooks.types.type_for_size > - (GET_MODE_BITSIZE (TYPE_MODE (TREE_TYPE (vec_type))), 0); > - truth_type = build_opaque_vector_type (elem, > - TYPE_VECTOR_SUBPARTS > (vec_type)); > - } > + tree truth_type = truth_type_for (TREE_TYPE (op1a)); > > /* First check for ((x CODE1 y) OR (x CODE2 y)). */ > if (operand_equal_p (op1a, op2a, 0) > && operand_equal_p (op1b, op2b, 0)) > { > /* Result will be either NULL_TREE, or a combined comparison. */ > tree t = combine_comparisons (UNKNOWN_LOCATION, > TRUTH_ORIF_EXPR, code1, code2, > truth_type, op1a, op1b); > if (t) > Index: gcc/tree.c > =================================================================== > --- gcc/tree.c (revision 191810) > +++ gcc/tree.c (working copy) > @@ -10243,20 +10243,36 @@ unsigned_type_for (tree type) > /* If TYPE is an integral or pointer type, return an integer type with > the same precision which is signed, or itself if TYPE is already a > signed integer type. */ > > tree > signed_type_for (tree type) > { > return signed_or_unsigned_type_for (0, type); > } > > +/* If TYPE is a vector type, return a signed integer vector type with the > + same width and number of subparts. Otherwise return boolean_type_node. > */ > + > +tree > +truth_type_for (tree type) > +{ > + if (TREE_CODE (type) == VECTOR_TYPE) > + { > + tree elem = lang_hooks.types.type_for_size > + (GET_MODE_BITSIZE (TYPE_MODE (TREE_TYPE (type))), 0); > + return build_opaque_vector_type (elem, TYPE_VECTOR_SUBPARTS (type)); > + } > + else > + return boolean_type_node; > +} > + > /* Returns the largest value obtainable by casting something in INNER type > to > OUTER type. */ > > tree > upper_bound_in_type (tree outer, tree inner) > { > double_int high; > unsigned int det = 0; > unsigned oprec = TYPE_PRECISION (outer); > unsigned iprec = TYPE_PRECISION (inner); > Index: gcc/tree.h > =================================================================== > --- gcc/tree.h (revision 191810) > +++ gcc/tree.h (working copy) > @@ -4762,20 +4762,21 @@ extern tree build_call_valist (tree, tre > extern tree build_call_array_loc (location_t, tree, tree, int, const tree > *); > extern tree build_call_vec (tree, tree, VEC(tree,gc) *); > > /* Construct various nodes representing data types. */ > > extern tree make_signed_type (int); > extern tree make_unsigned_type (int); > extern tree signed_or_unsigned_type_for (int, tree); > extern tree signed_type_for (tree); > extern tree unsigned_type_for (tree); > +extern tree truth_type_for (tree); > extern void initialize_sizetypes (void); > extern void fixup_unsigned_type (tree); > extern tree build_pointer_type_for_mode (tree, enum machine_mode, bool); > extern tree build_pointer_type (tree); > extern tree build_reference_type_for_mode (tree, enum machine_mode, bool); > extern tree build_reference_type (tree); > extern tree build_vector_type_for_mode (tree, enum machine_mode); > extern tree build_vector_type (tree innertype, int nunits); > extern tree build_opaque_vector_type (tree innertype, int nunits); > extern tree build_type_no_quals (tree); >