Hi,

On Thu, 15 Mar 2012, Richard Guenther wrote:

> > The type demotion is PR45397/PR47477 among other PRs. I'd just walk 
> > from the narrowing integer conversion stmts recursively through the 
> > def stmts, see if they can be narrowed, note it, and finally if 
> > everything or significant portion of the stmts can be demoted (if not 
> > all, with some narrowing integer conversion stmt inserted), do it all 
> > together.
> 
> For PROMOTE_MODE targets you'd promote but properly mask out
> constants (to make them cheaper to generate, for example).  You'd
> also take advantate of targets that can do zero/sign-extending loads
> without extra cost (ISTR that's quite important for some SPEC 2k6
> benchmark on x86_64).

gamess.  I still have an old proof of concept patch doing type promotion.  
Probably doesn't apply anymore, and it's using too broad predicates (it 
simple-mindedly extends to the largest type see in an expression tree).
But I think that basic idea of it is sound.


Ciao,
Michael.

Index: passes.c
===================================================================
--- passes.c    (revision 159226)
+++ passes.c    (working copy)
@@ -831,6 +831,7 @@ init_optimization_passes (void)
   NEXT_PASS (pass_all_optimizations);
     {
       struct opt_pass **p = &pass_all_optimizations.pass.sub;
+      extern struct gimple_opt_pass pass_bprop_extends;
       NEXT_PASS (pass_remove_cgraph_callee_edges);
       /* Initial scalar cleanups before alias computation.
         They ensure memory accesses are not indirect wherever possible.  */
@@ -838,6 +839,7 @@ init_optimization_passes (void)
       NEXT_PASS (pass_update_address_taken);
       NEXT_PASS (pass_rename_ssa_copies);
       NEXT_PASS (pass_complete_unrolli);
+      NEXT_PASS (pass_bprop_extends);
       NEXT_PASS (pass_ccp);
       NEXT_PASS (pass_forwprop);
       NEXT_PASS (pass_call_cdce);
Index: tree-ssa-ccp.c
===================================================================
--- tree-ssa-ccp.c      (revision 159226)
+++ tree-ssa-ccp.c      (working copy)
@@ -1999,3 +1999,263 @@ struct gimple_opt_pass pass_fold_builtin
     | TODO_update_ssa                  /* todo_flags_finish */
  }
 };
+
+#if 1
+static bool
+promote_through_insn_p (gimple def, tree *prhs1, tree *prhs2)
+{
+  tree lhs, rhs1, rhs2;
+  if (!is_gimple_assign (def))
+    return false;
+  lhs = gimple_assign_lhs (def);
+  rhs1 = rhs2 = NULL;
+  switch (gimple_assign_rhs_class (def))
+    {
+      case GIMPLE_SINGLE_RHS:
+       rhs1 = gimple_assign_rhs1 (def);
+       if (TREE_CODE (rhs1) != SSA_NAME)
+         return false;
+       break;
+      case GIMPLE_UNARY_RHS:
+       rhs1 = gimple_assign_rhs1 (def);
+       if (TREE_TYPE (gimple_expr_type (def)) != TREE_TYPE (rhs1))
+         return false;
+       break;
+      case GIMPLE_BINARY_RHS:
+       rhs1 = gimple_assign_rhs1 (def);
+       rhs2 = gimple_assign_rhs2 (def);
+
+       switch (gimple_assign_rhs_code (def))
+         {
+           case LSHIFT_EXPR: case RSHIFT_EXPR:
+           case LROTATE_EXPR: case RROTATE_EXPR:
+             rhs2 = NULL;
+             if (TREE_TYPE (lhs) != TREE_TYPE (rhs1))
+               return false;
+             break;
+           case PLUS_EXPR: case MINUS_EXPR:
+           case MULT_EXPR: case EXACT_DIV_EXPR:
+           case TRUNC_DIV_EXPR: case CEIL_DIV_EXPR:
+           case FLOOR_DIV_EXPR: case ROUND_DIV_EXPR:
+           case TRUNC_MOD_EXPR: case CEIL_MOD_EXPR:
+           case FLOOR_MOD_EXPR: case ROUND_MOD_EXPR:
+           case RDIV_EXPR:
+           case MIN_EXPR: case MAX_EXPR:
+           case BIT_IOR_EXPR: case BIT_XOR_EXPR: case BIT_AND_EXPR:
+             if (TREE_TYPE (lhs) != TREE_TYPE (rhs1)
+                 || TREE_TYPE (lhs) != TREE_TYPE (rhs2))
+               return false;
+             break;
+           default:
+             return false;
+         }
+       break;
+      default:
+       return false;
+    }
+  if (rhs1 && TREE_CODE (rhs1) != SSA_NAME)
+    rhs1 = NULL;
+  if (prhs1)
+    *prhs1 = rhs1;
+  if (rhs2 && TREE_CODE (rhs2) != SSA_NAME)
+    rhs2 = NULL;
+  if (prhs2)
+    *prhs2 = rhs2;
+  return true;
+}
+
+static tree
+get_extended_version (tree newtype, tree name, bool force)
+{
+  tree ret = TREE_CHAIN (name);
+  tree rhs1, rhs2;
+  gimple def;
+  /* If we already have a version of NAME, try to use it.  If it
+     doesn't match in type, fail.  */
+  if (ret)
+    {
+      if (TREE_TYPE (ret) == newtype)
+       return ret;
+      else
+       return NULL_TREE;
+    }
+  def = SSA_NAME_DEF_STMT (name);
+  /* If we can propagate through our defining insn, try to do that.  */
+  if (promote_through_insn_p (def, &rhs1, &rhs2))
+    {
+      gimple stmt;
+      tree extrhs1, extrhs2;
+      gimple_stmt_iterator gsi;
+      enum tree_code code;
+      if (rhs1)
+       {
+         extrhs1 = get_extended_version (newtype, rhs1, true);
+         if (!extrhs1)
+           /* ??? We could force here.  */
+           return NULL_TREE;
+       }
+      else
+       extrhs1 = gimple_assign_rhs1 (def);
+      if (extrhs1 && !useless_type_conversion_p (newtype, TREE_TYPE (extrhs1)))
+       {
+         gcc_assert (is_gimple_min_invariant (extrhs1));
+         extrhs1 = fold_convert (newtype, extrhs1);
+       }
+      if (rhs2)
+       {
+         extrhs2 = get_extended_version (newtype, rhs2, true);
+         if (!extrhs2)
+           return NULL_TREE;
+       }
+      else
+       extrhs2 = gimple_assign_rhs2 (def);
+      code = gimple_assign_rhs_code (def);
+      if (extrhs2
+         && code != LSHIFT_EXPR && code != RSHIFT_EXPR
+         && code != LROTATE_EXPR && code != RROTATE_EXPR
+         && !useless_type_conversion_p (newtype, TREE_TYPE (extrhs2)))
+       {
+         gcc_assert (is_gimple_min_invariant (extrhs2));
+         extrhs2 = fold_convert (newtype, extrhs2);
+       }
+      ret = create_tmp_reg (newtype, NULL);
+      add_referenced_var (ret);
+      ret = make_ssa_name (ret, NULL);
+      stmt = gimple_build_assign_with_ops (gimple_assign_rhs_code (def),
+                                          ret, extrhs1, extrhs2);
+      gsi = gsi_for_stmt (def);
+      gsi_insert_after (&gsi, stmt, GSI_NEW_STMT);
+    }
+  else if (force)
+    {
+      gimple stmt;
+      gimple_stmt_iterator gsi;
+      /* We can't propagate through our defining statement, so emit
+         a conversion explicitely.  */
+      ret = create_tmp_reg (newtype, NULL);
+      add_referenced_var (ret);
+      ret = make_ssa_name (ret, NULL);
+      stmt = gimple_build_assign_with_ops (NOP_EXPR, ret, name, NULL);
+      if (gimple_nop_p (def))
+       {
+         gsi = gsi_after_labels (single_succ (ENTRY_BLOCK_PTR));
+         gsi_insert_before (&gsi, stmt, GSI_NEW_STMT);
+       }
+      else if (gimple_code (def) == GIMPLE_PHI)
+       {
+         gsi = gsi_after_labels (gimple_bb (def));
+         gsi_insert_before (&gsi, stmt, GSI_NEW_STMT);
+       }
+      else if (!stmt_ends_bb_p (def))
+       {
+         gsi = gsi_for_stmt (def);
+         gsi_insert_after (&gsi, stmt, GSI_NEW_STMT);
+       }
+      else
+       {
+         /* XXX We could search the fallthru edge, and insert there.
+            That's correct because if this statement ends the BB it
+            must be throwing (it can't be a conditional), and hence
+            the result (which we want to extend) actually is only
+            available on the fallthru edge.  But inserting on edges
+            might create new basic blocks, and that doesn't seem 
+            worth it.  We could do that if the fallthru successor
+            has only one incoming edge.  Actually we can be sure that
+            this is the case, as NAME can't be used in a PHI node
+            (we don't call ourself on them), hence it must be used
+            in something we dominate and therefore our fallthru successor
+            must have only one incoming edge.  */
+#if 0
+         edge e;
+         edge_iterator ei;
+
+         FOR_EACH_EDGE (e, ei, gimple_bb (def)->succs)
+           if (e->flags & EDGE_FALLTHRU)
+             gsi_insert_on_edge_immediate (e, sum);
+#endif
+         return NULL_TREE;
+       }
+    }
+  TREE_CHAIN (name) = ret;
+  return ret;
+}
+
+static unsigned int
+execute_bprop_extends (void)
+{
+  unsigned int todoflags = 0;
+  size_t i;
+  /*bitmap_iterator bi;*/
+  bitmap new_extend = BITMAP_ALLOC (NULL);
+
+  /* Collect SSA names that we'd like to have in a wider type.  */
+  for (i = 0; i < num_ssa_names; i++)
+    {
+      tree lhs = ssa_name (i);
+      if (lhs)
+       {
+         gimple def = SSA_NAME_DEF_STMT (lhs);
+         tree rhs;
+         TREE_CHAIN (lhs) = NULL;
+         if (!is_gimple_assign (def)
+             || !CONVERT_EXPR_CODE_P (gimple_assign_rhs_code (def)))
+           continue;
+         rhs = gimple_assign_rhs1 (def);
+         /* We could handle int->pointer conversions with some care
+            through which insns we look through.  Don't bother for now.  */
+         if (POINTER_TYPE_P (TREE_TYPE (lhs))
+             || POINTER_TYPE_P (TREE_TYPE (rhs)))
+           continue;
+         if (TYPE_PRECISION (TREE_TYPE (lhs))
+             <= TYPE_PRECISION (TREE_TYPE (rhs)))
+           continue;
+         if (!nowrap_type_p (TREE_TYPE (rhs)))
+           continue;
+         bitmap_set_bit (new_extend, SSA_NAME_VERSION (lhs));
+       }
+    }
+
+  while (!bitmap_empty_p (new_extend))
+    {
+      tree lhs, rhs, extlhs;
+      gimple def;
+      i = bitmap_first_set_bit (new_extend);
+      bitmap_clear_bit (new_extend, i);
+      lhs = ssa_name (i);
+      gcc_assert (lhs);
+      def = SSA_NAME_DEF_STMT (lhs);
+      rhs = gimple_assign_rhs1 (def);
+      extlhs = get_extended_version (TREE_TYPE (lhs), rhs, false);
+      if (extlhs)
+       {
+         gimple_assign_set_rhs1 (def, extlhs);
+         gimple_assign_set_rhs_code (def, SSA_NAME);
+         update_stmt (def);
+       }
+    }
+
+  BITMAP_FREE (new_extend);
+  return todoflags;
+}
+
+struct gimple_opt_pass pass_bprop_extends =
+{
+ {
+  GIMPLE_PASS,
+  "bprop",                             /* name */
+  NULL,                                        /* gate */
+  execute_bprop_extends,               /* execute */
+  NULL,                                        /* sub */
+  NULL,                                        /* next */
+  0,                                   /* static_pass_number */
+  TV_NONE,                             /* tv_id */
+  PROP_cfg | PROP_ssa,                 /* properties_required */
+  0,                                   /* properties_provided */
+  0,                                   /* properties_destroyed */
+  0,                                   /* todo_flags_start */
+  TODO_dump_func
+    | TODO_verify_ssa
+    | TODO_update_ssa                  /* todo_flags_finish */
+ }
+};
+#endif

Reply via email to