Hi!

On the testcase below we ICE since my PR48343 patch.
The problem is that update_cfg_for_uncondjump delete_insns the noop move,
if the insn to be deleted is last_combined_insn (which can be both
if it is i3 or when retrying and undobuf.other_insn happens to be
last_combined_insn), next propagate_for_debug won't find the deleted
insn in the stream and thus will search through the whole rest of the
function and crash on dereferencing NULL NEXT_INSN.

The following patch fixes it, bootstrapped/regtested on x86_64-linux
and i686-linux (also with the patch attached after it), but it is
mainly for discussion what to do.

The propagate_for_debug change alone could fix it, we should never
fall through into next basic block.  We are unforuntately not deleting
just jumps (which ought to appear at the end of bbs), but also
any other noop moves, which I think is unintentional, we have
delete_noop_moves that should clean that up instead (see the second patch).
With the second patch, bootstrap succeeded even with gcc_assert (at_end);
in update_cfg_for_uncondjump, so either it is always at the end, or at
least very often, thus perhaps with the second patch being applied
in combine_instructions we could just for INSN_DELETED_P clear
last_combined_insn right away, meaning we want to propagate till end of
current bb.

2011-04-11  Jakub Jelinek  <ja...@redhat.com>

        PR rtl-optimization/48549
        * combine.c (propagate_for_debug): Also stop after BB_END of
        this_basic_block.
        (combine_instructions): If last_combined_insn has been deleted,
        set last_combined_insn to the next nondebug insn, or NULL
        if after the end of BB.
        (try_combine): Handle last_combined_insn being NULL.

        * g++.dg/opt/pr48549.C: New test.

--- gcc/combine.c.jj    2011-04-10 19:05:25.000000000 +0200
+++ gcc/combine.c       2011-04-11 09:13:04.000000000 +0200
@@ -1179,7 +1179,7 @@ combine_instructions (rtx f, unsigned in
 
   FOR_EACH_BB (this_basic_block)
     {
-      rtx last_combined_insn = NULL_RTX;
+      rtx last_combined_insn = pc_rtx;
       optimize_this_for_speed_p = optimize_bb_for_speed_p (this_basic_block);
       last_call_luid = 0;
       mem_last_set = -1;
@@ -1198,9 +1198,26 @@ combine_instructions (rtx f, unsigned in
          next = 0;
          if (NONDEBUG_INSN_P (insn))
            {
-             if (last_combined_insn == NULL_RTX
-                 || DF_INSN_LUID (last_combined_insn) < DF_INSN_LUID (insn))
+             if (last_combined_insn == pc_rtx)
                last_combined_insn = insn;
+             else if (last_combined_insn)
+               {
+                 if (INSN_DELETED_P (last_combined_insn))
+                   {
+                     while (last_combined_insn
+                            != NEXT_INSN (BB_END (this_basic_block))
+                            && (!NONDEBUG_INSN_P (last_combined_insn)
+                                || INSN_DELETED_P (last_combined_insn)))
+                       last_combined_insn = NEXT_INSN (last_combined_insn);
+                     if (last_combined_insn
+                         == NEXT_INSN (BB_END (this_basic_block)))
+                       last_combined_insn = NULL_RTX;
+                   }
+                 if (last_combined_insn
+                     && DF_INSN_LUID (last_combined_insn)
+                        <= DF_INSN_LUID (insn))
+                   last_combined_insn = insn;
+               }
 
              /* See if we know about function return values before this
                 insn based upon SUBREG flags.  */
@@ -2451,14 +2468,14 @@ propagate_for_debug_subst (rtx from, con
 static void
 propagate_for_debug (rtx insn, rtx last, rtx dest, rtx src)
 {
-  rtx next, loc;
+  rtx next, loc, end = NEXT_INSN (BB_END (this_basic_block));
 
   struct rtx_subst_pair p;
   p.to = src;
   p.adjusted = false;
 
   next = NEXT_INSN (insn);
-  while (next != last)
+  while (next != last && next != end)
     {
       insn = next;
       next = NEXT_INSN (insn);
@@ -3904,8 +3921,9 @@ try_combine (rtx i3, rtx i2, rtx i1, rtx
                    first = i3;
                    last = undobuf.other_insn;
                    gcc_assert (last);
-                   if (DF_INSN_LUID (last)
-                       < DF_INSN_LUID (last_combined_insn))
+                   if (last_combined_insn == NULL_RTX
+                       || (DF_INSN_LUID (last)
+                           < DF_INSN_LUID (last_combined_insn)))
                      last = last_combined_insn;
                  }
 
--- gcc/testsuite/g++.dg/opt/pr48549.C.jj       2011-04-11 08:35:03.000000000 
+0200
+++ gcc/testsuite/g++.dg/opt/pr48549.C  2011-04-11 08:34:19.000000000 +0200
@@ -0,0 +1,63 @@
+// PR rtl-optimization/48549
+// { dg-do compile }
+// { dg-options "-fcompare-debug -O2" }
+
+void
+foo (void *from, void *to)
+{
+  long offset = reinterpret_cast <long>(to) - reinterpret_cast <long>(from);
+  if (offset != static_cast <int>(offset))
+    *(int *) 0xC0DE = 0;
+  reinterpret_cast <int *>(from)[1] = offset;
+}
+struct A
+{
+  A () : a () {}
+  A (void *x) : a (x) {}
+  void *bar () { return a; }
+  void *a;
+};
+struct C;
+struct D;
+struct E : public A
+{
+  C m1 (int);
+  D m2 ();
+  E () {}
+  E (A x) : A (x) {}
+};
+struct C : public E
+{
+  C () {}
+  C (void *x) : E (x) {}
+};
+struct D : public E
+{
+  D (void *x) : E (x) {}
+};
+C
+E::m1 (int x)
+{
+  return (reinterpret_cast <char *>(bar ()) + x);
+}
+D
+E::m2 ()
+{
+  return reinterpret_cast <char *>(bar ());
+}
+struct B
+{
+  E a;
+  unsigned b : 16;
+  unsigned c : 1;
+};
+void
+baz (B *x)
+{
+  for (unsigned i = 0; i < 64; i++)
+    {
+      D d = x[i].a.m2 ();
+      C c = x[i].a.m1 (x[i].c);
+      foo (d.bar (), c.bar ());
+    }
+}

        Jakub
2011-04-11  Jakub Jelinek  <ja...@redhat.com>

        * combine.c (try_combine): Don't call update_cfg_for_uncondjump
        for noop non-jump moves.

--- gcc/combine.c.jj    2011-04-09 19:29:19.083421147 +0200
+++ gcc/combine.c       2011-04-11 10:27:41.769671151 +0200
@@ -4402,7 +4421,8 @@ try_combine (rtx i3, rtx i2, rtx i1, rtx
 
   /* A noop might also need cleaning up of CFG, if it comes from the
      simplification of a jump.  */
-  if (GET_CODE (newpat) == SET
+  if (JUMP_P (i3)
+      && GET_CODE (newpat) == SET
       && SET_SRC (newpat) == pc_rtx
       && SET_DEST (newpat) == pc_rtx)
     {
@@ -4411,6 +4431,7 @@ try_combine (rtx i3, rtx i2, rtx i1, rtx
     }
 
   if (undobuf.other_insn != NULL_RTX
+      && JUMP_P (undobuf.other_insn)
       && GET_CODE (PATTERN (undobuf.other_insn)) == SET
       && SET_SRC (PATTERN (undobuf.other_insn)) == pc_rtx
       && SET_DEST (PATTERN (undobuf.other_insn)) == pc_rtx)

Reply via email to