This fixes PR52028 - we were not properly re-writing virtual SSA form
in loop distribution.

Bootstrapped and tested on x86_64-unknown-linux-gnu, applied to trunk.

Richard.

2012-01-30  Richard Guenther  <rguent...@suse.de>

        PR tree-optimization/52028
        * tree-loop-distribution.c (ldist_gen): Properly update
        virtual SSA form.

        * gcc.dg/torture/pr52028.c: New testcase.
        * gfortran.dg/ldist-pr45199.f: Adjust.
        * gcc.dg/tree-ssa/ldist-16.c: Likewise.
        * gcc.dg/tree-ssa/ldist-17.c: Likewise.
        * gcc.dg/tree-ssa/ldist-pr45948.c: Likewise.

Index: gcc/tree-loop-distribution.c
===================================================================
*** gcc/tree-loop-distribution.c        (revision 183719)
--- gcc/tree-loop-distribution.c        (working copy)
*************** ldist_gen (struct loop *loop, struct gra
*** 1143,1149 ****
        goto ldist_done;
  
    rewrite_into_loop_closed_ssa (NULL, TODO_update_ssa);
!   update_ssa (TODO_update_ssa_only_virtuals | TODO_update_ssa);
  
   ldist_done:
  
--- 1143,1150 ----
        goto ldist_done;
  
    rewrite_into_loop_closed_ssa (NULL, TODO_update_ssa);
!   mark_sym_for_renaming (gimple_vop (cfun));
!   update_ssa (TODO_update_ssa_only_virtuals);
  
   ldist_done:
  
Index: gcc/testsuite/gcc.dg/torture/pr52028.c
===================================================================
*** gcc/testsuite/gcc.dg/torture/pr52028.c      (revision 0)
--- gcc/testsuite/gcc.dg/torture/pr52028.c      (revision 0)
***************
*** 0 ****
--- 1,83 ----
+ /* { dg-do run } */
+ /* { dg-require-effective-target int32plus } */
+ /* { dg-options "-ftree-loop-distribution" } */
+ 
+ #define CAST_LONG unsigned int
+ typedef struct cast_key_st
+ {
+   CAST_LONG data[32];
+ } CAST_KEY;
+ #define CAST_exp(l,A,a,n) \
+       A[n/4]=l; \
+       a[n+3]=(l    )&0xff; \
+       a[n+2]=(l>> 8)&0xff; \
+       a[n+1]=(l>>16)&0xff; \
+       a[n+0]=(l>>24)&0xff;
+ 
+ CAST_LONG CAST_S_table[1024];
+ 
+ #define S4 (CAST_S_table + 000)
+ #define S5 (CAST_S_table + 256)
+ #define S6 (CAST_S_table + 512)
+ #define S7 (CAST_S_table + 768)
+ 
+ void
+ CAST_set_key (CAST_KEY * key)
+ {
+   CAST_LONG x[16];
+   CAST_LONG z[16];
+   CAST_LONG k[32];
+   CAST_LONG X[4] = {0,0,0,0}, Z[4];
+   CAST_LONG l, *K = k;
+   int i;
+   for (i = 0; i < 16; i++)
+     x[i] = 0;
+   for (;;)
+     {
+       l = X[0] ^ S4[x[13]] ^ S5[x[15]] ^ S6[x[12]] ^ S7[x[14]] ^ S6[x[8]];
+       CAST_exp (l, Z, z, 0);
+       CAST_exp (l, Z, z, 4);
+       CAST_exp (l, Z, z, 8);
+       CAST_exp (l, Z, z, 12);
+       K[0] = S4[z[8]] ^ S5[z[9]] ^ S6[z[7]] ^ S7[z[6]] ^ S4[z[2]];
+       K[1] = S4[z[10]] ^ S5[z[11]] ^ S6[z[5]] ^ S7[z[4]] ^ S5[z[6]];
+       K[2] = S4[z[12]] ^ S5[z[13]] ^ S6[z[3]] ^ S7[z[2]] ^ S6[z[9]];
+       K[3] = S4[z[14]] ^ S5[z[15]] ^ S6[z[1]] ^ S7[z[0]] ^ S7[z[12]];
+       K[4] = S4[x[3]] ^ S5[x[2]] ^ S6[x[12]] ^ S7[x[13]] ^ S4[x[8]];
+       K[5] = S4[x[1]] ^ S5[x[0]] ^ S6[x[14]] ^ S7[x[15]] ^ S5[x[13]];
+       K[6] = S4[x[7]] ^ S5[x[6]] ^ S6[x[8]] ^ S7[x[9]] ^ S6[x[3]];
+       K[7] = S4[x[5]] ^ S5[x[4]] ^ S6[x[10]] ^ S7[x[11]] ^ S7[x[7]];
+       K[8] = S4[z[3]] ^ S5[z[2]] ^ S6[z[12]] ^ S7[z[13]] ^ S4[z[9]];
+       K[9] = S4[z[1]] ^ S5[z[0]] ^ S6[z[14]] ^ S7[z[15]] ^ S5[z[12]];
+       K[10] = S4[z[7]] ^ S5[z[6]] ^ S6[z[8]] ^ S7[z[9]] ^ S6[z[2]];
+       K[11] = S4[z[5]] ^ S5[z[4]] ^ S6[z[10]] ^ S7[z[11]] ^ S7[z[6]];
+       l = Z[2] ^ S4[z[5]] ^ S5[z[7]] ^ S6[z[4]] ^ S7[z[6]] ^ S6[z[0]];
+       CAST_exp (l, X, x, 0);
+       K[12] = S4[x[8]] ^ S5[x[9]] ^ S6[x[7]] ^ S7[x[6]] ^ S4[x[3]];
+       K[13] = S4[x[10]] ^ S5[x[11]] ^ S6[x[5]] ^ S7[x[4]] ^ S5[x[7]];
+       K[14] = S4[x[12]] ^ S5[x[13]] ^ S6[x[3]] ^ S7[x[2]] ^ S6[x[8]];
+       K[15] = S4[x[14]] ^ S5[x[15]] ^ S6[x[1]] ^ S7[x[0]] ^ S7[x[13]];
+       if (K != k)
+       break;
+       K += 16;
+     }
+   for (i = 0; i < 16; i++)
+     {
+       key->data[i * 2] = k[i];
+       key->data[i * 2 + 1] = ((k[i + 16]) + 16) & 0x1f;
+     }
+ }
+ 
+ int
+ main ()
+ {
+   CAST_KEY ref = { {0x0069B3F8, 0x00000013, 0x000AEFF8, 0x00000013, 
0x004AD0E0, 0x0000001B, 0x00818F18, 0x00000018, 0x008FF000, 0x0000001B, 
0x002D1C00, 0x0000001B, 0x00EA2800, 0x00000010, 0x00C73400, 0x00000010, 
0x004BF8E0, 0x0000001B, 0x00B3D718, 0x00000018, 0x00B0EBF8, 0x00000013, 
0x003247F8, 0x00000013, 0x00C5BA20, 0x00000010, 0x002D1C00, 0x00000010, 
0x0060822B, 0x00000008, 0x0096236B, 0x0000001B} };
+   CAST_KEY key;
+   unsigned i;
+   for (i = 1; i < 1024; i++)
+     CAST_S_table[i] = (CAST_S_table[i-1] * 7 + 3) & 0xFFFFFF;
+   CAST_set_key (&key);
+   if (__builtin_memcmp(&ref, &key, sizeof(ref)))
+     __builtin_abort();
+   return 0;
+ }
Index: gcc/testsuite/gfortran.dg/ldist-pr45199.f
===================================================================
*** gcc/testsuite/gfortran.dg/ldist-pr45199.f   (revision 183719)
--- gcc/testsuite/gfortran.dg/ldist-pr45199.f   (working copy)
***************
*** 23,27 ****
  ! GCC should apply memset zero loop distribution and it should not ICE.
  
  ! { dg-final { scan-tree-dump "distributed: split to 9 loops" "ldist" } }
! ! { dg-final { scan-tree-dump-times "__builtin_memset" 18 "ldist" } }
  ! { dg-final { cleanup-tree-dump "ldist" } }
--- 23,27 ----
  ! GCC should apply memset zero loop distribution and it should not ICE.
  
  ! { dg-final { scan-tree-dump "distributed: split to 9 loops" "ldist" } }
! ! { dg-final { scan-tree-dump-times "generated memset zero" 9 "ldist" } }
  ! { dg-final { cleanup-tree-dump "ldist" } }
Index: gcc/testsuite/gcc.dg/tree-ssa/ldist-16.c
===================================================================
*** gcc/testsuite/gcc.dg/tree-ssa/ldist-16.c    (revision 183719)
--- gcc/testsuite/gcc.dg/tree-ssa/ldist-16.c    (working copy)
*************** void foo (int n)
*** 17,21 ****
  /* We should apply loop distribution and generate a memset (0).  */
  
  /* { dg-final { scan-tree-dump "distributed: split to 2" "ldist" } } */
! /* { dg-final { scan-tree-dump-times "__builtin_memset" 2 "ldist" } } */
  /* { dg-final { cleanup-tree-dump "ldist" } } */
--- 17,21 ----
  /* We should apply loop distribution and generate a memset (0).  */
  
  /* { dg-final { scan-tree-dump "distributed: split to 2" "ldist" } } */
! /* { dg-final { scan-tree-dump-times "generated memset zero" 1 "ldist" } } */
  /* { dg-final { cleanup-tree-dump "ldist" } } */
Index: gcc/testsuite/gcc.dg/tree-ssa/ldist-17.c
===================================================================
*** gcc/testsuite/gcc.dg/tree-ssa/ldist-17.c    (revision 183719)
--- gcc/testsuite/gcc.dg/tree-ssa/ldist-17.c    (working copy)
*************** mad_synth_mute (struct mad_synth *synth)
*** 46,50 ****
  }
  
  /* { dg-final { scan-tree-dump "distributed: split to 4" "ldist" } } */
! /* { dg-final { scan-tree-dump-times "__builtin_memset" 8 "ldist" } } */
  /* { dg-final { cleanup-tree-dump "ldist" } } */
--- 46,50 ----
  }
  
  /* { dg-final { scan-tree-dump "distributed: split to 4" "ldist" } } */
! /* { dg-final { scan-tree-dump-times "generated memset zero" 4 "ldist" } } */
  /* { dg-final { cleanup-tree-dump "ldist" } } */
Index: gcc/testsuite/gcc.dg/tree-ssa/ldist-pr45948.c
===================================================================
*** gcc/testsuite/gcc.dg/tree-ssa/ldist-pr45948.c       (revision 183719)
--- gcc/testsuite/gcc.dg/tree-ssa/ldist-pr45948.c       (working copy)
*************** foo (int i, int n)
*** 19,23 ****
  /* We should apply loop distribution and generate 2 memset (0).  */
  
  /* { dg-final { scan-tree-dump "distributed: split to 2" "ldist" } } */
! /* { dg-final { scan-tree-dump-times "__builtin_memset" 4 "ldist" } } */
  /* { dg-final { cleanup-tree-dump "ldist" } } */
--- 19,23 ----
  /* We should apply loop distribution and generate 2 memset (0).  */
  
  /* { dg-final { scan-tree-dump "distributed: split to 2" "ldist" } } */
! /* { dg-final { scan-tree-dump-times "generated memset zero" 2 "ldist" } } */
  /* { dg-final { cleanup-tree-dump "ldist" } } */

Reply via email to