On Wed, 18 Sep 2019, Kito Cheng wrote:

> Hi Jakub, Richard:
> 
> This commit is fixing wrong code gen for RISC-V, does it OK to
> backport to GCC 9 branch?

Since it is target specific and for non-primary/secondary targets
it's the RISC-V maintainers call whether to allow backporting this.
Generally wrong-code issues can be backported even if they are not
regressions if the chance they introduce other issues is low.

Richard.

> On Fri, Sep 6, 2019 at 4:34 AM Jim Wilson <j...@sifive.com> wrote:
> >
> > Shifting by more than the size of a SUBREG_REG doesn't work, so we either
> > need to disable splits if an input is paradoxical, or else we need to
> > generate a clean temporary for intermediate results.
> >
> > This was tested with rv32i/newlib and rv64gc/linux cross builds and checks.
> > There were no regressions.  The new pr91635.c testcase works with the patch
> > and fails without it.  Also, code size for libc and libstdc++ was checked
> > and is smaller or equal sized with the patch, ignoring alignment padding.
> > The shift-shift-4.c testcase gives better code size with this patch.
> > The shift-shift-5.c testcase gave worse code size with a draft version
> > of this patch and is OK with the final version of this patch.
> >
> > Jakub wrote the first version of this patch, so gets primary credit for it.
> >
> > Committed.
> >
> > Jim
> >
> >         gcc/
> >         PR target/91635
> >         * config/riscv/riscv.md (zero_extendsidi2, zero_extendhi<GPR:mode>2,
> >         extend<SHORT:mode><SUPERQI:mode>2): Don't split if
> >         paradoxical_subreg_p (operands[0]).
> >         (*lshrsi3_zero_extend_3+1, *lshrsi3_zero_extend_3+2): Add clobber 
> > and
> >         use as intermediate value.
> >
> >         gcc/testsuite/
> >         PR target/91635
> >         * gcc.c-torture/execute/pr91635.c: New test.
> >         * gcc.target/riscv/shift-shift-4.c: New test.
> >         * gcc.target/riscv/shift-shift-5.c: New test.
> > ---
> >  gcc/config/riscv/riscv.md                     | 30 +++++++---
> >  gcc/testsuite/gcc.c-torture/execute/pr91635.c | 57 +++++++++++++++++++
> >  .../gcc.target/riscv/shift-shift-4.c          | 13 +++++
> >  .../gcc.target/riscv/shift-shift-5.c          | 16 ++++++
> >  4 files changed, 107 insertions(+), 9 deletions(-)
> >  create mode 100644 gcc/testsuite/gcc.c-torture/execute/pr91635.c
> >  create mode 100644 gcc/testsuite/gcc.target/riscv/shift-shift-4.c
> >  create mode 100644 gcc/testsuite/gcc.target/riscv/shift-shift-5.c
> >
> > diff --git a/gcc/config/riscv/riscv.md b/gcc/config/riscv/riscv.md
> > index 78260fcf6fd..744a027a1b7 100644
> > --- a/gcc/config/riscv/riscv.md
> > +++ b/gcc/config/riscv/riscv.md
> > @@ -1051,7 +1051,9 @@
> >    "@
> >     #
> >     lwu\t%0,%1"
> > -  "&& reload_completed && REG_P (operands[1])"
> > +  "&& reload_completed
> > +   && REG_P (operands[1])
> > +   && !paradoxical_subreg_p (operands[0])"
> >    [(set (match_dup 0)
> >         (ashift:DI (match_dup 1) (const_int 32)))
> >     (set (match_dup 0)
> > @@ -1068,7 +1070,9 @@
> >    "@
> >     #
> >     lhu\t%0,%1"
> > -  "&& reload_completed && REG_P (operands[1])"
> > +  "&& reload_completed
> > +   && REG_P (operands[1])
> > +   && !paradoxical_subreg_p (operands[0])"
> >    [(set (match_dup 0)
> >         (ashift:GPR (match_dup 1) (match_dup 2)))
> >     (set (match_dup 0)
> > @@ -1117,7 +1121,9 @@
> >    "@
> >     #
> >     l<SHORT:size>\t%0,%1"
> > -  "&& reload_completed && REG_P (operands[1])"
> > +  "&& reload_completed
> > +   && REG_P (operands[1])
> > +   && !paradoxical_subreg_p (operands[0])"
> >    [(set (match_dup 0) (ashift:SI (match_dup 1) (match_dup 2)))
> >     (set (match_dup 0) (ashiftrt:SI (match_dup 0) (match_dup 2)))]
> >  {
> > @@ -1766,15 +1772,20 @@
> >  ;; Handle AND with 2^N-1 for N from 12 to XLEN.  This can be split into
> >  ;; two logical shifts.  Otherwise it requires 3 instructions: lui,
> >  ;; xor/addi/srli, and.
> > +
> > +;; Generating a temporary for the shift output gives better combiner 
> > results;
> > +;; and also fixes a problem where op0 could be a paradoxical reg and 
> > shifting
> > +;; by amounts larger than the size of the SUBREG_REG doesn't work.
> >  (define_split
> >    [(set (match_operand:GPR 0 "register_operand")
> >         (and:GPR (match_operand:GPR 1 "register_operand")
> > -                (match_operand:GPR 2 "p2m1_shift_operand")))]
> > +                (match_operand:GPR 2 "p2m1_shift_operand")))
> > +   (clobber (match_operand:GPR 3 "register_operand"))]
> >    ""
> > - [(set (match_dup 0)
> > + [(set (match_dup 3)
> >         (ashift:GPR (match_dup 1) (match_dup 2)))
> >    (set (match_dup 0)
> > -       (lshiftrt:GPR (match_dup 0) (match_dup 2)))]
> > +       (lshiftrt:GPR (match_dup 3) (match_dup 2)))]
> >  {
> >    /* Op2 is a VOIDmode constant, so get the mode size from op1.  */
> >    operands[2] = GEN_INT (GET_MODE_BITSIZE (GET_MODE (operands[1]))
> > @@ -1786,12 +1797,13 @@
> >  (define_split
> >    [(set (match_operand:DI 0 "register_operand")
> >         (and:DI (match_operand:DI 1 "register_operand")
> > -               (match_operand:DI 2 "high_mask_shift_operand")))]
> > +               (match_operand:DI 2 "high_mask_shift_operand")))
> > +   (clobber (match_operand:DI 3 "register_operand"))]
> >    "TARGET_64BIT"
> > -  [(set (match_dup 0)
> > +  [(set (match_dup 3)
> >         (lshiftrt:DI (match_dup 1) (match_dup 2)))
> >     (set (match_dup 0)
> > -       (ashift:DI (match_dup 0) (match_dup 2)))]
> > +       (ashift:DI (match_dup 3) (match_dup 2)))]
> >  {
> >    operands[2] = GEN_INT (ctz_hwi (INTVAL (operands[2])));
> >  })
> > diff --git a/gcc/testsuite/gcc.c-torture/execute/pr91635.c 
> > b/gcc/testsuite/gcc.c-torture/execute/pr91635.c
> > new file mode 100644
> > index 00000000000..878a491fc36
> > --- /dev/null
> > +++ b/gcc/testsuite/gcc.c-torture/execute/pr91635.c
> > @@ -0,0 +1,57 @@
> > +/* PR target/91635 */
> > +
> > +#if __CHAR_BIT__ == 8 && __SIZEOF_SHORT__ == 2 \
> > +    && __SIZEOF_INT__ == 4 && __SIZEOF_LONG_LONG__ == 8
> > +unsigned short b, c;
> > +int u, v, w, x;
> > +
> > +__attribute__ ((noipa)) int
> > +foo (unsigned short c)
> > +{
> > +  c <<= __builtin_add_overflow (-c, -1, &b);
> > +  c >>= 1;
> > +  return c;
> > +}
> > +
> > +__attribute__ ((noipa)) int
> > +bar (unsigned short b)
> > +{
> > +  b <<= -14 & 15;
> > +  b = b >> -~1;
> > +  return b;
> > +}
> > +
> > +__attribute__ ((noipa)) int
> > +baz (unsigned short e)
> > +{
> > +  e <<= 1;
> > +  e >>= __builtin_add_overflow (8719476735, u, &v);
> > +  return e;
> > +}
> > +
> > +__attribute__ ((noipa)) int
> > +qux (unsigned int e)
> > +{
> > +  c = ~1;
> > +  c *= e;
> > +  c = c >> (-15 & 5);
> > +  return c + w + x;
> > +}
> > +#endif
> > +
> > +int
> > +main ()
> > +{
> > +#if __CHAR_BIT__ == 8 && __SIZEOF_SHORT__ == 2 \
> > +    && __SIZEOF_INT__ == 4 && __SIZEOF_LONG_LONG__ == 8
> > +  if (foo (0xffff) != 0x7fff)
> > +    __builtin_abort ();
> > +  if (bar (5) != 5)
> > +    __builtin_abort ();
> > +  if (baz (~0) != 0x7fff)
> > +    __builtin_abort ();
> > +  if (qux (2) != 0x7ffe)
> > +    __builtin_abort ();
> > +#endif
> > +  return 0;
> > +}
> > diff --git a/gcc/testsuite/gcc.target/riscv/shift-shift-4.c 
> > b/gcc/testsuite/gcc.target/riscv/shift-shift-4.c
> > new file mode 100644
> > index 00000000000..72a45ee87ae
> > --- /dev/null
> > +++ b/gcc/testsuite/gcc.target/riscv/shift-shift-4.c
> > @@ -0,0 +1,13 @@
> > +/* { dg-do compile } */
> > +/* { dg-options "-march=rv32i -mabi=ilp32 -O2" } */
> > +
> > +/* One zero-extend shift can be eliminated by modifying the constant in the
> > +   greater than test.  Started working after modifying the splitter
> > +   lshrsi3_zero_extend_3+1 to use a temporary reg for the first split 
> > dest.  */
> > +int
> > +sub (int i)
> > +{
> > +  i &= 0x7fffffff;
> > +  return i > 0x7f800000;
> > +}
> > +/* { dg-final { scan-assembler-not "srli" } } */
> > diff --git a/gcc/testsuite/gcc.target/riscv/shift-shift-5.c 
> > b/gcc/testsuite/gcc.target/riscv/shift-shift-5.c
> > new file mode 100644
> > index 00000000000..5b2ae89a471
> > --- /dev/null
> > +++ b/gcc/testsuite/gcc.target/riscv/shift-shift-5.c
> > @@ -0,0 +1,16 @@
> > +/* { dg-do compile } */
> > +/* { dg-options "-march=rv64gc -mabi=lp64d -O2" } */
> > +
> > +/* Fails if lshrsi3_zero_extend_3+1 uses a temp reg which has no REG_DEST
> > +   note.  */
> > +unsigned long
> > +sub (long l)
> > +{
> > +  union u {
> > +    struct s { int a : 19; unsigned int b : 13; int x; } s;
> > +    long l;
> > +  } u;
> > +  u.l = l;
> > +  return u.s.b;
> > +}
> > +/* { dg-final { scan-assembler "srliw" } } */
> > --
> > 2.17.1
> >
> 

-- 
Richard Biener <rguent...@suse.de>
SUSE Software Solutions Germany GmbH, Maxfeldstrasse 5, 90409 Nuernberg,
Germany; GF: Felix Imendörffer; HRB 247165 (AG München)

Reply via email to