Committed, thanks Juzhe.

On 2023/10/31 11:43, juzhe.zh...@rivai.ai wrote:
LGTM.

------------------------------------------------------------------------
juzhe.zh...@rivai.ai

    *From:* Lehua Ding <mailto:lehua.d...@rivai.ai>
    *Date:* 2023-10-31 11:39
    *To:* gcc-patches <mailto:gcc-patches@gcc.gnu.org>
    *CC:* juzhe.zhong <mailto:juzhe.zh...@rivai.ai>; kito.cheng
    <mailto:kito.ch...@gmail.com>; rdapp.gcc
    <mailto:rdapp....@gmail.com>; palmer <mailto:pal...@rivosinc.com>;
    jeffreyalaw <mailto:jeffreya...@gmail.com>; lehua.ding
    <mailto:lehua.d...@rivai.ai>
    *Subject:* [PATCH] RISC-V: Add the missed combine of [u]int64 ->
    _Float16 and vcond
    Hi,
    This patch let the INT64 to FP16 convert split to two small converts
    (INT64 -> FP32 and FP32 -> FP16) when expanding instead of dealy the
    split to split1 pass. This change could make it possible to combine
    the FP32 to FP16 and vcond patterns and so we don't need to add an
    combine pattern for INT64 to FP16 and vcond patterns.
    Consider this code:
       void
       foo (_Float16 *__restrict r, int64_t *__restrict a, _FLoat16
    *__restrict b,
            int64_t *__restrict pred, int n)
       {
         for (int i = 0; i < n; i += 1)
           {
             r[i] = pred[i] ? (_Float16) a[i] : b[i];
           }
       }
    Before this patch:
       ...
       vfncvt.f.f.w    v2,v2
       vmerge.vvm      v1,v1,v2,v0
       vse16.v v1,0(a0)
       ...
    After this patch:
       ...
       vfncvt.f.f.w    v1,v2,v0.t
       vse16.v v1,0(a0)
       ...
    gcc/ChangeLog:
    * config/riscv/autovec.md (<float_cvt><mode><vnnconvert>2):
    Change to define_expand.
    gcc/testsuite/ChangeLog:
    * gcc.target/riscv/rvv/autovec/cond/cond_convert_int2float-rv32-1.c:
    Add vfncvt.f.f.w assert.
    * gcc.target/riscv/rvv/autovec/cond/cond_convert_int2float-rv32-2.c:
    Ditto.
    * gcc.target/riscv/rvv/autovec/cond/cond_convert_int2float-rv64-1.c:
    Ditto.
    * gcc.target/riscv/rvv/autovec/cond/cond_convert_int2float-rv64-2.c:
    Ditto.
    ---
    gcc/config/riscv/autovec.md                                  | 5 +----
    .../riscv/rvv/autovec/cond/cond_convert_int2float-rv32-1.c   | 2 ++
    .../riscv/rvv/autovec/cond/cond_convert_int2float-rv32-2.c   | 2 ++
    .../riscv/rvv/autovec/cond/cond_convert_int2float-rv64-1.c   | 2 ++
    .../riscv/rvv/autovec/cond/cond_convert_int2float-rv64-2.c   | 2 ++
    5 files changed, 9 insertions(+), 4 deletions(-)
    diff --git a/gcc/config/riscv/autovec.md b/gcc/config/riscv/autovec.md
    index 5f49d73be44..bfd45dd76ff 100644
    --- a/gcc/config/riscv/autovec.md
    +++ b/gcc/config/riscv/autovec.md
    @@ -977,14 +977,11 @@
    ;; This operation can be performed in the loop vectorizer but
    unfortunately
    ;; not applicable for now. We can remove this pattern after loop
    vectorizer
    ;; is able to take care of INT64 to FP16 conversion.
    -(define_insn_and_split "<float_cvt><mode><vnnconvert>2"
    +(define_expand "<float_cvt><mode><vnnconvert>2"
        [(set (match_operand:<VNNCONVERT>  0 "register_operand")
    (any_float:<VNNCONVERT>
       (match_operand:VWWCONVERTI 1 "register_operand")))]
        "TARGET_VECTOR && TARGET_ZVFH && can_create_pseudo_p () &&
    !flag_trapping_math"
    -  "#"
    -  "&& 1"
    -  [(const_int 0)]
        {
          rtx single = gen_reg_rtx (<VNCONVERT>mode); /* Get vector SF
    mode.  */
    diff --git
    
a/gcc/testsuite/gcc.target/riscv/rvv/autovec/cond/cond_convert_int2float-rv32-1.c
 
b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cond/cond_convert_int2float-rv32-1.c
    index f5d3bb4c789..030c8fe33ce 100644
    ---
    
a/gcc/testsuite/gcc.target/riscv/rvv/autovec/cond/cond_convert_int2float-rv32-1.c
    +++
    
b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cond/cond_convert_int2float-rv32-1.c
    @@ -12,4 +12,6 @@
    /* { dg-final { scan-assembler-times
    {\tvfncvt\.f\.xu\.w\tv[0-9]+,v[0-9]+,v0\.t} 2 } } */
    /* { dg-final { scan-assembler-times
    {\tvfncvt\.f\.x\.w\tv[0-9]+,v[0-9]+,v0\.t} 2 } } */
    +/* { dg-final { scan-assembler-times
    {\tvfncvt\.f\.f\.w\tv[0-9]+,v[0-9]+,v0\.t} 2 } } */
    +
    /* { dg-final { scan-assembler
    {\tvsetvli\t[a-z0-9]+,[a-z0-9]+,e[0-9]+,m[f0-9]+,t[au],mu} } } */
    diff --git
    
a/gcc/testsuite/gcc.target/riscv/rvv/autovec/cond/cond_convert_int2float-rv32-2.c
 
b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cond/cond_convert_int2float-rv32-2.c
    index f5d3bb4c789..030c8fe33ce 100644
    ---
    
a/gcc/testsuite/gcc.target/riscv/rvv/autovec/cond/cond_convert_int2float-rv32-2.c
    +++
    
b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cond/cond_convert_int2float-rv32-2.c
    @@ -12,4 +12,6 @@
    /* { dg-final { scan-assembler-times
    {\tvfncvt\.f\.xu\.w\tv[0-9]+,v[0-9]+,v0\.t} 2 } } */
    /* { dg-final { scan-assembler-times
    {\tvfncvt\.f\.x\.w\tv[0-9]+,v[0-9]+,v0\.t} 2 } } */
    +/* { dg-final { scan-assembler-times
    {\tvfncvt\.f\.f\.w\tv[0-9]+,v[0-9]+,v0\.t} 2 } } */
    +
    /* { dg-final { scan-assembler
    {\tvsetvli\t[a-z0-9]+,[a-z0-9]+,e[0-9]+,m[f0-9]+,t[au],mu} } } */
    diff --git
    
a/gcc/testsuite/gcc.target/riscv/rvv/autovec/cond/cond_convert_int2float-rv64-1.c
 
b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cond/cond_convert_int2float-rv64-1.c
    index 5ebed2f7fdc..d6298f5351a 100644
    ---
    
a/gcc/testsuite/gcc.target/riscv/rvv/autovec/cond/cond_convert_int2float-rv64-1.c
    +++
    
b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cond/cond_convert_int2float-rv64-1.c
    @@ -12,4 +12,6 @@
    /* { dg-final { scan-assembler-times
    {\tvfncvt\.f\.xu\.w\tv[0-9]+,v[0-9]+,v0\.t} 2 } } */
    /* { dg-final { scan-assembler-times
    {\tvfncvt\.f\.x\.w\tv[0-9]+,v[0-9]+,v0\.t} 2 } } */
    +/* { dg-final { scan-assembler-times
    {\tvfncvt\.f\.f\.w\tv[0-9]+,v[0-9]+,v0\.t} 2 } } */
    +
    /* { dg-final { scan-assembler
    {\tvsetvli\t[a-z0-9]+,[a-z0-9]+,e[0-9]+,m[f0-9]+,t[au],mu} } } */
    diff --git
    
a/gcc/testsuite/gcc.target/riscv/rvv/autovec/cond/cond_convert_int2float-rv64-2.c
 
b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cond/cond_convert_int2float-rv64-2.c
    index 097e377f107..23ad5f2b579 100644
    ---
    
a/gcc/testsuite/gcc.target/riscv/rvv/autovec/cond/cond_convert_int2float-rv64-2.c
    +++
    
b/gcc/testsuite/gcc.target/riscv/rvv/autovec/cond/cond_convert_int2float-rv64-2.c
    @@ -12,4 +12,6 @@
    /* { dg-final { scan-assembler-times
    {\tvfncvt\.f\.xu\.w\tv[0-9]+,v[0-9]+,v0\.t} 2 } } */
    /* { dg-final { scan-assembler-times
    {\tvfncvt\.f\.x\.w\tv[0-9]+,v[0-9]+,v0\.t} 2 } } */
    +/* { dg-final { scan-assembler-times
    {\tvfncvt\.f\.f\.w\tv[0-9]+,v[0-9]+,v0\.t} 2 } } */
    +
    /* { dg-final { scan-assembler
    {\tvsetvli\t[a-z0-9]+,[a-z0-9]+,e[0-9]+,m[f0-9]+,t[au],mu} } } */
-- 2.36.3


--
Best,
Lehua (RiVAI)
lehua.d...@rivai.ai

Reply via email to