Support INT <-> FP VLS auto-vectorization patterns. Regression passed. Committed.
gcc/ChangeLog: * config/riscv/autovec.md: Extend VLS modes. * config/riscv/vector-iterators.md: Ditto. * config/riscv/vector.md: Ditto. gcc/testsuite/ChangeLog: * gcc.target/riscv/rvv/autovec/vls/convert-1.c: New test. * gcc.target/riscv/rvv/autovec/vls/convert-10.c: New test. * gcc.target/riscv/rvv/autovec/vls/convert-11.c: New test. * gcc.target/riscv/rvv/autovec/vls/convert-12.c: New test. * gcc.target/riscv/rvv/autovec/vls/convert-2.c: New test. * gcc.target/riscv/rvv/autovec/vls/convert-3.c: New test. * gcc.target/riscv/rvv/autovec/vls/convert-4.c: New test. * gcc.target/riscv/rvv/autovec/vls/convert-5.c: New test. * gcc.target/riscv/rvv/autovec/vls/convert-6.c: New test. * gcc.target/riscv/rvv/autovec/vls/convert-7.c: New test. * gcc.target/riscv/rvv/autovec/vls/convert-8.c: New test. * gcc.target/riscv/rvv/autovec/vls/convert-9.c: New test. --- gcc/config/riscv/autovec.md | 12 +- gcc/config/riscv/vector-iterators.md | 202 ++++++++++++++++++ gcc/config/riscv/vector.md | 20 +- .../riscv/rvv/autovec/vls/convert-1.c | 74 +++++++ .../riscv/rvv/autovec/vls/convert-10.c | 80 +++++++ .../riscv/rvv/autovec/vls/convert-11.c | 54 +++++ .../riscv/rvv/autovec/vls/convert-12.c | 36 ++++ .../riscv/rvv/autovec/vls/convert-2.c | 74 +++++++ .../riscv/rvv/autovec/vls/convert-3.c | 58 +++++ .../riscv/rvv/autovec/vls/convert-4.c | 36 ++++ .../riscv/rvv/autovec/vls/convert-5.c | 80 +++++++ .../riscv/rvv/autovec/vls/convert-6.c | 55 +++++ .../riscv/rvv/autovec/vls/convert-7.c | 37 ++++ .../riscv/rvv/autovec/vls/convert-8.c | 58 +++++ .../riscv/rvv/autovec/vls/convert-9.c | 22 ++ 15 files changed, 882 insertions(+), 16 deletions(-) create mode 100644 gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-1.c create mode 100644 gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-10.c create mode 100644 gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-11.c create mode 100644 gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-12.c create mode 100644 gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-2.c create mode 100644 gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-3.c create mode 100644 gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-4.c create mode 100644 gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-5.c create mode 100644 gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-6.c create mode 100644 gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-7.c create mode 100644 gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-8.c create mode 100644 gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-9.c diff --git a/gcc/config/riscv/autovec.md b/gcc/config/riscv/autovec.md index 75ed7ae4f2e..55c0a04df3b 100644 --- a/gcc/config/riscv/autovec.md +++ b/gcc/config/riscv/autovec.md @@ -847,7 +847,7 @@ (define_insn_and_split "<optab><mode><vconvert>2" [(set (match_operand:<VCONVERT> 0 "register_operand") (any_fix:<VCONVERT> - (match_operand:VF 1 "register_operand")))] + (match_operand:V_VLSF 1 "register_operand")))] "TARGET_VECTOR && can_create_pseudo_p ()" "#" "&& 1" @@ -868,8 +868,8 @@ ;; ------------------------------------------------------------------------- (define_insn_and_split "<float_cvt><vconvert><mode>2" - [(set (match_operand:VF 0 "register_operand") - (any_float:VF + [(set (match_operand:V_VLSF 0 "register_operand") + (any_float:V_VLSF (match_operand:<VCONVERT> 1 "register_operand")))] "TARGET_VECTOR && can_create_pseudo_p ()" "#" @@ -916,8 +916,8 @@ ;; - vfwcvt.f.x.v ;; ------------------------------------------------------------------------- (define_insn_and_split "<float_cvt><vnconvert><mode>2" - [(set (match_operand:VF 0 "register_operand") - (any_float:VF + [(set (match_operand:V_VLSF 0 "register_operand") + (any_float:V_VLSF (match_operand:<VNCONVERT> 1 "register_operand")))] "TARGET_VECTOR && can_create_pseudo_p ()" "#" @@ -940,7 +940,7 @@ (define_insn_and_split "<optab><mode><vnconvert>2" [(set (match_operand:<VNCONVERT> 0 "register_operand") (any_fix:<VNCONVERT> - (match_operand:VF 1 "register_operand")))] + (match_operand:V_VLSF 1 "register_operand")))] "TARGET_VECTOR && can_create_pseudo_p ()" "#" "&& 1" diff --git a/gcc/config/riscv/vector-iterators.md b/gcc/config/riscv/vector-iterators.md index 053d84c0c7d..19f3ec3ef74 100644 --- a/gcc/config/riscv/vector-iterators.md +++ b/gcc/config/riscv/vector-iterators.md @@ -1037,6 +1037,28 @@ (RVVM4DI "TARGET_VECTOR_ELEN_64 && TARGET_VECTOR_ELEN_FP_32") (RVVM2DI "TARGET_VECTOR_ELEN_64 && TARGET_VECTOR_ELEN_FP_32") (RVVM1DI "TARGET_VECTOR_ELEN_64 && TARGET_VECTOR_ELEN_FP_32") + + (V1SI "TARGET_VECTOR_VLS && TARGET_ZVFH") + (V2SI "TARGET_VECTOR_VLS && TARGET_ZVFH") + (V4SI "TARGET_VECTOR_VLS && TARGET_ZVFH") + (V8SI "TARGET_VECTOR_VLS && TARGET_ZVFH") + (V16SI "TARGET_VECTOR_VLS && TARGET_ZVFH && TARGET_MIN_VLEN >= 64") + (V32SI "TARGET_VECTOR_VLS && TARGET_ZVFH && TARGET_MIN_VLEN >= 128") + (V64SI "TARGET_VECTOR_VLS && TARGET_ZVFH && TARGET_MIN_VLEN >= 256") + (V128SI "TARGET_VECTOR_VLS && TARGET_ZVFH && TARGET_MIN_VLEN >= 512") + (V256SI "TARGET_VECTOR_VLS && TARGET_ZVFH && TARGET_MIN_VLEN >= 1024") + (V512SI "TARGET_VECTOR_VLS && TARGET_ZVFH && TARGET_MIN_VLEN >= 2048") + (V1024SI "TARGET_VECTOR_VLS && TARGET_ZVFH && TARGET_MIN_VLEN >= 4096") + (V1DI "TARGET_VECTOR_VLS && TARGET_VECTOR_ELEN_64 && TARGET_VECTOR_ELEN_FP_32") + (V2DI "TARGET_VECTOR_VLS && TARGET_VECTOR_ELEN_64 && TARGET_VECTOR_ELEN_FP_32") + (V4DI "TARGET_VECTOR_VLS && TARGET_VECTOR_ELEN_64 && TARGET_VECTOR_ELEN_FP_32") + (V8DI "TARGET_VECTOR_VLS && TARGET_VECTOR_ELEN_64 && TARGET_VECTOR_ELEN_FP_32 && TARGET_MIN_VLEN >= 64") + (V16DI "TARGET_VECTOR_VLS && TARGET_VECTOR_ELEN_64 && TARGET_VECTOR_ELEN_FP_32 && TARGET_MIN_VLEN >= 128") + (V32DI "TARGET_VECTOR_VLS && TARGET_VECTOR_ELEN_64 && TARGET_VECTOR_ELEN_FP_32 && TARGET_MIN_VLEN >= 256") + (V64DI "TARGET_VECTOR_VLS && TARGET_VECTOR_ELEN_64 && TARGET_VECTOR_ELEN_FP_32 && TARGET_MIN_VLEN >= 512") + (V128DI "TARGET_VECTOR_VLS && TARGET_VECTOR_ELEN_64 && TARGET_VECTOR_ELEN_FP_32 && TARGET_MIN_VLEN >= 1024") + (V256DI "TARGET_VECTOR_VLS && TARGET_VECTOR_ELEN_64 && TARGET_VECTOR_ELEN_FP_32 && TARGET_MIN_VLEN >= 2048") + (V512DI "TARGET_VECTOR_VLS && TARGET_VECTOR_ELEN_64 && TARGET_VECTOR_ELEN_FP_32 && TARGET_MIN_VLEN >= 4096") ]) (define_mode_iterator VQEXTI [ @@ -2635,12 +2657,80 @@ (RVVM8HF "RVVM8HI") (RVVM4HF "RVVM4HI") (RVVM2HF "RVVM2HI") (RVVM1HF "RVVM1HI") (RVVMF2HF "RVVMF2HI") (RVVMF4HF "RVVMF4HI") (RVVM8SF "RVVM8SI") (RVVM4SF "RVVM4SI") (RVVM2SF "RVVM2SI") (RVVM1SF "RVVM1SI") (RVVMF2SF "RVVMF2SI") (RVVM8DF "RVVM8DI") (RVVM4DF "RVVM4DI") (RVVM2DF "RVVM2DI") (RVVM1DF "RVVM1DI") + + (V1HF "V1HI") + (V2HF "V2HI") + (V4HF "V4HI") + (V8HF "V8HI") + (V16HF "V16HI") + (V32HF "V32HI") + (V64HF "V64HI") + (V128HF "V128HI") + (V256HF "V256HI") + (V512HF "V512HI") + (V1024HF "V1024HI") + (V2048HF "V2048HI") + (V1SF "V1SI") + (V2SF "V2SI") + (V4SF "V4SI") + (V8SF "V8SI") + (V16SF "V16SI") + (V32SF "V32SI") + (V64SF "V64SI") + (V128SF "V128SI") + (V256SF "V256SI") + (V512SF "V512SI") + (V1024SF "V1024SI") + (V1DF "V1DI") + (V2DF "V2DI") + (V4DF "V4DI") + (V8DF "V8DI") + (V16DF "V16DI") + (V32DF "V32DI") + (V64DF "V64DI") + (V128DF "V128DI") + (V256DF "V256DI") + (V512DF "V512DI") ]) (define_mode_attr vconvert [ (RVVM8HF "rvvm8hi") (RVVM4HF "rvvm4hi") (RVVM2HF "rvvm2hi") (RVVM1HF "rvvm1hi") (RVVMF2HF "rvvmf2hi") (RVVMF4HF "rvvmf4hi") (RVVM8SF "rvvm8si") (RVVM4SF "rvvm4si") (RVVM2SF "rvvm2si") (RVVM1SF "rvvm1si") (RVVMF2SF "rvvmf2si") (RVVM8DF "rvvm8di") (RVVM4DF "rvvm4di") (RVVM2DF "rvvm2di") (RVVM1DF "rvvm1di") + + (V1HF "v1hi") + (V2HF "v2hi") + (V4HF "v4hi") + (V8HF "v8hi") + (V16HF "v16hi") + (V32HF "v32hi") + (V64HF "v64hi") + (V128HF "v128hi") + (V256HF "v256hi") + (V512HF "v512hi") + (V1024HF "v1024hi") + (V2048HF "v2048hi") + (V1SF "v1si") + (V2SF "v2si") + (V4SF "v4si") + (V8SF "v8si") + (V16SF "v16si") + (V32SF "v32si") + (V64SF "v64si") + (V128SF "v128si") + (V256SF "v256si") + (V512SF "v512si") + (V1024SF "v1024si") + (V1DF "v1di") + (V2DF "v2di") + (V4DF "v4di") + (V8DF "v8di") + (V16DF "v16di") + (V32DF "v32di") + (V64DF "v64di") + (V128DF "v128di") + (V256DF "v256di") + (V512DF "v512di") ]) (define_mode_attr VNCONVERT [ @@ -2651,6 +2741,62 @@ (RVVM8DI "RVVM4SF") (RVVM4DI "RVVM2SF") (RVVM2DI "RVVM1SF") (RVVM1DI "RVVMF2SF") (RVVM8DF "RVVM4SI") (RVVM4DF "RVVM2SI") (RVVM2DF "RVVM1SI") (RVVM1DF "RVVMF2SI") + + (V1SI "V1HF") + (V2SI "V2HF") + (V4SI "V4HF") + (V8SI "V8HF") + (V16SI "V16HF") + (V32SI "V32HF") + (V64SI "V64HF") + (V128SI "V128HF") + (V256SI "V256HF") + (V512SI "V512HF") + (V1024SI "V1024HF") + (V1DI "V1SF") + (V2DI "V2SF") + (V4DI "V4SF") + (V8DI "V8SF") + (V16DI "V16SF") + (V32DI "V32SF") + (V64DI "V64SF") + (V128DI "V128SF") + (V256DI "V256SF") + (V512DI "V512SF") + + (V1HF "V1QI") + (V2HF "V2QI") + (V4HF "V4QI") + (V8HF "V8QI") + (V16HF "V16QI") + (V32HF "V32QI") + (V64HF "V64QI") + (V128HF "V128QI") + (V256HF "V256QI") + (V512HF "V512QI") + (V1024HF "V1024QI") + (V2048HF "V2048QI") + (V1SF "V1HI") + (V2SF "V2HI") + (V4SF "V4HI") + (V8SF "V8HI") + (V16SF "V16HI") + (V32SF "V32HI") + (V64SF "V64HI") + (V128SF "V128HI") + (V256SF "V256HI") + (V512SF "V512HI") + (V1024SF "V1024HI") + (V1DF "V1SI") + (V2DF "V2SI") + (V4DF "V4SI") + (V8DF "V8SI") + (V16DF "V16SI") + (V32DF "V32SI") + (V64DF "V64SI") + (V128DF "V128SI") + (V256DF "V256SI") + (V512DF "V512SI") ]) (define_mode_attr vnconvert [ @@ -2661,6 +2807,62 @@ (RVVM8DI "rvvm4sf") (RVVM4DI "rvvm2sf") (RVVM2DI "rvvm1sf") (RVVM1DI "rvvmf2sf") (RVVM8DF "rvvm4si") (RVVM4DF "rvvm2si") (RVVM2DF "rvvm1si") (RVVM1DF "rvvmf2si") + + (V1SI "v1hf") + (V2SI "v2hf") + (V4SI "v4hf") + (V8SI "v8hf") + (V16SI "v16hf") + (V32SI "v32hf") + (V64SI "v64hf") + (V128SI "v128hf") + (V256SI "v256hf") + (V512SI "v512hf") + (V1024SI "v1024hf") + (V1DI "v1sf") + (V2DI "v2sf") + (V4DI "v4sf") + (V8DI "v8sf") + (V16DI "v16sf") + (V32DI "v32sf") + (V64DI "v64sf") + (V128DI "v128sf") + (V256DI "v256sf") + (V512DI "v512sf") + + (V1HF "v1qi") + (V2HF "v2qi") + (V4HF "v4qi") + (V8HF "v8qi") + (V16HF "v16qi") + (V32HF "v32qi") + (V64HF "v64qi") + (V128HF "v128qi") + (V256HF "v256qi") + (V512HF "v512qi") + (V1024HF "v1024qi") + (V2048HF "v2048qi") + (V1SF "v1hi") + (V2SF "v2hi") + (V4SF "v4hi") + (V8SF "v8hi") + (V16SF "v16hi") + (V32SF "v32hi") + (V64SF "v64hi") + (V128SF "v128hi") + (V256SF "v256hi") + (V512SF "v512hi") + (V1024SF "v1024hi") + (V1DF "v1si") + (V2DF "v2si") + (V4DF "v4si") + (V8DF "v8si") + (V16DF "v16si") + (V32DF "v32si") + (V64DF "v64si") + (V128DF "v128si") + (V256DF "v256si") + (V512DF "v512si") ]) (define_mode_attr VDEMOTE [ diff --git a/gcc/config/riscv/vector.md b/gcc/config/riscv/vector.md index f66ffebba24..79c4a4bda53 100644 --- a/gcc/config/riscv/vector.md +++ b/gcc/config/riscv/vector.md @@ -7451,7 +7451,7 @@ (reg:SI VL_REGNUM) (reg:SI VTYPE_REGNUM)] UNSPEC_VPREDICATE) (any_fix:<VCONVERT> - (match_operand:VF 3 "register_operand" " vr, vr, vr, vr")) + (match_operand:V_VLSF 3 "register_operand" " vr, vr, vr, vr")) (match_operand:<VCONVERT> 2 "vector_merge_operand" " vu, 0, vu, 0")))] "TARGET_VECTOR" "vfcvt.rtz.x<u>.f.v\t%0,%3%p1" @@ -7459,8 +7459,8 @@ (set_attr "mode" "<MODE>")]) (define_insn "@pred_<float_cvt><mode>" - [(set (match_operand:VF 0 "register_operand" "=vd, vd, vr, vr") - (if_then_else:VF + [(set (match_operand:V_VLSF 0 "register_operand" "=vd, vd, vr, vr") + (if_then_else:V_VLSF (unspec:<VM> [(match_operand:<VM> 1 "vector_mask_operand" " vm, vm,Wc1,Wc1") (match_operand 4 "vector_length_operand" " rK, rK, rK, rK") @@ -7471,9 +7471,9 @@ (reg:SI VL_REGNUM) (reg:SI VTYPE_REGNUM) (reg:SI FRM_REGNUM)] UNSPEC_VPREDICATE) - (any_float:VF + (any_float:V_VLSF (match_operand:<VCONVERT> 3 "register_operand" " vr, vr, vr, vr")) - (match_operand:VF 2 "vector_merge_operand" " vu, 0, vu, 0")))] + (match_operand:V_VLSF 2 "vector_merge_operand" " vu, 0, vu, 0")))] "TARGET_VECTOR" "vfcvt.f.x<u>.v\t%0,%3%p1" [(set_attr "type" "vfcvtitof") @@ -7531,8 +7531,8 @@ (set_attr "mode" "<VNCONVERT>")]) (define_insn "@pred_widen_<float_cvt><mode>" - [(set (match_operand:VF 0 "register_operand" "=&vr, &vr") - (if_then_else:VF + [(set (match_operand:V_VLSF 0 "register_operand" "=&vr, &vr") + (if_then_else:V_VLSF (unspec:<VM> [(match_operand:<VM> 1 "vector_mask_operand" "vmWc1,vmWc1") (match_operand 4 "vector_length_operand" " rK, rK") @@ -7541,9 +7541,9 @@ (match_operand 7 "const_int_operand" " i, i") (reg:SI VL_REGNUM) (reg:SI VTYPE_REGNUM)] UNSPEC_VPREDICATE) - (any_float:VF + (any_float:V_VLSF (match_operand:<VNCONVERT> 3 "register_operand" " vr, vr")) - (match_operand:VF 2 "vector_merge_operand" " vu, 0")))] + (match_operand:V_VLSF 2 "vector_merge_operand" " vu, 0")))] "TARGET_VECTOR" "vfwcvt.f.x<u>.v\t%0,%3%p1" [(set_attr "type" "vfwcvtitof") @@ -7610,7 +7610,7 @@ (reg:SI VL_REGNUM) (reg:SI VTYPE_REGNUM)] UNSPEC_VPREDICATE) (any_fix:<VNCONVERT> - (match_operand:VF 3 "register_operand" " 0, 0, 0, 0, vr, vr")) + (match_operand:V_VLSF 3 "register_operand" " 0, 0, 0, 0, vr, vr")) (match_operand:<VNCONVERT> 2 "vector_merge_operand" " vu, 0, vu, 0, vu, 0")))] "TARGET_VECTOR" "vfncvt.rtz.x<u>.f.w\t%0,%3%p1" diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-1.c b/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-1.c new file mode 100644 index 00000000000..ca04f7f382e --- /dev/null +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-1.c @@ -0,0 +1,74 @@ +/* { dg-do compile } */ +/* { dg-options "-march=rv64gcv_zvfh_zvl4096b -mabi=lp64d -O3 --param=riscv-autovec-lmul=m8 -fdump-tree-optimized" } */ + +#include "def.h" + +DEF_CONVERT (fcvt, _Float16, int16_t, 4) +DEF_CONVERT (fcvt, _Float16, int16_t, 16) +DEF_CONVERT (fcvt, _Float16, int16_t, 32) +DEF_CONVERT (fcvt, _Float16, int16_t, 64) +DEF_CONVERT (fcvt, _Float16, int16_t, 128) +DEF_CONVERT (fcvt, _Float16, int16_t, 256) +DEF_CONVERT (fcvt, _Float16, int16_t, 512) +DEF_CONVERT (fcvt, _Float16, int16_t, 1024) +DEF_CONVERT (fcvt, _Float16, int16_t, 2048) + +DEF_CONVERT (fcvt, float, int32_t, 4) +DEF_CONVERT (fcvt, float, int32_t, 16) +DEF_CONVERT (fcvt, float, int32_t, 32) +DEF_CONVERT (fcvt, float, int32_t, 64) +DEF_CONVERT (fcvt, float, int32_t, 128) +DEF_CONVERT (fcvt, float, int32_t, 256) +DEF_CONVERT (fcvt, float, int32_t, 512) +DEF_CONVERT (fcvt, float, int32_t, 1024) + +DEF_CONVERT (fcvt, double, int64_t, 4) +DEF_CONVERT (fcvt, double, int64_t, 16) +DEF_CONVERT (fcvt, double, int64_t, 32) +DEF_CONVERT (fcvt, double, int64_t, 64) +DEF_CONVERT (fcvt, double, int64_t, 128) +DEF_CONVERT (fcvt, double, int64_t, 256) +DEF_CONVERT (fcvt, double, int64_t, 512) + +DEF_CONVERT (fcvt, _Float16, uint16_t, 4) +DEF_CONVERT (fcvt, _Float16, uint16_t, 16) +DEF_CONVERT (fcvt, _Float16, uint16_t, 32) +DEF_CONVERT (fcvt, _Float16, uint16_t, 64) +DEF_CONVERT (fcvt, _Float16, uint16_t, 128) +DEF_CONVERT (fcvt, _Float16, uint16_t, 256) +DEF_CONVERT (fcvt, _Float16, uint16_t, 512) +DEF_CONVERT (fcvt, _Float16, uint16_t, 1024) +DEF_CONVERT (fcvt, _Float16, uint16_t, 2048) + +DEF_CONVERT (fcvt, float, uint32_t, 4) +DEF_CONVERT (fcvt, float, uint32_t, 16) +DEF_CONVERT (fcvt, float, uint32_t, 32) +DEF_CONVERT (fcvt, float, uint32_t, 64) +DEF_CONVERT (fcvt, float, uint32_t, 128) +DEF_CONVERT (fcvt, float, uint32_t, 256) +DEF_CONVERT (fcvt, float, uint32_t, 512) +DEF_CONVERT (fcvt, float, uint32_t, 1024) + +DEF_CONVERT (fcvt, double, uint64_t, 4) +DEF_CONVERT (fcvt, double, uint64_t, 16) +DEF_CONVERT (fcvt, double, uint64_t, 32) +DEF_CONVERT (fcvt, double, uint64_t, 64) +DEF_CONVERT (fcvt, double, uint64_t, 128) +DEF_CONVERT (fcvt, double, uint64_t, 256) +DEF_CONVERT (fcvt, double, uint64_t, 512) + +/* { dg-final { scan-assembler-times {vfcvt\.rtz\.x\.f\.v} 24 } } */ +/* { dg-final { scan-assembler-times {vfcvt\.rtz\.xu\.f\.v} 24 } } */ +/* { dg-final { scan-assembler-not {csrr} } } */ +/* { dg-final { scan-tree-dump-not "1,1" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "2,2" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "4,4" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "16,16" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "32,32" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "64,64" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "128,128" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "256,256" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "512,512" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "1024,1024" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "2048,2048" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "4096,4096" "optimized" } } */ diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-10.c b/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-10.c new file mode 100644 index 00000000000..95d04cd814c --- /dev/null +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-10.c @@ -0,0 +1,80 @@ +/* { dg-do compile } */ +/* { dg-options "-march=rv64gcv_zvfh_zvl4096b -mabi=lp64d -O3 --param=riscv-autovec-lmul=m8 -fdump-tree-optimized" } */ + +#include "def.h" + +DEF_CONVERT (fncvt, _Float16, int8_t, 4) +DEF_CONVERT (fncvt, _Float16, int8_t, 16) +DEF_CONVERT (fncvt, _Float16, int8_t, 32) +DEF_CONVERT (fncvt, _Float16, int8_t, 64) +DEF_CONVERT (fncvt, _Float16, int8_t, 128) +DEF_CONVERT (fncvt, _Float16, int8_t, 256) +DEF_CONVERT (fncvt, _Float16, int8_t, 512) +DEF_CONVERT (fncvt, _Float16, int8_t, 1024) +DEF_CONVERT (fncvt, _Float16, int8_t, 2048) +DEF_CONVERT (fncvt, _Float16, int8_t, 4096) + +DEF_CONVERT (fncvt, _Float16, uint8_t, 4) +DEF_CONVERT (fncvt, _Float16, uint8_t, 16) +DEF_CONVERT (fncvt, _Float16, uint8_t, 32) +DEF_CONVERT (fncvt, _Float16, uint8_t, 64) +DEF_CONVERT (fncvt, _Float16, uint8_t, 128) +DEF_CONVERT (fncvt, _Float16, uint8_t, 256) +DEF_CONVERT (fncvt, _Float16, uint8_t, 512) +DEF_CONVERT (fncvt, _Float16, uint8_t, 1024) +DEF_CONVERT (fncvt, _Float16, uint8_t, 2048) +DEF_CONVERT (fncvt, _Float16, uint8_t, 4096) + +DEF_CONVERT (fncvt, float, int16_t, 4) +DEF_CONVERT (fncvt, float, int16_t, 16) +DEF_CONVERT (fncvt, float, int16_t, 32) +DEF_CONVERT (fncvt, float, int16_t, 64) +DEF_CONVERT (fncvt, float, int16_t, 128) +DEF_CONVERT (fncvt, float, int16_t, 256) +DEF_CONVERT (fncvt, float, int16_t, 512) +DEF_CONVERT (fncvt, float, int16_t, 1024) +DEF_CONVERT (fncvt, float, int16_t, 2048) + +DEF_CONVERT (fncvt, float, uint16_t, 4) +DEF_CONVERT (fncvt, float, uint16_t, 16) +DEF_CONVERT (fncvt, float, uint16_t, 32) +DEF_CONVERT (fncvt, float, uint16_t, 64) +DEF_CONVERT (fncvt, float, uint16_t, 128) +DEF_CONVERT (fncvt, float, uint16_t, 256) +DEF_CONVERT (fncvt, float, uint16_t, 512) +DEF_CONVERT (fncvt, float, uint16_t, 1024) +DEF_CONVERT (fncvt, float, uint16_t, 2048) + +DEF_CONVERT (fncvt, double, int32_t, 4) +DEF_CONVERT (fncvt, double, int32_t, 16) +DEF_CONVERT (fncvt, double, int32_t, 32) +DEF_CONVERT (fncvt, double, int32_t, 64) +DEF_CONVERT (fncvt, double, int32_t, 128) +DEF_CONVERT (fncvt, double, int32_t, 256) +DEF_CONVERT (fncvt, double, int32_t, 512) +DEF_CONVERT (fncvt, double, int32_t, 1024) + +DEF_CONVERT (fncvt, double, uint32_t, 4) +DEF_CONVERT (fncvt, double, uint32_t, 16) +DEF_CONVERT (fncvt, double, uint32_t, 32) +DEF_CONVERT (fncvt, double, uint32_t, 64) +DEF_CONVERT (fncvt, double, uint32_t, 128) +DEF_CONVERT (fncvt, double, uint32_t, 256) +DEF_CONVERT (fncvt, double, uint32_t, 512) +DEF_CONVERT (fncvt, double, uint32_t, 1024) + +/* { dg-final { scan-assembler-times {vfncvt\.rtz\.x\.f\.w} 30 } } */ +/* { dg-final { scan-assembler-times {vfncvt\.rtz\.xu\.f\.w} 30 } } */ +/* { dg-final { scan-assembler-not {csrr} } } */ +/* { dg-final { scan-tree-dump-not "1,1" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "2,2" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "4,4" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "16,16" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "32,32" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "64,64" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "128,128" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "256,256" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "512,512" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "1024,1024" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "2048,2048" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "4096,4096" "optimized" } } */ diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-11.c b/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-11.c new file mode 100644 index 00000000000..853acb3226b --- /dev/null +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-11.c @@ -0,0 +1,54 @@ +/* { dg-do compile } */ +/* { dg-options "-march=rv64gcv_zvfh_zvl4096b -mabi=lp64d -O3 --param=riscv-autovec-lmul=m8 -fno-trapping-math -fdump-tree-optimized" } */ + +#include "def.h" + +DEF_CONVERT (fncvt, float, int8_t, 4) +DEF_CONVERT (fncvt, float, int8_t, 16) +DEF_CONVERT (fncvt, float, int8_t, 32) +DEF_CONVERT (fncvt, float, int8_t, 64) +DEF_CONVERT (fncvt, float, int8_t, 128) +DEF_CONVERT (fncvt, float, int8_t, 256) +DEF_CONVERT (fncvt, float, int8_t, 512) +DEF_CONVERT (fncvt, float, int8_t, 1024) + +DEF_CONVERT (fncvt, float, uint8_t, 4) +DEF_CONVERT (fncvt, float, uint8_t, 16) +DEF_CONVERT (fncvt, float, uint8_t, 32) +DEF_CONVERT (fncvt, float, uint8_t, 64) +DEF_CONVERT (fncvt, float, uint8_t, 128) +DEF_CONVERT (fncvt, float, uint8_t, 256) +DEF_CONVERT (fncvt, float, uint8_t, 512) +DEF_CONVERT (fncvt, float, uint8_t, 1024) + +DEF_CONVERT (fncvt, double, int16_t, 4) +DEF_CONVERT (fncvt, double, int16_t, 16) +DEF_CONVERT (fncvt, double, int16_t, 32) +DEF_CONVERT (fncvt, double, int16_t, 64) +DEF_CONVERT (fncvt, double, int16_t, 128) +DEF_CONVERT (fncvt, double, int16_t, 256) +DEF_CONVERT (fncvt, double, int16_t, 512) + +DEF_CONVERT (fncvt, double, uint16_t, 4) +DEF_CONVERT (fncvt, double, uint16_t, 16) +DEF_CONVERT (fncvt, double, uint16_t, 32) +DEF_CONVERT (fncvt, double, uint16_t, 64) +DEF_CONVERT (fncvt, double, uint16_t, 128) +DEF_CONVERT (fncvt, double, uint16_t, 256) +DEF_CONVERT (fncvt, double, uint16_t, 512) + +/* { dg-final { scan-assembler-times {vfncvt\.rtz\.x\.f.w} 30 } } */ +/* { dg-final { scan-assembler-times {vncvt\.x\.x\.w} 30 } } */ +/* { dg-final { scan-assembler-not {csrr} } } */ +/* { dg-final { scan-tree-dump-not "1,1" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "2,2" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "4,4" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "16,16" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "32,32" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "64,64" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "128,128" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "256,256" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "512,512" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "1024,1024" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "2048,2048" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "4096,4096" "optimized" } } */ diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-12.c b/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-12.c new file mode 100644 index 00000000000..8fdfa447585 --- /dev/null +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-12.c @@ -0,0 +1,36 @@ +/* { dg-do compile } */ +/* { dg-options "-march=rv64gcv_zvfh_zvl4096b -mabi=lp64d -O3 --param=riscv-autovec-lmul=m8 -fno-trapping-math -fdump-tree-optimized" } */ + +#include "def.h" + +DEF_CONVERT (fncvt, double, int8_t, 4) +DEF_CONVERT (fncvt, double, int8_t, 16) +DEF_CONVERT (fncvt, double, int8_t, 32) +DEF_CONVERT (fncvt, double, int8_t, 64) +DEF_CONVERT (fncvt, double, int8_t, 128) +DEF_CONVERT (fncvt, double, int8_t, 256) +DEF_CONVERT (fncvt, double, int8_t, 512) + +DEF_CONVERT (fncvt, double, uint8_t, 4) +DEF_CONVERT (fncvt, double, uint8_t, 16) +DEF_CONVERT (fncvt, double, uint8_t, 32) +DEF_CONVERT (fncvt, double, uint8_t, 64) +DEF_CONVERT (fncvt, double, uint8_t, 128) +DEF_CONVERT (fncvt, double, uint8_t, 256) +DEF_CONVERT (fncvt, double, uint8_t, 512) + +/* { dg-final { scan-assembler-times {vfncvt\.rtz\.x\.f.w} 14 } } */ +/* { dg-final { scan-assembler-times {vncvt\.x\.x\.w} 28 } } */ +/* { dg-final { scan-assembler-not {csrr} } } */ +/* { dg-final { scan-tree-dump-not "1,1" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "2,2" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "4,4" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "16,16" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "32,32" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "64,64" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "128,128" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "256,256" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "512,512" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "1024,1024" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "2048,2048" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "4096,4096" "optimized" } } */ diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-2.c b/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-2.c new file mode 100644 index 00000000000..4b6a168625c --- /dev/null +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-2.c @@ -0,0 +1,74 @@ +/* { dg-do compile } */ +/* { dg-options "-march=rv64gcv_zvfh_zvl4096b -mabi=lp64d -O3 --param=riscv-autovec-lmul=m8 -fdump-tree-optimized" } */ + +#include "def.h" + +DEF_CONVERT (fcvt, int16_t, _Float16, 4) +DEF_CONVERT (fcvt, int16_t, _Float16, 16) +DEF_CONVERT (fcvt, int16_t, _Float16, 32) +DEF_CONVERT (fcvt, int16_t, _Float16, 64) +DEF_CONVERT (fcvt, int16_t, _Float16, 128) +DEF_CONVERT (fcvt, int16_t, _Float16, 256) +DEF_CONVERT (fcvt, int16_t, _Float16, 512) +DEF_CONVERT (fcvt, int16_t, _Float16, 1024) +DEF_CONVERT (fcvt, int16_t, _Float16, 2048) + +DEF_CONVERT (fcvt, int32_t, float, 4) +DEF_CONVERT (fcvt, int32_t, float, 16) +DEF_CONVERT (fcvt, int32_t, float, 32) +DEF_CONVERT (fcvt, int32_t, float, 64) +DEF_CONVERT (fcvt, int32_t, float, 128) +DEF_CONVERT (fcvt, int32_t, float, 256) +DEF_CONVERT (fcvt, int32_t, float, 512) +DEF_CONVERT (fcvt, int32_t, float, 1024) + +DEF_CONVERT (fcvt, int64_t, double, 4) +DEF_CONVERT (fcvt, int64_t, double, 16) +DEF_CONVERT (fcvt, int64_t, double, 32) +DEF_CONVERT (fcvt, int64_t, double, 64) +DEF_CONVERT (fcvt, int64_t, double, 128) +DEF_CONVERT (fcvt, int64_t, double, 256) +DEF_CONVERT (fcvt, int64_t, double, 512) + +DEF_CONVERT (fcvt, uint16_t, _Float16, 4) +DEF_CONVERT (fcvt, uint16_t, _Float16, 16) +DEF_CONVERT (fcvt, uint16_t, _Float16, 32) +DEF_CONVERT (fcvt, uint16_t, _Float16, 64) +DEF_CONVERT (fcvt, uint16_t, _Float16, 128) +DEF_CONVERT (fcvt, uint16_t, _Float16, 256) +DEF_CONVERT (fcvt, uint16_t, _Float16, 512) +DEF_CONVERT (fcvt, uint16_t, _Float16, 1024) +DEF_CONVERT (fcvt, uint16_t, _Float16, 2048) + +DEF_CONVERT (fcvt, uint32_t, float, 4) +DEF_CONVERT (fcvt, uint32_t, float, 16) +DEF_CONVERT (fcvt, uint32_t, float, 32) +DEF_CONVERT (fcvt, uint32_t, float, 64) +DEF_CONVERT (fcvt, uint32_t, float, 128) +DEF_CONVERT (fcvt, uint32_t, float, 256) +DEF_CONVERT (fcvt, uint32_t, float, 512) +DEF_CONVERT (fcvt, uint32_t, float, 1024) + +DEF_CONVERT (fcvt, uint64_t, double, 4) +DEF_CONVERT (fcvt, uint64_t, double, 16) +DEF_CONVERT (fcvt, uint64_t, double, 32) +DEF_CONVERT (fcvt, uint64_t, double, 64) +DEF_CONVERT (fcvt, uint64_t, double, 128) +DEF_CONVERT (fcvt, uint64_t, double, 256) +DEF_CONVERT (fcvt, uint64_t, double, 512) + +/* { dg-final { scan-assembler-times {vfcvt\.f\.x\.v} 24 } } */ +/* { dg-final { scan-assembler-times {vfcvt\.f\.xu\.v} 24 } } */ +/* { dg-final { scan-assembler-not {csrr} } } */ +/* { dg-final { scan-tree-dump-not "1,1" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "2,2" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "4,4" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "16,16" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "32,32" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "64,64" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "128,128" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "256,256" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "512,512" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "1024,1024" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "2048,2048" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "4096,4096" "optimized" } } */ diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-3.c b/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-3.c new file mode 100644 index 00000000000..6d74bdd35d4 --- /dev/null +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-3.c @@ -0,0 +1,58 @@ +/* { dg-do compile } */ +/* { dg-options "-march=rv64gcv_zvfh_zvl4096b -mabi=lp64d -O3 --param=riscv-autovec-lmul=m8 -fdump-tree-optimized" } */ + +#include "def.h" + +DEF_CONVERT (fwcvt, _Float16, int32_t, 4) +DEF_CONVERT (fwcvt, _Float16, int32_t, 16) +DEF_CONVERT (fwcvt, _Float16, int32_t, 32) +DEF_CONVERT (fwcvt, _Float16, int32_t, 64) +DEF_CONVERT (fwcvt, _Float16, int32_t, 128) +DEF_CONVERT (fwcvt, _Float16, int32_t, 256) +DEF_CONVERT (fwcvt, _Float16, int32_t, 512) +DEF_CONVERT (fwcvt, _Float16, int32_t, 1024) +DEF_CONVERT (fwcvt, _Float16, int32_t, 2048) + +DEF_CONVERT (fwcvt, _Float16, uint32_t, 4) +DEF_CONVERT (fwcvt, _Float16, uint32_t, 16) +DEF_CONVERT (fwcvt, _Float16, uint32_t, 32) +DEF_CONVERT (fwcvt, _Float16, uint32_t, 64) +DEF_CONVERT (fwcvt, _Float16, uint32_t, 128) +DEF_CONVERT (fwcvt, _Float16, uint32_t, 256) +DEF_CONVERT (fwcvt, _Float16, uint32_t, 512) +DEF_CONVERT (fwcvt, _Float16, uint32_t, 1024) +DEF_CONVERT (fwcvt, _Float16, uint32_t, 2048) + +DEF_CONVERT (fwcvt, float, int64_t, 4) +DEF_CONVERT (fwcvt, float, int64_t, 16) +DEF_CONVERT (fwcvt, float, int64_t, 32) +DEF_CONVERT (fwcvt, float, int64_t, 64) +DEF_CONVERT (fwcvt, float, int64_t, 128) +DEF_CONVERT (fwcvt, float, int64_t, 256) +DEF_CONVERT (fwcvt, float, int64_t, 512) +DEF_CONVERT (fwcvt, float, int64_t, 1024) + +DEF_CONVERT (fwcvt, float, uint64_t, 4) +DEF_CONVERT (fwcvt, float, uint64_t, 16) +DEF_CONVERT (fwcvt, float, uint64_t, 32) +DEF_CONVERT (fwcvt, float, uint64_t, 64) +DEF_CONVERT (fwcvt, float, uint64_t, 128) +DEF_CONVERT (fwcvt, float, uint64_t, 256) +DEF_CONVERT (fwcvt, float, uint64_t, 512) +DEF_CONVERT (fwcvt, float, uint64_t, 1024) + +/* { dg-final { scan-assembler-times {vfwcvt\.rtz\.x\.f\.v} 19 } } */ +/* { dg-final { scan-assembler-times {vfwcvt\.rtz\.xu\.f\.v} 19 } } */ +/* { dg-final { scan-assembler-not {csrr} } } */ +/* { dg-final { scan-tree-dump-not "1,1" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "2,2" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "4,4" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "16,16" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "32,32" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "64,64" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "128,128" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "256,256" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "512,512" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "1024,1024" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "2048,2048" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "4096,4096" "optimized" } } */ diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-4.c b/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-4.c new file mode 100644 index 00000000000..8ef991de44c --- /dev/null +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-4.c @@ -0,0 +1,36 @@ +/* { dg-do compile } */ +/* { dg-options "-march=rv64gcv_zvfh_zvl4096b -mabi=lp64d -O3 --param=riscv-autovec-lmul=m8 -fno-trapping-math -fdump-tree-optimized" } */ + +#include "def.h" + +DEF_CONVERT (fwcvt, _Float16, int64_t, 4) +DEF_CONVERT (fwcvt, _Float16, int64_t, 16) +DEF_CONVERT (fwcvt, _Float16, int64_t, 32) +DEF_CONVERT (fwcvt, _Float16, int64_t, 64) +DEF_CONVERT (fwcvt, _Float16, int64_t, 128) +DEF_CONVERT (fwcvt, _Float16, int64_t, 256) +DEF_CONVERT (fwcvt, _Float16, int64_t, 512) + +DEF_CONVERT (fwcvt, _Float16, uint64_t, 4) +DEF_CONVERT (fwcvt, _Float16, uint64_t, 16) +DEF_CONVERT (fwcvt, _Float16, uint64_t, 32) +DEF_CONVERT (fwcvt, _Float16, uint64_t, 64) +DEF_CONVERT (fwcvt, _Float16, uint64_t, 128) +DEF_CONVERT (fwcvt, _Float16, uint64_t, 256) +DEF_CONVERT (fwcvt, _Float16, uint64_t, 512) + +/* { dg-final { scan-assembler-times {vfwcvt\.rtz\.x\.f\.v} 14 } } */ +/* { dg-final { scan-assembler-times {vsext\.vf2} 14 } } */ +/* { dg-final { scan-assembler-not {csrr} } } */ +/* { dg-final { scan-tree-dump-not "1,1" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "2,2" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "4,4" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "16,16" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "32,32" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "64,64" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "128,128" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "256,256" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "512,512" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "1024,1024" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "2048,2048" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "4096,4096" "optimized" } } */ diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-5.c b/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-5.c new file mode 100644 index 00000000000..09a44de616a --- /dev/null +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-5.c @@ -0,0 +1,80 @@ +/* { dg-do compile } */ +/* { dg-options "-march=rv64gcv_zvfh_zvl4096b -mabi=lp64d -O3 --param=riscv-autovec-lmul=m8 -fdump-tree-optimized" } */ + +#include "def.h" + +DEF_CONVERT (fwcvt, int8_t, _Float16, 4) +DEF_CONVERT (fwcvt, int8_t, _Float16, 16) +DEF_CONVERT (fwcvt, int8_t, _Float16, 32) +DEF_CONVERT (fwcvt, int8_t, _Float16, 64) +DEF_CONVERT (fwcvt, int8_t, _Float16, 128) +DEF_CONVERT (fwcvt, int8_t, _Float16, 256) +DEF_CONVERT (fwcvt, int8_t, _Float16, 512) +DEF_CONVERT (fwcvt, int8_t, _Float16, 1024) +DEF_CONVERT (fwcvt, int8_t, _Float16, 2048) +DEF_CONVERT (fwcvt, int8_t, _Float16, 4096) + +DEF_CONVERT (fwcvt, uint8_t, _Float16, 4) +DEF_CONVERT (fwcvt, uint8_t, _Float16, 16) +DEF_CONVERT (fwcvt, uint8_t, _Float16, 32) +DEF_CONVERT (fwcvt, uint8_t, _Float16, 64) +DEF_CONVERT (fwcvt, uint8_t, _Float16, 128) +DEF_CONVERT (fwcvt, uint8_t, _Float16, 256) +DEF_CONVERT (fwcvt, uint8_t, _Float16, 512) +DEF_CONVERT (fwcvt, uint8_t, _Float16, 1024) +DEF_CONVERT (fwcvt, uint8_t, _Float16, 2048) +DEF_CONVERT (fwcvt, uint8_t, _Float16, 4096) + +DEF_CONVERT (fwcvt, int16_t, float, 4) +DEF_CONVERT (fwcvt, int16_t, float, 16) +DEF_CONVERT (fwcvt, int16_t, float, 32) +DEF_CONVERT (fwcvt, int16_t, float, 64) +DEF_CONVERT (fwcvt, int16_t, float, 128) +DEF_CONVERT (fwcvt, int16_t, float, 256) +DEF_CONVERT (fwcvt, int16_t, float, 512) +DEF_CONVERT (fwcvt, int16_t, float, 1024) +DEF_CONVERT (fwcvt, int16_t, float, 2048) + +DEF_CONVERT (fwcvt, uint16_t, float, 4) +DEF_CONVERT (fwcvt, uint16_t, float, 16) +DEF_CONVERT (fwcvt, uint16_t, float, 32) +DEF_CONVERT (fwcvt, uint16_t, float, 64) +DEF_CONVERT (fwcvt, uint16_t, float, 128) +DEF_CONVERT (fwcvt, uint16_t, float, 256) +DEF_CONVERT (fwcvt, uint16_t, float, 512) +DEF_CONVERT (fwcvt, uint16_t, float, 1024) +DEF_CONVERT (fwcvt, uint16_t, float, 2048) + +DEF_CONVERT (fwcvt, int32_t, double, 4) +DEF_CONVERT (fwcvt, int32_t, double, 16) +DEF_CONVERT (fwcvt, int32_t, double, 32) +DEF_CONVERT (fwcvt, int32_t, double, 64) +DEF_CONVERT (fwcvt, int32_t, double, 128) +DEF_CONVERT (fwcvt, int32_t, double, 256) +DEF_CONVERT (fwcvt, int32_t, double, 512) +DEF_CONVERT (fwcvt, int32_t, double, 1024) + +DEF_CONVERT (fwcvt, uint32_t, double, 4) +DEF_CONVERT (fwcvt, uint32_t, double, 16) +DEF_CONVERT (fwcvt, uint32_t, double, 32) +DEF_CONVERT (fwcvt, uint32_t, double, 64) +DEF_CONVERT (fwcvt, uint32_t, double, 128) +DEF_CONVERT (fwcvt, uint32_t, double, 256) +DEF_CONVERT (fwcvt, uint32_t, double, 512) +DEF_CONVERT (fwcvt, uint32_t, double, 1024) + +/* { dg-final { scan-assembler-times {vfwcvt\.f\.x\.v} 30 } } */ +/* { dg-final { scan-assembler-times {vfwcvt\.f\.xu\.v} 30 } } */ +/* { dg-final { scan-assembler-not {csrr} } } */ +/* { dg-final { scan-tree-dump-not "1,1" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "2,2" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "4,4" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "16,16" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "32,32" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "64,64" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "128,128" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "256,256" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "512,512" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "1024,1024" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "2048,2048" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "4096,4096" "optimized" } } */ diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-6.c b/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-6.c new file mode 100644 index 00000000000..2948dde0d0b --- /dev/null +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-6.c @@ -0,0 +1,55 @@ +/* { dg-do compile } */ +/* { dg-options "-march=rv64gcv_zvfh_zvl4096b -mabi=lp64d -O3 --param=riscv-autovec-lmul=m8 -fno-trapping-math -fdump-tree-optimized" } */ + +#include "def.h" + +DEF_CONVERT (fwcvt, int8_t, float, 4) +DEF_CONVERT (fwcvt, int8_t, float, 16) +DEF_CONVERT (fwcvt, int8_t, float, 32) +DEF_CONVERT (fwcvt, int8_t, float, 64) +DEF_CONVERT (fwcvt, int8_t, float, 128) +DEF_CONVERT (fwcvt, int8_t, float, 256) +DEF_CONVERT (fwcvt, int8_t, float, 512) +DEF_CONVERT (fwcvt, int8_t, float, 1024) + +DEF_CONVERT (fwcvt, uint8_t, float, 4) +DEF_CONVERT (fwcvt, uint8_t, float, 16) +DEF_CONVERT (fwcvt, uint8_t, float, 32) +DEF_CONVERT (fwcvt, uint8_t, float, 64) +DEF_CONVERT (fwcvt, uint8_t, float, 128) +DEF_CONVERT (fwcvt, uint8_t, float, 256) +DEF_CONVERT (fwcvt, uint8_t, float, 512) +DEF_CONVERT (fwcvt, uint8_t, float, 1024) + +DEF_CONVERT (fwcvt, int16_t, double, 4) +DEF_CONVERT (fwcvt, int16_t, double, 16) +DEF_CONVERT (fwcvt, int16_t, double, 32) +DEF_CONVERT (fwcvt, int16_t, double, 64) +DEF_CONVERT (fwcvt, int16_t, double, 128) +DEF_CONVERT (fwcvt, int16_t, double, 256) +DEF_CONVERT (fwcvt, int16_t, double, 512) + +DEF_CONVERT (fwcvt, uint16_t, double, 4) +DEF_CONVERT (fwcvt, uint16_t, double, 16) +DEF_CONVERT (fwcvt, uint16_t, double, 32) +DEF_CONVERT (fwcvt, uint16_t, double, 64) +DEF_CONVERT (fwcvt, uint16_t, double, 128) +DEF_CONVERT (fwcvt, uint16_t, double, 256) +DEF_CONVERT (fwcvt, uint16_t, double, 512) + +/* { dg-final { scan-assembler-times {vfwcvt\.f\.x\.v} 30 } } */ +/* { dg-final { scan-assembler-times {vsext\.vf2} 15 } } */ +/* { dg-final { scan-assembler-times {vzext\.vf2} 15 } } */ +/* { dg-final { scan-assembler-not {csrr} } } */ +/* { dg-final { scan-tree-dump-not "1,1" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "2,2" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "4,4" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "16,16" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "32,32" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "64,64" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "128,128" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "256,256" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "512,512" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "1024,1024" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "2048,2048" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "4096,4096" "optimized" } } */ diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-7.c b/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-7.c new file mode 100644 index 00000000000..ea39012b95a --- /dev/null +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-7.c @@ -0,0 +1,37 @@ +/* { dg-do compile } */ +/* { dg-options "-march=rv64gcv_zvfh_zvl4096b -mabi=lp64d -O3 --param=riscv-autovec-lmul=m8 -fdump-tree-optimized" } */ + +#include "def.h" + +DEF_CONVERT (fwcvt, int8_t, double, 4) +DEF_CONVERT (fwcvt, int8_t, double, 16) +DEF_CONVERT (fwcvt, int8_t, double, 32) +DEF_CONVERT (fwcvt, int8_t, double, 64) +DEF_CONVERT (fwcvt, int8_t, double, 128) +DEF_CONVERT (fwcvt, int8_t, double, 256) +DEF_CONVERT (fwcvt, int8_t, double, 512) + +DEF_CONVERT (fwcvt, uint8_t, double, 4) +DEF_CONVERT (fwcvt, uint8_t, double, 16) +DEF_CONVERT (fwcvt, uint8_t, double, 32) +DEF_CONVERT (fwcvt, uint8_t, double, 64) +DEF_CONVERT (fwcvt, uint8_t, double, 128) +DEF_CONVERT (fwcvt, uint8_t, double, 256) +DEF_CONVERT (fwcvt, uint8_t, double, 512) + +/* { dg-final { scan-assembler-times {vfwcvt\.f\.x\.v} 14 } } */ +/* { dg-final { scan-assembler-times {vsext\.vf4} 7 } } */ +/* { dg-final { scan-assembler-times {vzext\.vf4} 7 } } */ +/* { dg-final { scan-assembler-not {csrr} } } */ +/* { dg-final { scan-tree-dump-not "1,1" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "2,2" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "4,4" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "16,16" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "32,32" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "64,64" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "128,128" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "256,256" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "512,512" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "1024,1024" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "2048,2048" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "4096,4096" "optimized" } } */ diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-8.c b/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-8.c new file mode 100644 index 00000000000..59f36f582f6 --- /dev/null +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-8.c @@ -0,0 +1,58 @@ +/* { dg-do compile } */ +/* { dg-options "-march=rv64gcv_zvfh_zvl4096b -mabi=lp64d -O3 --param=riscv-autovec-lmul=m8 -fdump-tree-optimized" } */ + +#include "def.h" + +DEF_CONVERT (fncvt, int32_t, _Float16, 4) +DEF_CONVERT (fncvt, int32_t, _Float16, 16) +DEF_CONVERT (fncvt, int32_t, _Float16, 32) +DEF_CONVERT (fncvt, int32_t, _Float16, 64) +DEF_CONVERT (fncvt, int32_t, _Float16, 128) +DEF_CONVERT (fncvt, int32_t, _Float16, 256) +DEF_CONVERT (fncvt, int32_t, _Float16, 512) +DEF_CONVERT (fncvt, int32_t, _Float16, 1024) +DEF_CONVERT (fncvt, int32_t, _Float16, 2048) + +DEF_CONVERT (fncvt, uint32_t, _Float16, 4) +DEF_CONVERT (fncvt, uint32_t, _Float16, 16) +DEF_CONVERT (fncvt, uint32_t, _Float16, 32) +DEF_CONVERT (fncvt, uint32_t, _Float16, 64) +DEF_CONVERT (fncvt, uint32_t, _Float16, 128) +DEF_CONVERT (fncvt, uint32_t, _Float16, 256) +DEF_CONVERT (fncvt, uint32_t, _Float16, 512) +DEF_CONVERT (fncvt, uint32_t, _Float16, 1024) +DEF_CONVERT (fncvt, uint32_t, _Float16, 2048) + +DEF_CONVERT (fncvt, int64_t, float, 4) +DEF_CONVERT (fncvt, int64_t, float, 16) +DEF_CONVERT (fncvt, int64_t, float, 32) +DEF_CONVERT (fncvt, int64_t, float, 64) +DEF_CONVERT (fncvt, int64_t, float, 128) +DEF_CONVERT (fncvt, int64_t, float, 256) +DEF_CONVERT (fncvt, int64_t, float, 512) +DEF_CONVERT (fncvt, int64_t, float, 1024) + +DEF_CONVERT (fncvt, uint64_t, float, 4) +DEF_CONVERT (fncvt, uint64_t, float, 16) +DEF_CONVERT (fncvt, uint64_t, float, 32) +DEF_CONVERT (fncvt, uint64_t, float, 64) +DEF_CONVERT (fncvt, uint64_t, float, 128) +DEF_CONVERT (fncvt, uint64_t, float, 256) +DEF_CONVERT (fncvt, uint64_t, float, 512) +DEF_CONVERT (fncvt, uint64_t, float, 1024) + +/* { dg-final { scan-assembler-times {vfncvt\.f\.x\.w} 19 } } */ +/* { dg-final { scan-assembler-times {vfncvt\.f\.xu\.w} 19 } } */ +/* { dg-final { scan-assembler-not {csrr} } } */ +/* { dg-final { scan-tree-dump-not "1,1" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "2,2" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "4,4" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "16,16" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "32,32" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "64,64" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "128,128" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "256,256" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "512,512" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "1024,1024" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "2048,2048" "optimized" } } */ +/* { dg-final { scan-tree-dump-not "4096,4096" "optimized" } } */ diff --git a/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-9.c b/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-9.c new file mode 100644 index 00000000000..3546ddc4554 --- /dev/null +++ b/gcc/testsuite/gcc.target/riscv/rvv/autovec/vls/convert-9.c @@ -0,0 +1,22 @@ +/* { dg-do compile } */ +/* { dg-options "-march=rv64gcv_zvfh_zvl4096b -mabi=lp64d -O3 --param=riscv-autovec-lmul=m8 -fno-trapping-math -fdump-tree-optimized" } */ + +#include "def.h" + +DEF_CONVERT (fncvt, int64_t, _Float16, 4) +DEF_CONVERT (fncvt, int64_t, _Float16, 16) +DEF_CONVERT (fncvt, int64_t, _Float16, 32) +DEF_CONVERT (fncvt, int64_t, _Float16, 64) +DEF_CONVERT (fncvt, int64_t, _Float16, 128) +DEF_CONVERT (fncvt, int64_t, _Float16, 256) +DEF_CONVERT (fncvt, int64_t, _Float16, 512) + +DEF_CONVERT (fncvt, uint64_t, _Float16, 4) +DEF_CONVERT (fncvt, uint64_t, _Float16, 16) +DEF_CONVERT (fncvt, uint64_t, _Float16, 32) +DEF_CONVERT (fncvt, uint64_t, _Float16, 64) +DEF_CONVERT (fncvt, uint64_t, _Float16, 128) +DEF_CONVERT (fncvt, uint64_t, _Float16, 256) +DEF_CONVERT (fncvt, uint64_t, _Float16, 512) + +/* TODO: Currently, we can't vectorize this case. */ -- 2.36.3