On 20/03/2025 16:15, Christophe Lyon wrote: > r14-7202-gc8ec3e1327cb1e added vld1xN and vst1xN intrinsics and some > tests on arm, but didn't enable some existing tests. > > Since these tests are shared with aarch64, this patch removes the > 'dg-skip-if "unimplemented" { arm*-*-* }' directives and relies on the > advsimd-intrinsics.exp driver to define the appropriate flags and > dg-do-what action. (A previous patch removed 'dg-do run', and this > patch removes 'dg-options "-O3"' which would override the options > computed by the test driver) > > float16 intrinsics require the neon-fp16 FPU, which is possibly > enabled by advsimd-intrinsics.exp, so we include them unconditionally > on aarch64 or if fp16 is enabled on arm. > > poly64 intrinsics would require crypto-neon-fp-armv8: the patch > enables the corresponding tests on aarch64 only, since for arm they > are already covered by other tests in gcc.target/arm/simd/. For some > reason, poly64 tests where missing from x2 and x3 tests, so the patch > adds them as needed. > > Tested on aarch64-linux-gnu (no change), arm-linux-gnueabihf (the > additional tests are executed) and various flavors of arm-none-eabi > (the additional tests are compiled-only on M-profile, executed on > A-profile). > > gcc/testsuite/ > PR target/71233 > * gcc.target/aarch64/advsimd-intrinsics/vld1x2.c: Enable on arm. > * gcc.target/aarch64/advsimd-intrinsics/vld1x3.c: Likewise. > * gcc.target/aarch64/advsimd-intrinsics/vld1x4.c: Likewise. > * gcc.target/aarch64/advsimd-intrinsics/vst1x2.c: Likewise. > * gcc.target/aarch64/advsimd-intrinsics/vst1x3.c: Likewise. > * gcc.target/aarch64/advsimd-intrinsics/vst1x4.c: Likewise.
OK. R. > --- > .../aarch64/advsimd-intrinsics/vld1x2.c | 22 +++++++++++------ > .../aarch64/advsimd-intrinsics/vld1x3.c | 22 +++++++++++------ > .../aarch64/advsimd-intrinsics/vld1x4.c | 24 ++++++++++++------- > .../aarch64/advsimd-intrinsics/vst1x2.c | 22 +++++++++++------ > .../aarch64/advsimd-intrinsics/vst1x3.c | 22 +++++++++++------ > .../aarch64/advsimd-intrinsics/vst1x4.c | 24 ++++++++++++------- > 6 files changed, 90 insertions(+), 46 deletions(-) > > diff --git a/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vld1x2.c > b/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vld1x2.c > index 0892ce79118..a653296b766 100644 > --- a/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vld1x2.c > +++ b/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vld1x2.c > @@ -1,7 +1,3 @@ > -/* We haven't implemented these intrinsics for arm yet. */ > -/* { dg-skip-if "unimplemented" { arm*-*-* } } */ > -/* { dg-options "-O3" } */ > - > #include <arm_neon.h> > #include "arm-neon-ref.h" > > @@ -39,7 +35,6 @@ VARIANT (int32, 2, _s32) \ > VARIANT (int64, 1, _s64) \ > VARIANT (poly8, 8, _p8) \ > VARIANT (poly16, 4, _p16) \ > -VARIANT (float16, 4, _f16) \ > VARIANT (float32, 2, _f32) \ > VARIANT (uint8, 16, q_u8) \ > VARIANT (uint16, 8, q_u16) \ > @@ -51,17 +46,30 @@ VARIANT (int32, 4, q_s32) \ > VARIANT (int64, 2, q_s64) \ > VARIANT (poly8, 16, q_p8) \ > VARIANT (poly16, 8, q_p16) \ > -VARIANT (float16, 8, q_f16) \ > VARIANT (float32, 4, q_f32) > > +#if defined (__ARM_FP16_FORMAT_IEEE) \ > + || defined (__ARM_FP16_FORMAT_ALTERNATIVE) \ > + || defined (__aarch64__) > +#define VARIANTS_F16(VARIANT) \ > + VARIANT (float16, 4, _f16) \ > + VARIANT (float16, 8, q_f16) > +#else > +#define VARIANTS_F16(VARIANTS_F16) > +#endif > + > #ifdef __aarch64__ > #define VARIANTS(VARIANT) VARIANTS_1(VARIANT) \ > +VARIANTS_F16(VARIANT) \ > +VARIANT (poly64, 1, _p64) \ > +VARIANT (poly64, 2, q_p64) \ > VARIANT (mfloat8, 8, _mf8) \ > VARIANT (mfloat8, 16, q_mf8) \ > VARIANT (float64, 1, _f64) \ > VARIANT (float64, 2, q_f64) > #else > -#define VARIANTS(VARIANT) VARIANTS_1(VARIANT) > +#define VARIANTS(VARIANT) VARIANTS_1(VARIANT) \ > +VARIANTS_F16(VARIANT) > #endif > > /* Tests of vld1_x2 and vld1q_x2. */ > diff --git a/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vld1x3.c > b/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vld1x3.c > index 9465e4aabb6..832ee7538f6 100644 > --- a/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vld1x3.c > +++ b/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vld1x3.c > @@ -1,7 +1,3 @@ > -/* We haven't implemented these intrinsics for arm yet. */ > -/* { dg-skip-if "unimplemented" { arm*-*-* } } */ > -/* { dg-options "-O3" } */ > - > #include <arm_neon.h> > #include "arm-neon-ref.h" > > @@ -40,7 +36,6 @@ VARIANT (int32, 2, _s32) \ > VARIANT (int64, 1, _s64) \ > VARIANT (poly8, 8, _p8) \ > VARIANT (poly16, 4, _p16) \ > -VARIANT (float16, 4, _f16) \ > VARIANT (float32, 2, _f32) \ > VARIANT (uint8, 16, q_u8) \ > VARIANT (uint16, 8, q_u16) \ > @@ -52,17 +47,30 @@ VARIANT (int32, 4, q_s32) \ > VARIANT (int64, 2, q_s64) \ > VARIANT (poly8, 16, q_p8) \ > VARIANT (poly16, 8, q_p16) \ > -VARIANT (float16, 8, q_f16) \ > VARIANT (float32, 4, q_f32) > > +#if defined (__ARM_FP16_FORMAT_IEEE) \ > + || defined (__ARM_FP16_FORMAT_ALTERNATIVE) \ > + || defined (__aarch64__) > +#define VARIANTS_F16(VARIANT) \ > + VARIANT (float16, 4, _f16) \ > + VARIANT (float16, 8, q_f16) > +#else > +#define VARIANTS_F16(VARIANTS_F16) > +#endif > + > #ifdef __aarch64__ > #define VARIANTS(VARIANT) VARIANTS_1(VARIANT) \ > +VARIANTS_F16(VARIANT) \ > +VARIANT (poly64, 1, _p64) \ > +VARIANT (poly64, 2, q_p64) \ > VARIANT (mfloat8, 8, _mf8) \ > VARIANT (mfloat8, 16, q_mf8) \ > VARIANT (float64, 1, _f64) \ > VARIANT (float64, 2, q_f64) > #else > -#define VARIANTS(VARIANT) VARIANTS_1(VARIANT) > +#define VARIANTS(VARIANT) VARIANTS_1(VARIANT) \ > +VARIANTS_F16(VARIANT) > #endif > > > diff --git a/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vld1x4.c > b/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vld1x4.c > index a1461fd1af5..e5f55f0b730 100644 > --- a/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vld1x4.c > +++ b/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vld1x4.c > @@ -1,7 +1,3 @@ > -/* We haven't implemented these intrinsics for arm yet. */ > -/* { dg-skip-if "unimplemented" { arm*-*-* } } */ > -/* { dg-options "-O3" } */ > - > #include <stdbool.h> > #include <arm_neon.h> > #include "arm-neon-ref.h" > @@ -42,8 +38,6 @@ VARIANT (int32, 2, _s32) \ > VARIANT (int64, 1, _s64) \ > VARIANT (poly8, 8, _p8) \ > VARIANT (poly16, 4, _p16) \ > -VARIANT (poly64, 1, _p64) \ > -VARIANT (float16, 4, _f16) \ > VARIANT (float32, 2, _f32) \ > VARIANT (uint8, 16, q_u8) \ > VARIANT (uint16, 8, q_u16) \ > @@ -55,18 +49,30 @@ VARIANT (int32, 4, q_s32) \ > VARIANT (int64, 2, q_s64) \ > VARIANT (poly8, 16, q_p8) \ > VARIANT (poly16, 8, q_p16) \ > -VARIANT (poly64, 2, q_p64) \ > -VARIANT (float16, 8, q_f16) \ > VARIANT (float32, 4, q_f32) > > +#if defined (__ARM_FP16_FORMAT_IEEE) \ > + || defined (__ARM_FP16_FORMAT_ALTERNATIVE) \ > + || defined (__aarch64__) > +#define VARIANTS_F16(VARIANT) \ > + VARIANT (float16, 4, _f16) \ > + VARIANT (float16, 8, q_f16) > +#else > +#define VARIANTS_F16(VARIANTS_F16) > +#endif > + > #ifdef __aarch64__ > #define VARIANTS(VARIANT) VARIANTS_1(VARIANT) \ > +VARIANTS_F16(VARIANT) \ > +VARIANT (poly64, 1, _p64) \ > +VARIANT (poly64, 2, q_p64) \ > VARIANT (mfloat8, 8, _mf8) \ > VARIANT (mfloat8, 16, q_mf8) \ > VARIANT (float64, 1, _f64) \ > VARIANT (float64, 2, q_f64) > #else > -#define VARIANTS(VARIANT) VARIANTS_1(VARIANT) > +#define VARIANTS(VARIANT) VARIANTS_1(VARIANT) \ > +VARIANTS_F16(VARIANT) > #endif > > /* Tests of vld1_x4 and vld1q_x4. */ > diff --git a/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vst1x2.c > b/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vst1x2.c > index 3cf5eb3bd7e..8399290c55f 100644 > --- a/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vst1x2.c > +++ b/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vst1x2.c > @@ -1,7 +1,3 @@ > -/* We haven't implemented these intrinsics for arm yet. */ > -/* { dg-skip-if "unimplemented" { arm*-*-* } } */ > -/* { dg-options "-O3" } */ > - > #include <arm_neon.h> > #include "arm-neon-ref.h" > > @@ -39,7 +35,6 @@ VARIANT (int32, 2, _s32) \ > VARIANT (int64, 1, _s64) \ > VARIANT (poly8, 8, _p8) \ > VARIANT (poly16, 4, _p16) \ > -VARIANT (float16, 4, _f16) \ > VARIANT (float32, 2, _f32) \ > VARIANT (uint8, 16, q_u8) \ > VARIANT (uint16, 8, q_u16) \ > @@ -51,17 +46,30 @@ VARIANT (int32, 4, q_s32) \ > VARIANT (int64, 2, q_s64) \ > VARIANT (poly8, 16, q_p8) \ > VARIANT (poly16, 8, q_p16) \ > -VARIANT (float16, 8, q_f16) \ > VARIANT (float32, 4, q_f32) > > +#if defined (__ARM_FP16_FORMAT_IEEE) \ > + || defined (__ARM_FP16_FORMAT_ALTERNATIVE) \ > + || defined (__aarch64__) > +#define VARIANTS_F16(VARIANT) \ > + VARIANT (float16, 4, _f16) \ > + VARIANT (float16, 8, q_f16) > +#else > +#define VARIANTS_F16(VARIANTS_F16) > +#endif > + > #ifdef __aarch64__ > #define VARIANTS(VARIANT) VARIANTS_1(VARIANT) \ > +VARIANTS_F16(VARIANT) \ > +VARIANT (poly64, 1, _p64) \ > +VARIANT (poly64, 2, q_p64) \ > VARIANT (mfloat8, 8, _mf8) \ > VARIANT (mfloat8, 16, q_mf8) \ > VARIANT (float64, 1, _f64) \ > VARIANT (float64, 2, q_f64) > #else > -#define VARIANTS(VARIANT) VARIANTS_1(VARIANT) > +#define VARIANTS(VARIANT) VARIANTS_1(VARIANT) \ > +VARIANTS_F16(VARIANT) > #endif > > /* Tests of vst1_x2 and vst1q_x2. */ > diff --git a/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vst1x3.c > b/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vst1x3.c > index c05f8e73e64..e7d9e022bba 100644 > --- a/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vst1x3.c > +++ b/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vst1x3.c > @@ -1,7 +1,3 @@ > -/* We haven't implemented these intrinsics for arm yet. */ > -/* { dg-skip-if "unimplemented" { arm*-*-* } } */ > -/* { dg-options "-O3" } */ > - > #include <arm_neon.h> > #include "arm-neon-ref.h" > > @@ -40,7 +36,6 @@ VARIANT (int32, 2, _s32) \ > VARIANT (int64, 1, _s64) \ > VARIANT (poly8, 8, _p8) \ > VARIANT (poly16, 4, _p16) \ > -VARIANT (float16, 4, _f16) \ > VARIANT (float32, 2, _f32) \ > VARIANT (uint8, 16, q_u8) \ > VARIANT (uint16, 8, q_u16) \ > @@ -52,17 +47,30 @@ VARIANT (int32, 4, q_s32) \ > VARIANT (int64, 2, q_s64) \ > VARIANT (poly8, 16, q_p8) \ > VARIANT (poly16, 8, q_p16) \ > -VARIANT (float16, 8, q_f16) \ > VARIANT (float32, 4, q_f32) > > +#if defined (__ARM_FP16_FORMAT_IEEE) \ > + || defined (__ARM_FP16_FORMAT_ALTERNATIVE) \ > + || defined (__aarch64__) > +#define VARIANTS_F16(VARIANT) \ > + VARIANT (float16, 4, _f16) \ > + VARIANT (float16, 8, q_f16) > +#else > +#define VARIANTS_F16(VARIANTS_F16) > +#endif > + > #ifdef __aarch64__ > #define VARIANTS(VARIANT) VARIANTS_1(VARIANT) \ > +VARIANTS_F16(VARIANT) \ > +VARIANT (poly64, 1, _p64) \ > +VARIANT (poly64, 2, q_p64) \ > VARIANT (mfloat8, 8, _mf8) \ > VARIANT (mfloat8, 16, q_mf8) \ > VARIANT (float64, 1, _f64) \ > VARIANT (float64, 2, q_f64) > #else > -#define VARIANTS(VARIANT) VARIANTS_1(VARIANT) > +#define VARIANTS(VARIANT) VARIANTS_1(VARIANT) \ > +VARIANTS_F16(VARIANT) > #endif > > /* Tests of vst1_x3 and vst1q_x3. */ > diff --git a/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vst1x4.c > b/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vst1x4.c > index a9867c312cf..83b0567963c 100644 > --- a/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vst1x4.c > +++ b/gcc/testsuite/gcc.target/aarch64/advsimd-intrinsics/vst1x4.c > @@ -1,7 +1,3 @@ > -/* We haven't implemented these intrinsics for arm yet. */ > -/* { dg-skip-if "unimplemented" { arm*-*-* } } */ > -/* { dg-options "-O3" } */ > - > #include <arm_neon.h> > #include "arm-neon-ref.h" > > @@ -41,8 +37,6 @@ VARIANT (int32, 2, _s32) \ > VARIANT (int64, 1, _s64) \ > VARIANT (poly8, 8, _p8) \ > VARIANT (poly16, 4, _p16) \ > -VARIANT (poly64, 1, _p64) \ > -VARIANT (float16, 4, _f16) \ > VARIANT (float32, 2, _f32) \ > VARIANT (uint8, 16, q_u8) \ > VARIANT (uint16, 8, q_u16) \ > @@ -54,18 +48,30 @@ VARIANT (int32, 4, q_s32) \ > VARIANT (int64, 2, q_s64) \ > VARIANT (poly8, 16, q_p8) \ > VARIANT (poly16, 8, q_p16) \ > -VARIANT (poly64, 2, q_p64) \ > -VARIANT (float16, 8, q_f16) \ > VARIANT (float32, 4, q_f32) > > +#if defined (__ARM_FP16_FORMAT_IEEE) \ > + || defined (__ARM_FP16_FORMAT_ALTERNATIVE) \ > + || defined (__aarch64__) > +#define VARIANTS_F16(VARIANT) \ > + VARIANT (float16, 4, _f16) \ > + VARIANT (float16, 8, q_f16) > +#else > +#define VARIANTS_F16(VARIANTS_F16) > +#endif > + > #ifdef __aarch64__ > #define VARIANTS(VARIANT) VARIANTS_1(VARIANT) \ > +VARIANTS_F16(VARIANT) \ > +VARIANT (poly64, 1, _p64) \ > +VARIANT (poly64, 2, q_p64) \ > VARIANT (mfloat8, 8, _mf8) \ > VARIANT (mfloat8, 16, q_mf8) \ > VARIANT (float64, 1, _f64) \ > VARIANT (float64, 2, q_f64) > #else > -#define VARIANTS(VARIANT) VARIANTS_1(VARIANT) > +#define VARIANTS(VARIANT) VARIANTS_1(VARIANT) \ > +VARIANTS_F16(VARIANT) > #endif > > /* Tests of vst1_x4 and vst1q_x4. */