Hi Carl, on 2024/8/8 01:15, Carl Love wrote: > > GCC maintainers: > > The following patch adds missing test cases for the overloaded vec_perm > built-in. It also fixes and issue with printing the 128-bit values in the > DEBUG section that was noticed when adding the additional test cases. > > The patch has been tested on Power 10 LE and BE with no regressions. > > Please let me know if it is acceptable for mainline. Thanks. > > Carl > > ------------------------------------------------------------- > > rs6000, add testcases to the overloaded vec_perm built-in > > The overloaded vec_perm built-in supports permuting signed and unsigned > vectors of char, bool char, short int, short bool, int, bool, > long long int, long long bool, int128, float and double. However, not all > of the supported arguments are included in the test cases. This patch adds > the missing test cases. > > Additionally, in the 128-bit debug print statements the expected result and > the result need to be cast to unsigned long long to print correctly. The > patch makes this additional change to the print statements. > > gcc/ChangeLog: > * doc/extend.texi: Fix spelling mistake in description of the > vec_sel built-in. > Add documentation of the 128-bit vec_perm instance. > > gcc/testsuite/ChangeLog: > * gcc.target/powerpc/vsx-builtin-3.c: Add vec_perm test cases for > arguments of type vector signed long long int, long long bool, > bool, bool short, bool char and pixel, > vector unsigned long long int, unsigned int, unsigned short int, > unsigned char. > Cast arguments for debug prints to unsigned long long. > * gcc.target/powerpc/builtins-4-int128-runnable.c: Add vec_perm > test cases for signed and unsigned int128 arguments.
Nit: Some changelog lines have unnecessary newlines and spaces. > --- > gcc/doc/extend.texi | 12 +- > .../powerpc/builtins-4-int128-runnable.c | 108 +++++++++++++++--- > .../gcc.target/powerpc/vsx-builtin-3.c | 18 +++ > 3 files changed, 121 insertions(+), 17 deletions(-) > > diff --git a/gcc/doc/extend.texi b/gcc/doc/extend.texi > index 48b27ff9f39..bf6f4094040 100644 > --- a/gcc/doc/extend.texi > +++ b/gcc/doc/extend.texi > @@ -21553,9 +21553,19 @@ vector bool __int128 vec_sel (vector bool __int128, > vector bool __int128, vector unsigned __int128); > @end smallexample > > -The instance is an extension of the exiting overloaded built-in > @code{vec_sel} > +The instance is an extension of the existing overloaded built-in > @code{vec_sel} > that is documented in the PVIPR. Good catch! > > +@smallexample > +vector signed __int128 vec_perm (vector signed __int128, > + vector signed __int128); > +vector unsigned __int128 vec_perm (vector unsigned __int128, > + vector unsigned __int128); > +@end smallexample > + > +The 128-bit integer arguments for the @code{vec_perm} built-in are in > addition > +to the instances that are documented in the PVIPR. Nit: Maybe just copy the above wording for @code{vec_sel} but replaced with @code{vec_perm} to keep them consistent. > + > @node Basic PowerPC Built-in Functions Available on ISA 2.06 > @subsubsection Basic PowerPC Built-in Functions Available on ISA 2.06 > > diff --git a/gcc/testsuite/gcc.target/powerpc/builtins-4-int128-runnable.c > b/gcc/testsuite/gcc.target/powerpc/builtins-4-int128-runnable.c > index 62c11132cf3..c61b0ecb854 100644 > --- a/gcc/testsuite/gcc.target/powerpc/builtins-4-int128-runnable.c > +++ b/gcc/testsuite/gcc.target/powerpc/builtins-4-int128-runnable.c > @@ -18,6 +18,16 @@ int main() { > __uint128_t data_u128[100]; > __int128_t data_128[100]; > > +#ifdef __BIG_ENDIAN__ > + vector unsigned char vuc = {0xC, 0xD, 0xE, 0xF, 0x8, 0x9, 0xA, 0xB, > + 0x1C, 0x1D, 0x1E, 0x1F, 0x18, 0x19, 0x1A, > 0x1B}; > +#else > + vector unsigned char vuc = {0x4, 0x5, 0x6, 0x7, 0x0, 0x1, 0x2, 0x3, > + 0x14, 0x15, 0x16, 0x17, 0x10, 0x11, 0x12, 0x13}; > +#endif > + > + vector __int128_t vec_128_arg1, vec_128_arg2; > + vector __uint128_t vec_u128_arg1, vec_u128_arg2; > vector __int128_t vec_128_expected1, vec_128_result1; > vector __uint128_t vec_u128_expected1, vec_u128_result1; > signed long long zero = (signed long long) 0; > @@ -37,11 +47,13 @@ int main() { > { > #ifdef DEBUG > printf("Error: vec_xl(), vec_128_result1[0] = %lld %llu; ", > - vec_128_result1[0] >> 64, > - vec_128_result1[0] & (__int128_t)0xFFFFFFFFFFFFFFFF); > + (unsigned long long)(vec_128_result1[0] >> 64), > + (unsigned long long)(vec_128_result1[0] > + & (__int128_t)0xFFFFFFFFFFFFFFFF)); > printf("vec_128_expected1[0] = %lld %llu\n", > - vec_128_expected1[0] >> 64, > - vec_128_expected1[0] & (__int128_t)0xFFFFFFFFFFFFFFFF); > + (unsigned long long)(vec_128_expected1[0] >> 64), > + (unsigned long long)(vec_128_expected1[0] > + & (__int128_t)0xFFFFFFFFFFFFFFFF)); > #else > abort (); > #endif > @@ -53,11 +65,13 @@ int main() { > { > #ifdef DEBUG > printf("Error: vec_xl(), vec_u128_result1[0] = %lld; ", > - vec_u128_result1[0] >> 64, > - vec_u128_result1[0] & (__int128_t)0xFFFFFFFFFFFFFFFF); > + (unsigned long long)(vec_u128_result1[0] >> 64), > + (unsigned long long)(vec_u128_result1[0] > + & (__int128_t)0xFFFFFFFFFFFFFFFF)); > printf("vec_u128_expected1[0] = %lld\n", > - vec_u128_expected1[0] >> 64, > - vec_u128_expected1[0] & (__int128_t)0xFFFFFFFFFFFFFFFF); > + (unsigned long long)(vec_u128_expected1[0] >> 64), > + (unsigned long long)(vec_u128_expected1[0] > + & (__int128_t)0xFFFFFFFFFFFFFFFF)); > #else > abort (); > #endif > @@ -76,11 +90,12 @@ int main() { > { > #ifdef DEBUG > printf("Error: vec_xl_be(), vec_128_result1[0] = %llu %llu;", > - vec_128_result1[0] >> 64, > - vec_128_result1[0] & 0xFFFFFFFFFFFFFFFF); > + (unsigned long long)(vec_128_result1[0] >> 64), > + (unsigned long long)(vec_128_result1[0] & 0xFFFFFFFFFFFFFFFF)); > printf(" vec_128_expected1[0] = %llu %llu\n", > - vec_128_expected1[0] >> 64, > - vec_128_expected1[0] & 0xFFFFFFFFFFFFFFFF); > + (unsigned long long)(vec_128_expected1[0] >> 64), > + (unsigned long long)(vec_128_expected1[0] > + & 0xFFFFFFFFFFFFFFFF)); > #else > abort (); > #endif > @@ -98,11 +113,72 @@ int main() { > { > #ifdef DEBUG > printf("Error: vec_xl_be(), vec_u128_result1[0] = %llu %llu;", > - vec_u128_result1[0] >> 64, > - vec_u128_result1[0] & 0xFFFFFFFFFFFFFFFF); > + (unsigned long long)(vec_u128_result1[0] >> 64), > + (unsigned long long)(vec_u128_result1[0] & 0xFFFFFFFFFFFFFFFF)); > + printf(" vec_u128_expected1[0] = %llu %llu\n", > + (unsigned long long)(vec_u128_expected1[0] >> 64), > + (unsigned long long)(vec_u128_expected1[0] > + & 0xFFFFFFFFFFFFFFFF)); > +#else > + abort (); > +#endif > + } > + > + /* vec_perm() tests */ > + vec_128_arg1 = (vector __int128_t){ (__uint128_t)0x1122334455667788ULL }; > + vec_128_arg2 = (vector __int128_t){ (__uint128_t)0xAAABBBCCCDDDEEEF }; > + > +#ifdef __BIG_ENDIAN__ > + vec_128_expected1[0] = 0x5566778811223344ULL; > + vec_128_expected1[0] = (vec_128_expected1[0] << 64) | > + 0xcdddeeefaaabbbccULL; > +#else > + vec_128_expected1[0] = 0xcdddeeefaaabbbccULL; > + vec_128_expected1[0] = (vec_128_expected1[0] << 64) | > + 0x5566778811223344ULL; > +#endif > + > + vec_128_result1 = vec_perm (vec_128_arg1, vec_128_arg2, vuc); > + > + if (vec_128_expected1[0] != vec_128_result1[0]) > + { > +#ifdef DEBUG > + printf("Error: vec_perm(), vec_128_result1[0] = %llu %llu;", > + (unsigned long long)(vec_128_result1[0] >> 64), > + (unsigned long long)(vec_128_result1[0] & 0xFFFFFFFFFFFFFFFF)); > + printf(" vec_128_expected1[0] = %llu %llu\n", > + (unsigned long long)(vec_128_expected1[0] >> 64), > + (unsigned long long)(vec_128_expected1[0] > + & 0xFFFFFFFFFFFFFFFF)); > +#else > + abort (); > +#endif > + } > + vec_u128_arg1 = (vector __uint128_t){ (__uint128_t)0x1122334455667788ULL }; > + vec_u128_arg2 = (vector __uint128_t){ (__uint128_t)0xAAABBBCCCDDDEEEF }; > + > +#ifdef __BIG_ENDIAN__ > + vec_u128_expected1[0] = 0x5566778811223344ULL; > + vec_u128_expected1[0] = (vec_u128_expected1[0] << 64) | > + 0xcdddeeefaaabbbccULL; > +#else > + vec_u128_expected1[0] = 0xcdddeeefaaabbbccULL; > + vec_u128_expected1[0] = (vec_u128_expected1[0] << 64) | > + 0x5566778811223344ULL; > +#endif > + > + vec_u128_result1 = vec_perm (vec_u128_arg1, vec_u128_arg2, vuc); > + > + if (vec_u128_expected1[0] != vec_u128_result1[0]) > + { > +#ifdef DEBUG > + printf("Error: vec_perm(), vec_u128_result1[0] = %llu %llu;", > + (unsigned long long)(vec_u128_result1[0] >> 64), > + (unsigned long long)(vec_u128_result1[0] & 0xFFFFFFFFFFFFFFFF)); > printf(" vec_u128_expected1[0] = %llu %llu\n", > - vec_u128_expected1[0] >> 64, > - vec_u128_expected1[0] & 0xFFFFFFFFFFFFFFFF); > + (unsigned long long)(vec_u128_expected1[0] >> 64), > + (unsigned long long)(vec_u128_expected1[0] > + & 0xFFFFFFFFFFFFFFFF)); > #else > abort (); > #endif > diff --git a/gcc/testsuite/gcc.target/powerpc/vsx-builtin-3.c > b/gcc/testsuite/gcc.target/powerpc/vsx-builtin-3.c > index 67c93be1469..b3b76be34b9 100644 > --- a/gcc/testsuite/gcc.target/powerpc/vsx-builtin-3.c > +++ b/gcc/testsuite/gcc.target/powerpc/vsx-builtin-3.c > @@ -39,10 +39,17 @@ > > #include <altivec.h> > > +extern __vector long long int sll[][4]; There is a "extern __vector long long sll[][4]" below. > +extern __vector long long bool bll[][4]; > extern __vector int si[][4]; > +extern __vector bool int bi[][4]; Similar, having "... __vector __bool int bi[][4]" below. > extern __vector short ss[][4]; > +extern __vector bool short bs[][4]; Similar, having "... __vector __bool short bs[][4]" below. > extern __vector signed char sc[][4]; > +extern __vector bool char bc[][4]; Ditto. > +extern __vector pixel p[][4]; Similar, having "... __vector __pixel p[][4]" below. > extern __vector float f[][4]; > +extern __vector unsigned long long int ull[][4]; As above, I think we only need "bll" and "ull" here. BR, Kewen > extern __vector unsigned int ui[][4]; > extern __vector unsigned short us[][4]; > extern __vector unsigned char uc[][4]; > @@ -88,12 +95,23 @@ int do_perm(void) > { > int i = 0; > > + sll[i][0] = vec_perm (sll[i][1], sll[i][2], uc[i][3]); i++; > + bll[i][0] = vec_perm (bll[i][1], bll[i][2], uc[i][3]); i++; > si[i][0] = vec_perm (si[i][1], si[i][2], uc[i][3]); i++; > + bi[i][0] = vec_perm (bi[i][1], bi[i][2], uc[i][3]); i++; > ss[i][0] = vec_perm (ss[i][1], ss[i][2], uc[i][3]); i++; > + bs[i][0] = vec_perm (bs[i][1], bs[i][2], uc[i][3]); i++; > sc[i][0] = vec_perm (sc[i][1], sc[i][2], uc[i][3]); i++; > + bc[i][0] = vec_perm (bc[i][1], bc[i][2], uc[i][3]); i++; > + p[i][0] = vec_perm (p[i][1], p[i][2], uc[i][3]); i++; > f[i][0] = vec_perm (f[i][1], f[i][2], uc[i][3]); i++; > d[i][0] = vec_perm (d[i][1], d[i][2], uc[i][3]); i++; > > + ull[i][0] = vec_perm (ull[i][1], ull[i][2], uc[i][3]); i++; > + ui[i][0] = vec_perm (ui[i][1], ui[i][2], uc[i][3]); i++; > + us[i][0] = vec_perm (us[i][1], us[i][2], uc[i][3]); i++; > + uc[i][0] = vec_perm (uc[i][1], uc[i][2], uc[i][3]); i++; > + > si[i][0] = vec_perm (si[i][1], si[i][2], uc[i][3]); i++; > ss[i][0] = vec_perm (ss[i][1], ss[i][2], uc[i][3]); i++; > sc[i][0] = vec_perm (sc[i][1], sc[i][2], uc[i][3]); i++;