Hi,
on 2024/5/30 00:10, Carl Love wrote:
> This was patch 10 from the previous series. The patch was updated to
> address feedback comments.
>
> Carl
> ---------------------------------------------------
>
> rs6000, extend vec_xxpermdi built-in for __int128 args
>
> Add a new signed and unsigned overloaded instances for vec_xxpermdi
>
> __int128 vec_xxpermdi (__int128, __int128, const int);
> __uint128 vec_xxpermdi (__uint128, __uint128, const int);
>
> Update the documentation to include a reference to the new built-in
> instances.
>
> Add test cases for the new overloaded instances.
>
> gcc/ChangeLog:
> * config/rs6000/rs6000-overload.def (vec_xxpermdi): Add new
> overloaded built-in instances.
> * doc/extend.texi: Add documentation for new overloaded built-in
> instances.
>
> gcc/testsuite/ChangeLog:gcc/testsuite/ChangeLog:
> * gcc.target/powerpc/vec_perm-runnable-i128.c: New test file.
> ---
> gcc/config/rs6000/rs6000-overload.def | 4 +
> gcc/doc/extend.texi | 2 +
> .../powerpc/vec_perm-runnable-i128.c | 229 ++++++++++++++++++
> 3 files changed, 235 insertions(+)
> create mode 100644 gcc/testsuite/gcc.target/powerpc/vec_perm-runnable-i128.c
>
> diff --git a/gcc/config/rs6000/rs6000-overload.def
> b/gcc/config/rs6000/rs6000-overload.def
> index a210c5ad10d..45000f161e4 100644
> --- a/gcc/config/rs6000/rs6000-overload.def
> +++ b/gcc/config/rs6000/rs6000-overload.def
> @@ -4932,6 +4932,10 @@
> XXPERMDI_4SF XXPERMDI_VF
> vd __builtin_vsx_xxpermdi (vd, vd, const int);
> XXPERMDI_2DF XXPERMDI_VD
> + vsq __builtin_vsx_xxpermdi (vsq, vsq, const int);
> + XXPERMDI_1TI XXPERMDI_1TI
> + vuq __builtin_vsx_xxpermdi (vuq, vuq, const int);
> + XXPERMDI_1TI XXPERMDI_1TUI
Nits:
- Move them before "vf __builtin_vsx_xxpermdi (vf, vf, const int);" so
they are close to instances for other integral types.
- As the existing name convention, _{SQ,UQ} are better.
vsq __builtin_vsx_xxpermdi (vsq, vsq, const int);
XXPERMDI_1TI XXPERMDI_1SQ
vuq __builtin_vsx_xxpermdi (vuq, vuq, const int);
XXPERMDI_1TI XXPERMDI_1UQ
>
> [VEC_XXSLDWI, vec_xxsldwi, __builtin_vsx_xxsldwi]
> vsc __builtin_vsx_xxsldwi (vsc, vsc, const int);
> diff --git a/gcc/doc/extend.texi b/gcc/doc/extend.texi
> index 0756230b19e..edfef1bdab7 100644
> --- a/gcc/doc/extend.texi
> +++ b/gcc/doc/extend.texi
> @@ -22555,6 +22555,8 @@ void vec_vsx_st (vector bool char, int, signed char
> *);
> vector double vec_xxpermdi (vector double, vector double, const int);
> vector float vec_xxpermdi (vector float, vector float, const int);
> vector long long vec_xxpermdi (vector long long, vector long long, const
> int);
> +vector __int128 vec_xxpermdi (vector __int128, vector __int128, const int);
> +vector __int128 vec_xxpermdi (vector __uint128, vector __uint128, const int);
Nit: These two lines break the long long and unsigned long long lines, can you
move
them one line upward? Also using the explicit "signed" and "unsigned" would be
better than "__{u,}int128".
> vector unsigned long long vec_xxpermdi (vector unsigned long long,
> vector unsigned long long, const
> int);
> vector int vec_xxpermdi (vector int, vector int, const int);
> diff --git a/gcc/testsuite/gcc.target/powerpc/vec_perm-runnable-i128.c
> b/gcc/testsuite/gcc.target/powerpc/vec_perm-runnable-i128.c
> new file mode 100644
> index 00000000000..2d5dce09404
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/powerpc/vec_perm-runnable-i128.c
> @@ -0,0 +1,229 @@
> +/* { dg-do run } */
> +/* { dg-require-effective-target vmx_hw } */
> +/* { dg-options "-save-temps" } */
Nit: dg-options line isn't needed as it doesn't check assembly.
BR,
Kewen
> +
> +#include <altivec.h>
> +
> +#define DEBUG 0
> +
> +#if DEBUG
> +#include <stdio.h>
> +void print_i128 (unsigned __int128 val)
> +{
> + printf(" 0x%016llx%016llx",
> + (unsigned long long)(val >> 64),
> + (unsigned long long)(val & 0xFFFFFFFFFFFFFFFF));
> +}
> +#endif
> +
> +extern void abort (void);
> +
> +union convert_union {
> + vector signed __int128 s128;
> + vector unsigned __int128 u128;
> + char val[16];
> +} convert;
> +
> +int check_u128_result(vector unsigned __int128 vresult_u128,
> + vector unsigned __int128 expected_vresult_u128)
> +{
> + /* Use a for loop to check each byte manually so the test case will
> + run with ISA 2.06.
> +
> + Return 1 if they match, 0 otherwise. */
> +
> + int i;
> +
> + union convert_union result;
> + union convert_union expected;
> +
> + result.u128 = vresult_u128;
> + expected.u128 = expected_vresult_u128;
> +
> + /* Check if each byte of the result and expected match. */
> + for (i = 0; i < 16; i++)
> + {
> + if (result.val[i] != expected.val[i])
> + return 0;
> + }
> + return 1;
> +}
> +
> +int check_s128_result(vector signed __int128 vresult_s128,
> + vector signed __int128 expected_vresult_s128)
> +{
> + /* Convert the arguments to unsigned, then check equality. */
> + union convert_union result;
> + union convert_union expected;
> +
> + result.s128 = vresult_s128;
> + expected.s128 = expected_vresult_s128;
> +
> + return check_u128_result (result.u128, expected.u128);
> +}
> +
> +
> +int
> +main (int argc, char *argv [])
> +{
> + int i;
> +
> + vector signed __int128 src_va_s128;
> + vector signed __int128 src_vb_s128;
> + vector signed __int128 vresult_s128;
> + vector signed __int128 expected_vresult_s128;
> +
> + vector unsigned __int128 src_va_u128;
> + vector unsigned __int128 src_vb_u128;
> + vector unsigned __int128 src_vc_u128;
> + vector unsigned __int128 vresult_u128;
> + vector unsigned __int128 expected_vresult_u128;
> +
> + src_va_s128 = (vector signed __int128) {0x123456789ABCDEF0};
> + src_va_s128 = src_va_s128 << 64;
> + src_va_s128 |= (vector signed __int128) {0x22446688AACCEE00};
> + src_vb_s128 = (vector signed __int128) {0xFEDCBA9876543210};
> + src_vb_s128 = src_vb_s128 << 64;
> + src_vb_s128 |= (vector signed __int128) {0x3333333333333333};
> +
> + src_va_u128 = (vector unsigned __int128) {0x13579ACE02468BDF};
> + src_va_u128 = src_va_u128 << 64;
> + src_va_u128 |= (vector unsigned __int128) {0x1133557799BBDD00};
> + src_vb_u128 = (vector unsigned __int128) {0xA987654FEDCB3210};
> + src_vb_u128 = src_vb_u128 << 64;
> + src_vb_u128 |= (vector unsigned __int128) {0x5555555555555555};
> +
> +
> + /* Signed 128-bit arguments. */
> + vresult_s128 = vec_xxpermdi (src_va_s128, src_vb_s128, 0x1);
> +
> +#if __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__
> + /* BE expected results */
> + expected_vresult_s128 = (vector signed __int128) {0x123456789ABCDEF0};
> + expected_vresult_s128 = expected_vresult_s128 << 64;
> + expected_vresult_s128 |= (vector signed __int128) {0x3333333333333333};
> +#else
> + /* LE expected results */
> + expected_vresult_s128 = (vector signed __int128) {0xFEDCBA9876543210};
> + expected_vresult_s128 = expected_vresult_s128 << 64;
> + expected_vresult_s128 |= (vector signed __int128) {0x22446688AACCEE00};
> +#endif
> +
> + if (!check_s128_result (vresult_s128, expected_vresult_s128))
> +#if DEBUG
> + {
> + printf ("ERROR, vec_xxpermdi (src_va_s128, src_vb_s128, 0x1) result
> does not match expected output.\n");
> + printf (" src_va_s128: ");
> + print_i128 ((unsigned __int128) src_va_s128);
> + printf ("\n src_vb_s128: ");
> + print_i128 ((unsigned __int128) src_vb_s128);
> + printf ("\n Result: ");
> + print_i128 ((unsigned __int128) vresult_s128);
> + printf ("\n Expected result: ");
> + print_i128 ((unsigned __int128) expected_vresult_s128);
> + printf ("\n");
> + }
> +#else
> + abort ();
> +#endif
> +
> + vresult_s128 = vec_xxpermdi (src_va_s128, src_vb_s128, 0x2);
> +
> +#if __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__
> + /* BE expected results */
> + expected_vresult_s128 = (vector signed __int128) {0x22446688AACCEE00};
> + expected_vresult_s128 = expected_vresult_s128 << 64;
> + expected_vresult_s128 |= (vector signed __int128) {0xFEDCBA9876543210};
> +#else
> + /* LE expected results */
> + expected_vresult_s128 = (vector signed __int128) {0x3333333333333333};
> + expected_vresult_s128 = expected_vresult_s128 << 64;
> + expected_vresult_s128 |= (vector signed __int128) {0x123456789ABCDEF0};
> +#endif
> +
> + if (!check_s128_result (vresult_s128, expected_vresult_s128))
> +#if DEBUG
> + {
> + printf ("ERROR, vec_xxpermdi (src_va_s128, src_vb_s128, 0x2) result
> does not match expected output.\n");
> + printf (" src_va_s128: ");
> + print_i128 ((unsigned __int128) src_va_s128);
> + printf ("\n src_vb_s128: ");
> + print_i128 ((unsigned __int128) src_vb_s128);
> + printf ("\n Result: ");
> + print_i128 ((unsigned __int128) vresult_s128);
> + printf ("\n Expected result: ");
> + print_i128 ((unsigned __int128) expected_vresult_s128);
> + printf ("\n");
> + }
> +#else
> + abort ();
> +#endif
> +
> + /* Unigned arguments. */
> + vresult_u128 = vec_xxpermdi (src_va_u128, src_vb_u128, 0x1);
> +
> + #if __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__
> + /* BE expected results */
> + expected_vresult_u128 = (vector unsigned __int128) {0x13579ACE02468BDF};
> + expected_vresult_u128 = expected_vresult_u128 << 64;
> + expected_vresult_u128 |= (vector unsigned __int128) {0x5555555555555555};
> +#else
> + /* LE expected results */
> + expected_vresult_u128 = (vector unsigned __int128) {0xA987654FEDCB3210};
> + expected_vresult_u128 = expected_vresult_u128 << 64;
> + expected_vresult_u128 |= (vector unsigned __int128) {0x1133557799BBDD00};
> +#endif
> +
> + if (!check_u128_result (vresult_u128, expected_vresult_u128))
> +#if DEBUG
> + {
> + printf ("ERROR, vec_xxpermdi (src_va_u128, src_vb_u128, 0x1) result
> does not match expected output.\n");
> + printf (" src_va_s128: ");
> + print_i128 ((unsigned __int128) src_va_s128);
> + printf ("\n src_vb_s128: ");
> + print_i128 ((unsigned __int128) src_vb_s128);
> + printf ("\n Result: ");
> + print_i128 ((unsigned __int128) vresult_u128);
> + printf ("\n Expected result: ");
> + print_i128 ((unsigned __int128) expected_vresult_u128);
> + printf ("\n");
> + }
> +#else
> + abort ();
> +#endif
> +
> + /* Unigned arguments. */
> + vresult_u128 = vec_xxpermdi (src_va_u128, src_vb_u128, 0x2);
> +
> +#if __BYTE_ORDER__ == __ORDER_BIG_ENDIAN__
> + /* BE expected results */
> + expected_vresult_u128 = (vector unsigned __int128) {0x1133557799BBDD00};
> + expected_vresult_u128 = expected_vresult_u128 << 64;
> + expected_vresult_u128 |= (vector unsigned __int128) {0xA987654FEDCB3210};
> +#else
> + /* LE expected results */
> + expected_vresult_u128 = (vector unsigned __int128) {0x5555555555555555};
> + expected_vresult_u128 = expected_vresult_u128 << 64;
> + expected_vresult_u128 |= (vector unsigned __int128) {0x13579ACE02468BDF};
> +#endif
> +
> + if (!check_u128_result (vresult_u128, expected_vresult_u128))
> +#if DEBUG
> + {
> + printf ("ERROR, vec_xxpermdi (src_va_u128, src_vb_u128, 0x2) result
> does not match expected output.\n");
> + printf (" src_va_s128: ");
> + print_i128 ((unsigned __int128) src_va_s128);
> + printf ("\n src_vb_s128: ");
> + print_i128 ((unsigned __int128) src_vb_s128);
> + printf ("\n Result: ");
> + print_i128 ((unsigned __int128) vresult_u128);
> + printf ("\n Expected result: ");
> + print_i128 ((unsigned __int128) expected_vresult_u128);
> + printf ("\n");
> + }
> +#else
> + abort ();
> +#endif
> +
> + return 0;
> +}