On 02/12/2024 21:21, Christophe Lyon wrote:
> If the target does not support floating-point, we register FP vector
> types as 'void' (see register_vector_type).
>
> The leads to warnings about 'pure attribute on function returning
> void' when we declare the various load intrinsics because their
> call_properties say CP_READ_MEMORY (thus giving them the 'pure'
> attribute), but their return type is void.
>
> To avoid such warnings, declare floating-point scalar and vector types
> even if the target does not have an FPU.
>
> In arm-mve-builtins.cc (register_builtin_types, register_vector_type,
> register_builtin_tuple_types), this means simply removing the early
> exits. However, for this to work, we need to update
> arm_vector_mode_supported_p, so that vector floating-point types are
> always defined, and __fp16 must always be registered by
> arm_init_fp16_builtins (as it is the base type for vectors of
> float16_t. Another side effect is that the declaration of float16_t
> and float32_t typedefs is now unconditional
>
> The two new tests verify that:
> - we emit an error if the code tries to use a floating-point
> intrinsics and the target does not have the floating-point extension
> - we emit the expected code when activating the floating-point
> expected via a pragma
>
> gcc/ChangeLog:
>
> PR target/117814
> * config/arm/arm-builtins.cc (arm_init_fp16_builtins): Always
> register __fp16 type.
> * config/arm/arm-mve-builtins.cc (register_vector_type): Remove
> special handling when TARGET_HAVE_MVE_FLOAT is false.
> (register_builtin_tuple_types): Likewise.
> * config/arm/arm.cc (arm_vector_mode_supported_p): Accept
> floating-point vector modes even if TARGET_HAVE_MVE_FLOAT is
> false.
> * config/arm/arm_mve_types.h (float16_t, float32_t): Define
> unconditionally.
>
> gcc/testsuite/ChangeLog:
>
> PR target/117814
> * gcc.target/arm/mve/intrinsics/pr117814-2.c: New test.
> * gcc.target/arm/mve/intrinsics/pr117814.c: New test.
The manual says:
@opindex mfp16-format
@item -mfp16-format=@var{name}
Specify the format of the @code{__fp16} half-precision floating-point type.
Permissible names are @samp{none}, @samp{ieee}, and @samp{alternative};
the default is @samp{none}, in which case the @code{__fp16} type is not
defined. @xref{Half-Precision}, for more information.
So I think, as stands, this is incompatible with your patch. However, I think
this is something we should perhaps fix by changing that default now. The
minimum architecture we now support is v4, so we always have ldrh, making
/* __fp16 support currently assumes the core has ldrh. */
if (!arm_arch4 && arm_fp16_format != ARM_FP16_FORMAT_NONE)
sorry ("%<__fp16%> and no ldrh");
redundant.
That does mean that some people will need to explicitly use -mfp16-format=none
if they want their code to be portable to both ABI variants, but I think that's
very much a niche case.
I'd be content if it were necessary for arm_mve.h to be declared incompatible
with -mfp16-format being set to none (or even alternative) provided this is
documented.
R.
> ---
> gcc/config/arm/arm-builtins.cc | 5 ++--
> gcc/config/arm/arm-mve-builtins.cc | 24 ++--------------
> gcc/config/arm/arm.cc | 6 +---
> gcc/config/arm/arm_mve_types.h | 2 --
> .../arm/mve/intrinsics/pr117814-2.c | 28 +++++++++++++++++++
> .../gcc.target/arm/mve/intrinsics/pr117814.c | 19 +++++++++++++
> 6 files changed, 52 insertions(+), 32 deletions(-)
> create mode 100644 gcc/testsuite/gcc.target/arm/mve/intrinsics/pr117814-2.c
> create mode 100644 gcc/testsuite/gcc.target/arm/mve/intrinsics/pr117814.c
>
> diff --git a/gcc/config/arm/arm-builtins.cc b/gcc/config/arm/arm-builtins.cc
> index 01bdbbf943d..71b78fee55b 100644
> --- a/gcc/config/arm/arm-builtins.cc
> +++ b/gcc/config/arm/arm-builtins.cc
> @@ -2443,9 +2443,8 @@ arm_init_fp16_builtins (void)
> arm_fp16_type_node = make_node (REAL_TYPE);
> TYPE_PRECISION (arm_fp16_type_node) = GET_MODE_PRECISION (HFmode);
> layout_type (arm_fp16_type_node);
> - if (arm_fp16_format)
> - (*lang_hooks.types.register_builtin_type) (arm_fp16_type_node,
> - "__fp16");
> + (*lang_hooks.types.register_builtin_type) (arm_fp16_type_node,
> + "__fp16");
> }
>
> void
> diff --git a/gcc/config/arm/arm-mve-builtins.cc
> b/gcc/config/arm/arm-mve-builtins.cc
> index 30b103ec086..25c1b442a28 100644
> --- a/gcc/config/arm/arm-mve-builtins.cc
> +++ b/gcc/config/arm/arm-mve-builtins.cc
> @@ -410,8 +410,6 @@ register_builtin_types ()
> #include "arm-mve-builtins.def"
> for (unsigned int i = 0; i < NUM_VECTOR_TYPES; ++i)
> {
> - if (vector_types[i].requires_float && !TARGET_HAVE_MVE_FLOAT)
> - continue;
> tree eltype = scalar_types[i];
> tree vectype;
> if (eltype == boolean_type_node)
> @@ -433,18 +431,6 @@ register_builtin_types ()
> static void
> register_vector_type (vector_type_index type)
> {
> -
> - /* If the target does not have the mve.fp extension, but the type requires
> - it, then it needs to be assigned a non-dummy type so that functions
> - with those types in their signature can be registered. This allows for
> - diagnostics about the missing extension, rather than about a missing
> - function definition. */
> - if (vector_types[type].requires_float && !TARGET_HAVE_MVE_FLOAT)
> - {
> - acle_vector_types[0][type] = void_type_node;
> - return;
> - }
> -
> tree vectype = abi_vector_types[type];
> tree id = get_identifier (vector_types[type].acle_name);
> tree decl = build_decl (input_location, TYPE_DECL, id, vectype);
> @@ -512,17 +498,11 @@ register_builtin_tuple_types (vector_type_index type)
> {
> const vector_type_info* info = &vector_types[type];
>
> - /* If the target does not have the mve.fp extension, but the type requires
> - it, then it needs to be assigned a non-dummy type so that functions
> - with those types in their signature can be registered. This allows for
> - diagnostics about the missing extension, rather than about a missing
> - function definition. */
> - if (scalar_types[type] == boolean_type_node
> - || (info->requires_float && !TARGET_HAVE_MVE_FLOAT))
> + if (scalar_types[type] == boolean_type_node)
> {
> for (unsigned int num_vectors = 2; num_vectors <= 4; num_vectors += 2)
> acle_vector_types[num_vectors - 1][type] = void_type_node;
> - return;
> + return;
> }
>
> const char *vector_type_name = info->acle_name;
> diff --git a/gcc/config/arm/arm.cc b/gcc/config/arm/arm.cc
> index 04028dbc3c3..500c8fdefc3 100644
> --- a/gcc/config/arm/arm.cc
> +++ b/gcc/config/arm/arm.cc
> @@ -29791,11 +29791,7 @@ arm_vector_mode_supported_p (machine_mode mode)
> return true;
>
> if (TARGET_HAVE_MVE
> - && (VALID_MVE_SI_MODE (mode) || VALID_MVE_PRED_MODE (mode)))
> - return true;
> -
> - if (TARGET_HAVE_MVE_FLOAT
> - && (mode == V2DFmode || mode == V4SFmode || mode == V8HFmode))
> + && (VALID_MVE_MODE (mode) || VALID_MVE_PRED_MODE (mode)))
> return true;
>
> return false;
> diff --git a/gcc/config/arm/arm_mve_types.h b/gcc/config/arm/arm_mve_types.h
> index f549f881b49..003e7e51d96 100644
> --- a/gcc/config/arm/arm_mve_types.h
> +++ b/gcc/config/arm/arm_mve_types.h
> @@ -22,10 +22,8 @@
> #ifndef _GCC_ARM_MVE_TYPES_H
> #define _GCC_ARM_MVE_TYPES_H
>
> -#if (__ARM_FEATURE_MVE & 2) /* MVE Floating point. */
> typedef __fp16 float16_t;
> typedef float float32_t;
> -#endif
>
> #pragma GCC arm "arm_mve_types.h"
>
> diff --git a/gcc/testsuite/gcc.target/arm/mve/intrinsics/pr117814-2.c
> b/gcc/testsuite/gcc.target/arm/mve/intrinsics/pr117814-2.c
> new file mode 100644
> index 00000000000..ca8d414ef92
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/arm/mve/intrinsics/pr117814-2.c
> @@ -0,0 +1,28 @@
> +/* { dg-require-effective-target arm_v8_1m_mve_ok } */
> +/* { dg-add-options arm_v8_1m_mve } */
> +/* { dg-additional-options "-O2" } */
> +/* { dg-final { check-function-bodies "**" "" } } */
> +
> +#include "arm_mve.h"
> +
> +#ifdef __cplusplus
> +extern "C" {
> +#endif
> +
> +#pragma GCC target ("arch=armv8.1-m.main+mve.fp")
> +
> +/*
> +**foo1:
> +** ...
> +** vldrh.16 q[0-9]+, \[(?:ip|fp|r[0-9]+)\](?: @.*|)
> +** ...
> +*/
> +float16x8_t
> +foo1 (float16_t const *base)
> +{
> + return vld1q_f16 (base);
> +}
> +
> +#ifdef __cplusplus
> +}
> +#endif
> diff --git a/gcc/testsuite/gcc.target/arm/mve/intrinsics/pr117814.c
> b/gcc/testsuite/gcc.target/arm/mve/intrinsics/pr117814.c
> new file mode 100644
> index 00000000000..5038bcb3dba
> --- /dev/null
> +++ b/gcc/testsuite/gcc.target/arm/mve/intrinsics/pr117814.c
> @@ -0,0 +1,19 @@
> +/* { dg-require-effective-target arm_v8_1m_mve_ok } */
> +/* { dg-add-options arm_v8_1m_mve } */
> +/* { dg-additional-options "-O2" } */
> +
> +#include "arm_mve.h"
> +
> +#ifdef __cplusplus
> +extern "C" {
> +#endif
> +
> +float16x8_t
> +foo (float16_t const *base)
> +{
> + return vld1q_f16 (base); /* { dg-error {ACLE function 'vld1q_f16' requires
> ISA extension 'mve.fp'} } */
> +}
> +
> +#ifdef __cplusplus
> +}
> +#endif