On Wed, 5 Mar 2025 at 12:59, Richard Earnshaw <[email protected]> wrote:
>
> The header file arm_neon.h provides the Advanced SIMD intrinsics that
> are available on armv7 or later A & R profile cores. However, they
> are not compatible with M-profile and we also need to ensure that the
> FP instructions are enabled (with -mfloat-abi=softfp/hard). That
> leads to some complicated checking as arm_neon.h includes stdint.h
> and, at least on linux, that can require that the appropriate ABI
> bits/ headers are also installed.
>
> This patch adds a new check to target-supports.exp to establish the
> minimal set of option overrides needed to enable use of this header in
> a test.
>
> gcc/testsuite:
> * lib/target-supports.exp
> (check_effective_target_arm_neon_h_ok_nocache): New function.
> (check_effective_target_arm_neon_h_ok): Likewise.
> (add_options_for_arm_neon_h): Likewise.
> (check_effective_target_arm_libc_fp_abi_ok_nocache): Allow any
> Arm target, not just arm32.
> * gcc.target/arm/attr-neon-builtin-fail.c: Use it.
> * gcc.target/arm/attr-neon-builtin-fail2.c: Likewise.
> * gcc.target/arm/attr-neon-fp16.c: Likewise.
> * gcc.target/arm/attr-neon2.c: Likewise.
> ---
>
> I'm going to wait 24 hrs before committing this as I'd like to see the
> results of the CI first.
>
I've manually started precommit tests which are not executed by
default (targeting arm-none-eabi with runtest flags overridden), and
results look good:
* NO CHANGE (except for line number change in attr-neon-builtin-fail.c):
v7a_softfp_eabi -marm/-march=armv7-a/-mfpu=vfpv3-d16/-mfloat-abi=softfp
thumb_m33_hard
-mthumb/-march=armv8-m.main+dsp+fp/-mtune=cortex-m33/-mfloat-abi=hard/-mfpu=auto
* UNSUPPORTED -> PASS:
gcc:gcc.target/arm/arm.exp=gcc.target/arm/attr-neon-builtin-fail.c
gcc:gcc.target/arm/arm.exp=gcc.target/arm/attr-neon-fp16.c
gcc:gcc.target/arm/arm.exp=gcc.target/arm/attr-neon2.c
default flags ""
thumb_m3_softfp
-mthumb/-march=armv7-m/-mtune=cortex-m3/-mfloat-abi=softfp/-mfpu=auto
thumb_m7_hard
-mthumb/-march=armv7e-m+fp.dp/-mtune=cortex-m7/-mfloat-abi=hard/-mfpu=auto
thumb_v8a_hard -mthumb/-march=armv8-a+simd/-mfpu=auto/-mfloat-abi=hard
* UNSUPPORTED -> PASS:
gcc:gcc.target/arm/arm.exp=gcc.target/arm/attr-neon-builtin-fail.c
gcc:gcc.target/arm/arm.exp=gcc.target/arm/attr-neon-builtin-fail2.c
gcc:gcc.target/arm/arm.exp=gcc.target/arm/attr-neon-fp16.c
gcc:gcc.target/arm/arm.exp=gcc.target/arm/attr-neon2.c
gcc:gcc.target/arm/arm.exp=gcc.target/arm/pr68620.c
thumb_m0_soft
-mthumb/-march=armv6s-m/-mtune=cortex-m0/-mfloat-abi=soft/-mfpu=auto
thumb_m23_soft
-mthumb/-march=armv8-m.base/-mtune=cortex-m23/-mfloat-abi=soft/-mfpu=auto
* FAIL / UNRESOLVED -> PASS:
gcc:gcc.target/arm/arm.exp=gcc.target/arm/attr-neon-builtin-fail.c
(test for excess errors)
gcc:gcc.target/arm/arm.exp=gcc.target/arm/attr-neon-builtin-fail.c
(test for warnings, line 14)
gcc:gcc.target/arm/arm.exp=gcc.target/arm/attr-neon-builtin-fail.c
at line 17 (test for errors, line )
gcc:gcc.target/arm/arm.exp=gcc.target/arm/attr-neon-builtin-fail2.c
(test for errors, line 13)
gcc:gcc.target/arm/arm.exp=gcc.target/arm/attr-neon-builtin-fail2.c
(test for excess errors)
gcc:gcc.target/arm/arm.exp=gcc.target/arm/attr-neon-fp16.c (test
for excess errors)
gcc:gcc.target/arm/arm.exp=gcc.target/arm/attr-neon2.c (test for
excess errors)
gcc:gcc.target/arm/arm.exp=gcc.target/arm/attr-neon2.c
check-function-bodies my
gcc:gcc.target/arm/arm.exp=gcc.target/arm/attr-neon2.c
check-function-bodies my1
gcc:gcc.target/arm/arm.exp=gcc.target/arm/attr-neon2.c
scan-assembler .fpu\\s+neon\n
gcc:gcc.target/arm/arm.exp=gcc.target/arm/attr-neon2.c
scan-assembler .fpu\\s+vfp\n
thumb_m55_hard
-mthumb/-march=armv8.1-m.main+mve.fp+fp.dp/-mtune=cortex-m55/-mfloat-abi=hard/-mfpu=auto
so we actually get more coverage, which is nice, thanks!
> R.
>
> .../gcc.target/arm/attr-neon-builtin-fail.c | 6 +--
> .../gcc.target/arm/attr-neon-builtin-fail2.c | 5 +-
> gcc/testsuite/gcc.target/arm/attr-neon-fp16.c | 4 +-
> gcc/testsuite/gcc.target/arm/attr-neon2.c | 5 +-
> gcc/testsuite/lib/target-supports.exp | 53 ++++++++++++++++++-
> 5 files changed, 60 insertions(+), 13 deletions(-)
>
> diff --git a/gcc/testsuite/gcc.target/arm/attr-neon-builtin-fail.c
> b/gcc/testsuite/gcc.target/arm/attr-neon-builtin-fail.c
> index fb6e0b9cd66..645d708f005 100644
> --- a/gcc/testsuite/gcc.target/arm/attr-neon-builtin-fail.c
> +++ b/gcc/testsuite/gcc.target/arm/attr-neon-builtin-fail.c
> @@ -1,9 +1,8 @@
> /* Check that calling a neon builtin from a function compiled with vfp
> fails. */
> /* { dg-do compile } */
> -/* { dg-require-effective-target arm_fp_ok } */
> -/* { dg-require-effective-target arm_neon_ok } */
> +/* { dg-require-effective-target arm_neon_h_ok } */
> /* { dg-options "-O2" } */
> -/* { dg-add-options arm_fp } */
> +/* { dg-add-options arm_neon_h } */
>
> #include <arm_neon.h>
>
> @@ -15,4 +14,3 @@ foo (uint8x16_t *p)
> }
>
> /* { dg-error "inlining failed in call to 'always_inline'" "" { target *-*-*
> } 0 } */
> -
> diff --git a/gcc/testsuite/gcc.target/arm/attr-neon-builtin-fail2.c
> b/gcc/testsuite/gcc.target/arm/attr-neon-builtin-fail2.c
> index 9cb5a2ebb90..ed0c4634b77 100644
> --- a/gcc/testsuite/gcc.target/arm/attr-neon-builtin-fail2.c
> +++ b/gcc/testsuite/gcc.target/arm/attr-neon-builtin-fail2.c
> @@ -1,8 +1,8 @@
> /* Check that calling a neon builtin from a function compiled with vfp
> fails. */
> /* { dg-do compile } */
> -/* { dg-require-effective-target arm_vfp_ok } */
> +/* { dg-require-effective-target arm_neon_h_ok } */
> /* { dg-options "-O2" } */
> -/* { dg-add-options arm_vfp } */
> +/* { dg-add-options arm_neon_h } */
>
> extern __simd64_int8_t a, b;
>
> @@ -13,4 +13,3 @@ foo (__simd128_int16_t *p)
> *p = (__simd128_int16_t)__builtin_neon_vaddlsv8qi (a, b); /* { dg-error
> "You must enable NEON instructions .*" } */
>
> }
> -
> diff --git a/gcc/testsuite/gcc.target/arm/attr-neon-fp16.c
> b/gcc/testsuite/gcc.target/arm/attr-neon-fp16.c
> index d7b75645bc4..a5982604f9e 100644
> --- a/gcc/testsuite/gcc.target/arm/attr-neon-fp16.c
> +++ b/gcc/testsuite/gcc.target/arm/attr-neon-fp16.c
> @@ -1,8 +1,8 @@
> /* { dg-do compile } */
> /* { dg-skip-if "-mpure-code supports M-profile only and without Neon" {
> *-*-* } { "-mpure-code" } } */
> -/* { dg-require-effective-target arm_fp_ok } */
> +/* { dg-require-effective-target arm_neon_h_ok } */
> /* { dg-options "-mfp16-format=ieee" } */
> -/* { dg-add-options arm_fp } */
> +/* { dg-add-options arm_neon_h } */
>
> #include "arm_neon.h"
>
> diff --git a/gcc/testsuite/gcc.target/arm/attr-neon2.c
> b/gcc/testsuite/gcc.target/arm/attr-neon2.c
> index a7a72dac379..c0f7667c2dc 100644
> --- a/gcc/testsuite/gcc.target/arm/attr-neon2.c
> +++ b/gcc/testsuite/gcc.target/arm/attr-neon2.c
> @@ -1,8 +1,7 @@
> /* { dg-do compile } */
> -/* { dg-require-effective-target arm_neon_ok } */
> -/* { dg-require-effective-target arm_fp_ok } */
> +/* { dg-require-effective-target arm_neon_h_ok } */
> /* { dg-options "-Ofast" } */
> -/* { dg-add-options arm_fp } */
> +/* { dg-add-options arm_neon_h } */
>
> /* Reset fpu to a value compatible with the next pragmas. */
> #pragma GCC target ("fpu=vfp")
> diff --git a/gcc/testsuite/lib/target-supports.exp
> b/gcc/testsuite/lib/target-supports.exp
> index d02d1fa9bec..ca0bd1bc8a2 100644
> --- a/gcc/testsuite/lib/target-supports.exp
> +++ b/gcc/testsuite/lib/target-supports.exp
> @@ -5127,7 +5127,7 @@ proc add_options_for_arm_fp { flags } {
> proc check_effective_target_arm_libc_fp_abi_ok_nocache { } {
> global et_arm_libc_fp_abi_flags
> set et_arm_libc_fp_abi_flags ""
> - if { [check_effective_target_arm32] } {
> + if { [istarget arm*-*-*] } {
> foreach flags {"-mfloat-abi=hard" "-mfloat-abi=softfp"} {
> if { [check_no_compiler_messages_nocache arm_libc_fp_abi_ok
> object {
> #include <stdint.h>
> @@ -5155,6 +5155,57 @@ proc add_options_for_arm_libc_fp_abi { flags } {
> return "$flags $et_arm_libc_fp_abi_flags"
> }
>
> +# Try to find the minimal set of flags needed to make the header file
> +# arm_neon.h compatible with this compilation. The is complicated due
> +# to the fact that this header doesn't work properly on m-profile cores
> +# and also won't work correctly if the wrong floating-point ABI is used
> +# on the platfrom (since arm_neon.h can include stdint.h, which on Linux
typo "platform"
> +# will pull in stub headers that aren't installed).
> +# Note: This will not necessarily enable Neon instructions, just provide
> +# something where the header will not cause errors.
> +
> +proc check_effective_target_arm_neon_h_ok_nocache { } {
> + # none-arm or thumb1 cannot support neon, so there's no point in
I'm not sure what "none-arm" means here? "not arm" ?
Thanks,
Christophe
> + # looking further.
> + if { [istarget arm*-*-*] } {
> + global et_arm_neon_h_flags
> + set base_flags [add_options_for_arm_libc_fp_abi ""]
> + foreach flags {"" "-mfpu=auto" "-marm" "-marm -mfpu=auto" \
> + "-mcpu=unset -march=armv7-a+fp -mfpu=auto" } {
> + if { [check_no_compiler_messages_nocache arm_neon_h_ok assembly {
> + #if __ARM_ARCH < 5
> + #error architecture too low for FP
> + #endif
> + #if __ARM_ARCH < 7
> + #if !defined(__arm__) || (defined(__thumb__) &&
> !defined(__thumb2__))
> + #error incompatible arch or mode
> + #endif
> + #endif
> + #if __ARM_ARCH_PROFILE == 'M'
> + #error incompatible profile
> + #endif
> + } "$base_flags $flags" ] } {
> + set et_arm_neon_h_flags "$base_flags $flags"
> + return 1
> + }
> + }
> + }
> + return 0
> +}
> +
> +proc check_effective_target_arm_neon_h_ok { } {
> + return [check_cached_effective_target arm_neon_h_ok \
> + check_effective_target_arm_neon_h_ok_nocache]
> +}
> +
> +proc add_options_for_arm_neon_h { flags } {
> + if { ! [check_effective_target_arm_neon_h_ok] } {
> + return "$flags"
> + }
> + global et_arm_neon_h_flags
> + return "$flags $et_arm_neon_h_flags"
> +}
> +
> # Return 1 if this is an ARM target defining __ARM_FP with
> # double-precision support. We may need -mfloat-abi=softfp or
> # equivalent options. Some multilibs may be incompatible with these
> --
> 2.34.1
>