[PATCH] aarch64: SVE/NEON Bridging intrinsics

Richard Ball via Gcc-patches Wed, 02 Aug 2023 05:10:57 -0700

ACLE has added intrinsics to bridge between SVE and Neon.


The NEON_SVE Bridge adds intrinsics that allow conversions between NEON and
SVE vectors.

This patch adds support to GCC for the following 3 intrinsics:
svset_neonq, svget_neonq and svdup_neonq

gcc/ChangeLog:

        * config.gcc: Adds new header to config.
        * config/aarch64/aarch64-builtins.cc (GTY): Externs aarch64_simd_types.
        * config/aarch64/aarch64-c.cc (aarch64_pragma_aarch64):
         Defines pragma for arm_neon_sve_bridge.h.
        * config/aarch64/aarch64-protos.h: New function.
        * config/aarch64/aarch64-sve-builtins-base.h: New intrinsics.
        * config/aarch64/aarch64-sve-builtins-base.cc
         (class svget_neonq_impl): New intrinsic implementation.
        (class svset_neonq_impl): Likewise.
        (class svdup_neonq_impl): Likewise.
        (NEON_SVE_BRIDGE_FUNCTION): New intrinsics.
        * config/aarch64/aarch64-sve-builtins-functions.h

(NEON_SVE_BRIDGE_FUNCTION): Defines macro for NEON_SVE_BRIDGEfunctions.

        * config/aarch64/aarch64-sve-builtins-shapes.h: New shapes.
        * config/aarch64/aarch64-sve-builtins-shapes.cc
         (parse_neon_type): Parser for NEON types.
        (parse_element_type): Add NEON element types.
        (parse_type): Likewise.
        (NEON_SVE_BRIDGE_SHAPE): Defines macro for NEON_SVE_BRIDGE shapes.
        (struct get_neonq_def): Defines function shape for get_neonq.
        (struct set_neonq_def): Defines function shape for set_neonq.
        (struct dup_neonq_def): Defines function shape for dup_neonq.
        * config/aarch64/aarch64-sve-builtins.cc (DEF_NEON_SVE_FUNCTION): 
Defines
         macro for NEON_SVE_BRIDGE functions.
        (handle_arm_neon_sve_bridge_h): Handles #pragma arm_neon_sve_bridge.h.
        * config/aarch64/aarch64-builtins.h: New header file to extern neon 
types.
        * config/aarch64/aarch64-neon-sve-bridge-builtins.def: New instrinsics
         function def file.
        * config/aarch64/arm_neon_sve_bridge.h: New header file.

gcc/testsuite/ChangeLog:

        * gcc.c-torture/execute/neon-sve-bridge.c: New test.

#############################################################################

diff --git a/gcc/config.gcc b/gcc/config.gcc

indexd88071773c9e1280cc5f38e36e09573214323b48..ca55992200dbe58782c3dbf66906339de021ba6b100644

--- a/gcc/config.gcc
+++ b/gcc/config.gcc
@@ -334,7 +334,7 @@ m32c*-*-*)
          ;;
  aarch64*-*-*)
        cpu_type=aarch64
-       extra_headers="arm_fp16.h arm_neon.h arm_bf16.h arm_acle.h arm_sve.h"

+ extra_headers="arm_fp16.h arm_neon.h arm_bf16.h arm_acle.h arm_sve.harm_neon_sve_bridge.h"

        c_target_objs="aarch64-c.o"
        cxx_target_objs="aarch64-c.o"
        d_target_objs="aarch64-d.o"

diff --git a/gcc/config/aarch64/aarch64-builtins.hb/gcc/config/aarch64/aarch64-builtins.h

new file mode 100644

index0000000000000000000000000000000000000000..eebde448f92c230c8f88b4da1ca8ebd9670b1536

--- /dev/null
+++ b/gcc/config/aarch64/aarch64-builtins.h
@@ -0,0 +1,86 @@
+/* Builtins' description for AArch64 SIMD architecture.
+   Copyright (C) 2023 Free Software Foundation, Inc.
+   This file is part of GCC.
+   GCC is free software; you can redistribute it and/or modify it
+   under the terms of the GNU General Public License as published by
+   the Free Software Foundation; either version 3, or (at your option)
+   any later version.
+   GCC is distributed in the hope that it will be useful, but
+   WITHOUT ANY WARRANTY; without even the implied warranty of
+   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+   General Public License for more details.
+   You should have received a copy of the GNU General Public License
+   along with GCC; see the file COPYING3.  If not see
+   <http://www.gnu.org/licenses/>.  */
+#ifndef GCC_AARCH64_BUILTINS_H
+#define GCC_AARCH64_BUILTINS_H
+#include "tree.h"
+enum aarch64_type_qualifiers
+{
+  /* T foo.  */
+  qualifier_none = 0x0,
+  /* unsigned T foo.  */
+  qualifier_unsigned = 0x1, /* 1 << 0  */
+  /* const T foo.  */
+  qualifier_const = 0x2, /* 1 << 1  */
+  /* T *foo.  */
+  qualifier_pointer = 0x4, /* 1 << 2  */
+  /* Used when expanding arguments if an operand could
+     be an immediate.  */
+  qualifier_immediate = 0x8, /* 1 << 3  */
+  qualifier_maybe_immediate = 0x10, /* 1 << 4  */
+  /* void foo (...).  */
+  qualifier_void = 0x20, /* 1 << 5  */
+  /* 1 << 6 is now unused */
+  /* Some builtins should use the T_*mode* encoded in a simd_builtin_datum
+     rather than using the type of the operand.  */
+  qualifier_map_mode = 0x80, /* 1 << 7  */
+  /* qualifier_pointer | qualifier_map_mode  */
+  qualifier_pointer_map_mode = 0x84,
+  /* qualifier_const | qualifier_pointer | qualifier_map_mode  */
+  qualifier_const_pointer_map_mode = 0x86,
+  /* Polynomial types.  */
+  qualifier_poly = 0x100,
+  /* Lane indices - must be in range, and flipped for bigendian.  */
+  qualifier_lane_index = 0x200,
+  /* Lane indices for single lane structure loads and stores.  */
+  qualifier_struct_load_store_lane_index = 0x400,
+  /* Lane indices selected in pairs. - must be in range, and flipped for
+     bigendian.  */
+  qualifier_lane_pair_index = 0x800,

+ /* Lane indices selected in quadtuplets. - must be in range, andflipped for

+     bigendian.  */
+  qualifier_lane_quadtup_index = 0x1000,
+};
+#define ENTRY(E, M, Q, G) E,
+enum aarch64_simd_type
+{
+#include "aarch64-simd-builtin-types.def"
+  ARM_NEON_H_TYPES_LAST
+};
+#undef ENTRY
+struct GTY(()) aarch64_simd_type_info
+{
+  enum aarch64_simd_type type;
+  /* Internal type name.  */
+  const char *name;
+  /* Internal type name(mangled).  The mangled names conform to the

+ AAPCS64 (see "Procedure Call Standard for the ARM 64-bitArchitecture",+ Appendix A). To qualify for emission with the mangled namesdefined in+ that document, a vector type must not only be of the correct modebut also+ be of the correct internal AdvSIMD vector type (e.g. __Int8x8_t);these

+     types are registered by aarch64_init_simd_builtin_types ().  In other

+ words, vector types defined in other ways e.g. via vector_sizeattribute

+     will get default mangled names.  */
+  const char *mangle;
+  /* Internal type.  */
+  tree itype;
+  /* Element type.  */
+  tree eltype;
+  /* Machine mode the internal type maps to.  */
+  enum machine_mode mode;
+  /* Qualifiers.  */
+  enum aarch64_type_qualifiers q;
+};
+extern aarch64_simd_type_info aarch64_simd_types[];
+#endif
\ No newline at end of file

diff --git a/gcc/config/aarch64/aarch64-builtins.ccb/gcc/config/aarch64/aarch64-builtins.ccindex04f59fd9a54306d6422b03e32dce79bc00aed4f8..6a3aca6420624ad5ea93d64d7ed580791d65d4e4100644

--- a/gcc/config/aarch64/aarch64-builtins.cc
+++ b/gcc/config/aarch64/aarch64-builtins.cc
@@ -923,7 +923,7 @@ struct GTY(()) aarch64_simd_type_info

  #define ENTRY(E, M, Q, G)  \

{E, "__" #E, #G "__" #E, NULL_TREE, NULL_TREE, E_##M##mode,qualifier_##Q},

-static GTY(()) struct aarch64_simd_type_info aarch64_simd_types [] = {
+extern GTY(()) struct aarch64_simd_type_info aarch64_simd_types [] = {
  #include "aarch64-simd-builtin-types.def"
  };
  #undef ENTRY

diff --git a/gcc/config/aarch64/aarch64-c.ccb/gcc/config/aarch64/aarch64-c.ccindex578ec6f45b06347d90f951b37064006786baf10f..ada8b81a7bef6c2e58b07324a7bfc38eecb651da100644

--- a/gcc/config/aarch64/aarch64-c.cc
+++ b/gcc/config/aarch64/aarch64-c.cc
@@ -294,6 +294,8 @@ aarch64_pragma_aarch64 (cpp_reader *)
      handle_arm_neon_h ();
    else if (strcmp (name, "arm_acle.h") == 0)
      handle_arm_acle_h ();
+  else if (strcmp (name, "arm_neon_sve_bridge.h") == 0)
+    aarch64_sve::handle_arm_neon_sve_bridge_h ();
    else
      error ("unknown %<#pragma GCC aarch64%> option %qs", name);
  }

diff --git a/gcc/config/aarch64/aarch64-neon-sve-bridge-builtins.defb/gcc/config/aarch64/aarch64-neon-sve-bridge-builtins.def

new file mode 100644

index0000000000000000000000000000000000000000..0c3cf233c9382b2f7420379054a53fa846d46c8c

--- /dev/null
+++ b/gcc/config/aarch64/aarch64-neon-sve-bridge-builtins.def
@@ -0,0 +1,28 @@
+/* Builtin lists for AArch64 NEON-SVE-Bridge
+   Copyright (C) 2023 Free Software Foundation, Inc.
+
+   This file is part of GCC.
+
+   GCC is free software; you can redistribute it and/or modify it
+   under the terms of the GNU General Public License as published by
+   the Free Software Foundation; either version 3, or (at your option)
+   any later version.
+
+   GCC is distributed in the hope that it will be useful, but
+   WITHOUT ANY WARRANTY; without even the implied warranty of
+   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+   General Public License for more details.
+
+   You should have received a copy of the GNU General Public License
+   along with GCC; see the file COPYING3.  If not see
+   <http://www.gnu.org/licenses/>.  */
+
+#ifndef DEF_NEON_SVE_FUNCTION
+#define DEF_NEON_SVE_FUNCTION(A, B, C, D)
+#endif
+
+DEF_NEON_SVE_FUNCTION (svset_neonq, set_neonq, all_data, none)
+DEF_NEON_SVE_FUNCTION (svget_neonq, get_neonq, all_data, none)
+DEF_NEON_SVE_FUNCTION (svdup_neonq, dup_neonq, all_data, none)
+
+#undef DEF_NEON_SVE_FUNCTION
\ No newline at end of file

diff --git a/gcc/config/aarch64/aarch64-protos.hb/gcc/config/aarch64/aarch64-protos.hindex70303d6fd953e0c397b9138ede8858c2db2e53db..c5e4e20e73cedb363d867a73869c0659ed9b237d100644

--- a/gcc/config/aarch64/aarch64-protos.h
+++ b/gcc/config/aarch64/aarch64-protos.h
@@ -987,6 +987,7 @@ void handle_arm_neon_h (void);
  namespace aarch64_sve {
    void init_builtins ();
    void handle_arm_sve_h ();
+  void handle_arm_neon_sve_bridge_h ();
    tree builtin_decl (unsigned, bool);
    bool builtin_type_p (const_tree);
    bool builtin_type_p (const_tree, unsigned int *, unsigned int *);

diff --git a/gcc/config/aarch64/aarch64-sve-builtins-base.hb/gcc/config/aarch64/aarch64-sve-builtins-base.hindexd300e3a85d00b58ad790851a81d43af709b66bce..df75e4c1ecf81f3ddfa256edbcf8637d092fcfde100644

--- a/gcc/config/aarch64/aarch64-sve-builtins-base.h
+++ b/gcc/config/aarch64/aarch64-sve-builtins-base.h
@@ -299,6 +299,12 @@ namespace aarch64_sve
      extern const function_base *const svzip2;
      extern const function_base *const svzip2q;
    }
+  namespace neon_sve_bridge_functions
+  {
+    extern const function_base *const svset_neonq;
+    extern const function_base *const svget_neonq;
+    extern const function_base *const svdup_neonq;
+  }
  }

  #endif

diff --git a/gcc/config/aarch64/aarch64-sve-builtins-base.ccb/gcc/config/aarch64/aarch64-sve-builtins-base.ccindex9010ecca6da23c107f5ded9ab3cfa678e308daf9..0acc3acf7d34b54af8679dc36effb85f7b557543100644

--- a/gcc/config/aarch64/aarch64-sve-builtins-base.cc
+++ b/gcc/config/aarch64/aarch64-sve-builtins-base.cc
@@ -44,6 +44,7 @@
  #include "aarch64-sve-builtins-shapes.h"
  #include "aarch64-sve-builtins-base.h"
  #include "aarch64-sve-builtins-functions.h"
+#include "aarch64-builtins.h"
  #include "ssa.h"
  #include "gimple-fold.h"

@@ -1064,6 +1065,99 @@ public:
    }
  };

+class svget_neonq_impl : public function_base
+{
+public:
+  gimple *
+  fold (gimple_folder &f) const override
+  {
+    tree rhs_tuple = gimple_call_arg (f.call, 0);
+    tree rhs_vector = build3 (BIT_FIELD_REF, TREE_TYPE (f.lhs),
+                            rhs_tuple, bitsize_int(128), bitsize_int(0));
+    return gimple_build_assign (f.lhs, rhs_vector);
+  }
+  rtx
+  expand (function_expander &e) const override
+  {
+    return simplify_gen_subreg (e.vector_mode (0), e.args[0],
+                               GET_MODE (e.args[0]),
+                               INTVAL (e.args[1]) * BYTES_PER_SVE_VECTOR);
+  }
+};
+
+class svset_neonq_impl : public function_base
+{
+public:
+  gimple *
+  fold (gimple_folder &f) const override
+  {
+    tree rhs_tuple = gimple_call_arg (f.call, 0);
+    tree rhs_vector = gimple_call_arg (f.call, 1);
+    gassign *copy = gimple_build_assign (unshare_expr (f.lhs), rhs_tuple);
+    tree lhs_vector = build3 (BIT_INSERT_EXPR, TREE_TYPE (rhs_vector),
+                            f.lhs, rhs_vector, bitsize_int(0));
+    gassign *update = gimple_build_assign (f.lhs, lhs_vector);
+    gsi_insert_after (f.gsi, update, GSI_SAME_STMT);
+    return copy;
+  }
+  rtx
+  expand (function_expander &e) const override
+  {
+    rtx rhs_tuple = e.args[0];
+    unsigned int index = INTVAL (e.args[1]);
+    rtx rhs_vector = e.args[2];
+    rtx lhs_tuple = e.get_nonoverlapping_reg_target ();
+    emit_move_insn (lhs_tuple, rhs_tuple);
+    rtx lhs_vector = simplify_gen_subreg (GET_MODE (rhs_vector),
+                                         lhs_tuple, GET_MODE (lhs_tuple),
+                                         index * BYTES_PER_SVE_VECTOR);
+    emit_move_insn (lhs_vector, rhs_vector);
+    return lhs_vector;
+  }
+};
+
+class svdup_neonq_impl : public function_base
+{
+public:
+  gimple *
+  fold (gimple_folder &f) const override
+  {
+    tree rhs_vector = gimple_call_arg (f.call, 0);
+    unsigned int nargs = gimple_call_num_args (f.call);
+    unsigned HOST_WIDE_INT NEONnelts;
+    TYPE_VECTOR_SUBPARTS (TREE_TYPE (rhs_vector)).is_constant (&NEONnelts);
+    poly_uint64 SVEnelts;
+    SVEnelts = TYPE_VECTOR_SUBPARTS (TREE_TYPE (f.lhs));
+    vec_perm_builder builder (SVEnelts, NEONnelts, 1);
+    for (unsigned int i = 0; i < NEONnelts; i++)
+      {
+       builder.quick_push (i);
+      }
+    vec_perm_indices indices (builder, 1, NEONnelts);
+    tree perm_type = build_vector_type (ssizetype, SVEnelts);
+    return gimple_build_assign (f.lhs, VEC_PERM_EXPR,
+                               rhs_vector,
+                               rhs_vector,
+                               vec_perm_indices_to_tree (perm_type, indices));
+  }
+  rtx
+  expand (function_expander &e) const override
+  {
+    insn_code icode;
+    machine_mode mode = e.vector_mode (0);
+    if (valid_for_const_vector_p (GET_MODE_INNER (mode), e.args.last ()))
+      /* Duplicate the constant to fill a vector.  The pattern optimizes
+        various cases involving constant operands, falling back to SEL
+        if necessary.  */
+      icode = code_for_vcond_mask (mode, mode);
+    else
+      /* Use the pattern for selecting between a duplicated scalar
+        variable and a vector fallback.  */
+      icode = code_for_aarch64_sel_dup (mode);
+    return e.use_vcond_mask_insn (icode);
+  }
+};
+
  class svindex_impl : public function_base
  {
  public:

@@ -3028,5 +3122,8 @@ FUNCTION (svzip1q, unspec_based_function,(UNSPEC_ZIP1Q, UNSPEC_ZIP1Q,

  FUNCTION (svzip2, svzip_impl, (1))
  FUNCTION (svzip2q, unspec_based_function, (UNSPEC_ZIP2Q, UNSPEC_ZIP2Q,
                                           UNSPEC_ZIP2Q))
+NEON_SVE_BRIDGE_FUNCTION (svget_neonq, svget_neonq_impl,)
+NEON_SVE_BRIDGE_FUNCTION (svset_neonq, svset_neonq_impl,)
+NEON_SVE_BRIDGE_FUNCTION (svdup_neonq, svdup_neonq_impl,)

  } /* end namespace aarch64_sve */

diff --git a/gcc/config/aarch64/aarch64-sve-builtins-functions.hb/gcc/config/aarch64/aarch64-sve-builtins-functions.hindex2729877d914414eff33182e03ab1dfc94a3515fa..bfb7fea674a905a2eb99f2bac7cbcb72af681b52100644

--- a/gcc/config/aarch64/aarch64-sve-builtins-functions.h
+++ b/gcc/config/aarch64/aarch64-sve-builtins-functions.h
@@ -622,4 +622,8 @@ public:
    namespace { static CONSTEXPR const CLASS NAME##_obj ARGS; } \
    namespace functions { const function_base *const NAME = &NAME##_obj; }

+#define NEON_SVE_BRIDGE_FUNCTION(NAME, CLASS, ARGS) \
+  namespace { static CONSTEXPR const CLASS NAME##_obj ARGS; } \

+ namespace neon_sve_bridge_functions { const function_base *const NAME= &NAME##_obj; }

+
  #endif

diff --git a/gcc/config/aarch64/aarch64-sve-builtins-shapes.hb/gcc/config/aarch64/aarch64-sve-builtins-shapes.hindex7483c1d04b8e463e607e8e65aa94233460f77648..30c0bf8503622b0320a334b79c328233248122a4100644

--- a/gcc/config/aarch64/aarch64-sve-builtins-shapes.h
+++ b/gcc/config/aarch64/aarch64-sve-builtins-shapes.h
@@ -186,6 +186,13 @@ namespace aarch64_sve
      extern const function_shape *const unary_uint;
      extern const function_shape *const unary_widen;
    }
+
+  namespace neon_sve_bridge_shapes
+  {
+    extern const function_shape *const get_neonq;
+    extern const function_shape *const set_neonq;
+    extern const function_shape *const dup_neonq;
+  }
  }

  #endif

diff --git a/gcc/config/aarch64/aarch64-sve-builtins-shapes.ccb/gcc/config/aarch64/aarch64-sve-builtins-shapes.ccindexaf816c4c9e705d9cc4bce5cc50481cb27e6a03a7..46e65cc78b3cf7bb70344a856c8fdb481534f46c100644

--- a/gcc/config/aarch64/aarch64-sve-builtins-shapes.cc
+++ b/gcc/config/aarch64/aarch64-sve-builtins-shapes.cc
@@ -29,6 +29,7 @@
  #include "optabs.h"
  #include "aarch64-sve-builtins.h"
  #include "aarch64-sve-builtins-shapes.h"
+#include "aarch64-builtins.h"

  /* In the comments below, _t0 represents the first type suffix and _t1
     represents the second.  Square brackets enclose characters that are

@@ -145,6 +146,76 @@ parse_element_type (const function_instance&instance, const char *&format)

    gcc_unreachable ();
  }

+int
+parse_neon_type (type_suffix_index suffix, int ch)
+{
+  if (ch == 'Q')
+    {
+      switch (suffix)
+       {
+       case TYPE_SUFFIX_s8:
+         return Int8x16_t;
+       case TYPE_SUFFIX_s16:
+         return Int16x8_t;
+       case TYPE_SUFFIX_s32:
+         return Int32x4_t;
+       case TYPE_SUFFIX_s64:
+         return Int64x2_t;
+       case TYPE_SUFFIX_u8:
+         return Uint8x16_t;
+       case TYPE_SUFFIX_u16:
+         return Uint16x8_t;
+       case TYPE_SUFFIX_u32:
+         return Uint32x4_t;
+       case TYPE_SUFFIX_u64:
+         return Uint64x2_t;
+       case TYPE_SUFFIX_f16:
+         return Float16x8_t;
+       case TYPE_SUFFIX_f32:
+         return Float32x4_t;
+       case TYPE_SUFFIX_f64:
+         return Float64x2_t;
+       case TYPE_SUFFIX_bf16:
+         return Bfloat16x8_t;
+       default:
+         gcc_unreachable ();
+       }
+    }
+  if (ch == 'D')
+    {
+      switch (suffix)
+       {
+       case TYPE_SUFFIX_s8:
+         return Int8x8_t;
+       case TYPE_SUFFIX_s16:
+         return Int16x4_t;
+       case TYPE_SUFFIX_s32:
+         return Int32x2_t;
+       case TYPE_SUFFIX_s64:
+         return Int64x1_t;
+       case TYPE_SUFFIX_u8:
+         return Uint8x8_t;
+       case TYPE_SUFFIX_u16:
+         return Uint16x4_t;
+       case TYPE_SUFFIX_u32:
+         return Uint32x2_t;
+       case TYPE_SUFFIX_u64:
+         return Uint64x1_t;
+       case TYPE_SUFFIX_f16:
+         return Float16x4_t;
+       case TYPE_SUFFIX_f32:
+         return Float32x2_t;
+       case TYPE_SUFFIX_f64:
+         return Float64x1_t;
+       case TYPE_SUFFIX_bf16:
+         return Bfloat16x4_t;
+       default:
+         gcc_unreachable ();
+       }
+    }
+  gcc_unreachable ();
+}
+
  /* Read and return a type from FORMAT for function INSTANCE.  Advance
     FORMAT beyond the type string.  The format is:

@@ -158,6 +229,8 @@ parse_element_type (const function_instance&instance, const char *&format)

     s<elt>  - a scalar type with the given element suffix
     t<elt>  - a vector or tuple type with given element suffix [*1]
     v<elt>  - a vector with the given element suffix
+   D<elt>  - a 64 bit neon vector
+   Q<elt>  - a 128 bit neon vector

     where <elt> has the format described above parse_element_type

@@ -224,6 +297,13 @@ parse_type (const function_instance &instance,const char *&format)

        return acle_vector_types[0][type_suffixes[suffix].vector_type];
      }

+  if (ch == 'Q' || ch == 'D')
+    {
+      type_suffix_index suffix = parse_element_type (instance, format);
+      int neon_index = parse_neon_type (suffix, ch);
+      return aarch64_simd_types[neon_index].itype;
+    }
+
    gcc_unreachable ();
  }

@@ -450,6 +530,12 @@ long_type_suffix (function_resolver &r,type_suffix_index type)

    static CONSTEXPR const NAME##_def NAME##_obj; \
    namespace shapes { const function_shape *const NAME = &NAME##_obj; }

+/* Declare the function neon_sve_bridge_shape NAME, pointing it to aninstance

+   of class <NAME>_def.  */
+#define NEON_SVE_BRIDGE_SHAPE(NAME) \
+  static CONSTEXPR const NAME##_def NAME##_obj; \

+ namespace neon_sve_bridge_shapes { const function_shape *const NAME =&NAME##_obj; }

+
  /* Base class for functions that are not overloaded.  */
  struct nonoverloaded_base : public function_shape
  {
@@ -1917,6 +2003,72 @@ struct get_def : public overloaded_base<0>
  };
  SHAPE (get)

+/* <t0>xN_t svfoo[_t0](sv<t0>_t).  */
+struct get_neonq_def : public overloaded_base<0>
+{
+  void

+ build (function_builder &b, const function_group_info &group) constoverride

+  {
+    b.add_overloaded_functions (group, MODE_none);
+    build_all (b, "Q0,v0", group, MODE_none);
+  }
+  tree
+  resolve (function_resolver &r) const override
+  {
+    unsigned int i, nargs;
+    type_suffix_index type;
+    if (!r.check_gp_argument (1, i, nargs)
+       || (type = r.infer_tuple_type (i)) == NUM_TYPE_SUFFIXES)
+      return error_mark_node;
+    return r.resolve_to (r.mode_suffix_id, type);
+  }
+};
+NEON_SVE_BRIDGE_SHAPE (get_neonq)
+
+/* sv<t0>_t svfoo[_t0](sv<t0>_t, <t0>xN_t).  */
+struct set_neonq_def : public overloaded_base<0>
+{
+  void

+ build (function_builder &b, const function_group_info &group) constoverride

+  {
+    b.add_overloaded_functions (group, MODE_none);
+    build_all (b, "v0,v0,Q0", group, MODE_none);
+  }
+  tree
+  resolve (function_resolver &r) const override
+  {
+    unsigned int i, nargs;
+    type_suffix_index type;
+    if (!r.check_gp_argument (1, i, nargs)
+       || (type = r.infer_tuple_type (i)) == NUM_TYPE_SUFFIXES)
+      return error_mark_node;
+    return r.resolve_to (r.mode_suffix_id, type);
+  }
+};
+NEON_SVE_BRIDGE_SHAPE (set_neonq)
+
+/* sv<t0>_t svfoo[_t0](<t0>xN_t).  */
+struct dup_neonq_def : public overloaded_base<0>
+{
+  void

+ build (function_builder &b, const function_group_info &group) constoverride

+  {
+    b.add_overloaded_functions (group, MODE_none);
+    build_all (b, "v0,Q0", group, MODE_none);
+  }
+  tree
+  resolve (function_resolver &r) const override
+  {
+    unsigned int i, nargs;
+    type_suffix_index type;
+    if (!r.check_gp_argument (1, i, nargs)
+       || (type = r.infer_tuple_type (i)) == NUM_TYPE_SUFFIXES)
+      return error_mark_node;
+    return r.resolve_to (r.mode_suffix_id, type);
+  }
+};
+NEON_SVE_BRIDGE_SHAPE (dup_neonq)
+
  /* sv<t0>_t svfoo[_t0](sv<t0>_t, uint64_t)
     <t0>_t svfoo[_n_t0](<t0>_t, uint64_t)

diff --git a/gcc/config/aarch64/aarch64-sve-builtins.ccb/gcc/config/aarch64/aarch64-sve-builtins.ccindex161a14edde7c9fb1b13b146cf50463e2d78db264..c994c83c5777e500ab2cf76ee2ed29dcebca074f100644

--- a/gcc/config/aarch64/aarch64-sve-builtins.cc
+++ b/gcc/config/aarch64/aarch64-sve-builtins.cc

@@ -529,6 +529,13 @@ static CONSTEXPR const function_group_infofunction_groups[] = {

  #include "aarch64-sve-builtins.def"
  };

+/* A list of all NEON-SVE-Bridge ACLE functions.  */
+static CONSTEXPR const function_group_info neon_sve_function_groups[] = {
+#define DEF_NEON_SVE_FUNCTION(NAME, SHAPE, TYPES, PREDS) \

+ { #NAME, &neon_sve_bridge_functions::NAME,&neon_sve_bridge_shapes::SHAPE, types_##TYPES, preds_##PREDS },

+#include "aarch64-neon-sve-bridge-builtins.def"
+};
+
  /* The scalar type associated with each vector type.  */
  extern GTY(()) tree scalar_types[NUM_VECTOR_TYPES];
  tree scalar_types[NUM_VECTOR_TYPES];
@@ -3560,6 +3567,20 @@ handle_arm_sve_h ()
      builder.register_function_group (function_groups[i]);
  }

+/* Implement #pragma GCC aarch64 "arm_sve.h".  */
+void
+handle_arm_neon_sve_bridge_h ()
+{
+
+  sve_switcher sve;
+
+  /* Define the functions.  */
+  function_table = new hash_table<registered_function_hasher> (1023);
+  function_builder builder;
+  for (unsigned int i = 0; i < ARRAY_SIZE (neon_sve_function_groups); ++i)
+    builder.register_function_group (neon_sve_function_groups[i]);
+}
+

/* Return the function decl with SVE function subcode CODE, orerror_mark_node

     if no such function exists.  */
  tree

diff --git a/gcc/config/aarch64/arm_neon_sve_bridge.hb/gcc/config/aarch64/arm_neon_sve_bridge.h

new file mode 100644

index0000000000000000000000000000000000000000..8f526eae86b94f615d22fe8de52583bb403e102e

--- /dev/null
+++ b/gcc/config/aarch64/arm_neon_sve_bridge.h
@@ -0,0 +1,38 @@
+/* AArch64 NEON-SVE Bridge intrinsics include file.
+   Copyright (C) 2023 Free Software Foundation, Inc.
+
+   This file is part of GCC.
+
+   GCC is free software; you can redistribute it and/or modify it
+   under the terms of the GNU General Public License as published
+   by the Free Software Foundation; either version 3, or (at your
+   option) any later version.
+
+   GCC is distributed in the hope that it will be useful, but WITHOUT
+   ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
+   or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public
+   License for more details.
+
+   Under Section 7 of GPL version 3, you are granted additional
+   permissions described in the GCC Runtime Library Exception, version
+   3.1, as published by the Free Software Foundation.
+
+   You should have received a copy of the GNU General Public License and
+   a copy of the GCC Runtime Library Exception along with this program;
+   see the files COPYING3 and COPYING.RUNTIME respectively.  If not, see
+   <http://www.gnu.org/licenses/>.  */
+
+#ifndef _ARM_NEON_SVE_BRIDGE_H_
+#define _ARM_NEON_SVE_BRIDGE_H_
+
+#include <arm_neon.h>
+#include <arm_sve.h>
+

+/* NOTE: This implementation of arm_neon_sve_bridge.h is intentionallyshort. It does

+   not define the types and intrinsic functions directly in C and C++
+   code, but instead uses the following pragma to tell GCC to insert the
+   necessary type and function definitions itself.  The net effect is the

+ same, and the file is a complete implementation ofarm_neon_sve_bridge.h. */

+#pragma GCC aarch64 "arm_neon_sve_bridge.h"
+
+#endif
\ No newline at end of file

diff --git a/gcc/testsuite/gcc.c-torture/execute/neon-sve-bridge.cb/gcc/testsuite/gcc.c-torture/execute/neon-sve-bridge.c

new file mode 100644

index0000000000000000000000000000000000000000..45dbcf97a647f0842693dbe47eedb4264e7b61fd

--- /dev/null
+++ b/gcc/testsuite/gcc.c-torture/execute/neon-sve-bridge.c
@@ -0,0 +1,55 @@
+// { dg-options "-march=armv8.2-a+sve" }
+// { dg-do run { target aarch64_sve_hw } }
+
+#include <arm_neon_sve_bridge.h>
+
+extern void abort (void);
+
+int
+svget_neonq_test ()
+{
+  int64_t val1 = 987654321;
+  svint64_t sveInput = svdup_n_s64(val1);
+  int64x2_t neonReturn = svget_neonq_s64 (sveInput);
+  int64_t val1Return = vgetq_lane_s64(neonReturn, 1);
+  if (val1 == val1Return)
+    return 0;
+  return 1;
+}
+
+int
+svset_neonq_test ()
+{
+  int64_t val2 = 123456789;
+  int64x2_t NeonInput = vdupq_n_s64(val2);
+  svint64_t sveReturn;
+  sveReturn = svset_neonq_s64 (sveReturn, NeonInput);
+  int64_t val2Return = svlasta_s64(svptrue_b64(), sveReturn);
+  if (val2 == val2Return)
+    return 0;
+  return 1;
+}
+
+int
+svdup_neonq_test ()
+{
+  uint32_t val2 = 123456789;
+  uint32x4_t NeonInput = vdupq_n_u32(val2);
+  svuint32_t sveReturn = svdup_neonq_u32 (NeonInput);
+  uint32_t val2Return = svlastb_u32(svptrue_b32(), sveReturn);
+  if (val2 == val2Return)
+    return 0;
+  return 1;
+}
+
+int
+main ()
+{
+  if (svget_neonq_test() == 1)
+    abort ();
+  if (svset_neonq_test() == 1)
+    abort ();
+  if (svdup_neonq_test() == 1)
+    abort ();
+  return 0;
+}
\ No newline at end of file

[PATCH] aarch64: SVE/NEON Bridging intrinsics

Reply via email to