config/aarch64/aarch64-sve-builtins-functions.h

    1.1  mrg /* ACLE support for AArch64 SVE (function_base classes)
1.1.1.2  mrg    Copyright (C) 2018-2022 Free Software Foundation, Inc.
    1.1  mrg
    1.1  mrg    This file is part of GCC.
    1.1  mrg
    1.1  mrg    GCC is free software; you can redistribute it and/or modify it
    1.1  mrg    under the terms of the GNU General Public License as published by
    1.1  mrg    the Free Software Foundation; either version 3, or (at your option)
    1.1  mrg    any later version.
    1.1  mrg
    1.1  mrg    GCC is distributed in the hope that it will be useful, but
    1.1  mrg    WITHOUT ANY WARRANTY; without even the implied warranty of
    1.1  mrg    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
    1.1  mrg    General Public License for more details.
    1.1  mrg
    1.1  mrg    You should have received a copy of the GNU General Public License
    1.1  mrg    along with GCC; see the file COPYING3.  If not see
    1.1  mrg    <http://www.gnu.org/licenses/>.  */
    1.1  mrg
    1.1  mrg #ifndef GCC_AARCH64_SVE_BUILTINS_FUNCTIONS_H
    1.1  mrg #define GCC_AARCH64_SVE_BUILTINS_FUNCTIONS_H
    1.1  mrg
    1.1  mrg namespace aarch64_sve {
    1.1  mrg
    1.1  mrg /* Wrap T, which is derived from function_base, and indicate that the
    1.1  mrg    function never has side effects.  It is only necessary to use this
    1.1  mrg    wrapper on functions that might have floating-point suffixes, since
    1.1  mrg    otherwise we assume by default that the function has no side effects.  */
    1.1  mrg template<typename T>
    1.1  mrg class quiet : public T
    1.1  mrg {
    1.1  mrg public:
    1.1  mrg   CONSTEXPR quiet () : T () {}
    1.1  mrg
    1.1  mrg   /* Unfortunately we can't use parameter packs yet.  */
    1.1  mrg   template<typename T1>
    1.1  mrg   CONSTEXPR quiet (const T1 &t1) : T (t1) {}
    1.1  mrg
    1.1  mrg   template<typename T1, typename T2>
    1.1  mrg   CONSTEXPR quiet (const T1 &t1, const T2 &t2) : T (t1, t2) {}
    1.1  mrg
    1.1  mrg   template<typename T1, typename T2, typename T3>
    1.1  mrg   CONSTEXPR quiet (const T1 &t1, const T2 &t2, const T3 &t3)
    1.1  mrg     : T (t1, t2, t3) {}
    1.1  mrg
    1.1  mrg   unsigned int
    1.1  mrg   call_properties (const function_instance &) const OVERRIDE
    1.1  mrg   {
    1.1  mrg     return 0;
    1.1  mrg   }
    1.1  mrg };
    1.1  mrg
    1.1  mrg /* A function_base that sometimes or always operates on tuples of
    1.1  mrg    vectors.  */
    1.1  mrg class multi_vector_function : public function_base
    1.1  mrg {
    1.1  mrg public:
    1.1  mrg   CONSTEXPR multi_vector_function (unsigned int vectors_per_tuple)
    1.1  mrg     : m_vectors_per_tuple (vectors_per_tuple) {}
    1.1  mrg
    1.1  mrg   unsigned int
    1.1  mrg   vectors_per_tuple () const OVERRIDE
    1.1  mrg   {
    1.1  mrg     return m_vectors_per_tuple;
    1.1  mrg   }
    1.1  mrg
    1.1  mrg   /* The number of vectors in a tuple, or 1 if the function only operates
    1.1  mrg      on single vectors.  */
    1.1  mrg   unsigned int m_vectors_per_tuple;
    1.1  mrg };
    1.1  mrg
    1.1  mrg /* A function_base that loads or stores contiguous memory elements
    1.1  mrg    without extending or truncating them.  */
    1.1  mrg class full_width_access : public multi_vector_function
    1.1  mrg {
    1.1  mrg public:
    1.1  mrg   CONSTEXPR full_width_access (unsigned int vectors_per_tuple = 1)
    1.1  mrg     : multi_vector_function (vectors_per_tuple) {}
    1.1  mrg
    1.1  mrg   tree
    1.1  mrg   memory_scalar_type (const function_instance &fi) const OVERRIDE
    1.1  mrg   {
    1.1  mrg     return fi.scalar_type (0);
    1.1  mrg   }
    1.1  mrg
    1.1  mrg   machine_mode
    1.1  mrg   memory_vector_mode (const function_instance &fi) const OVERRIDE
    1.1  mrg   {
    1.1  mrg     machine_mode mode = fi.vector_mode (0);
    1.1  mrg     if (m_vectors_per_tuple != 1)
    1.1  mrg       mode = targetm.array_mode (mode, m_vectors_per_tuple).require ();
    1.1  mrg     return mode;
    1.1  mrg   }
    1.1  mrg };
    1.1  mrg
    1.1  mrg /* A function_base that loads elements from memory and extends them
    1.1  mrg    to a wider element.  The memory element type is a fixed part of
    1.1  mrg    the function base name.  */
    1.1  mrg class extending_load : public function_base
    1.1  mrg {
    1.1  mrg public:
    1.1  mrg   CONSTEXPR extending_load (type_suffix_index memory_type)
    1.1  mrg     : m_memory_type (memory_type) {}
    1.1  mrg
    1.1  mrg   unsigned int
    1.1  mrg   call_properties (const function_instance &) const OVERRIDE
    1.1  mrg   {
    1.1  mrg     return CP_READ_MEMORY;
    1.1  mrg   }
    1.1  mrg
    1.1  mrg   tree
    1.1  mrg   memory_scalar_type (const function_instance &) const OVERRIDE
    1.1  mrg   {
    1.1  mrg     return scalar_types[type_suffixes[m_memory_type].vector_type];
    1.1  mrg   }
    1.1  mrg
    1.1  mrg   machine_mode
    1.1  mrg   memory_vector_mode (const function_instance &fi) const OVERRIDE
    1.1  mrg   {
    1.1  mrg     machine_mode mem_mode = type_suffixes[m_memory_type].vector_mode;
    1.1  mrg     machine_mode reg_mode = fi.vector_mode (0);
    1.1  mrg     return aarch64_sve_data_mode (GET_MODE_INNER (mem_mode),
    1.1  mrg 				  GET_MODE_NUNITS (reg_mode)).require ();
    1.1  mrg   }
    1.1  mrg
    1.1  mrg   /* Return the rtx code associated with the kind of extension that
    1.1  mrg      the load performs.  */
    1.1  mrg   rtx_code
    1.1  mrg   extend_rtx_code () const
    1.1  mrg   {
    1.1  mrg     return (type_suffixes[m_memory_type].unsigned_p
    1.1  mrg 	    ? ZERO_EXTEND : SIGN_EXTEND);
    1.1  mrg   }
    1.1  mrg
    1.1  mrg   /* The type of the memory elements.  This is part of the function base
    1.1  mrg      name rather than a true type suffix.  */
    1.1  mrg   type_suffix_index m_memory_type;
    1.1  mrg };
    1.1  mrg
    1.1  mrg /* A function_base that truncates vector elements and stores them to memory.
    1.1  mrg    The memory element width is a fixed part of the function base name.  */
    1.1  mrg class truncating_store : public function_base
    1.1  mrg {
    1.1  mrg public:
    1.1  mrg   CONSTEXPR truncating_store (scalar_int_mode to_mode) : m_to_mode (to_mode) {}
    1.1  mrg
    1.1  mrg   unsigned int
    1.1  mrg   call_properties (const function_instance &) const OVERRIDE
    1.1  mrg   {
    1.1  mrg     return CP_WRITE_MEMORY;
    1.1  mrg   }
    1.1  mrg
    1.1  mrg   tree
    1.1  mrg   memory_scalar_type (const function_instance &fi) const OVERRIDE
    1.1  mrg   {
    1.1  mrg     /* In truncating stores, the signedness of the memory element is defined
    1.1  mrg        to be the same as the signedness of the vector element.  The signedness
    1.1  mrg        doesn't make any difference to the behavior of the function.  */
    1.1  mrg     type_class_index tclass = fi.type_suffix (0).tclass;
    1.1  mrg     unsigned int element_bits = GET_MODE_BITSIZE (m_to_mode);
    1.1  mrg     type_suffix_index suffix = find_type_suffix (tclass, element_bits);
    1.1  mrg     return scalar_types[type_suffixes[suffix].vector_type];
    1.1  mrg   }
    1.1  mrg
    1.1  mrg   machine_mode
    1.1  mrg   memory_vector_mode (const function_instance &fi) const OVERRIDE
    1.1  mrg   {
    1.1  mrg     poly_uint64 nunits = GET_MODE_NUNITS (fi.vector_mode (0));
    1.1  mrg     return aarch64_sve_data_mode (m_to_mode, nunits).require ();
    1.1  mrg   }
    1.1  mrg
    1.1  mrg   /* The mode of a single memory element.  */
    1.1  mrg   scalar_int_mode m_to_mode;
    1.1  mrg };
    1.1  mrg
    1.1  mrg /* An incomplete function_base for functions that have an associated rtx code.
    1.1  mrg    It simply records information about the mapping for derived classes
    1.1  mrg    to use.  */
    1.1  mrg class rtx_code_function_base : public function_base
    1.1  mrg {
    1.1  mrg public:
    1.1  mrg   CONSTEXPR rtx_code_function_base (rtx_code code_for_sint,
    1.1  mrg 				    rtx_code code_for_uint,
    1.1  mrg 				    int unspec_for_fp = -1)
    1.1  mrg     : m_code_for_sint (code_for_sint), m_code_for_uint (code_for_uint),
    1.1  mrg       m_unspec_for_fp (unspec_for_fp) {}
    1.1  mrg
    1.1  mrg   /* The rtx code to use for signed and unsigned integers respectively.
    1.1  mrg      Can be UNKNOWN for functions that don't have integer forms.  */
    1.1  mrg   rtx_code m_code_for_sint;
    1.1  mrg   rtx_code m_code_for_uint;
    1.1  mrg
    1.1  mrg   /* The UNSPEC_COND_* to use for floating-point operations.  Can be -1
    1.1  mrg      for functions that only operate on integers.  */
    1.1  mrg   int m_unspec_for_fp;
    1.1  mrg };
    1.1  mrg
    1.1  mrg /* A function_base for functions that have an associated rtx code.
    1.1  mrg    It supports all forms of predication except PRED_implicit.  */
    1.1  mrg class rtx_code_function : public rtx_code_function_base
    1.1  mrg {
    1.1  mrg public:
    1.1  mrg   CONSTEXPR rtx_code_function (rtx_code code_for_sint, rtx_code code_for_uint,
    1.1  mrg 			       int unspec_for_fp = -1)
    1.1  mrg     : rtx_code_function_base (code_for_sint, code_for_uint, unspec_for_fp) {}
    1.1  mrg
    1.1  mrg   rtx
    1.1  mrg   expand (function_expander &e) const OVERRIDE
    1.1  mrg   {
    1.1  mrg     return e.map_to_rtx_codes (m_code_for_sint, m_code_for_uint,
    1.1  mrg 			       m_unspec_for_fp);
    1.1  mrg   }
    1.1  mrg };
    1.1  mrg
    1.1  mrg /* Like rtx_code_function, but for functions that take what is normally
    1.1  mrg    the final argument first.  One use of this class is to handle binary
    1.1  mrg    reversed operations; another is to handle MLA-style operations that
    1.1  mrg    are normally expressed in GCC as MAD-style operations.  */
    1.1  mrg class rtx_code_function_rotated : public rtx_code_function_base
    1.1  mrg {
    1.1  mrg public:
    1.1  mrg   CONSTEXPR rtx_code_function_rotated (rtx_code code_for_sint,
    1.1  mrg 				       rtx_code code_for_uint,
    1.1  mrg 				       int unspec_for_fp = -1)
    1.1  mrg     : rtx_code_function_base (code_for_sint, code_for_uint, unspec_for_fp) {}
    1.1  mrg
    1.1  mrg   rtx
    1.1  mrg   expand (function_expander &e) const OVERRIDE
    1.1  mrg   {
    1.1  mrg     /* Rotate the inputs into their normal order, but continue to make _m
    1.1  mrg        functions merge with what was originally the first vector argument.  */
    1.1  mrg     unsigned int nargs = e.args.length ();
    1.1  mrg     e.rotate_inputs_left (e.pred != PRED_none ? 1 : 0, nargs);
    1.1  mrg     return e.map_to_rtx_codes (m_code_for_sint, m_code_for_uint,
    1.1  mrg 			       m_unspec_for_fp, nargs - 1);
    1.1  mrg   }
    1.1  mrg };
    1.1  mrg
    1.1  mrg /* An incomplete function_base for functions that have an associated
    1.1  mrg    unspec code, with separate codes for signed integers, unsigned
    1.1  mrg    integers and floating-point values.  The class simply records
    1.1  mrg    information about the mapping for derived classes to use.  */
    1.1  mrg class unspec_based_function_base : public function_base
    1.1  mrg {
    1.1  mrg public:
    1.1  mrg   CONSTEXPR unspec_based_function_base (int unspec_for_sint,
    1.1  mrg 					int unspec_for_uint,
    1.1  mrg 					int unspec_for_fp)
    1.1  mrg     : m_unspec_for_sint (unspec_for_sint),
    1.1  mrg       m_unspec_for_uint (unspec_for_uint),
    1.1  mrg       m_unspec_for_fp (unspec_for_fp)
    1.1  mrg   {}
    1.1  mrg
    1.1  mrg   /* Return the unspec code to use for INSTANCE, based on type suffix 0.  */
    1.1  mrg   int
    1.1  mrg   unspec_for (const function_instance &instance) const
    1.1  mrg   {
    1.1  mrg     return (!instance.type_suffix (0).integer_p ? m_unspec_for_fp
    1.1  mrg 	    : instance.type_suffix (0).unsigned_p ? m_unspec_for_uint
    1.1  mrg 	    : m_unspec_for_sint);
    1.1  mrg   }
    1.1  mrg
    1.1  mrg   /* The unspec code associated with signed-integer, unsigned-integer
    1.1  mrg      and floating-point operations respectively.  */
    1.1  mrg   int m_unspec_for_sint;
    1.1  mrg   int m_unspec_for_uint;
    1.1  mrg   int m_unspec_for_fp;
    1.1  mrg };
    1.1  mrg
    1.1  mrg /* A function_base for functions that have an associated unspec code.
    1.1  mrg    It supports all forms of predication except PRED_implicit.  */
    1.1  mrg class unspec_based_function : public unspec_based_function_base
    1.1  mrg {
    1.1  mrg public:
    1.1  mrg   CONSTEXPR unspec_based_function (int unspec_for_sint, int unspec_for_uint,
    1.1  mrg 				   int unspec_for_fp)
    1.1  mrg     : unspec_based_function_base (unspec_for_sint, unspec_for_uint,
    1.1  mrg 				  unspec_for_fp)
    1.1  mrg   {}
    1.1  mrg
    1.1  mrg   rtx
    1.1  mrg   expand (function_expander &e) const OVERRIDE
    1.1  mrg   {
    1.1  mrg     return e.map_to_unspecs (m_unspec_for_sint, m_unspec_for_uint,
    1.1  mrg 			     m_unspec_for_fp);
    1.1  mrg   }
    1.1  mrg };
    1.1  mrg
    1.1  mrg /* Like unspec_based_function, but for functions that take what is normally
    1.1  mrg    the final argument first.  One use of this class is to handle binary
    1.1  mrg    reversed operations; another is to handle MLA-style operations that
    1.1  mrg    are normally expressed in GCC as MAD-style operations.  */
    1.1  mrg class unspec_based_function_rotated : public unspec_based_function_base
    1.1  mrg {
    1.1  mrg public:
    1.1  mrg   CONSTEXPR unspec_based_function_rotated (int unspec_for_sint,
    1.1  mrg 					   int unspec_for_uint,
    1.1  mrg 					   int unspec_for_fp)
    1.1  mrg     : unspec_based_function_base (unspec_for_sint, unspec_for_uint,
    1.1  mrg 				  unspec_for_fp)
    1.1  mrg   {}
    1.1  mrg
    1.1  mrg   rtx
    1.1  mrg   expand (function_expander &e) const OVERRIDE
    1.1  mrg   {
    1.1  mrg     /* Rotate the inputs into their normal order, but continue to make _m
    1.1  mrg        functions merge with what was originally the first vector argument.  */
    1.1  mrg     unsigned int nargs = e.args.length ();
    1.1  mrg     e.rotate_inputs_left (e.pred != PRED_none ? 1 : 0, nargs);
    1.1  mrg     return e.map_to_unspecs (m_unspec_for_sint, m_unspec_for_uint,
    1.1  mrg 			     m_unspec_for_fp, nargs - 1);
    1.1  mrg   }
    1.1  mrg };
    1.1  mrg
    1.1  mrg /* Like unspec_based_function, but map the function directly to
    1.1  mrg    CODE (UNSPEC, M) instead of using the generic predication-based
    1.1  mrg    expansion. where M is the vector mode associated with type suffix 0.
    1.1  mrg    This is useful if the unspec doesn't describe the full operation or
    1.1  mrg    if the usual predication rules don't apply for some reason.  */
    1.1  mrg template<insn_code (*CODE) (int, machine_mode)>
    1.1  mrg class unspec_based_function_exact_insn : public unspec_based_function_base
    1.1  mrg {
    1.1  mrg public:
    1.1  mrg   CONSTEXPR unspec_based_function_exact_insn (int unspec_for_sint,
    1.1  mrg 					      int unspec_for_uint,
    1.1  mrg 					      int unspec_for_fp)
    1.1  mrg     : unspec_based_function_base (unspec_for_sint, unspec_for_uint,
    1.1  mrg 				  unspec_for_fp)
    1.1  mrg   {}
    1.1  mrg
    1.1  mrg   rtx
    1.1  mrg   expand (function_expander &e) const OVERRIDE
    1.1  mrg   {
    1.1  mrg     return e.use_exact_insn (CODE (unspec_for (e), e.vector_mode (0)));
    1.1  mrg   }
    1.1  mrg };
    1.1  mrg
    1.1  mrg /* A function that performs an unspec and then adds it to another value.  */
    1.1  mrg typedef unspec_based_function_exact_insn<code_for_aarch64_sve_add>
    1.1  mrg   unspec_based_add_function;
    1.1  mrg typedef unspec_based_function_exact_insn<code_for_aarch64_sve_add_lane>
    1.1  mrg   unspec_based_add_lane_function;
    1.1  mrg
    1.1  mrg /* Generic unspec-based _lane function.  */
    1.1  mrg typedef unspec_based_function_exact_insn<code_for_aarch64_sve_lane>
    1.1  mrg   unspec_based_lane_function;
    1.1  mrg
    1.1  mrg /* A functon that uses aarch64_pred* patterns regardless of the
    1.1  mrg    predication type.  */
    1.1  mrg typedef unspec_based_function_exact_insn<code_for_aarch64_pred>
    1.1  mrg   unspec_based_pred_function;
    1.1  mrg
    1.1  mrg /* Like unspec_based_add_function and unspec_based_add_lane_function,
    1.1  mrg    but using saturating addition.  */
    1.1  mrg typedef unspec_based_function_exact_insn<code_for_aarch64_sve_qadd>
    1.1  mrg   unspec_based_qadd_function;
    1.1  mrg typedef unspec_based_function_exact_insn<code_for_aarch64_sve_qadd_lane>
    1.1  mrg   unspec_based_qadd_lane_function;
    1.1  mrg
    1.1  mrg /* Like unspec_based_sub_function and unspec_based_sub_lane_function,
    1.1  mrg    but using saturating subtraction.  */
    1.1  mrg typedef unspec_based_function_exact_insn<code_for_aarch64_sve_qsub>
    1.1  mrg   unspec_based_qsub_function;
    1.1  mrg typedef unspec_based_function_exact_insn<code_for_aarch64_sve_qsub_lane>
    1.1  mrg   unspec_based_qsub_lane_function;
    1.1  mrg
    1.1  mrg /* A function that performs an unspec and then subtracts it from
    1.1  mrg    another value.  */
    1.1  mrg typedef unspec_based_function_exact_insn<code_for_aarch64_sve_sub>
    1.1  mrg   unspec_based_sub_function;
    1.1  mrg typedef unspec_based_function_exact_insn<code_for_aarch64_sve_sub_lane>
    1.1  mrg   unspec_based_sub_lane_function;
    1.1  mrg
    1.1  mrg /* A function that acts like unspec_based_function_exact_insn<INT_CODE>
    1.1  mrg    when operating on integers, but that expands to an (fma ...)-style
    1.1  mrg    aarch64_sve* operation when applied to floats.  */
    1.1  mrg template<insn_code (*INT_CODE) (int, machine_mode)>
    1.1  mrg class unspec_based_fused_function : public unspec_based_function_base
    1.1  mrg {
    1.1  mrg public:
    1.1  mrg   CONSTEXPR unspec_based_fused_function (int unspec_for_sint,
    1.1  mrg 					 int unspec_for_uint,
    1.1  mrg 					 int unspec_for_fp)
    1.1  mrg     : unspec_based_function_base (unspec_for_sint, unspec_for_uint,
    1.1  mrg 				  unspec_for_fp)
    1.1  mrg   {}
    1.1  mrg
    1.1  mrg   rtx
    1.1  mrg   expand (function_expander &e) const OVERRIDE
    1.1  mrg   {
    1.1  mrg     int unspec = unspec_for (e);
    1.1  mrg     insn_code icode;
    1.1  mrg     if (e.type_suffix (0).float_p)
    1.1  mrg       {
    1.1  mrg 	/* Put the operands in the normal (fma ...) order, with the accumulator
    1.1  mrg 	   last.  This fits naturally since that's also the unprinted operand
    1.1  mrg 	   in the asm output.  */
    1.1  mrg 	e.rotate_inputs_left (0, e.pred != PRED_none ? 4 : 3);
    1.1  mrg 	icode = code_for_aarch64_sve (unspec, e.vector_mode (0));
    1.1  mrg       }
    1.1  mrg     else
    1.1  mrg       icode = INT_CODE (unspec, e.vector_mode (0));
    1.1  mrg     return e.use_exact_insn (icode);
    1.1  mrg   }
    1.1  mrg };
    1.1  mrg typedef unspec_based_fused_function<code_for_aarch64_sve_add>
    1.1  mrg   unspec_based_mla_function;
    1.1  mrg typedef unspec_based_fused_function<code_for_aarch64_sve_sub>
    1.1  mrg   unspec_based_mls_function;
    1.1  mrg
    1.1  mrg /* Like unspec_based_fused_function, but for _lane functions.  */
    1.1  mrg template<insn_code (*INT_CODE) (int, machine_mode)>
    1.1  mrg class unspec_based_fused_lane_function : public unspec_based_function_base
    1.1  mrg {
    1.1  mrg public:
    1.1  mrg   CONSTEXPR unspec_based_fused_lane_function (int unspec_for_sint,
    1.1  mrg 					      int unspec_for_uint,
    1.1  mrg 					      int unspec_for_fp)
    1.1  mrg     : unspec_based_function_base (unspec_for_sint, unspec_for_uint,
    1.1  mrg 				  unspec_for_fp)
    1.1  mrg   {}
    1.1  mrg
    1.1  mrg   rtx
    1.1  mrg   expand (function_expander &e) const OVERRIDE
    1.1  mrg   {
    1.1  mrg     int unspec = unspec_for (e);
    1.1  mrg     insn_code icode;
    1.1  mrg     if (e.type_suffix (0).float_p)
    1.1  mrg       {
    1.1  mrg 	/* Put the operands in the normal (fma ...) order, with the accumulator
    1.1  mrg 	   last.  This fits naturally since that's also the unprinted operand
    1.1  mrg 	   in the asm output.  */
    1.1  mrg 	e.rotate_inputs_left (0, e.pred != PRED_none ? 5 : 4);
    1.1  mrg 	icode = code_for_aarch64_lane (unspec, e.vector_mode (0));
    1.1  mrg       }
    1.1  mrg     else
    1.1  mrg       icode = INT_CODE (unspec, e.vector_mode (0));
    1.1  mrg     return e.use_exact_insn (icode);
    1.1  mrg   }
    1.1  mrg };
    1.1  mrg typedef unspec_based_fused_lane_function<code_for_aarch64_sve_add_lane>
    1.1  mrg   unspec_based_mla_lane_function;
    1.1  mrg typedef unspec_based_fused_lane_function<code_for_aarch64_sve_sub_lane>
    1.1  mrg   unspec_based_mls_lane_function;
    1.1  mrg
    1.1  mrg /* A function_base that uses CODE_FOR_MODE (M) to get the associated
    1.1  mrg    instruction code, where M is the vector mode associated with type
    1.1  mrg    suffix N.  */
    1.1  mrg template<insn_code (*CODE_FOR_MODE) (machine_mode), unsigned int N>
    1.1  mrg class code_for_mode_function : public function_base
    1.1  mrg {
    1.1  mrg public:
    1.1  mrg   rtx
    1.1  mrg   expand (function_expander &e) const OVERRIDE
    1.1  mrg   {
    1.1  mrg     return e.use_exact_insn (CODE_FOR_MODE (e.vector_mode (N)));
    1.1  mrg   }
    1.1  mrg };
    1.1  mrg
    1.1  mrg /* A function that uses code_for_<PATTERN> (M), where M is the vector
    1.1  mrg    mode associated with the first type suffix.  */
    1.1  mrg #define CODE_FOR_MODE0(PATTERN) code_for_mode_function<code_for_##PATTERN, 0>
    1.1  mrg
    1.1  mrg /* Likewise for the second type suffix.  */
    1.1  mrg #define CODE_FOR_MODE1(PATTERN) code_for_mode_function<code_for_##PATTERN, 1>
    1.1  mrg
    1.1  mrg /* Like CODE_FOR_MODE0, but the function doesn't raise exceptions when
    1.1  mrg    operating on floating-point data.  */
    1.1  mrg #define QUIET_CODE_FOR_MODE0(PATTERN) \
    1.1  mrg   quiet< code_for_mode_function<code_for_##PATTERN, 0> >
    1.1  mrg
    1.1  mrg /* A function_base for functions that always expand to a fixed insn pattern,
    1.1  mrg    regardless of what the suffixes are.  */
    1.1  mrg class fixed_insn_function : public function_base
    1.1  mrg {
    1.1  mrg public:
    1.1  mrg   CONSTEXPR fixed_insn_function (insn_code code) : m_code (code) {}
    1.1  mrg
    1.1  mrg   rtx
    1.1  mrg   expand (function_expander &e) const OVERRIDE
    1.1  mrg   {
    1.1  mrg     return e.use_exact_insn (m_code);
    1.1  mrg   }
    1.1  mrg
    1.1  mrg   /* The instruction to use.  */
    1.1  mrg   insn_code m_code;
    1.1  mrg };
    1.1  mrg
    1.1  mrg /* A function_base for functions that permute their arguments.  */
    1.1  mrg class permute : public quiet<function_base>
    1.1  mrg {
    1.1  mrg public:
    1.1  mrg   /* Fold a unary or binary permute with the permute vector given by
    1.1  mrg      BUILDER.  */
    1.1  mrg   gimple *
    1.1  mrg   fold_permute (const gimple_folder &f, const vec_perm_builder &builder) const
    1.1  mrg   {
    1.1  mrg     /* Punt for now on _b16 and wider; we'd need more complex evpc logic
    1.1  mrg        to rerecognize the result.  */
    1.1  mrg     if (f.type_suffix (0).bool_p && f.type_suffix (0).element_bits > 8)
    1.1  mrg       return NULL;
    1.1  mrg
    1.1  mrg     unsigned int nargs = gimple_call_num_args (f.call);
    1.1  mrg     poly_uint64 nelts = TYPE_VECTOR_SUBPARTS (TREE_TYPE (f.lhs));
    1.1  mrg     vec_perm_indices indices (builder, nargs, nelts);
    1.1  mrg     tree perm_type = build_vector_type (ssizetype, nelts);
    1.1  mrg     return gimple_build_assign (f.lhs, VEC_PERM_EXPR,
    1.1  mrg 				gimple_call_arg (f.call, 0),
    1.1  mrg 				gimple_call_arg (f.call, nargs - 1),
    1.1  mrg 				vec_perm_indices_to_tree (perm_type, indices));
    1.1  mrg   }
    1.1  mrg };
    1.1  mrg
    1.1  mrg /* A function_base for functions that permute two vectors using a fixed
    1.1  mrg    choice of indices.  */
    1.1  mrg class binary_permute : public permute
    1.1  mrg {
    1.1  mrg public:
    1.1  mrg   CONSTEXPR binary_permute (int unspec) : m_unspec (unspec) {}
    1.1  mrg
    1.1  mrg   rtx
    1.1  mrg   expand (function_expander &e) const OVERRIDE
    1.1  mrg   {
    1.1  mrg     insn_code icode = code_for_aarch64_sve (m_unspec, e.vector_mode (0));
    1.1  mrg     return e.use_exact_insn (icode);
    1.1  mrg   }
    1.1  mrg
    1.1  mrg   /* The unspec code associated with the operation.  */
    1.1  mrg   int m_unspec;
    1.1  mrg };
    1.1  mrg
    1.1  mrg /* A function_base for functions that reduce a vector to a scalar.  */
    1.1  mrg class reduction : public function_base
    1.1  mrg {
    1.1  mrg public:
    1.1  mrg   CONSTEXPR reduction (int unspec)
    1.1  mrg     : m_unspec_for_sint (unspec),
    1.1  mrg       m_unspec_for_uint (unspec),
    1.1  mrg       m_unspec_for_fp (unspec)
    1.1  mrg   {}
    1.1  mrg
    1.1  mrg   CONSTEXPR reduction (int unspec_for_sint, int unspec_for_uint,
    1.1  mrg 		       int unspec_for_fp)
    1.1  mrg     : m_unspec_for_sint (unspec_for_sint),
    1.1  mrg       m_unspec_for_uint (unspec_for_uint),
    1.1  mrg       m_unspec_for_fp (unspec_for_fp)
    1.1  mrg   {}
    1.1  mrg
    1.1  mrg   rtx
    1.1  mrg   expand (function_expander &e) const OVERRIDE
    1.1  mrg   {
    1.1  mrg     machine_mode mode = e.vector_mode (0);
    1.1  mrg     int unspec = (!e.type_suffix (0).integer_p ? m_unspec_for_fp
    1.1  mrg 		  : e.type_suffix (0).unsigned_p ? m_unspec_for_uint
    1.1  mrg 		  : m_unspec_for_sint);
    1.1  mrg     /* There's no distinction between SADDV and UADDV for 64-bit elements;
    1.1  mrg        the signed versions only exist for narrower elements.  */
    1.1  mrg     if (GET_MODE_UNIT_BITSIZE (mode) == 64 && unspec == UNSPEC_SADDV)
    1.1  mrg       unspec = UNSPEC_UADDV;
    1.1  mrg     return e.use_exact_insn (code_for_aarch64_pred_reduc (unspec, mode));
    1.1  mrg   }
    1.1  mrg
    1.1  mrg   /* The unspec code associated with signed-integer, unsigned-integer
    1.1  mrg      and floating-point operations respectively.  */
    1.1  mrg   int m_unspec_for_sint;
    1.1  mrg   int m_unspec_for_uint;
    1.1  mrg   int m_unspec_for_fp;
    1.1  mrg };
    1.1  mrg
    1.1  mrg /* A function_base for functions that shift narrower-than-64-bit values
    1.1  mrg    by 64-bit amounts.  */
    1.1  mrg class shift_wide : public function_base
    1.1  mrg {
    1.1  mrg public:
    1.1  mrg   CONSTEXPR shift_wide (rtx_code code, int wide_unspec)
    1.1  mrg     : m_code (code), m_wide_unspec (wide_unspec) {}
    1.1  mrg
    1.1  mrg   rtx
    1.1  mrg   expand (function_expander &e) const OVERRIDE
    1.1  mrg   {
    1.1  mrg     machine_mode mode = e.vector_mode (0);
    1.1  mrg     machine_mode elem_mode = GET_MODE_INNER (mode);
    1.1  mrg
    1.1  mrg     /* If the argument is a constant that the normal shifts can handle
    1.1  mrg        directly, use them instead.  */
    1.1  mrg     rtx shift = unwrap_const_vec_duplicate (e.args.last ());
    1.1  mrg     if (aarch64_simd_shift_imm_p (shift, elem_mode, m_code == ASHIFT))
    1.1  mrg       {
    1.1  mrg 	e.args.last () = shift;
    1.1  mrg 	return e.map_to_rtx_codes (m_code, m_code, -1);
    1.1  mrg       }
    1.1  mrg
    1.1  mrg     if (e.pred == PRED_x)
    1.1  mrg       return e.use_unpred_insn (code_for_aarch64_sve (m_wide_unspec, mode));
    1.1  mrg
    1.1  mrg     return e.use_cond_insn (code_for_cond (m_wide_unspec, mode));
    1.1  mrg   }
    1.1  mrg
    1.1  mrg   /* The rtx code associated with a "normal" shift.  */
    1.1  mrg   rtx_code m_code;
    1.1  mrg
    1.1  mrg   /* The unspec code associated with the wide shift.  */
    1.1  mrg   int m_wide_unspec;
    1.1  mrg };
    1.1  mrg
    1.1  mrg /* A function_base for unary functions that count bits.  */
    1.1  mrg class unary_count : public quiet<function_base>
    1.1  mrg {
    1.1  mrg public:
    1.1  mrg   CONSTEXPR unary_count (rtx_code code) : m_code (code) {}
    1.1  mrg
    1.1  mrg   rtx
    1.1  mrg   expand (function_expander &e) const OVERRIDE
    1.1  mrg   {
    1.1  mrg     /* The md patterns treat the operand as an integer.  */
    1.1  mrg     machine_mode mode = aarch64_sve_int_mode (e.vector_mode (0));
    1.1  mrg     e.args.last () = gen_lowpart (mode, e.args.last ());
    1.1  mrg
    1.1  mrg     if (e.pred == PRED_x)
    1.1  mrg       return e.use_pred_x_insn (code_for_aarch64_pred (m_code, mode));
    1.1  mrg
    1.1  mrg     return e.use_cond_insn (code_for_cond (m_code, mode));
    1.1  mrg   }
    1.1  mrg
    1.1  mrg   /* The rtx code associated with the operation.  */
    1.1  mrg   rtx_code m_code;
    1.1  mrg };
    1.1  mrg
    1.1  mrg /* A function_base for svwhile* functions.  */
    1.1  mrg class while_comparison : public function_base
    1.1  mrg {
    1.1  mrg public:
    1.1  mrg   CONSTEXPR while_comparison (int unspec_for_sint, int unspec_for_uint)
    1.1  mrg     : m_unspec_for_sint (unspec_for_sint),
    1.1  mrg       m_unspec_for_uint (unspec_for_uint)
    1.1  mrg   {}
    1.1  mrg
    1.1  mrg   rtx
    1.1  mrg   expand (function_expander &e) const OVERRIDE
    1.1  mrg   {
    1.1  mrg     /* Suffix 0 determines the predicate mode, suffix 1 determines the
    1.1  mrg        scalar mode and signedness.  */
    1.1  mrg     int unspec = (e.type_suffix (1).unsigned_p
    1.1  mrg 		  ? m_unspec_for_uint
    1.1  mrg 		  : m_unspec_for_sint);
    1.1  mrg     machine_mode pred_mode = e.vector_mode (0);
    1.1  mrg     scalar_mode reg_mode = GET_MODE_INNER (e.vector_mode (1));
    1.1  mrg     return e.use_exact_insn (code_for_while (unspec, reg_mode, pred_mode));
    1.1  mrg   }
    1.1  mrg
    1.1  mrg   /* The unspec codes associated with signed and unsigned operations
    1.1  mrg      respectively.  */
    1.1  mrg   int m_unspec_for_sint;
    1.1  mrg   int m_unspec_for_uint;
    1.1  mrg };
    1.1  mrg
    1.1  mrg }
    1.1  mrg
    1.1  mrg /* Declare the global function base NAME, creating it from an instance
    1.1  mrg    of class CLASS with constructor arguments ARGS.  */
    1.1  mrg #define FUNCTION(NAME, CLASS, ARGS) \
    1.1  mrg   namespace { static CONSTEXPR const CLASS NAME##_obj ARGS; } \
    1.1  mrg   namespace functions { const function_base *const NAME = &NAME##_obj; }
    1.1  mrg
    1.1  mrg #endif