Add ACLE support for the SVE AES2 multi-vector AES indexed
instructions and the 128-bit PMULL/PMLAL pair forms.
This adds builtin shapes and expanders for svaese_lane, svaesd_lane,
svaesemc_lane, svaesdimc_lane, svpmull_pair and svpmlal_pair, together
with the corresponding RTL patterns and tests. Also add preprocessor
feature macros for SVE AES2 and SSVE AES.
gcc/
* config/aarch64/aarch64-c.cc (aarch64_update_cpp_builtins): Define
__ARM_FEATURE_SVE_AES2 and __ARM_FEATURE_SSVE_AES.
* config/aarch64/aarch64-sve-builtins-functions.h
(unspec_based_aes_lane_function): New typedef.
(unspec_based_aes_lane_mc_function): Likewise.
* config/aarch64/aarch64-sve-builtins-shapes.cc
(binary_tuple_uint64_n_def): New shape.
(ternary_tuple_uint64_n_def): Likewise.
(binary_aes_lane_def): Likewise.
* config/aarch64/aarch64-sve-builtins-shapes.h: Declare new shapes.
* config/aarch64/aarch64-sve-builtins-sve2.cc: Add new function
entries.
* config/aarch64/aarch64-sve-builtins-sve2.def: Add new ACLE
builtin definitions.
* config/aarch64/aarch64-sve-builtins-sve2.h: Declare new functions.
* config/aarch64/aarch64-sve2.md: Add PMULL/PMLAL pair and AES
indexed multi-vector patterns.
* config/aarch64/aarch64.h (TARGET_SVE_AES2): Define.
* config/aarch64/aarch64.md (UNSPEC_SSVE_LANE_SELECT): New unspec.
* config/aarch64/iterators.md: Add iterators and attrs for new
patterns.
* config/aarch64/predicates.md (const_0_to_3_operand): New predicate.
gcc/testsuite/
* gcc.target/aarch64/pragma_cpp_predefs_5.c: Test new feature macros.
* gcc.target/aarch64/sve/acle/asm/test_sve_acle.h
(TEST_XN_INDEXED): New macro.
* gcc.target/aarch64/sve2/acle/asm/aesd_lane_u8.c: New test.
* gcc.target/aarch64/sve2/acle/asm/aesdimc_lane_u8.c: New test.
* gcc.target/aarch64/sve2/acle/asm/aese_lane_u8.c: New test.
* gcc.target/aarch64/sve2/acle/asm/aesemc_lane_u8.c: New test.
* gcc.target/aarch64/sve2/acle/asm/pmlal_pair_u64.c: New test.
* gcc.target/aarch64/sve2/acle/asm/pmull_pair_u64.c: New test.
* lib/target-supports.exp: Add sve-aes2 assembler probe.
---
gcc/config/aarch64/aarch64-c.cc | 4 +
.../aarch64/aarch64-sve-builtins-functions.h | 5 +
.../aarch64/aarch64-sve-builtins-shapes.cc | 143 ++++++++++++++++++
.../aarch64/aarch64-sve-builtins-shapes.h | 3 +
.../aarch64/aarch64-sve-builtins-sve2.cc | 6 +
.../aarch64/aarch64-sve-builtins-sve2.def | 10 ++
.../aarch64/aarch64-sve-builtins-sve2.h | 6 +
gcc/config/aarch64/aarch64-sve2.md | 86 +++++++++++
gcc/config/aarch64/aarch64.h | 2 +
gcc/config/aarch64/aarch64.md | 3 +
gcc/config/aarch64/iterators.md | 14 ++
gcc/config/aarch64/predicates.md | 4 +
.../gcc.target/aarch64/pragma_cpp_predefs_5.c | 22 +++
.../aarch64/sve/acle/asm/test_sve_acle.h | 16 ++
.../aarch64/sve2/acle/asm/aesd_lane_u8.c | 67 ++++++++
.../aarch64/sve2/acle/asm/aesdimc_lane_u8.c | 67 ++++++++
.../aarch64/sve2/acle/asm/aese_lane_u8.c | 67 ++++++++
.../aarch64/sve2/acle/asm/aesemc_lane_u8.c | 67 ++++++++
.../aarch64/sve2/acle/asm/pmlal_pair_u64.c | 69 +++++++++
.../aarch64/sve2/acle/asm/pmull_pair_u64.c | 45 ++++++
gcc/testsuite/lib/target-supports.exp | 4 +-
21 files changed, 708 insertions(+), 2 deletions(-)
create mode 100644
gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/aesd_lane_u8.c
create mode 100644
gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/aesdimc_lane_u8.c
create mode 100644
gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/aese_lane_u8.c
create mode 100644
gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/aesemc_lane_u8.c
create mode 100644
gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/pmlal_pair_u64.c
create mode 100644
gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/pmull_pair_u64.c
diff --git a/gcc/config/aarch64/aarch64-c.cc b/gcc/config/aarch64/aarch64-c.cc
index 4d83d5f0184..86ba2214e88 100644
--- a/gcc/config/aarch64/aarch64-c.cc
+++ b/gcc/config/aarch64/aarch64-c.cc
@@ -228,6 +228,10 @@ aarch64_update_cpp_builtins (cpp_reader *pfile)
aarch64_def_or_undef (AARCH64_HAVE_ISA (SVE2), "__ARM_FEATURE_SVE2", pfile);
aarch64_def_or_undef (AARCH64_HAVE_ISA (SVE2) && AARCH64_HAVE_ISA (SVE_AES),
"__ARM_FEATURE_SVE2_AES", pfile);
+ aarch64_def_or_undef (AARCH64_HAVE_ISA (SVE_AES2), "__ARM_FEATURE_SVE_AES2",
+ pfile);
+ aarch64_def_or_undef (AARCH64_HAVE_ISA (SSVE_AES), "__ARM_FEATURE_SSVE_AES",
+ pfile);
aarch64_def_or_undef (AARCH64_HAVE_ISA (SVE_BITPERM)
&& AARCH64_HAVE_ISA (SVE2),
"__ARM_FEATURE_SVE2_BITPERM", pfile);
diff --git a/gcc/config/aarch64/aarch64-sve-builtins-functions.h
b/gcc/config/aarch64/aarch64-sve-builtins-functions.h
index 8fd7a8fef52..7a62c05e08b 100644
--- a/gcc/config/aarch64/aarch64-sve-builtins-functions.h
+++ b/gcc/config/aarch64/aarch64-sve-builtins-functions.h
@@ -397,6 +397,11 @@ typedef
unspec_based_function_exact_insn<code_for_aarch64_sve_sub>
typedef unspec_based_function_exact_insn<code_for_aarch64_sve_sub_lane>
unspec_based_sub_lane_function;
+typedef unspec_based_function_exact_insn<code_for_aarch64_sve2_aes_lane>
+ unspec_based_aes_lane_function;
+typedef unspec_based_function_exact_insn<code_for_aarch64_sve2_aes_lane_mc>
+ unspec_based_aes_lane_mc_function;
+
/* A function that has conditional and unconditional forms, with both
forms being associated with a single unspec each. */
class cond_or_uncond_unspec_function : public function_base
diff --git a/gcc/config/aarch64/aarch64-sve-builtins-shapes.cc
b/gcc/config/aarch64/aarch64-sve-builtins-shapes.cc
index 8611f20f6e8..08f8d6b4ad5 100644
--- a/gcc/config/aarch64/aarch64-sve-builtins-shapes.cc
+++ b/gcc/config/aarch64/aarch64-sve-builtins-shapes.cc
@@ -1502,6 +1502,149 @@ struct binary_int_opt_single_n_def : public
overloaded_base<0>
};
SHAPE (binary_int_opt_single_n)
+/* sv<t0>x<g>_t svfoo[_t0_g](sv<t0>_t, sv<t0>_t)
+ sv<t0>x<g>_t svfoo[_n_t0_g](sv<t0>_t, <t0>_t). */
+struct binary_tuple_uint64_n_def : public overloaded_base<0>
+{
+ bool explicit_group_suffix_p () const override { return false; }
+
+ void
+ build (function_builder &b, const function_group_info &group) const override
+ {
+ b.add_overloaded_functions (group, MODE_none);
+ build_all (b, "t0,v0,v0", group, MODE_none);
+ build_all (b, "t0,v0,s0", group, MODE_n);
+ }
+
+ tree
+ resolve (function_resolver &r) const override
+ {
+ if (!r.check_num_arguments (2))
+ return error_mark_node;
+
+ if (!r.require_vector_type (0, VECTOR_TYPE_svuint64_t))
+ return error_mark_node;
+
+ mode_suffix_index mode;
+ if (r.scalar_argument_p (1))
+ {
+ if (!r.require_scalar_type (1, "uint64_t"))
+ return error_mark_node;
+ mode = MODE_n;
+ }
+ else
+ {
+ if (!r.require_vector_type (1, VECTOR_TYPE_svuint64_t))
+ return error_mark_node;
+ mode = MODE_none;
+ }
+
+ return r.resolve_to (mode, { TYPE_SUFFIX_u64, 2 });
+ }
+};
+SHAPE (binary_tuple_uint64_n)
+
+/* sv<t0>x<g>_t svfoo[_t0_g](sv<t0>x<g>_t, sv<t0>_t, sv<t0>_t)
+ sv<t0>x<g>_t svfoo[_n_t0_g](sv<t0>x<g>_t, sv<t0>_t, <t0>_t). */
+struct ternary_tuple_uint64_n_def : public overloaded_base<0>
+{
+ bool explicit_group_suffix_p () const override { return false; }
+
+ void
+ build (function_builder &b, const function_group_info &group) const override
+ {
+ b.add_overloaded_functions (group, MODE_none);
+ build_all (b, "t0,t0,v0,v0", group, MODE_none);
+ build_all (b, "t0,t0,v0,s0", group, MODE_n);
+ }
+
+ tree
+ resolve (function_resolver &r) const override
+ {
+ if (!r.check_num_arguments (3))
+ return error_mark_node;
+
+ sve_type type = r.infer_sve_type (0);
+ if (!type)
+ return error_mark_node;
+
+ if (type.num_vectors != 2)
+ {
+ r.report_incorrect_num_vectors (0, type, 2);
+ return error_mark_node;
+ }
+
+ if (!r.require_vector_type (1, VECTOR_TYPE_svuint64_t))
+ return error_mark_node;
+
+ mode_suffix_index mode;
+ if (r.scalar_argument_p (2))
+ {
+ if (!r.require_scalar_type (2, "uint64_t"))
+ return error_mark_node;
+ mode = MODE_n;
+ }
+ else
+ {
+ if (!r.require_vector_type (2, VECTOR_TYPE_svuint64_t))
+ return error_mark_node;
+ mode = MODE_none;
+ }
+
+ return r.resolve_to (mode, type);
+ }
+};
+SHAPE (ternary_tuple_uint64_n)
+
+/* svuint8x2_t svaes<...>_lane[_u8_x2] (svuint8x2_t zdn, svuint8_t zm, uint64_t
+ index);
+ and
+ svuint8x4_t svaes<...>_lane[_u8_x4] (svuint8x4_t zdn, svuint8_t zm, uint64_t
+ index);
+ When index is in range[0-3]
+*/
+struct binary_aes_lane_def : public overloaded_base<0>
+{
+ bool explicit_group_suffix_p () const override { return false; }
+
+ void
+ build (function_builder &b, const function_group_info &group) const override
+ {
+ b.add_overloaded_functions (group, MODE_none);
+ build_all (b, "t0,t0,v0,su64", group, MODE_none);
+ }
+
+ tree
+ resolve (function_resolver &r) const override
+ {
+ if (!r.check_num_arguments (3))
+ return error_mark_node;
+
+ sve_type type = r.infer_sve_type (0);
+ if (!type)
+ return error_mark_node;
+
+ if (type.num_vectors != 2 && type.num_vectors != 4)
+ return error_mark_node;
+
+ if (!r.require_vector_type (1, VECTOR_TYPE_svuint8_t))
+ return error_mark_node;
+
+ if (!r.require_integer_immediate (2))
+ return error_mark_node;
+
+ return r.resolve_to (MODE_none, type);
+ }
+
+ bool
+ check (function_checker &c) const override
+ {
+ return c.require_immediate_lane_index (2, 0, 4);
+ }
+};
+SHAPE (binary_aes_lane)
+
+
/* sv<t0>_t svfoo_<t0>(sv<t0>_t, sv<t0>_t, uint64_t)
where the final argument is an integer constant expression in the
diff --git a/gcc/config/aarch64/aarch64-sve-builtins-shapes.h
b/gcc/config/aarch64/aarch64-sve-builtins-shapes.h
index b2c927542a8..df85f0688c5 100644
--- a/gcc/config/aarch64/aarch64-sve-builtins-shapes.h
+++ b/gcc/config/aarch64/aarch64-sve-builtins-shapes.h
@@ -85,6 +85,7 @@ namespace aarch64_sve
extern const function_shape *const binary_int_opt_single_n;
extern const function_shape *const binary_lane;
extern const function_shape *const binary_long_lane;
+ extern const function_shape *const binary_aes_lane;
extern const function_shape *const binary_long_opt_n;
extern const function_shape *const binary_n;
extern const function_shape *const binary_narrowb_opt_n;
@@ -95,6 +96,7 @@ namespace aarch64_sve
extern const function_shape *const binary_rotate;
extern const function_shape *const binary_scalar;
extern const function_shape *const binary_single;
+ extern const function_shape *const binary_tuple_uint64_n;
extern const function_shape *const binary_to_uint;
extern const function_shape *const binary_uint;
extern const function_shape *const binary_uint_n;
@@ -237,6 +239,7 @@ namespace aarch64_sve
extern const function_shape *const ternary_uintq_intq;
extern const function_shape *const ternary_uintq_intq_lane;
extern const function_shape *const ternary_uintq_intq_opt_n;
+ extern const function_shape *const ternary_tuple_uint64_n;
extern const function_shape *const tmad;
extern const function_shape *const unary;
extern const function_shape *const unary_convert;
diff --git a/gcc/config/aarch64/aarch64-sve-builtins-sve2.cc
b/gcc/config/aarch64/aarch64-sve-builtins-sve2.cc
index 5ea08056ae3..ee67d15e51a 100644
--- a/gcc/config/aarch64/aarch64-sve-builtins-sve2.cc
+++ b/gcc/config/aarch64/aarch64-sve-builtins-sve2.cc
@@ -1045,6 +1045,10 @@ FUNCTION (svaesd, fixed_insn_function,
(CODE_FOR_aarch64_sve2_aesd))
FUNCTION (svaese, fixed_insn_function, (CODE_FOR_aarch64_sve2_aese))
FUNCTION (svaesimc, fixed_insn_function, (CODE_FOR_aarch64_sve2_aesimc))
FUNCTION (svaesmc, fixed_insn_function, (CODE_FOR_aarch64_sve2_aesmc))
+FUNCTION (svaese_lane, unspec_based_aes_lane_function, (-1, UNSPEC_AESE, -1))
+FUNCTION (svaesd_lane, unspec_based_aes_lane_function, (-1, UNSPEC_AESD, -1))
+FUNCTION (svaesemc_lane, unspec_based_aes_lane_mc_function, (-1, UNSPEC_AESE,
-1))
+FUNCTION (svaesdimc_lane, unspec_based_aes_lane_mc_function, (-1, UNSPEC_AESD,
-1))
FUNCTION (svamax, faminmaximpl, (UNSPEC_COND_FAMAX, UNSPEC_FAMAX))
FUNCTION (svamin, faminmaximpl, (UNSPEC_COND_FAMIN, UNSPEC_FAMIN))
FUNCTION (svandqv, reduction, (UNSPEC_ANDQV, UNSPEC_ANDQV, -1))
@@ -1172,6 +1176,8 @@ FUNCTION (svpmullb, unspec_based_function, (-1,
UNSPEC_PMULLB, -1))
FUNCTION (svpmullb_pair, unspec_based_function, (-1, UNSPEC_PMULLB_PAIR, -1))
FUNCTION (svpmullt, unspec_based_function, (-1, UNSPEC_PMULLT, -1))
FUNCTION (svpmullt_pair, unspec_based_function, (-1, UNSPEC_PMULLT_PAIR, -1))
+FUNCTION (svpmull_pair, fixed_insn_function, (CODE_FOR_aarch64_sve_pmull_pair))
+FUNCTION (svpmlal_pair, fixed_insn_function, (CODE_FOR_aarch64_sve_pmlal_pair))
FUNCTION (svpsel_lane, svpsel_lane_impl,)
FUNCTION (svqabs, rtx_code_function, (SS_ABS, UNKNOWN, UNKNOWN))
FUNCTION (svqcadd, svqcadd_impl,)
diff --git a/gcc/config/aarch64/aarch64-sve-builtins-sve2.def
b/gcc/config/aarch64/aarch64-sve-builtins-sve2.def
index 16524cfedab..cf7fd6e5e17 100644
--- a/gcc/config/aarch64/aarch64-sve-builtins-sve2.def
+++ b/gcc/config/aarch64/aarch64-sve-builtins-sve2.def
@@ -206,6 +206,16 @@ DEF_SVE_FUNCTION (svpmullb_pair, binary_opt_n, d_unsigned,
none)
DEF_SVE_FUNCTION (svpmullt_pair, binary_opt_n, d_unsigned, none)
#undef REQUIRED_EXTENSIONS
+#define REQUIRED_EXTENSIONS streaming_compatible (AARCH64_FL_SVE_AES2, \
+ AARCH64_FL_SSVE_AES)
+DEF_SVE_FUNCTION_GS (svaese_lane, binary_aes_lane, b_unsigned, x24, none)
+DEF_SVE_FUNCTION_GS (svaesd_lane, binary_aes_lane, b_unsigned, x24, none)
+DEF_SVE_FUNCTION_GS (svaesemc_lane, binary_aes_lane, b_unsigned, x24, none)
+DEF_SVE_FUNCTION_GS (svaesdimc_lane, binary_aes_lane, b_unsigned, x24, none)
+DEF_SVE_FUNCTION_GS (svpmull_pair, binary_tuple_uint64_n, d_unsigned, x2, none)
+DEF_SVE_FUNCTION_GS (svpmlal_pair, ternary_tuple_uint64_n, d_unsigned, x2,
none)
+#undef REQUIRED_EXTENSIONS
+
#define REQUIRED_EXTENSIONS streaming_compatible (AARCH64_FL_SVE2 \
| AARCH64_FL_SVE_BITPERM, \
AARCH64_FL_SSVE_BITPERM)
diff --git a/gcc/config/aarch64/aarch64-sve-builtins-sve2.h
b/gcc/config/aarch64/aarch64-sve-builtins-sve2.h
index b2f2698b880..48f2e80baae 100644
--- a/gcc/config/aarch64/aarch64-sve-builtins-sve2.h
+++ b/gcc/config/aarch64/aarch64-sve-builtins-sve2.h
@@ -45,6 +45,10 @@ namespace aarch64_sve
extern const function_base *const svaese;
extern const function_base *const svaesimc;
extern const function_base *const svaesmc;
+ extern const function_base *const svaese_lane;
+ extern const function_base *const svaesd_lane;
+ extern const function_base *const svaesemc_lane;
+ extern const function_base *const svaesdimc_lane;
extern const function_base *const svandqv;
extern const function_base *const svbcax;
extern const function_base *const svbdep;
@@ -143,6 +147,8 @@ namespace aarch64_sve
extern const function_base *const svpmullb_pair;
extern const function_base *const svpmullt;
extern const function_base *const svpmullt_pair;
+ extern const function_base *const svpmull_pair;
+ extern const function_base *const svpmlal_pair;
extern const function_base *const svpsel_lane;
extern const function_base *const svqabs;
extern const function_base *const svqcadd;
diff --git a/gcc/config/aarch64/aarch64-sve2.md
b/gcc/config/aarch64/aarch64-sve2.md
index 4bf9710519f..ca3400ecefc 100644
--- a/gcc/config/aarch64/aarch64-sve2.md
+++ b/gcc/config/aarch64/aarch64-sve2.md
@@ -4100,6 +4100,43 @@ (define_insn "@aarch64_sve_<optab><mode>"
[(set_attr "sve_type" "sve_int_pmul")]
)
+;; Polynomial multiply corresponding D elements and return the widened Q
+;; results as a pair of consecutive destination vectors.
+;; PMULL { <Zd1>.Q-<Zd2>.Q }, <Zn>.D, <Zm>.D
+;; <Zd1> must be a multiple of 2 (0, 2, ..., 30)
+;; <Zd2> must be must be Zdn1 + 1
+;; <Zn> (0-31) scalable vector
+;; <Zm> (0-31) scalable vector -or- an uint64 (broadcast to a vector)
+(define_insn "aarch64_sve_pmull_pair"
+ [(set (match_operand:VNx4DI 0 "aligned_register_operand" "=Uw2")
+ (unspec:VNx4DI
+ [(match_operand:VNx2DI 1 "register_operand" "w")
+ (match_operand:VNx2DI 2 "register_operand" "w")]
+ UNSPEC_PMULL_PAIR))]
+ "TARGET_SVE_AES2"
+ "pmull\t{%S0.q - %T0.q}, %1.d, %2.d"
+ [(set_attr "sve_type" "sve_int_pmul")]
+)
+
+;; Polynomial multiply corresponding D elements and XOR-accumulate the widened
+;; Q results into a pair of consecutive destination vectors.
+;; PMLAL { <Zda1>.Q-<Zda2>.Q }, <Zn>.D, <Zm>.D
+;; <Zda1> must be a multiple of 2 (0, 2, ..., 30)
+;; <Zda2> must be must be Zdn1 + 1
+;; <Zn> (0-31) scalable vector
+;; <Zm> (0-31) scalable vector -or- an uint64 (broadcast to a vector)
+(define_insn "aarch64_sve_pmlal_pair"
+ [(set (match_operand:VNx4DI 0 "aligned_register_operand" "=Uw2")
+ (unspec:VNx4DI
+ [(match_operand:VNx4DI 1 "aligned_register_operand" "0")
+ (match_operand:VNx2DI 2 "register_operand" "w")
+ (match_operand:VNx2DI 3 "register_operand" "w")]
+ UNSPEC_PMLAL_PAIR))]
+ "TARGET_SVE_AES2"
+ "pmlal\t{%S0.q - %T0.q}, %2.d, %3.d"
+ [(set_attr "sve_type" "sve_int_pmul")]
+)
+
;; =========================================================================
;; == Comparisons and selects
;; =========================================================================
@@ -4705,6 +4742,10 @@ (define_insn "@aarch64_sve_luti<LUTI_BITS><mode>"
;; - AESE
;; - AESIMC
;; - AESMC
+;; - AESD (indexed, two registers and four registers)
+;; - AESE (indexed, two registers and four registers)
+;; - AESEMC (indexed, two registers and four registers)
+;; - AESDIMC (indexed, two registers and four registers)
;; -------------------------------------------------------------------------
;; AESD and AESE.
@@ -4766,6 +4807,51 @@ (define_insn "*aarch64_sve2_aesd_fused"
(set_attr "length" "8")]
)
+;; AESE and AESD, indexed, two registers and four registers.
+;; AES<E/D> { <Zdn1>.B-<Zdn(2/4)>.B }, { <Zdn1>.B-<Zdn(2/4)>.B },
<Zm>.Q[<index>]
+;; <Zdn1> must be a multiple of 2 (0, 2, ..., 30) or 4 (0, 4, ..., 28)
+;; <Zdn4> must be must be Zdn1 + 1 or Zdn1 + 3
+;; <Zm> (0-31)
+;; <Index> (0-3)
+
+(define_insn "@aarch64_sve2_aes<aes_op>_lane<mode>"
+ [(set (match_operand:SVE_QIx24 0 "aligned_register_operand"
"=Uw<vector_count>")
+ (unspec:SVE_QIx24
+ [(xor:SVE_QIx24
+ (match_operand:SVE_QIx24 1 "aligned_register_operand" "0")
+ (unspec:SVE_QIx24
+ [(match_operand:VNx16QI 2 "register_operand" "w")
+ (match_operand:SI 3 "const_0_to_3_operand")]
+ UNSPEC_SSVE_LANE_SELECT))]
+ CRYPTO_AES))]
+ "TARGET_SVE_AES2"
+ "aes<aes_op>\t%0, %0, %2.q[%3]"
+ [(set_attr "type" "crypto_aese")]
+)
+
+;; AESEMC and AESDIMC, indexed, two registers and four registers.
+;; AESEMC/AESDIMC { <Zdn1>.B-<Zdn (2/4)>.B }, { <Zdn1>.B-<Zdn (2/4)>.B },
<Zm>.Q[<index>]
+;; <Zdn1> must be a multiple of 2 (0, 2, ..., 30)
+;; <Zdn2> must be Zdn1 + 1 or Zdn1 + 3
+;; <Zm> (0-31)
+
+(define_insn "@aarch64_sve2_aes<CRYPTO_AES>_lane_mc<mode>"
+ [(set (match_operand:SVE_QIx24 0 "aligned_register_operand"
"=Uw<vector_count>")
+ (unspec:SVE_QIx24
+ [(unspec:SVE_QIx24
+ [(xor:SVE_QIx24
+ (match_operand:SVE_QIx24 1 "aligned_register_operand" "0")
+ (unspec:SVE_QIx24
+ [(match_operand:VNx16QI 2 "register_operand" "w")
+ (match_operand:SI 3 "const_0_to_3_operand")]
+ UNSPEC_SSVE_LANE_SELECT))]
+ CRYPTO_AES)]
+ <aesemc_outer_unspec>))]
+ "TARGET_SVE_AES2"
+ "aes<aesemc_op>\t%0, %0, %2.q[%3]"
+ [(set_attr "type" "crypto_aesmc")]
+)
+
;; -------------------------------------------------------------------------
;; ---- Optional SHA-3 extensions
;; -------------------------------------------------------------------------
diff --git a/gcc/config/aarch64/aarch64.h b/gcc/config/aarch64/aarch64.h
index 83cbe46fed8..c0a8ab0bd00 100644
--- a/gcc/config/aarch64/aarch64.h
+++ b/gcc/config/aarch64/aarch64.h
@@ -300,6 +300,8 @@ For:
&& (AARCH64_HAVE_ISA (SSVE_AES) \
|| TARGET_NON_STREAMING))
+#define TARGET_SVE_AES2 (TARGET_SVE_AES && AARCH64_HAVE_ISA (SVE_AES2))
+
/* SVE BITPERM instructions, enabled through +sve-bitperm+sve2 for
non-streaming
and +ssve-bitperm for streaming. */
#define TARGET_SVE_BITPERM (AARCH64_HAVE_ISA (SVE_BITPERM) \
diff --git a/gcc/config/aarch64/aarch64.md b/gcc/config/aarch64/aarch64.md
index d8c8c73a632..841c563da21 100644
--- a/gcc/config/aarch64/aarch64.md
+++ b/gcc/config/aarch64/aarch64.md
@@ -397,6 +397,9 @@ (define_c_enum "unspec" [
;; Represents an SVE-style lane index, in which the indexing applies
;; within the containing 128-bit block.
UNSPEC_SVE_LANE_SELECT
+ ;; Represents an SVE-style lane index, in which the indexing applies
+ ;; within the containing 512-bit block.
+ UNSPEC_SSVE_LANE_SELECT
UNSPEC_SVE_CNT_PAT
UNSPEC_SVE_PREFETCH
UNSPEC_SVE_PREFETCH_GATHER
diff --git a/gcc/config/aarch64/iterators.md b/gcc/config/aarch64/iterators.md
index f65d85be1f5..92ca35b1ba7 100644
--- a/gcc/config/aarch64/iterators.md
+++ b/gcc/config/aarch64/iterators.md
@@ -708,6 +708,9 @@ (define_mode_iterator SVE_SI [VNx2SI VNx4SI])
(define_mode_iterator SVE_DIx24 [VNx4DI VNx8DI])
+;; SVE integer vector modes with 2 and 4 vectors of 8-bit elements.
+(define_mode_iterator SVE_QIx24 [VNx32QI VNx64QI])
+
;; SVE modes with 2 or 4 elements.
(define_mode_iterator SVE_24 [VNx2QI VNx2HI VNx2HF VNx2BF VNx2SI VNx2SF
VNx2DI VNx2DF
@@ -889,6 +892,8 @@ (define_c_enum "unspec"
UNSPEC_SQDMULH ; Used in aarch64-simd.md.
UNSPEC_SQRDMULH ; Used in aarch64-simd.md.
UNSPEC_PMUL ; Used in aarch64-simd.md.
+ UNSPEC_PMULL_PAIR ; Used in aarch64-sve2.md.
+ UNSPEC_PMLAL_PAIR ; Used in aarch64-sve2.md.
UNSPEC_FMULX ; Used in aarch64-simd.md.
UNSPEC_USQADD ; Used in aarch64-simd.md.
UNSPEC_SUQADD ; Used in aarch64-simd.md.
@@ -940,6 +945,8 @@ (define_c_enum "unspec"
UNSPEC_AESD ; Used in aarch64-simd.md.
UNSPEC_AESMC ; Used in aarch64-simd.md.
UNSPEC_AESIMC ; Used in aarch64-simd.md.
+ UNSPEC_AESEMC ; Used in aarch64-sve2.md.
+ UNSPEC_AESDIMC ; Used in aarch64-sve2.md.
UNSPEC_SHA1C ; Used in aarch64-simd.md.
UNSPEC_SHA1M ; Used in aarch64-simd.md.
UNSPEC_SHA1P ; Used in aarch64-simd.md.
@@ -3678,6 +3685,13 @@ (define_int_iterator CRC [UNSPEC_CRC32B UNSPEC_CRC32H
UNSPEC_CRC32W
(define_int_iterator CRYPTO_AES [UNSPEC_AESE UNSPEC_AESD])
(define_int_iterator CRYPTO_AESMC [UNSPEC_AESMC UNSPEC_AESIMC])
+(define_int_attr aesemc_op [(UNSPEC_AESE "emc") (UNSPEC_AESD "dimc")])
+(define_int_attr aesemc_outer_unspec [(UNSPEC_AESE "UNSPEC_AESMC")
+ (UNSPEC_AESD "UNSPEC_AESIMC")])
+
+(define_int_attr crypto_aesemc_op [(UNSPEC_AESE "emc") (UNSPEC_AESD "dimc")])
+(define_int_attr crypto_aesemc_outer_unspec [(UNSPEC_AESE "UNSPEC_AESMC")
+ (UNSPEC_AESD "UNSPEC_AESIMC")])
(define_int_iterator CRYPTO_SHA1 [UNSPEC_SHA1C UNSPEC_SHA1M UNSPEC_SHA1P])
diff --git a/gcc/config/aarch64/predicates.md b/gcc/config/aarch64/predicates.md
index f02486c2d9a..e2911a0bccd 100644
--- a/gcc/config/aarch64/predicates.md
+++ b/gcc/config/aarch64/predicates.md
@@ -50,6 +50,10 @@ (define_predicate "const0_to_1_operand"
(and (match_code "const_int")
(match_test "IN_RANGE (INTVAL (op), 0, 1)")))
+(define_predicate "const_0_to_3_operand"
+ (and (match_code "const_int")
+ (match_test "IN_RANGE (INTVAL (op), 0, 3)")))
+
(define_predicate "const_0_to_7_operand"
(and (match_code "const_int")
(match_test "IN_RANGE (INTVAL (op), 0, 7)")))
diff --git a/gcc/testsuite/gcc.target/aarch64/pragma_cpp_predefs_5.c
b/gcc/testsuite/gcc.target/aarch64/pragma_cpp_predefs_5.c
index bb83ab434b5..0bec72d70a2 100644
--- a/gcc/testsuite/gcc.target/aarch64/pragma_cpp_predefs_5.c
+++ b/gcc/testsuite/gcc.target/aarch64/pragma_cpp_predefs_5.c
@@ -41,6 +41,14 @@
#error "__ARM_FEATURE_SVE2_SHA3 is defined but should not be!"
#endif
+#ifdef __ARM_FEATURE_SSVE_AES
+#error "__ARM_FEATURE_SSVE_AES is defined but should not be!"
+#endif
+
+#ifdef __ARM_FEATURE_SVE_AES2
+#error "__ARM_FEATURE_SVE_AES2 is defined but should not be!"
+#endif
+
#pragma GCC pop_options
#pragma GCC push_options
@@ -225,6 +233,20 @@
#endif
#pragma GCC pop_options
+#pragma GCC push_options
+#pragma GCC target "arch=armv8-a+ssve-aes"
+#ifndef __ARM_FEATURE_SSVE_AES
+#error "__ARM_FEATURE_SSVE_AES is not defined but should be!"
+#endif
+#pragma GCC pop_options
+
+#pragma GCC push_options
+#pragma GCC target "arch=armv8-a+sve-aes2"
+#ifndef __ARM_FEATURE_SVE_AES2
+#error "__ARM_FEATURE_SVE_AES2 is not defined but should be!"
+#endif
+#pragma GCC pop_options
+
int
foo (int a)
{
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/test_sve_acle.h
b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/test_sve_acle.h
index aeb58ead0dd..cecd1c154b9 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/test_sve_acle.h
+++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/test_sve_acle.h
@@ -687,6 +687,22 @@
__asm volatile ("" :: "w" (RES)); \
}
+#define TEST_XN_INDEXED(NAME, TTYPE, VTYPE, CODE1, CODE2) \
+ PROTO (NAME, TTYPE, (TTYPE t, VTYPE v)) \
+ { \
+ register TTYPE z0 __asm ("z0"); \
+ register TTYPE z1 __asm ("z1"); \
+ register TTYPE z2 __asm ("z2"); \
+ register TTYPE z3 __asm ("z3"); \
+ register VTYPE z4 __asm ("z4"); \
+ register VTYPE z5 __asm ("z5"); \
+ register VTYPE z6 __asm ("z6"); \
+ register VTYPE z7 __asm ("z7"); \
+ INVOKE (CODE1, CODE2); \
+ __asm volatile ("" :: "w" (t)); \
+ return t; \
+ }
+
#define TEST_DUAL_XN(NAME, TTYPE1, TTYPE2, RES, CODE1, CODE2) \
PROTO (NAME, void, ()) \
{ \
diff --git a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/aesd_lane_u8.c
b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/aesd_lane_u8.c
new file mode 100644
index 00000000000..6d6bd63effa
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/aesd_lane_u8.c
@@ -0,0 +1,67 @@
+/* { dg-do assemble { target { aarch64_asm_ssve-aes_ok &&
aarch64_asm_sve-aes2_ok } } } */
+/* { dg-do compile { target { ! { aarch64_asm_ssve-aes_ok &&
aarch64_asm_sve-aes2_ok } } } } */
+/* { dg-final { check-function-bodies "**" "" "-DCHECK_ASM" } } */
+
+#include "test_sve_acle.h"
+
+#pragma GCC target "+sve-aes2+ssve-aes"
+
+/*
+** test_aesd_lane_u8_x2:
+** aesd[[:space:]]+{z0.b - z1.b}, {z0.b - z1.b}, z2.q\[0\]
+** ret
+*/
+TEST_XN_INDEXED (test_aesd_lane_u8_x2, svuint8x2_t, svuint8_t,
+ t = svaesd_lane_u8_x2 (t, v, 0),
+ t = svaesd_lane (t, v, 0))
+
+/*
+** test_aesd_lane_u8_x4:
+** aesd[[:space:]]+{z0.b - z3.b}, {z0.b - z3.b}, z4.q\[0\]
+** ret
+*/
+TEST_XN_INDEXED (test_aesd_lane_u8_x4, svuint8x4_t, svuint8_t,
+ t = svaesd_lane_u8_x4 (t, v, 0),
+ t = svaesd_lane (t, v, 0))
+
+/*
+** test_aesd_lane_u8_x2_regs:
+** aesd[[:space:]]+{z0.b - z1.b}, {z0.b - z1.b}, z4.q\[0\]
+** ret
+*/
+TEST_XN_INDEXED (test_aesd_lane_u8_x2_regs, svuint8x2_t, svuint8_t,
+ t = svaesd_lane_u8_x2 (z0, z4, 0),
+ t = svaesd_lane (z0, z4, 0))
+
+/*
+** test_aesd_lane_u8_x4_regs:
+** aesd[[:space:]]+{z0.b - z3.b}, {z0.b - z3.b}, z4.q\[0\]
+** ret
+*/
+TEST_XN_INDEXED (test_aesd_lane_u8_x4_regs, svuint8x4_t, svuint8_t,
+ t = svaesd_lane_u8_x4 (z0, z4, 0),
+ t = svaesd_lane (z0, z4, 0))
+
+/*
+** test_aesd_lane_u8_x2_regs_mov:
+** mov[[:space:]]+z0.d, z3.d
+** mov[[:space:]]+z1.d, z4.d
+** aesd[[:space:]]+{z0.b - z1.b}, {z0.b - z1.b}, z4.q\[0\]
+** ret
+*/
+TEST_XN_INDEXED (test_aesd_lane_u8_x2_regs_mov, svuint8x2_t, svuint8_t,
+ t = svaesd_lane_u8_x2 (z3, z4, 0),
+ t = svaesd_lane (z3, z4, 0))
+
+/*
+** test_aesd_lane_u8_x4_regs_mov:
+** mov[[:space:]]+z0.d, z3.d
+** mov[[:space:]]+z1.d, z4.d
+** mov[[:space:]]+z2.d, z5.d
+** mov[[:space:]]+z3.d, z6.d
+** aesd[[:space:]]+{z0.b - z3.b}, {z0.b - z3.b}, z4.q\[0\]
+** ret
+*/
+TEST_XN_INDEXED (test_aesd_lane_u8_x4_regs_mov, svuint8x4_t, svuint8_t,
+ t = svaesd_lane_u8_x4 (z3, z4, 0),
+ t = svaesd_lane (z3, z4, 0))
diff --git a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/aesdimc_lane_u8.c
b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/aesdimc_lane_u8.c
new file mode 100644
index 00000000000..d7863c5f45e
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/aesdimc_lane_u8.c
@@ -0,0 +1,67 @@
+/* { dg-do assemble { target { aarch64_asm_ssve-aes_ok &&
aarch64_asm_sve-aes2_ok } } } */
+/* { dg-do compile { target { ! { aarch64_asm_ssve-aes_ok &&
aarch64_asm_sve-aes2_ok } } } } */
+/* { dg-final { check-function-bodies "**" "" "-DCHECK_ASM" } } */
+
+#include "test_sve_acle.h"
+
+#pragma GCC target "+sve-aes2+ssve-aes"
+
+/*
+** test_aesdimc_lane_u8_x2:
+** aesdimc[[:space:]]+{z0.b - z1.b}, {z0.b - z1.b}, z2.q\[0\]
+** ret
+*/
+TEST_XN_INDEXED (test_aesdimc_lane_u8_x2, svuint8x2_t, svuint8_t,
+ t = svaesdimc_lane_u8_x2 (t, v, 0),
+ t = svaesdimc_lane (t, v, 0))
+
+/*
+** test_aesdimc_lane_u8_x4:
+** aesdimc[[:space:]]+{z0.b - z3.b}, {z0.b - z3.b}, z4.q\[0\]
+** ret
+*/
+TEST_XN_INDEXED (test_aesdimc_lane_u8_x4, svuint8x4_t, svuint8_t,
+ t = svaesdimc_lane_u8_x4 (t, v, 0),
+ t = svaesdimc_lane (t, v, 0))
+
+/*
+** test_aesdimc_lane_u8_x2_regs:
+** aesdimc[[:space:]]+{z0.b - z1.b}, {z0.b - z1.b}, z4.q\[0\]
+** ret
+*/
+TEST_XN_INDEXED (test_aesdimc_lane_u8_x2_regs, svuint8x2_t, svuint8_t,
+ t = svaesdimc_lane_u8_x2 (z0, z4, 0),
+ t = svaesdimc_lane (z0, z4, 0))
+
+/*
+** test_aesdimc_lane_u8_x4_regs:
+** aesdimc[[:space:]]+{z0.b - z3.b}, {z0.b - z3.b}, z4.q\[0\]
+** ret
+*/
+TEST_XN_INDEXED (test_aesdimc_lane_u8_x4_regs, svuint8x4_t, svuint8_t,
+ t = svaesdimc_lane_u8_x4 (z0, z4, 0),
+ t = svaesdimc_lane (z0, z4, 0))
+
+/*
+** test_aesdimc_lane_u8_x2_regs_mov:
+** mov[[:space:]]+z0.d, z3.d
+** mov[[:space:]]+z1.d, z4.d
+** aesdimc[[:space:]]+{z0.b - z1.b}, {z0.b - z1.b}, z4.q\[0\]
+** ret
+*/
+TEST_XN_INDEXED (test_aesdimc_lane_u8_x2_regs_mov, svuint8x2_t, svuint8_t,
+ t = svaesdimc_lane_u8_x2 (z3, z4, 0),
+ t = svaesdimc_lane (z3, z4, 0))
+
+/*
+** test_aesdimc_lane_u8_x4_regs_mov:
+** mov[[:space:]]+z0.d, z3.d
+** mov[[:space:]]+z1.d, z4.d
+** mov[[:space:]]+z2.d, z5.d
+** mov[[:space:]]+z3.d, z6.d
+** aesdimc[[:space:]]+{z0.b - z3.b}, {z0.b - z3.b}, z4.q\[0\]
+** ret
+*/
+TEST_XN_INDEXED (test_aesdimc_lane_u8_x4_regs_mov, svuint8x4_t, svuint8_t,
+ t = svaesdimc_lane_u8_x4 (z3, z4, 0),
+ t = svaesdimc_lane (z3, z4, 0))
diff --git a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/aese_lane_u8.c
b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/aese_lane_u8.c
new file mode 100644
index 00000000000..aa826f360a4
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/aese_lane_u8.c
@@ -0,0 +1,67 @@
+/* { dg-do assemble { target { aarch64_asm_ssve-aes_ok &&
aarch64_asm_sve-aes2_ok } } } */
+/* { dg-do compile { target { ! { aarch64_asm_ssve-aes_ok &&
aarch64_asm_sve-aes2_ok } } } } */
+/* { dg-final { check-function-bodies "**" "" "-DCHECK_ASM" } } */
+
+#include "test_sve_acle.h"
+
+#pragma GCC target "+sve-aes2+ssve-aes"
+
+/*
+** test_aese_lane_u8_x2:
+** aese[[:space:]]+{z0.b - z1.b}, {z0.b - z1.b}, z2.q\[0\]
+** ret
+*/
+TEST_XN_INDEXED (test_aese_lane_u8_x2, svuint8x2_t, svuint8_t,
+ t = svaese_lane_u8_x2 (t, v, 0),
+ t = svaese_lane (t, v, 0))
+
+/*
+** test_aese_lane_u8_x4:
+** aese[[:space:]]+{z0.b - z3.b}, {z0.b - z3.b}, z4.q\[0\]
+** ret
+*/
+TEST_XN_INDEXED (test_aese_lane_u8_x4, svuint8x4_t, svuint8_t,
+ t = svaese_lane_u8_x4 (t, v, 0),
+ t = svaese_lane (t, v, 0))
+
+/*
+** test_aese_lane_u8_x2_regs:
+** aese[[:space:]]+{z0.b - z1.b}, {z0.b - z1.b}, z4.q\[0\]
+** ret
+*/
+TEST_XN_INDEXED (test_aese_lane_u8_x2_regs, svuint8x2_t, svuint8_t,
+ t = svaese_lane_u8_x2 (z0, z4, 0),
+ t = svaese_lane (z0, z4, 0))
+
+/*
+** test_aese_lane_u8_x4_regs:
+** aese[[:space:]]+{z0.b - z3.b}, {z0.b - z3.b}, z4.q\[0\]
+** ret
+*/
+TEST_XN_INDEXED (test_aese_lane_u8_x4_regs, svuint8x4_t, svuint8_t,
+ t = svaese_lane_u8_x4 (z0, z4, 0),
+ t = svaese_lane (z0, z4, 0))
+
+/*
+** test_aese_lane_u8_x2_regs_mov:
+** mov[[:space:]]+z0.d, z3.d
+** mov[[:space:]]+z1.d, z4.d
+** aese[[:space:]]+{z0.b - z1.b}, {z0.b - z1.b}, z4.q\[0\]
+** ret
+*/
+TEST_XN_INDEXED (test_aese_lane_u8_x2_regs_mov, svuint8x2_t, svuint8_t,
+ t = svaese_lane_u8_x2 (z3, z4, 0),
+ t = svaese_lane (z3, z4, 0))
+
+/*
+** test_aese_lane_u8_x4_regs_mov:
+** mov[[:space:]]+z0.d, z3.d
+** mov[[:space:]]+z1.d, z4.d
+** mov[[:space:]]+z2.d, z5.d
+** mov[[:space:]]+z3.d, z6.d
+** aese[[:space:]]+{z0.b - z3.b}, {z0.b - z3.b}, z4.q\[0\]
+** ret
+*/
+TEST_XN_INDEXED (test_aese_lane_u8_x4_regs_mov, svuint8x4_t, svuint8_t,
+ t = svaese_lane_u8_x4 (z3, z4, 0),
+ t = svaese_lane (z3, z4, 0))
diff --git a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/aesemc_lane_u8.c
b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/aesemc_lane_u8.c
new file mode 100644
index 00000000000..04530a285b5
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/aesemc_lane_u8.c
@@ -0,0 +1,67 @@
+/* { dg-do assemble { target { aarch64_asm_ssve-aes_ok &&
aarch64_asm_sve-aes2_ok } } } */
+/* { dg-do compile { target { ! { aarch64_asm_ssve-aes_ok &&
aarch64_asm_sve-aes2_ok } } } } */
+/* { dg-final { check-function-bodies "**" "" "-DCHECK_ASM" } } */
+
+#include "test_sve_acle.h"
+
+#pragma GCC target "+sve-aes2+ssve-aes"
+
+/*
+** test_aesemc_lane_u8_x2:
+** aesemc[[:space:]]+{z0.b - z1.b}, {z0.b - z1.b}, z2.q\[0\]
+** ret
+*/
+TEST_XN_INDEXED (test_aesemc_lane_u8_x2, svuint8x2_t, svuint8_t,
+ t = svaesemc_lane_u8_x2 (t, v, 0),
+ t = svaesemc_lane (t, v, 0))
+
+/*
+** test_aesemc_lane_u8_x4:
+** aesemc[[:space:]]+{z0.b - z3.b}, {z0.b - z3.b}, z4.q\[0\]
+** ret
+*/
+TEST_XN_INDEXED (test_aesemc_lane_u8_x4, svuint8x4_t, svuint8_t,
+ t = svaesemc_lane_u8_x4 (t, v, 0),
+ t = svaesemc_lane (t, v, 0))
+
+/*
+** test_aesemc_lane_u8_x2_regs:
+** aesemc[[:space:]]+{z0.b - z1.b}, {z0.b - z1.b}, z4.q\[0\]
+** ret
+*/
+TEST_XN_INDEXED (test_aesemc_lane_u8_x2_regs, svuint8x2_t, svuint8_t,
+ t = svaesemc_lane_u8_x2 (z0, z4, 0),
+ t = svaesemc_lane (z0, z4, 0))
+
+/*
+** test_aesemc_lane_u8_x4_regs:
+** aesemc[[:space:]]+{z0.b - z3.b}, {z0.b - z3.b}, z4.q\[0\]
+** ret
+*/
+TEST_XN_INDEXED (test_aesemc_lane_u8_x4_regs, svuint8x4_t, svuint8_t,
+ t = svaesemc_lane_u8_x4 (z0, z4, 0),
+ t = svaesemc_lane (z0, z4, 0))
+
+/*
+** test_aesemc_lane_u8_x2_regs_mov:
+** mov[[:space:]]+z0.d, z3.d
+** mov[[:space:]]+z1.d, z4.d
+** aesemc[[:space:]]+{z0.b - z1.b}, {z0.b - z1.b}, z4.q\[0\]
+** ret
+*/
+TEST_XN_INDEXED (test_aesemc_lane_u8_x2_regs_mov, svuint8x2_t, svuint8_t,
+ t = svaesemc_lane_u8_x2 (z3, z4, 0),
+ t = svaesemc_lane (z3, z4, 0))
+
+/*
+** test_aesemc_lane_u8_x4_regs_mov:
+** mov[[:space:]]+z0.d, z3.d
+** mov[[:space:]]+z1.d, z4.d
+** mov[[:space:]]+z2.d, z5.d
+** mov[[:space:]]+z3.d, z6.d
+** aesemc[[:space:]]+{z0.b - z3.b}, {z0.b - z3.b}, z4.q\[0\]
+** ret
+*/
+TEST_XN_INDEXED (test_aesemc_lane_u8_x4_regs_mov, svuint8x4_t, svuint8_t,
+ t = svaesemc_lane_u8_x4 (z3, z4, 0),
+ t = svaesemc_lane (z3, z4, 0))
diff --git a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/pmlal_pair_u64.c
b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/pmlal_pair_u64.c
new file mode 100644
index 00000000000..1e0acb259db
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/pmlal_pair_u64.c
@@ -0,0 +1,69 @@
+/* { dg-do assemble { target { aarch64_asm_ssve-aes_ok &&
aarch64_asm_sve-aes2_ok } } } */
+/* { dg-do compile { target { ! { aarch64_asm_ssve-aes_ok &&
aarch64_asm_sve-aes2_ok } } } } */
+/* { dg-final { check-function-bodies "**" "" "-DCHECK_ASM" } } */
+
+#include "test_sve_acle.h"
+
+#pragma GCC target "+sve-aes2+ssve-aes"
+
+/*
+**test_pmlal_pair_u64:
+** pmlal[[:space:]]+{z0.q - z1.q}, z2.d, z2.d
+** ret
+*/
+TEST_XN_INDEXED(test_pmlal_pair_u64, svuint64x2_t, svuint64_t,
+ t = svpmlal_pair_u64_x2(t, v, v),
+ t = svpmlal_pair(t, v, v))
+
+/*
+**test_pmlal_pair_n_u64_regs:
+** pmlal[[:space:]]+{z0.q - z1.q}, z4.d, z5.d
+** ret
+*/
+TEST_XN_INDEXED(test_pmlal_pair_n_u64_regs, svuint64x2_t, svuint64_t,
+ t = svpmlal_pair_u64_x2(z0, z4, z5),
+ t = svpmlal_pair(z0, z4, z5))
+
+/*
+**test_pmlal_pair_n_u64_regs_imm:
+** movi[[:space:]]+d[0-9]{1,2}, #0
+** pmlal[[:space:]]+{z0.q - z1.q}, z4.d, z[0-9]{1,2}\.d
+** ret
+*/
+TEST_XN_INDEXED(test_pmlal_pair_n_u64_regs_imm, svuint64x2_t, svuint64_t,
+ t = svpmlal_pair_n_u64_x2(z0, z4, 0x0),
+ t = svpmlal_pair(z0, z4, 0x0))
+
+/*
+**test_pmlal_pair_n_u64_regs_imm_1:
+** mov[[:space:]]+z[0-9]{1,2}\.d, #65535
+** pmlal[[:space:]]+{z0.q - z1.q}, z4.d, z[0-9]{1,2}\.d
+** ret
+*/
+TEST_XN_INDEXED(test_pmlal_pair_n_u64_regs_imm_1, svuint64x2_t, svuint64_t,
+ t = svpmlal_pair_n_u64_x2(z0, z4, 0xFFFF),
+ t = svpmlal_pair(z0, z4, 0xFFFF))
+
+/*
+**test_pmlal_pair_n_u64_regs_mov:
+** mov[[:space:]]+z0.d, z3.d
+** mov[[:space:]]+z1.d, z4.d
+** movi[[:space:]]+d[0-9]{1,2}, #0
+** pmlal[[:space:]]+{z0.q - z1.q}, z4.d, z[0-9]{1,2}\.d
+** ret
+*/
+TEST_XN_INDEXED(test_pmlal_pair_n_u64_regs_mov, svuint64x2_t, svuint64_t,
+ t = svpmlal_pair_n_u64_x2(z3, z4, 0x0),
+ t = svpmlal_pair(z3, z4, 0x0))
+
+/*
+**test_pmlal_pair_n_u64_regs_mov_1:
+** mov[[:space:]]+z0.d, z3.d
+** mov[[:space:]]+z1.d, z4.d
+** mov[[:space:]]+z[0-9]{1,2}\.d, #65535
+** pmlal[[:space:]]+{z0.q - z1.q}, z4.d, z[0-9]{1,2}\.d
+** ret
+*/
+TEST_XN_INDEXED(test_pmlal_pair_n_u64_regs_mov_1, svuint64x2_t, svuint64_t,
+ t = svpmlal_pair_n_u64_x2(z3, z4, 0xFFFF),
+ t = svpmlal_pair(z3, z4, 0xFFFF))
diff --git a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/pmull_pair_u64.c
b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/pmull_pair_u64.c
new file mode 100644
index 00000000000..79e45cc9319
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/pmull_pair_u64.c
@@ -0,0 +1,45 @@
+/* { dg-do assemble { target { aarch64_asm_ssve-aes_ok &&
aarch64_asm_sve-aes2_ok } } } */
+/* { dg-do compile { target { ! { aarch64_asm_ssve-aes_ok &&
aarch64_asm_sve-aes2_ok } } } } */
+/* { dg-final { check-function-bodies "**" "" "-DCHECK_ASM" } } */
+
+#include "test_sve_acle.h"
+
+#pragma GCC target "+sve-aes2+ssve-aes"
+
+/*
+**test_pmull_pair_u64:
+** pmull[[:space:]]+{z0.q - z1.q}, z2.d, z2.d
+** ret
+*/
+TEST_XN_INDEXED(test_pmull_pair_u64, svuint64x2_t, svuint64_t,
+ t = svpmull_pair_u64_x2(v, v),
+ t = svpmull_pair(v, v))
+
+/*
+**test_pmull_pair_n_u64:
+** movi[[:space:]]+d([0-9]{1,2}), #0
+** pmull[[:space:]]+{z0.q - z1.q}, z2.d, z\1.d
+** ret
+*/
+TEST_XN_INDEXED(test_pmull_pair_n_u64, svuint64x2_t, svuint64_t,
+ t = svpmull_pair_n_u64_x2(v, 0x0),
+ t = svpmull_pair(v, 0x0))
+
+/*
+**test_pmull_pair_u64_regs:
+** pmull[[:space:]]+{z0.q - z1.q}, z4.d, z5.d
+** ret
+*/
+TEST_XN_INDEXED(test_pmull_pair_u64_regs, svuint64x2_t, svuint64_t,
+ t = svpmull_pair_u64_x2(z4, z5),
+ t = svpmull_pair(z4, z5))
+
+/*
+**test_pmull_pair_n_u64_regs:
+** movi[[:space:]]+d([0-9]{1,2}), #0
+** pmull[[:space:]]+{z0.q - z1.q}, z4.d, z\1.d
+** ret
+*/
+TEST_XN_INDEXED(test_pmull_pair_n_u64_regs, svuint64x2_t, svuint64_t,
+ t = svpmull_pair_n_u64_x2(z4, 0x0),
+ t = svpmull_pair(z4, 0x0))
diff --git a/gcc/testsuite/lib/target-supports.exp
b/gcc/testsuite/lib/target-supports.exp
index fdde04a73e4..fcccf49f1ba 100644
--- a/gcc/testsuite/lib/target-supports.exp
+++ b/gcc/testsuite/lib/target-supports.exp
@@ -12901,8 +12901,8 @@ proc
check_effective_target_aarch64_gas_has_build_attributes { } {
set exts {
"bf16" "cmpbr" "crc" "crypto" "dotprod" "f32mm" "f64mm" "faminmax"
"fp" "fp8" "fp8dot2" "fp8dot4" "fp8fma" "i8mm" "ls64" "lse" "lut"
- "sb" "simd" "sve-b16b16" "sve" "sve2" "sve-sm4" "sve-aes" "sve-bitperm"
- "sve-sha3" "f8f16mm" "f8f32mm" "sve-f16f32mm"
+ "sb" "simd" "sve-b16b16" "sve" "sve2" "sve-sm4" "sve-aes" "sve-aes2"
+ "sve-bitperm" "sve-sha3" "f8f16mm" "f8f32mm" "sve-f16f32mm"
"sme-f8f16" "sme-f8f32"
"sme-b16b16" "sme-f16f16" "sme-i16i64" "sme" "sme2" "sme2p1" "sme2p2"
"ssve-fp8dot2" "ssve-fp8dot4" "ssve-fp8fma" "sve-bfscale" "sme-lutv2"
--
2.43.0