aboutsummaryrefslogtreecommitdiff
path: root/gcc
diff options
context:
space:
mode:
authorSoumya AR <soumyaa@nvidia.com>2024-09-10 14:18:44 +0530
committerKyrylo Tkachov <ktkachov@nvidia.com>2024-09-16 16:53:45 +0200
commit4af196b2ebd662c5183f1998b0184985e85479b2 (patch)
treee478bf17bff134be70537e9c69516d852d4790a4 /gcc
parentf6e629a7134c6b83be4542b8cd26b7c4483d17f4 (diff)
downloadgcc-4af196b2ebd662c5183f1998b0184985e85479b2.zip
gcc-4af196b2ebd662c5183f1998b0184985e85479b2.tar.gz
gcc-4af196b2ebd662c5183f1998b0184985e85479b2.tar.bz2
aarch64: Emit ADD X, Y, Y instead of SHL X, Y, #1 for SVE instructions.
On Neoverse V2, SVE ADD instructions have a throughput of 4, while shift instructions like SHL have a throughput of 2. We can lean on that to emit code like: add z31.b, z31.b, z31.b instead of: lsl z31.b, z31.b, #1 The implementation of this change for SVE vectors is similar to a prior patch <https://gcc.gnu.org/pipermail/gcc-patches/2024-August/659958.html> that adds the above functionality for Neon vectors. Here, the machine descriptor pattern is split up to separately accommodate left and right shifts, so we can specifically emit an add for all left shifts by 1. The patch was bootstrapped and regtested on aarch64-linux-gnu, no regression. OK for mainline? Signed-off-by: Soumya AR <soumyaa@nvidia.com> gcc/ChangeLog: * config/aarch64/aarch64-sve.md (*post_ra_v<optab><mode>3): Split pattern to accomodate left and right shifts separately. (*post_ra_v_ashl<mode>3): Matches left shifts with additional constraint to check for shifts by 1. (*post_ra_v_<optab><mode>3): Matches right shifts. gcc/testsuite/ChangeLog: * gcc.target/aarch64/sve/acle/asm/lsl_s16.c: Updated instances of lsl-1 with corresponding add. * gcc.target/aarch64/sve/acle/asm/lsl_s32.c: Likewise. * gcc.target/aarch64/sve/acle/asm/lsl_s64.c: Likewise. * gcc.target/aarch64/sve/acle/asm/lsl_s8.c: Likewise. * gcc.target/aarch64/sve/acle/asm/lsl_u16.c: Likewise. * gcc.target/aarch64/sve/acle/asm/lsl_u32.c: Likewise. * gcc.target/aarch64/sve/acle/asm/lsl_u64.c: Likewise. * gcc.target/aarch64/sve/acle/asm/lsl_u8.c: Likewise. * gcc.target/aarch64/sve/acle/asm/lsl_wide_s16.c: Likewise. * gcc.target/aarch64/sve/acle/asm/lsl_wide_s32.c: Likewise. * gcc.target/aarch64/sve/acle/asm/lsl_wide_s8.c: Likewise. * gcc.target/aarch64/sve/acle/asm/lsl_wide_u16.c: Likewise. * gcc.target/aarch64/sve/acle/asm/lsl_wide_u32.c: Likewise. * gcc.target/aarch64/sve/acle/asm/lsl_wide_u8.c: Likewise. * gcc.target/aarch64/sve/adr_1.c: Likewise. * gcc.target/aarch64/sve/adr_6.c: Likewise. * gcc.target/aarch64/sve/cond_mla_7.c: Likewise. * gcc.target/aarch64/sve/cond_mla_8.c: Likewise. * gcc.target/aarch64/sve/shift_2.c: Likewise. * gcc.target/aarch64/sve2/acle/asm/ldnt1sh_gather_s64.c: Likewise. * gcc.target/aarch64/sve2/acle/asm/ldnt1sh_gather_u64.c: Likewise. * gcc.target/aarch64/sve2/acle/asm/ldnt1uh_gather_s64.c: Likewise. * gcc.target/aarch64/sve2/acle/asm/ldnt1uh_gather_u64.c: Likewise. * gcc.target/aarch64/sve2/acle/asm/rshl_s16.c: Likewise. * gcc.target/aarch64/sve2/acle/asm/rshl_s32.c: Likewise. * gcc.target/aarch64/sve2/acle/asm/rshl_s64.c: Likewise. * gcc.target/aarch64/sve2/acle/asm/rshl_s8.c: Likewise. * gcc.target/aarch64/sve2/acle/asm/rshl_u16.c: Likewise. * gcc.target/aarch64/sve2/acle/asm/rshl_u32.c: Likewise. * gcc.target/aarch64/sve2/acle/asm/rshl_u64.c: Likewise. * gcc.target/aarch64/sve2/acle/asm/rshl_u8.c: Likewise. * gcc.target/aarch64/sve2/acle/asm/stnt1h_scatter_s64.c: Likewise. * gcc.target/aarch64/sve2/acle/asm/stnt1h_scatter_u64.c: Likewise. * gcc.target/aarch64/sve/sve_shl_add.c: New test.
Diffstat (limited to 'gcc')
-rw-r--r--gcc/config/aarch64/aarch64-sve.md18
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_s16.c4
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_s32.c4
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_s64.c4
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_s8.c4
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_u16.c4
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_u32.c4
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_u64.c4
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_u8.c4
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_s16.c4
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_s32.c4
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_s8.c4
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_u16.c4
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_u32.c4
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_u8.c4
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve/adr_1.c6
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve/adr_6.c4
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve/cond_mla_7.c8
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve/cond_mla_8.c8
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve/shift_2.c6
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve/sve_shl_add.c45
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/ldnt1sh_gather_s64.c12
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/ldnt1sh_gather_u64.c12
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/ldnt1uh_gather_s64.c12
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/ldnt1uh_gather_u64.c12
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_s16.c4
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_s32.c4
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_s64.c4
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_s8.c4
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_u16.c4
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_u32.c4
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_u64.c4
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_u8.c4
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/stnt1h_scatter_s64.c8
-rw-r--r--gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/stnt1h_scatter_u64.c8
35 files changed, 151 insertions, 96 deletions
diff --git a/gcc/config/aarch64/aarch64-sve.md b/gcc/config/aarch64/aarch64-sve.md
index a5cd42b..bfa2884 100644
--- a/gcc/config/aarch64/aarch64-sve.md
+++ b/gcc/config/aarch64/aarch64-sve.md
@@ -4816,11 +4816,23 @@
;; Unpredicated shift operations by a constant (post-RA only).
;; These are generated by splitting a predicated instruction whose
;; predicate is unused.
-(define_insn "*post_ra_v<optab><mode>3"
+(define_insn "*post_ra_v_ashl<mode>3"
+ [(set (match_operand:SVE_I 0 "register_operand")
+ (ashift:SVE_I
+ (match_operand:SVE_I 1 "register_operand")
+ (match_operand:SVE_I 2 "aarch64_simd_lshift_imm")))]
+ "TARGET_SVE && reload_completed"
+ {@ [ cons: =0 , 1 , 2 ]
+ [ w , w , vs1 ] add\t%0.<Vetype>, %1.<Vetype>, %1.<Vetype>
+ [ w , w , Dl ] lsl\t%0.<Vetype>, %1.<Vetype>, #%2
+ }
+)
+
+(define_insn "*post_ra_v_<optab><mode>3"
[(set (match_operand:SVE_I 0 "register_operand" "=w")
- (ASHIFT:SVE_I
+ (SHIFTRT:SVE_I
(match_operand:SVE_I 1 "register_operand" "w")
- (match_operand:SVE_I 2 "aarch64_simd_<lr>shift_imm")))]
+ (match_operand:SVE_I 2 "aarch64_simd_rshift_imm")))]
"TARGET_SVE && reload_completed"
"<shift>\t%0.<Vetype>, %1.<Vetype>, #%2"
)
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_s16.c b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_s16.c
index d5c5fd5..710d6f6 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_s16.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_s16.c
@@ -296,7 +296,7 @@ TEST_UNIFORM_ZX (lsl_w0_s16_x_untied, svint16_t, uint16_t,
/*
** lsl_1_s16_x_tied1:
-** lsl z0\.h, z0\.h, #1
+** add z0\.h, z0\.h, z0\.h
** ret
*/
TEST_UNIFORM_Z (lsl_1_s16_x_tied1, svint16_t,
@@ -305,7 +305,7 @@ TEST_UNIFORM_Z (lsl_1_s16_x_tied1, svint16_t,
/*
** lsl_1_s16_x_untied:
-** lsl z0\.h, z1\.h, #1
+** add z0\.h, z1\.h, z1\.h
** ret
*/
TEST_UNIFORM_Z (lsl_1_s16_x_untied, svint16_t,
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_s32.c b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_s32.c
index b5df8a84..5ae79ac 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_s32.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_s32.c
@@ -296,7 +296,7 @@ TEST_UNIFORM_ZX (lsl_w0_s32_x_untied, svint32_t, uint32_t,
/*
** lsl_1_s32_x_tied1:
-** lsl z0\.s, z0\.s, #1
+** add z0\.s, z0\.s, z0\.s
** ret
*/
TEST_UNIFORM_Z (lsl_1_s32_x_tied1, svint32_t,
@@ -305,7 +305,7 @@ TEST_UNIFORM_Z (lsl_1_s32_x_tied1, svint32_t,
/*
** lsl_1_s32_x_untied:
-** lsl z0\.s, z1\.s, #1
+** add z0\.s, z1\.s, z1\.s
** ret
*/
TEST_UNIFORM_Z (lsl_1_s32_x_untied, svint32_t,
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_s64.c b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_s64.c
index 850a798..fd930da 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_s64.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_s64.c
@@ -296,7 +296,7 @@ TEST_UNIFORM_ZX (lsl_x0_s64_x_untied, svint64_t, uint64_t,
/*
** lsl_1_s64_x_tied1:
-** lsl z0\.d, z0\.d, #1
+** add z0\.d, z0\.d, z0\.d
** ret
*/
TEST_UNIFORM_Z (lsl_1_s64_x_tied1, svint64_t,
@@ -305,7 +305,7 @@ TEST_UNIFORM_Z (lsl_1_s64_x_tied1, svint64_t,
/*
** lsl_1_s64_x_untied:
-** lsl z0\.d, z1\.d, #1
+** add z0\.d, z1\.d, z1\.d
** ret
*/
TEST_UNIFORM_Z (lsl_1_s64_x_untied, svint64_t,
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_s8.c b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_s8.c
index d877659..e417fb9 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_s8.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_s8.c
@@ -296,7 +296,7 @@ TEST_UNIFORM_ZX (lsl_w0_s8_x_untied, svint8_t, uint8_t,
/*
** lsl_1_s8_x_tied1:
-** lsl z0\.b, z0\.b, #1
+** add z0\.b, z0\.b, z0\.b
** ret
*/
TEST_UNIFORM_Z (lsl_1_s8_x_tied1, svint8_t,
@@ -305,7 +305,7 @@ TEST_UNIFORM_Z (lsl_1_s8_x_tied1, svint8_t,
/*
** lsl_1_s8_x_untied:
-** lsl z0\.b, z1\.b, #1
+** add z0\.b, z1\.b, z1\.b
** ret
*/
TEST_UNIFORM_Z (lsl_1_s8_x_untied, svint8_t,
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_u16.c b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_u16.c
index 068e49b..8050fe2 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_u16.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_u16.c
@@ -296,7 +296,7 @@ TEST_UNIFORM_ZX (lsl_w0_u16_x_untied, svuint16_t, uint16_t,
/*
** lsl_1_u16_x_tied1:
-** lsl z0\.h, z0\.h, #1
+** add z0\.h, z0\.h, z0\.h
** ret
*/
TEST_UNIFORM_Z (lsl_1_u16_x_tied1, svuint16_t,
@@ -305,7 +305,7 @@ TEST_UNIFORM_Z (lsl_1_u16_x_tied1, svuint16_t,
/*
** lsl_1_u16_x_untied:
-** lsl z0\.h, z1\.h, #1
+** add z0\.h, z1\.h, z1\.h
** ret
*/
TEST_UNIFORM_Z (lsl_1_u16_x_untied, svuint16_t,
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_u32.c b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_u32.c
index 9c2be1d..30968be 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_u32.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_u32.c
@@ -296,7 +296,7 @@ TEST_UNIFORM_ZX (lsl_w0_u32_x_untied, svuint32_t, uint32_t,
/*
** lsl_1_u32_x_tied1:
-** lsl z0\.s, z0\.s, #1
+** add z0\.s, z0\.s, z0\.s
** ret
*/
TEST_UNIFORM_Z (lsl_1_u32_x_tied1, svuint32_t,
@@ -305,7 +305,7 @@ TEST_UNIFORM_Z (lsl_1_u32_x_tied1, svuint32_t,
/*
** lsl_1_u32_x_untied:
-** lsl z0\.s, z1\.s, #1
+** add z0\.s, z1\.s, z1\.s
** ret
*/
TEST_UNIFORM_Z (lsl_1_u32_x_untied, svuint32_t,
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_u64.c b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_u64.c
index 0c1e473..2fb97ac 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_u64.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_u64.c
@@ -296,7 +296,7 @@ TEST_UNIFORM_ZX (lsl_x0_u64_x_untied, svuint64_t, uint64_t,
/*
** lsl_1_u64_x_tied1:
-** lsl z0\.d, z0\.d, #1
+** add z0\.d, z0\.d, z0\.d
** ret
*/
TEST_UNIFORM_Z (lsl_1_u64_x_tied1, svuint64_t,
@@ -305,7 +305,7 @@ TEST_UNIFORM_Z (lsl_1_u64_x_tied1, svuint64_t,
/*
** lsl_1_u64_x_untied:
-** lsl z0\.d, z1\.d, #1
+** add z0\.d, z1\.d, z1\.d
** ret
*/
TEST_UNIFORM_Z (lsl_1_u64_x_untied, svuint64_t,
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_u8.c b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_u8.c
index 59d386c..636679a 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_u8.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_u8.c
@@ -296,7 +296,7 @@ TEST_UNIFORM_ZX (lsl_w0_u8_x_untied, svuint8_t, uint8_t,
/*
** lsl_1_u8_x_tied1:
-** lsl z0\.b, z0\.b, #1
+** add z0\.b, z0\.b, z0\.b
** ret
*/
TEST_UNIFORM_Z (lsl_1_u8_x_tied1, svuint8_t,
@@ -305,7 +305,7 @@ TEST_UNIFORM_Z (lsl_1_u8_x_tied1, svuint8_t,
/*
** lsl_1_u8_x_untied:
-** lsl z0\.b, z1\.b, #1
+** add z0\.b, z1\.b, z1\.b
** ret
*/
TEST_UNIFORM_Z (lsl_1_u8_x_untied, svuint8_t,
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_s16.c b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_s16.c
index 7244f64..67b652d 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_s16.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_s16.c
@@ -276,7 +276,7 @@ TEST_UNIFORM_ZX (lsl_wide_x0_s16_x_untied, svint16_t, uint64_t,
/*
** lsl_wide_1_s16_x_tied1:
-** lsl z0\.h, z0\.h, #1
+** add z0\.h, z0\.h, z0\.h
** ret
*/
TEST_UNIFORM_Z (lsl_wide_1_s16_x_tied1, svint16_t,
@@ -285,7 +285,7 @@ TEST_UNIFORM_Z (lsl_wide_1_s16_x_tied1, svint16_t,
/*
** lsl_wide_1_s16_x_untied:
-** lsl z0\.h, z1\.h, #1
+** add z0\.h, z1\.h, z1\.h
** ret
*/
TEST_UNIFORM_Z (lsl_wide_1_s16_x_untied, svint16_t,
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_s32.c b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_s32.c
index 04333ce..7782681 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_s32.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_s32.c
@@ -276,7 +276,7 @@ TEST_UNIFORM_ZX (lsl_wide_x0_s32_x_untied, svint32_t, uint64_t,
/*
** lsl_wide_1_s32_x_tied1:
-** lsl z0\.s, z0\.s, #1
+** add z0\.s, z0\.s, z0\.s
** ret
*/
TEST_UNIFORM_Z (lsl_wide_1_s32_x_tied1, svint32_t,
@@ -285,7 +285,7 @@ TEST_UNIFORM_Z (lsl_wide_1_s32_x_tied1, svint32_t,
/*
** lsl_wide_1_s32_x_untied:
-** lsl z0\.s, z1\.s, #1
+** add z0\.s, z1\.s, z1\.s
** ret
*/
TEST_UNIFORM_Z (lsl_wide_1_s32_x_untied, svint32_t,
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_s8.c b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_s8.c
index 5847db7..d14e314 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_s8.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_s8.c
@@ -276,7 +276,7 @@ TEST_UNIFORM_ZX (lsl_wide_x0_s8_x_untied, svint8_t, uint64_t,
/*
** lsl_wide_1_s8_x_tied1:
-** lsl z0\.b, z0\.b, #1
+** add z0\.b, z0\.b, z0\.b
** ret
*/
TEST_UNIFORM_Z (lsl_wide_1_s8_x_tied1, svint8_t,
@@ -285,7 +285,7 @@ TEST_UNIFORM_Z (lsl_wide_1_s8_x_tied1, svint8_t,
/*
** lsl_wide_1_s8_x_untied:
-** lsl z0\.b, z1\.b, #1
+** add z0\.b, z1\.b, z1\.b
** ret
*/
TEST_UNIFORM_Z (lsl_wide_1_s8_x_untied, svint8_t,
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_u16.c b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_u16.c
index 2c047b7..154f7bd 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_u16.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_u16.c
@@ -276,7 +276,7 @@ TEST_UNIFORM_ZX (lsl_wide_x0_u16_x_untied, svuint16_t, uint64_t,
/*
** lsl_wide_1_u16_x_tied1:
-** lsl z0\.h, z0\.h, #1
+** add z0\.h, z0\.h, z0\.h
** ret
*/
TEST_UNIFORM_Z (lsl_wide_1_u16_x_tied1, svuint16_t,
@@ -285,7 +285,7 @@ TEST_UNIFORM_Z (lsl_wide_1_u16_x_tied1, svuint16_t,
/*
** lsl_wide_1_u16_x_untied:
-** lsl z0\.h, z1\.h, #1
+** add z0\.h, z1\.h, z1\.h
** ret
*/
TEST_UNIFORM_Z (lsl_wide_1_u16_x_untied, svuint16_t,
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_u32.c b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_u32.c
index 1e14963..d059d68 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_u32.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_u32.c
@@ -276,7 +276,7 @@ TEST_UNIFORM_ZX (lsl_wide_x0_u32_x_untied, svuint32_t, uint64_t,
/*
** lsl_wide_1_u32_x_tied1:
-** lsl z0\.s, z0\.s, #1
+** add z0\.s, z0\.s, z0\.s
** ret
*/
TEST_UNIFORM_Z (lsl_wide_1_u32_x_tied1, svuint32_t,
@@ -285,7 +285,7 @@ TEST_UNIFORM_Z (lsl_wide_1_u32_x_tied1, svuint32_t,
/*
** lsl_wide_1_u32_x_untied:
-** lsl z0\.s, z1\.s, #1
+** add z0\.s, z1\.s, z1\.s
** ret
*/
TEST_UNIFORM_Z (lsl_wide_1_u32_x_untied, svuint32_t,
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_u8.c b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_u8.c
index 55f2721..503e101 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_u8.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/acle/asm/lsl_wide_u8.c
@@ -276,7 +276,7 @@ TEST_UNIFORM_ZX (lsl_wide_x0_u8_x_untied, svuint8_t, uint64_t,
/*
** lsl_wide_1_u8_x_tied1:
-** lsl z0\.b, z0\.b, #1
+** add z0\.b, z0\.b, z0\.b
** ret
*/
TEST_UNIFORM_Z (lsl_wide_1_u8_x_tied1, svuint8_t,
@@ -285,7 +285,7 @@ TEST_UNIFORM_Z (lsl_wide_1_u8_x_tied1, svuint8_t,
/*
** lsl_wide_1_u8_x_untied:
-** lsl z0\.b, z1\.b, #1
+** add z0\.b, z1\.b, z1\.b
** ret
*/
TEST_UNIFORM_Z (lsl_wide_1_u8_x_untied, svuint8_t,
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/adr_1.c b/gcc/testsuite/gcc.target/aarch64/sve/adr_1.c
index ff47768..9eaa0d1 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve/adr_1.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/adr_1.c
@@ -29,12 +29,10 @@
TEST_ALL (LOOP)
-/* { dg-final { scan-assembler-times {\tadd\tz[0-9]+\.b,} 2 } } */
-/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.b,} 2 } } */
+/* { dg-final { scan-assembler-times {\tadd\tz[0-9]+\.b,} 4 } } */
/* { dg-final { scan-assembler-not {\tadr\tz[0-9]+\.b,} } } */
-/* { dg-final { scan-assembler-times {\tadd\tz[0-9]+\.h,} 2 } } */
-/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.h,} 2 } } */
+/* { dg-final { scan-assembler-times {\tadd\tz[0-9]+\.h,} 4 } } */
/* { dg-final { scan-assembler-not {\tadr\tz[0-9]+\.h,} } } */
/* { dg-final { scan-assembler-not {\tadd\tz[0-9]+\.s,} } } */
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/adr_6.c b/gcc/testsuite/gcc.target/aarch64/sve/adr_6.c
index 1f92749..13e2264 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve/adr_6.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/adr_6.c
@@ -31,8 +31,8 @@ TEST_TYPE (uint16_t, 128)
TEST_TYPE (int32_t, 128)
TEST_TYPE (uint32_t, 128)
-/* { dg-final { scan-assembler-times {\tadd\tz[0-9]+\.b,} 6 } } */
-/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.b,} 6 } } */
+/* { dg-final { scan-assembler-times {\tadd\tz[0-9]+\.b,} 8 } } */
+/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.b,} 4 } } */
/* { dg-final { scan-assembler-times {\tadr\tz[0-9]+\.s, \[z[0-9]+\.s, z[0-9]+\.s, lsl #?1\]\n} 4 } } */
/* { dg-final { scan-assembler-times {\tadr\tz[0-9]+\.s, \[z[0-9]+\.s, z[0-9]+\.s, lsl #?2\]\n} 4 } } */
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/cond_mla_7.c b/gcc/testsuite/gcc.target/aarch64/sve/cond_mla_7.c
index 5561f42..e11a455 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve/cond_mla_7.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/cond_mla_7.c
@@ -31,19 +31,19 @@
TEST_ALL (DEF_LOOP)
-/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.b, z[0-9]+\.b, #1\n} 2 } } */
+/* { dg-final { scan-assembler-times {\tadd\tz[0-9]+\.b, z[0-9]+\.b, z[0-9]+\.b\n} 2 } } */
/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.b, z[0-9]+\.b, #2\n} 2 } } */
/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.b, z[0-9]+\.b, #7\n} 2 } } */
-/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.h, z[0-9]+\.h, #1\n} 2 } } */
+/* { dg-final { scan-assembler-times {\tadd\tz[0-9]+\.h, z[0-9]+\.h, z[0-9]+\.h\n} 2 } } */
/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.h, z[0-9]+\.h, #2\n} 2 } } */
/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.h, z[0-9]+\.h, #15\n} 2 } } */
-/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.s, z[0-9]+\.s, #1\n} 2 } } */
+/* { dg-final { scan-assembler-times {\tadd\tz[0-9]+\.s, z[0-9]+\.s, z[0-9]+\.s\n} 2 } } */
/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.s, z[0-9]+\.s, #2\n} 2 } } */
/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.s, z[0-9]+\.s, #31\n} 2 } } */
-/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.d, z[0-9]+\.d, #1\n} 2 } } */
+/* { dg-final { scan-assembler-times {\tadd\tz[0-9]+\.d, z[0-9]+\.d, z[0-9]+\.d\n} 2 } } */
/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.d, z[0-9]+\.d, #2\n} 2 } } */
/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.d, z[0-9]+\.d, #63\n} 2 } } */
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/cond_mla_8.c b/gcc/testsuite/gcc.target/aarch64/sve/cond_mla_8.c
index d554927..7db3f62 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve/cond_mla_8.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/cond_mla_8.c
@@ -31,19 +31,19 @@
TEST_ALL (DEF_LOOP)
-/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.b, z[0-9]+\.b, #1\n} 2 } } */
+/* { dg-final { scan-assembler-times {\tadd\tz[0-9]+\.b, z[0-9]+\.b, z[0-9]+\.b\n} 2 } } */
/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.b, z[0-9]+\.b, #2\n} 2 } } */
/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.b, z[0-9]+\.b, #7\n} 2 } } */
-/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.h, z[0-9]+\.h, #1\n} 2 } } */
+/* { dg-final { scan-assembler-times {\tadd\tz[0-9]+\.h, z[0-9]+\.h, z[0-9]+\.h\n} 2 } } */
/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.h, z[0-9]+\.h, #2\n} 2 } } */
/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.h, z[0-9]+\.h, #15\n} 2 } } */
-/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.s, z[0-9]+\.s, #1\n} 2 } } */
+/* { dg-final { scan-assembler-times {\tadd\tz[0-9]+\.s, z[0-9]+\.s, z[0-9]+\.s\n} 2 } } */
/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.s, z[0-9]+\.s, #2\n} 2 } } */
/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.s, z[0-9]+\.s, #31\n} 2 } } */
-/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.d, z[0-9]+\.d, #1\n} 2 } } */
+/* { dg-final { scan-assembler-times {\tadd\tz[0-9]+\.d, z[0-9]+\.d, z[0-9]+\.d\n} 2 } } */
/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.d, z[0-9]+\.d, #2\n} 2 } } */
/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.d, z[0-9]+\.d, #63\n} 2 } } */
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/shift_2.c b/gcc/testsuite/gcc.target/aarch64/sve/shift_2.c
index b7462c4..c1eadf0 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve/shift_2.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/shift_2.c
@@ -44,9 +44,9 @@ TEST_TYPE (uint32_t, 128, 31)
/* { dg-final { scan-assembler-times {\tasr\tz[0-9]+\.h, p[0-7]/m, z[0-9]+\.h, z[0-9]+\.h\n} 2 } } */
/* { dg-final { scan-assembler-times {\tasr\tz[0-9]+\.s, p[0-7]/m, z[0-9]+\.s, z[0-9]+\.s\n} 1 } } */
-/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.b, z[0-9]+\.b, #1\n} 6 } } */
-/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.h, z[0-9]+\.h, #1\n} 4 } } */
-/* { dg-final { scan-assembler-times {\tlsl\tz[0-9]+\.s, z[0-9]+\.s, #1\n} 2 } } */
+/* { dg-final { scan-assembler-times {\tadd\tz[0-9]+\.b, z[0-9]+\.b, z[0-9]+\.b\n} 6 } } */
+/* { dg-final { scan-assembler-times {\tadd\tz[0-9]+\.h, z[0-9]+\.h, z[0-9]+\.h\n} 4 } } */
+/* { dg-final { scan-assembler-times {\tadd\tz[0-9]+\.s, z[0-9]+\.s, z[0-9]+\.s\n} 2 } } */
/* { dg-final { scan-assembler-times {\tlsr\tz[0-9]+\.b, z[0-9]+\.b, #1\n} 3 } } */
/* { dg-final { scan-assembler-times {\tlsr\tz[0-9]+\.h, z[0-9]+\.h, #1\n} 2 } } */
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/sve_shl_add.c b/gcc/testsuite/gcc.target/aarch64/sve/sve_shl_add.c
new file mode 100644
index 0000000..6b370af
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/sve/sve_shl_add.c
@@ -0,0 +1,45 @@
+/* { dg-do compile } */
+/* { dg-additional-options "-O3" } */
+/* { dg-final { check-function-bodies "**" "" "" } } */
+
+#define FUNC(NAME, OPERATION, IMMEDIATE) \
+void NAME(int n) { \
+ for (int i = 0; i < n; i++) \
+ out[i] = in[i] OPERATION IMMEDIATE; \
+} \
+
+#define N 1024
+
+int out[N], in[N];
+
+/*
+** foo:
+** ...
+** add z[0-9]+.s, z[0-9]+.s, z[0-9]+.s
+** ...
+*/
+FUNC(foo, <<, 1)
+
+/*
+** foo2:
+** ...
+** lsl z[0-9]+.s, z[0-9]+.s, #15
+** ...
+*/
+FUNC(foo2, <<, 15)
+
+/*
+** foo3:
+** ...
+** asr z[0-9]+.s, z[0-9]+.s, #1
+** ...
+*/
+FUNC(foo3, >>, 1)
+
+/*
+** foo4:
+** ...
+** asr z[0-9]+.s, z[0-9]+.s, #10
+** ...
+*/
+FUNC(foo4, >>, 10)
diff --git a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/ldnt1sh_gather_s64.c b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/ldnt1sh_gather_s64.c
index 4ea3335..4093990 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/ldnt1sh_gather_s64.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/ldnt1sh_gather_s64.c
@@ -204,7 +204,7 @@ TEST_LOAD_GATHER_SZ (ldnt1sh_gather_untied_s64_u64offset, svint64_t, int16_t, sv
/*
** ldnt1sh_gather_x0_s64_s64index:
-** lsl (z[0-9]+\.d), z0\.d, #1
+** add (z[0-9]+\.d), z0\.d, z0\.d
** ldnt1sh z0\.d, p0/z, \[\1, x0\]
** ret
*/
@@ -214,7 +214,7 @@ TEST_LOAD_GATHER_SZ (ldnt1sh_gather_x0_s64_s64index, svint64_t, int16_t, svint64
/*
** ldnt1sh_gather_tied1_s64_s64index:
-** lsl (z[0-9]+\.d), z0\.d, #1
+** add (z[0-9]+\.d), z0\.d, z0\.d
** ldnt1sh z0\.d, p0/z, \[\1, x0\]
** ret
*/
@@ -224,7 +224,7 @@ TEST_LOAD_GATHER_SZ (ldnt1sh_gather_tied1_s64_s64index, svint64_t, int16_t, svin
/*
** ldnt1sh_gather_untied_s64_s64index:
-** lsl (z[0-9]+\.d), z1\.d, #1
+** add (z[0-9]+\.d), z1\.d, z1\.d
** ldnt1sh z0\.d, p0/z, \[\1, x0\]
** ret
*/
@@ -234,7 +234,7 @@ TEST_LOAD_GATHER_SZ (ldnt1sh_gather_untied_s64_s64index, svint64_t, int16_t, svi
/*
** ldnt1sh_gather_x0_s64_u64index:
-** lsl (z[0-9]+\.d), z0\.d, #1
+** add (z[0-9]+\.d), z0\.d, z0\.d
** ldnt1sh z0\.d, p0/z, \[\1, x0\]
** ret
*/
@@ -244,7 +244,7 @@ TEST_LOAD_GATHER_SZ (ldnt1sh_gather_x0_s64_u64index, svint64_t, int16_t, svuint6
/*
** ldnt1sh_gather_tied1_s64_u64index:
-** lsl (z[0-9]+\.d), z0\.d, #1
+** add (z[0-9]+\.d), z0\.d, z0\.d
** ldnt1sh z0\.d, p0/z, \[\1, x0\]
** ret
*/
@@ -254,7 +254,7 @@ TEST_LOAD_GATHER_SZ (ldnt1sh_gather_tied1_s64_u64index, svint64_t, int16_t, svui
/*
** ldnt1sh_gather_untied_s64_u64index:
-** lsl (z[0-9]+\.d), z1\.d, #1
+** add (z[0-9]+\.d), z1\.d, z1\.d
** ldnt1sh z0\.d, p0/z, \[\1, x0\]
** ret
*/
diff --git a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/ldnt1sh_gather_u64.c b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/ldnt1sh_gather_u64.c
index 18c8ca4..afc920e 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/ldnt1sh_gather_u64.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/ldnt1sh_gather_u64.c
@@ -204,7 +204,7 @@ TEST_LOAD_GATHER_SZ (ldnt1sh_gather_untied_u64_u64offset, svuint64_t, int16_t, s
/*
** ldnt1sh_gather_x0_u64_s64index:
-** lsl (z[0-9]+\.d), z0\.d, #1
+** add (z[0-9]+\.d), z0\.d, z0\.d
** ldnt1sh z0\.d, p0/z, \[\1, x0\]
** ret
*/
@@ -214,7 +214,7 @@ TEST_LOAD_GATHER_SZ (ldnt1sh_gather_x0_u64_s64index, svuint64_t, int16_t, svint6
/*
** ldnt1sh_gather_tied1_u64_s64index:
-** lsl (z[0-9]+\.d), z0\.d, #1
+** add (z[0-9]+\.d), z0\.d, z0\.d
** ldnt1sh z0\.d, p0/z, \[\1, x0\]
** ret
*/
@@ -224,7 +224,7 @@ TEST_LOAD_GATHER_SZ (ldnt1sh_gather_tied1_u64_s64index, svuint64_t, int16_t, svi
/*
** ldnt1sh_gather_untied_u64_s64index:
-** lsl (z[0-9]+\.d), z1\.d, #1
+** add (z[0-9]+\.d), z1\.d, z1\.d
** ldnt1sh z0\.d, p0/z, \[\1, x0\]
** ret
*/
@@ -234,7 +234,7 @@ TEST_LOAD_GATHER_SZ (ldnt1sh_gather_untied_u64_s64index, svuint64_t, int16_t, sv
/*
** ldnt1sh_gather_x0_u64_u64index:
-** lsl (z[0-9]+\.d), z0\.d, #1
+** add (z[0-9]+\.d), z0\.d, z0\.d
** ldnt1sh z0\.d, p0/z, \[\1, x0\]
** ret
*/
@@ -244,7 +244,7 @@ TEST_LOAD_GATHER_SZ (ldnt1sh_gather_x0_u64_u64index, svuint64_t, int16_t, svuint
/*
** ldnt1sh_gather_tied1_u64_u64index:
-** lsl (z[0-9]+\.d), z0\.d, #1
+** add (z[0-9]+\.d), z0\.d, z0\.d
** ldnt1sh z0\.d, p0/z, \[\1, x0\]
** ret
*/
@@ -254,7 +254,7 @@ TEST_LOAD_GATHER_SZ (ldnt1sh_gather_tied1_u64_u64index, svuint64_t, int16_t, svu
/*
** ldnt1sh_gather_untied_u64_u64index:
-** lsl (z[0-9]+\.d), z1\.d, #1
+** add (z[0-9]+\.d), z1\.d, z1\.d
** ldnt1sh z0\.d, p0/z, \[\1, x0\]
** ret
*/
diff --git a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/ldnt1uh_gather_s64.c b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/ldnt1uh_gather_s64.c
index be2e6d1..a468508 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/ldnt1uh_gather_s64.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/ldnt1uh_gather_s64.c
@@ -204,7 +204,7 @@ TEST_LOAD_GATHER_SZ (ldnt1uh_gather_untied_s64_u64offset, svint64_t, uint16_t, s
/*
** ldnt1uh_gather_x0_s64_s64index:
-** lsl (z[0-9]+\.d), z0\.d, #1
+** add (z[0-9]+\.d), z0\.d, z0\.d
** ldnt1h z0\.d, p0/z, \[\1, x0\]
** ret
*/
@@ -214,7 +214,7 @@ TEST_LOAD_GATHER_SZ (ldnt1uh_gather_x0_s64_s64index, svint64_t, uint16_t, svint6
/*
** ldnt1uh_gather_tied1_s64_s64index:
-** lsl (z[0-9]+\.d), z0\.d, #1
+** add (z[0-9]+\.d), z0\.d, z0\.d
** ldnt1h z0\.d, p0/z, \[\1, x0\]
** ret
*/
@@ -224,7 +224,7 @@ TEST_LOAD_GATHER_SZ (ldnt1uh_gather_tied1_s64_s64index, svint64_t, uint16_t, svi
/*
** ldnt1uh_gather_untied_s64_s64index:
-** lsl (z[0-9]+\.d), z1\.d, #1
+** add (z[0-9]+\.d), z1\.d, z1\.d
** ldnt1h z0\.d, p0/z, \[\1, x0\]
** ret
*/
@@ -234,7 +234,7 @@ TEST_LOAD_GATHER_SZ (ldnt1uh_gather_untied_s64_s64index, svint64_t, uint16_t, sv
/*
** ldnt1uh_gather_x0_s64_u64index:
-** lsl (z[0-9]+\.d), z0\.d, #1
+** add (z[0-9]+\.d), z0\.d, z0\.d
** ldnt1h z0\.d, p0/z, \[\1, x0\]
** ret
*/
@@ -244,7 +244,7 @@ TEST_LOAD_GATHER_SZ (ldnt1uh_gather_x0_s64_u64index, svint64_t, uint16_t, svuint
/*
** ldnt1uh_gather_tied1_s64_u64index:
-** lsl (z[0-9]+\.d), z0\.d, #1
+** add (z[0-9]+\.d), z0\.d, z0\.d
** ldnt1h z0\.d, p0/z, \[\1, x0\]
** ret
*/
@@ -254,7 +254,7 @@ TEST_LOAD_GATHER_SZ (ldnt1uh_gather_tied1_s64_u64index, svint64_t, uint16_t, svu
/*
** ldnt1uh_gather_untied_s64_u64index:
-** lsl (z[0-9]+\.d), z1\.d, #1
+** add (z[0-9]+\.d), z1\.d, z1\.d
** ldnt1h z0\.d, p0/z, \[\1, x0\]
** ret
*/
diff --git a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/ldnt1uh_gather_u64.c b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/ldnt1uh_gather_u64.c
index e3bc104..ffcbf1f 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/ldnt1uh_gather_u64.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/ldnt1uh_gather_u64.c
@@ -204,7 +204,7 @@ TEST_LOAD_GATHER_SZ (ldnt1uh_gather_untied_u64_u64offset, svuint64_t, uint16_t,
/*
** ldnt1uh_gather_x0_u64_s64index:
-** lsl (z[0-9]+\.d), z0\.d, #1
+** add (z[0-9]+\.d), z0\.d, z0\.d
** ldnt1h z0\.d, p0/z, \[\1, x0\]
** ret
*/
@@ -214,7 +214,7 @@ TEST_LOAD_GATHER_SZ (ldnt1uh_gather_x0_u64_s64index, svuint64_t, uint16_t, svint
/*
** ldnt1uh_gather_tied1_u64_s64index:
-** lsl (z[0-9]+\.d), z0\.d, #1
+** add (z[0-9]+\.d), z0\.d, z0\.d
** ldnt1h z0\.d, p0/z, \[\1, x0\]
** ret
*/
@@ -224,7 +224,7 @@ TEST_LOAD_GATHER_SZ (ldnt1uh_gather_tied1_u64_s64index, svuint64_t, uint16_t, sv
/*
** ldnt1uh_gather_untied_u64_s64index:
-** lsl (z[0-9]+\.d), z1\.d, #1
+** add (z[0-9]+\.d), z1\.d, z1\.d
** ldnt1h z0\.d, p0/z, \[\1, x0\]
** ret
*/
@@ -234,7 +234,7 @@ TEST_LOAD_GATHER_SZ (ldnt1uh_gather_untied_u64_s64index, svuint64_t, uint16_t, s
/*
** ldnt1uh_gather_x0_u64_u64index:
-** lsl (z[0-9]+\.d), z0\.d, #1
+** add (z[0-9]+\.d), z0\.d, z0\.d
** ldnt1h z0\.d, p0/z, \[\1, x0\]
** ret
*/
@@ -244,7 +244,7 @@ TEST_LOAD_GATHER_SZ (ldnt1uh_gather_x0_u64_u64index, svuint64_t, uint16_t, svuin
/*
** ldnt1uh_gather_tied1_u64_u64index:
-** lsl (z[0-9]+\.d), z0\.d, #1
+** add (z[0-9]+\.d), z0\.d, z0\.d
** ldnt1h z0\.d, p0/z, \[\1, x0\]
** ret
*/
@@ -254,7 +254,7 @@ TEST_LOAD_GATHER_SZ (ldnt1uh_gather_tied1_u64_u64index, svuint64_t, uint16_t, sv
/*
** ldnt1uh_gather_untied_u64_u64index:
-** lsl (z[0-9]+\.d), z1\.d, #1
+** add (z[0-9]+\.d), z1\.d, z1\.d
** ldnt1h z0\.d, p0/z, \[\1, x0\]
** ret
*/
diff --git a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_s16.c b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_s16.c
index 103af35..6bd88dc 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_s16.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_s16.c
@@ -361,7 +361,7 @@ TEST_UNIFORM_Z (rshl_m1_s16_x_untied, svint16_t,
/*
** rshl_1_s16_x_tied1:
-** lsl z0\.h, z0\.h, #1
+** add z0\.h, z0\.h, z0\.h
** ret
*/
TEST_UNIFORM_Z (rshl_1_s16_x_tied1, svint16_t,
@@ -370,7 +370,7 @@ TEST_UNIFORM_Z (rshl_1_s16_x_tied1, svint16_t,
/*
** rshl_1_s16_x_untied:
-** lsl z0\.h, z1\.h, #1
+** add z0\.h, z1\.h, z1\.h
** ret
*/
TEST_UNIFORM_Z (rshl_1_s16_x_untied, svint16_t,
diff --git a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_s32.c b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_s32.c
index 542c857..450a45b 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_s32.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_s32.c
@@ -361,7 +361,7 @@ TEST_UNIFORM_Z (rshl_m1_s32_x_untied, svint32_t,
/*
** rshl_1_s32_x_tied1:
-** lsl z0\.s, z0\.s, #1
+** add z0\.s, z0\.s, z0\.s
** ret
*/
TEST_UNIFORM_Z (rshl_1_s32_x_tied1, svint32_t,
@@ -370,7 +370,7 @@ TEST_UNIFORM_Z (rshl_1_s32_x_tied1, svint32_t,
/*
** rshl_1_s32_x_untied:
-** lsl z0\.s, z1\.s, #1
+** add z0\.s, z1\.s, z1\.s
** ret
*/
TEST_UNIFORM_Z (rshl_1_s32_x_untied, svint32_t,
diff --git a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_s64.c b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_s64.c
index b85fbb5..3e54707 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_s64.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_s64.c
@@ -361,7 +361,7 @@ TEST_UNIFORM_Z (rshl_m1_s64_x_untied, svint64_t,
/*
** rshl_1_s64_x_tied1:
-** lsl z0\.d, z0\.d, #1
+** add z0\.d, z0\.d, z0\.d
** ret
*/
TEST_UNIFORM_Z (rshl_1_s64_x_tied1, svint64_t,
@@ -370,7 +370,7 @@ TEST_UNIFORM_Z (rshl_1_s64_x_tied1, svint64_t,
/*
** rshl_1_s64_x_untied:
-** lsl z0\.d, z1\.d, #1
+** add z0\.d, z1\.d, z1\.d
** ret
*/
TEST_UNIFORM_Z (rshl_1_s64_x_untied, svint64_t,
diff --git a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_s8.c b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_s8.c
index f33102c..7ba2d7c 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_s8.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_s8.c
@@ -361,7 +361,7 @@ TEST_UNIFORM_Z (rshl_m1_s8_x_untied, svint8_t,
/*
** rshl_1_s8_x_tied1:
-** lsl z0\.b, z0\.b, #1
+** add z0\.b, z0\.b, z0\.b
** ret
*/
TEST_UNIFORM_Z (rshl_1_s8_x_tied1, svint8_t,
@@ -370,7 +370,7 @@ TEST_UNIFORM_Z (rshl_1_s8_x_tied1, svint8_t,
/*
** rshl_1_s8_x_untied:
-** lsl z0\.b, z1\.b, #1
+** add z0\.b, z1\.b, z1\.b
** ret
*/
TEST_UNIFORM_Z (rshl_1_s8_x_untied, svint8_t,
diff --git a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_u16.c b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_u16.c
index 3b7abfe..2b01b9f 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_u16.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_u16.c
@@ -361,7 +361,7 @@ TEST_UNIFORM_Z (rshl_m1_u16_x_untied, svuint16_t,
/*
** rshl_1_u16_x_tied1:
-** lsl z0\.h, z0\.h, #1
+** add z0\.h, z0\.h, z0\.h
** ret
*/
TEST_UNIFORM_Z (rshl_1_u16_x_tied1, svuint16_t,
@@ -370,7 +370,7 @@ TEST_UNIFORM_Z (rshl_1_u16_x_tied1, svuint16_t,
/*
** rshl_1_u16_x_untied:
-** lsl z0\.h, z1\.h, #1
+** add z0\.h, z1\.h, z1\.h
** ret
*/
TEST_UNIFORM_Z (rshl_1_u16_x_untied, svuint16_t,
diff --git a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_u32.c b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_u32.c
index ed86ae0..c659987 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_u32.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_u32.c
@@ -361,7 +361,7 @@ TEST_UNIFORM_Z (rshl_m1_u32_x_untied, svuint32_t,
/*
** rshl_1_u32_x_tied1:
-** lsl z0\.s, z0\.s, #1
+** add z0\.s, z0\.s, z0\.s
** ret
*/
TEST_UNIFORM_Z (rshl_1_u32_x_tied1, svuint32_t,
@@ -370,7 +370,7 @@ TEST_UNIFORM_Z (rshl_1_u32_x_tied1, svuint32_t,
/*
** rshl_1_u32_x_untied:
-** lsl z0\.s, z1\.s, #1
+** add z0\.s, z1\.s, z1\.s
** ret
*/
TEST_UNIFORM_Z (rshl_1_u32_x_untied, svuint32_t,
diff --git a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_u64.c b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_u64.c
index cd92206..23b4930 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_u64.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_u64.c
@@ -361,7 +361,7 @@ TEST_UNIFORM_Z (rshl_m1_u64_x_untied, svuint64_t,
/*
** rshl_1_u64_x_tied1:
-** lsl z0\.d, z0\.d, #1
+** add z0\.d, z0\.d, z0\.d
** ret
*/
TEST_UNIFORM_Z (rshl_1_u64_x_tied1, svuint64_t,
@@ -370,7 +370,7 @@ TEST_UNIFORM_Z (rshl_1_u64_x_tied1, svuint64_t,
/*
** rshl_1_u64_x_untied:
-** lsl z0\.d, z1\.d, #1
+** add z0\.d, z1\.d, z1\.d
** ret
*/
TEST_UNIFORM_Z (rshl_1_u64_x_untied, svuint64_t,
diff --git a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_u8.c b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_u8.c
index 4cc0036..39507b1 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_u8.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/rshl_u8.c
@@ -361,7 +361,7 @@ TEST_UNIFORM_Z (rshl_m1_u8_x_untied, svuint8_t,
/*
** rshl_1_u8_x_tied1:
-** lsl z0\.b, z0\.b, #1
+** add z0\.b, z0\.b, z0\.b
** ret
*/
TEST_UNIFORM_Z (rshl_1_u8_x_tied1, svuint8_t,
@@ -370,7 +370,7 @@ TEST_UNIFORM_Z (rshl_1_u8_x_tied1, svuint8_t,
/*
** rshl_1_u8_x_untied:
-** lsl z0\.b, z1\.b, #1
+** add z0\.b, z1\.b, z1\.b
** ret
*/
TEST_UNIFORM_Z (rshl_1_u8_x_untied, svuint8_t,
diff --git a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/stnt1h_scatter_s64.c b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/stnt1h_scatter_s64.c
index 006e0e2..07f9c08 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/stnt1h_scatter_s64.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/stnt1h_scatter_s64.c
@@ -177,7 +177,7 @@ TEST_STORE_SCATTER_SZ (stnt1h_scatter_s64_u64offset, svint64_t, int16_t, svuint6
/*
** stnt1h_scatter_x0_s64_s64index:
-** lsl (z[0-9]+\.d), z1\.d, #1
+** add (z[0-9]+\.d), z1\.d, z1\.d
** stnt1h z0\.d, p0, \[\1, x0\]
** ret
*/
@@ -187,7 +187,7 @@ TEST_STORE_SCATTER_SZ (stnt1h_scatter_x0_s64_s64index, svint64_t, int16_t, svint
/*
** stnt1h_scatter_s64_s64index:
-** lsl (z[0-9]+\.d), z1\.d, #1
+** add (z[0-9]+\.d), z1\.d, z1\.d
** stnt1h z0\.d, p0, \[\1, x0\]
** ret
*/
@@ -197,7 +197,7 @@ TEST_STORE_SCATTER_SZ (stnt1h_scatter_s64_s64index, svint64_t, int16_t, svint64_
/*
** stnt1h_scatter_x0_s64_u64index:
-** lsl (z[0-9]+\.d), z1\.d, #1
+** add (z[0-9]+\.d), z1\.d, z1\.d
** stnt1h z0\.d, p0, \[\1, x0\]
** ret
*/
@@ -207,7 +207,7 @@ TEST_STORE_SCATTER_SZ (stnt1h_scatter_x0_s64_u64index, svint64_t, int16_t, svuin
/*
** stnt1h_scatter_s64_u64index:
-** lsl (z[0-9]+\.d), z1\.d, #1
+** add (z[0-9]+\.d), z1\.d, z1\.d
** stnt1h z0\.d, p0, \[\1, x0\]
** ret
*/
diff --git a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/stnt1h_scatter_u64.c b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/stnt1h_scatter_u64.c
index 972ee36..792e10c 100644
--- a/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/stnt1h_scatter_u64.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve2/acle/asm/stnt1h_scatter_u64.c
@@ -177,7 +177,7 @@ TEST_STORE_SCATTER_SZ (stnt1h_scatter_u64_u64offset, svuint64_t, uint16_t, svuin
/*
** stnt1h_scatter_x0_u64_s64index:
-** lsl (z[0-9]+\.d), z1\.d, #1
+** add (z[0-9]+\.d), z1\.d, z1\.d
** stnt1h z0\.d, p0, \[\1, x0\]
** ret
*/
@@ -187,7 +187,7 @@ TEST_STORE_SCATTER_SZ (stnt1h_scatter_x0_u64_s64index, svuint64_t, uint16_t, svi
/*
** stnt1h_scatter_u64_s64index:
-** lsl (z[0-9]+\.d), z1\.d, #1
+** add (z[0-9]+\.d), z1\.d, z1\.d
** stnt1h z0\.d, p0, \[\1, x0\]
** ret
*/
@@ -197,7 +197,7 @@ TEST_STORE_SCATTER_SZ (stnt1h_scatter_u64_s64index, svuint64_t, uint16_t, svint6
/*
** stnt1h_scatter_x0_u64_u64index:
-** lsl (z[0-9]+\.d), z1\.d, #1
+** add (z[0-9]+\.d), z1\.d, z1\.d
** stnt1h z0\.d, p0, \[\1, x0\]
** ret
*/
@@ -207,7 +207,7 @@ TEST_STORE_SCATTER_SZ (stnt1h_scatter_x0_u64_u64index, svuint64_t, uint16_t, svu
/*
** stnt1h_scatter_u64_u64index:
-** lsl (z[0-9]+\.d), z1\.d, #1
+** add (z[0-9]+\.d), z1\.d, z1\.d
** stnt1h z0\.d, p0, \[\1, x0\]
** ret
*/