aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorKyrylo Tkachov <kyrylo.tkachov@arm.com>2023-05-10 12:04:47 +0100
committerKyrylo Tkachov <kyrylo.tkachov@arm.com>2023-05-10 12:04:47 +0100
commit5a7dda68000dcbe6c54735313521228812b10893 (patch)
treeddf2fc4f2a738d953a5bc03871793cec26ca1d8b
parent3ed5677bb61b334a2d01c769859cdd3279e12a07 (diff)
downloadgcc-5a7dda68000dcbe6c54735313521228812b10893.zip
gcc-5a7dda68000dcbe6c54735313521228812b10893.tar.gz
gcc-5a7dda68000dcbe6c54735313521228812b10893.tar.bz2
aarch64: Simplify sqmovun expander
This patch is a no-op as it removes the explicit vec-concat-zero patterns in favour of vczle/vczbe. This allows us to delete the explicit expander too. Tests are added to ensure the optimisation required still triggers. Bootstrapped and tested on aarch64-none-linux-gnu and aarch64_be-none-elf. gcc/ChangeLog: * config/aarch64/aarch64-simd.md (aarch64_sqmovun<mode>_insn_le): Delete. (aarch64_sqmovun<mode>_insn_be): Delete. (aarch64_sqmovun<mode><vczle><vczbe>): New define_insn. (aarch64_sqmovun<mode>): Delete expander. gcc/testsuite/ChangeLog: * gcc.target/aarch64/simd/pr99195_4.c: Add tests for sqmovun.
-rw-r--r--gcc/config/aarch64/aarch64-simd.md45
-rw-r--r--gcc/testsuite/gcc.target/aarch64/simd/pr99195_4.c8
2 files changed, 13 insertions, 40 deletions
diff --git a/gcc/config/aarch64/aarch64-simd.md b/gcc/config/aarch64/aarch64-simd.md
index 500d92c..bfc98a8 100644
--- a/gcc/config/aarch64/aarch64-simd.md
+++ b/gcc/config/aarch64/aarch64-simd.md
@@ -5327,50 +5327,15 @@
[(set_attr "type" "neon_sat_shift_imm_narrow_q")]
)
-(define_insn "aarch64_sqmovun<mode>_insn_le"
- [(set (match_operand:<VNARROWQ2> 0 "register_operand" "=w")
- (vec_concat:<VNARROWQ2>
- (unspec:<VNARROWQ> [(match_operand:VQN 1 "register_operand" "w")]
- UNSPEC_SQXTUN)
- (match_operand:<VNARROWQ> 2 "aarch64_simd_or_scalar_imm_zero")))]
- "TARGET_SIMD && !BYTES_BIG_ENDIAN"
- "sqxtun\\t%<vn2>0<Vmntype>, %<v>1<Vmtype>"
- [(set_attr "type" "neon_sat_shift_imm_narrow_q")]
-)
-
-(define_insn "aarch64_sqmovun<mode>_insn_be"
- [(set (match_operand:<VNARROWQ2> 0 "register_operand" "=w")
- (vec_concat:<VNARROWQ2>
- (match_operand:<VNARROWQ> 2 "aarch64_simd_or_scalar_imm_zero")
- (unspec:<VNARROWQ> [(match_operand:VQN 1 "register_operand" "w")]
- UNSPEC_SQXTUN)))]
- "TARGET_SIMD && BYTES_BIG_ENDIAN"
+(define_insn "aarch64_sqmovun<mode><vczle><vczbe>"
+ [(set (match_operand:<VNARROWQ> 0 "register_operand" "=w")
+ (unspec:<VNARROWQ> [(match_operand:VQN 1 "register_operand" "w")]
+ UNSPEC_SQXTUN))]
+ "TARGET_SIMD"
"sqxtun\\t%<vn2>0<Vmntype>, %<v>1<Vmtype>"
[(set_attr "type" "neon_sat_shift_imm_narrow_q")]
)
-(define_expand "aarch64_sqmovun<mode>"
- [(set (match_operand:<VNARROWQ> 0 "register_operand")
- (unspec:<VNARROWQ> [(match_operand:VQN 1 "register_operand")]
- UNSPEC_SQXTUN))]
- "TARGET_SIMD"
- {
- rtx tmp = gen_reg_rtx (<VNARROWQ2>mode);
- if (BYTES_BIG_ENDIAN)
- emit_insn (gen_aarch64_sqmovun<mode>_insn_be (tmp, operands[1],
- CONST0_RTX (<VNARROWQ>mode)));
- else
- emit_insn (gen_aarch64_sqmovun<mode>_insn_le (tmp, operands[1],
- CONST0_RTX (<VNARROWQ>mode)));
-
- /* The intrinsic expects a narrow result, so emit a subreg that will get
- optimized away as appropriate. */
- emit_move_insn (operands[0], lowpart_subreg (<VNARROWQ>mode, tmp,
- <VNARROWQ2>mode));
- DONE;
- }
-)
-
(define_insn "aarch64_sqxtun2<mode>_le"
[(set (match_operand:<VNARROWQ2> 0 "register_operand" "=w")
(vec_concat:<VNARROWQ2>
diff --git a/gcc/testsuite/gcc.target/aarch64/simd/pr99195_4.c b/gcc/testsuite/gcc.target/aarch64/simd/pr99195_4.c
index 6127cb2..8faf569 100644
--- a/gcc/testsuite/gcc.target/aarch64/simd/pr99195_4.c
+++ b/gcc/testsuite/gcc.target/aarch64/simd/pr99195_4.c
@@ -50,6 +50,14 @@ MYOP (uint32x4_t, uint64x2_t, uint32x2_t, OP, u64, u32) \
FUNC (movn)
FUNC (qmovn)
+#undef FUNC
+#define FUNC(OP) \
+MYOP (uint8x16_t, int16x8_t, uint8x8_t, OP, s16, u8) \
+MYOP (uint16x8_t, int32x4_t, uint16x4_t, OP, s32, u16) \
+MYOP (uint32x4_t, int64x2_t, uint32x2_t, OP, s64, u32) \
+
+FUNC (qmovun)
+
/* { dg-final { scan-assembler-not {\tfmov\t} } } */
/* { dg-final { scan-assembler-not {\tmov\t} } } */