From 9798ba2c6b4cccb17277a9d5fc04d285bf48f742 Mon Sep 17 00:00:00 2001 From: Tamar Christina Date: Fri, 7 Mar 2025 13:32:11 +0000 Subject: aarch64: add support for partial modes to last extractions [PR118464] The last extraction instructions work full both full and partial SVE vectors, however we currrently only define them for FULL vectors. Early break code for VLA now however requires partial vector support, which relies on extract_last support. I have not added any new testcases as they overlap with the existing Early break tests which now fail without this. gcc/ChangeLog: PR tree-optimization/118464 PR tree-optimization/116855 * config/aarch64/aarch64-sve.md (@extract__, @fold_extract__, @aarch64_fold_extract_vector__): Change SVE_FULL to SVE_ALL. * config/aarch64/iterators.md (vccore): Add more partial types. --- gcc/config/aarch64/aarch64-sve.md | 24 ++++++++++++------------ gcc/config/aarch64/iterators.md | 6 +++++- 2 files changed, 17 insertions(+), 13 deletions(-) (limited to 'gcc') diff --git a/gcc/config/aarch64/aarch64-sve.md b/gcc/config/aarch64/aarch64-sve.md index a93bc46..3dbd659 100644 --- a/gcc/config/aarch64/aarch64-sve.md +++ b/gcc/config/aarch64/aarch64-sve.md @@ -3107,12 +3107,12 @@ [(set (match_operand: 0 "register_operand") (unspec: [(match_operand: 1 "register_operand") - (match_operand:SVE_FULL 2 "register_operand")] + (match_operand:SVE_ALL 2 "register_operand")] LAST))] "TARGET_SVE" {@ [ cons: =0 , 1 , 2 ] - [ ?r , Upl , w ] last\t%0, %1, %2. - [ w , Upl , w ] last\t%0, %1, %2. + [ ?r , Upl , w ] last\t%0, %1, %2. + [ w , Upl , w ] last\t%0, %1, %2. } ) @@ -8899,26 +8899,26 @@ (unspec: [(match_operand: 1 "register_operand") (match_operand: 2 "register_operand") - (match_operand:SVE_FULL 3 "register_operand")] + (match_operand:SVE_ALL 3 "register_operand")] CLAST))] "TARGET_SVE" {@ [ cons: =0 , 1 , 2 , 3 ] - [ ?r , 0 , Upl , w ] clast\t%0, %2, %0, %3. - [ w , 0 , Upl , w ] clast\t%0, %2, %0, %3. + [ ?r , 0 , Upl , w ] clast\t%0, %2, %0, %3. + [ w , 0 , Upl , w ] clast\t%0, %2, %0, %3. } ) (define_insn "@aarch64_fold_extract_vector__" - [(set (match_operand:SVE_FULL 0 "register_operand") - (unspec:SVE_FULL - [(match_operand:SVE_FULL 1 "register_operand") + [(set (match_operand:SVE_ALL 0 "register_operand") + (unspec:SVE_ALL + [(match_operand:SVE_ALL 1 "register_operand") (match_operand: 2 "register_operand") - (match_operand:SVE_FULL 3 "register_operand")] + (match_operand:SVE_ALL 3 "register_operand")] CLAST))] "TARGET_SVE" {@ [ cons: =0 , 1 , 2 , 3 ] - [ w , 0 , Upl , w ] clast\t%0., %2, %0., %3. - [ ?&w , w , Upl , w ] movprfx\t%0, %1\;clast\t%0., %2, %0., %3. + [ w , 0 , Upl , w ] clast\t%0., %2, %0., %3. + [ ?&w , w , Upl , w ] movprfx\t%0, %1\;clast\t%0., %2, %0., %3. } ) diff --git a/gcc/config/aarch64/iterators.md b/gcc/config/aarch64/iterators.md index 5bfd6e7..146453b 100644 --- a/gcc/config/aarch64/iterators.md +++ b/gcc/config/aarch64/iterators.md @@ -2025,8 +2025,12 @@ ;; Like vwcore, but for the container mode rather than the element mode. (define_mode_attr vccore [(VNx16QI "w") (VNx8QI "w") (VNx4QI "w") (VNx2QI "x") (VNx8HI "w") (VNx4HI "w") (VNx2HI "x") + (VNx8HF "w") (VNx4HF "w") (VNx2HF "x") + (VNx8BF "w") (VNx4BF "w") (VNx2BF "x") (VNx4SI "w") (VNx2SI "x") - (VNx2DI "x")]) + (VNx4SF "w") (VNx2SF "x") + (VNx2DI "x") + (VNx2DF "x")]) ;; Double vector types for ALLX. (define_mode_attr Vallxd [(QI "8b") (HI "4h") (SI "2s")]) -- cgit v1.1