diff options
author | Richard Sandiford <richard.sandiford@arm.com> | 2019-12-10 16:32:40 +0000 |
---|---|---|
committer | Richard Sandiford <rsandifo@gcc.gnu.org> | 2019-12-10 16:32:40 +0000 |
commit | 30f8bf3d6c072a8fce14e8a003dff485a9068a97 (patch) | |
tree | 3c677c1d911f9af6a7ecf2f90f1d00705af35e7c /gcc | |
parent | 393283b8efaba009ce57a78fa658f55fbf262551 (diff) | |
download | gcc-30f8bf3d6c072a8fce14e8a003dff485a9068a97.zip gcc-30f8bf3d6c072a8fce14e8a003dff485a9068a97.tar.gz gcc-30f8bf3d6c072a8fce14e8a003dff485a9068a97.tar.bz2 |
[AArch64] Fix INDEX patterns for partial VNx2 modes
The INDEX patterns handle partial modes by choosing the container
size rather than the element size, so that the number of lanes
(and thus number of additions) matches the mode. This means that
all VNx4 modes use .s and all VNx2 modes use .d, etc.
When adding this, I'd forgotten that the choice between Wn and Xn
registers would need to be updated to use the container size too.
For partial VNx2s, we were using .d containers with Wn rather than
Xn source registers.
2019-12-10 Richard Sandiford <richard.sandiford@arm.com>
gcc/
* config/aarch64/iterators.md (vccore): New iterator.
* config/aarch64/aarch64-sve.md (vec_series<mode>): Use it instead
of vwcore.
(*vec_series<mode>_plus): Likewise.
gcc/testsuite/
* gcc.target/aarch64/sve/mixed_size_6.c: New test.
From-SVN: r279173
Diffstat (limited to 'gcc')
-rw-r--r-- | gcc/ChangeLog | 7 | ||||
-rw-r--r-- | gcc/config/aarch64/aarch64-sve.md | 8 | ||||
-rw-r--r-- | gcc/config/aarch64/iterators.md | 6 | ||||
-rw-r--r-- | gcc/testsuite/ChangeLog | 4 | ||||
-rw-r--r-- | gcc/testsuite/gcc.target/aarch64/sve/mixed_size_6.c | 47 |
5 files changed, 68 insertions, 4 deletions
diff --git a/gcc/ChangeLog b/gcc/ChangeLog index f559d3a..577acb1 100644 --- a/gcc/ChangeLog +++ b/gcc/ChangeLog @@ -1,3 +1,10 @@ +2019-12-10 Richard Sandiford <richard.sandiford@arm.com> + + * config/aarch64/iterators.md (vccore): New iterator. + * config/aarch64/aarch64-sve.md (vec_series<mode>): Use it instead + of vwcore. + (*vec_series<mode>_plus): Likewise. + 2019-12-10 Frederik Harwath <frederik@codesourcery.com> * omp-low.c (scan_omp_for): Use clause location in warning. diff --git a/gcc/config/aarch64/aarch64-sve.md b/gcc/config/aarch64/aarch64-sve.md index 4427609..1d9cdad 100644 --- a/gcc/config/aarch64/aarch64-sve.md +++ b/gcc/config/aarch64/aarch64-sve.md @@ -2541,9 +2541,9 @@ (match_operand:<VEL> 2 "aarch64_sve_index_operand" "r, Usi, r")))] "TARGET_SVE" "@ - index\t%0.<Vctype>, #%1, %<vwcore>2 - index\t%0.<Vctype>, %<vwcore>1, #%2 - index\t%0.<Vctype>, %<vwcore>1, %<vwcore>2" + index\t%0.<Vctype>, #%1, %<vccore>2 + index\t%0.<Vctype>, %<vccore>1, #%2 + index\t%0.<Vctype>, %<vccore>1, %<vccore>2" ) ;; Optimize {x, x, x, x, ...} + {0, n, 2*n, 3*n, ...} if n is in range @@ -2557,7 +2557,7 @@ "TARGET_SVE && aarch64_check_zero_based_sve_index_immediate (operands[2])" { operands[2] = aarch64_check_zero_based_sve_index_immediate (operands[2]); - return "index\t%0.<Vctype>, %<vwcore>1, #%2"; + return "index\t%0.<Vctype>, %<vccore>1, #%2"; } ) diff --git a/gcc/config/aarch64/iterators.md b/gcc/config/aarch64/iterators.md index 83a0d15..1ca5ed1 100644 --- a/gcc/config/aarch64/iterators.md +++ b/gcc/config/aarch64/iterators.md @@ -1093,6 +1093,12 @@ (VNx2DI "x") (VNx2DF "x")]) +;; Like vwcore, but for the container mode rather than the element mode. +(define_mode_attr vccore [(VNx16QI "w") (VNx8QI "w") (VNx4QI "w") (VNx2QI "x") + (VNx8HI "w") (VNx4HI "w") (VNx2HI "x") + (VNx4SI "w") (VNx2SI "x") + (VNx2DI "x")]) + ;; Double vector types for ALLX. (define_mode_attr Vallxd [(QI "8b") (HI "4h") (SI "2s")]) diff --git a/gcc/testsuite/ChangeLog b/gcc/testsuite/ChangeLog index e2454a6..c1f22f2 100644 --- a/gcc/testsuite/ChangeLog +++ b/gcc/testsuite/ChangeLog @@ -1,3 +1,7 @@ +2019-12-10 Richard Sandiford <richard.sandiford@arm.com> + + * gcc.target/aarch64/sve/mixed_size_6.c: New test. + 2019-12-10 Frederik Harwath <frederik@codesourcery.com> * c-c++-common/goacc/clause-locations.c: New test. diff --git a/gcc/testsuite/gcc.target/aarch64/sve/mixed_size_6.c b/gcc/testsuite/gcc.target/aarch64/sve/mixed_size_6.c new file mode 100644 index 0000000..837edec --- /dev/null +++ b/gcc/testsuite/gcc.target/aarch64/sve/mixed_size_6.c @@ -0,0 +1,47 @@ +/* { dg-options "-O3 -msve-vector-bits=256" } */ + +#include <stdint.h> + +void +f1 (uint64_t *restrict ptr1, uint8_t *restrict ptr2, uint8_t start) +{ +#pragma GCC unroll 0 + for (int i = 0; i < 4; ++i) + { + ptr1[i] = 10; + ptr2[i] = start; + start += 1; + } +} + +void +f2 (uint64_t *restrict ptr1, uint16_t *restrict ptr2, uint16_t start) +{ +#pragma GCC unroll 0 + for (int i = 0; i < 4; ++i) + { + ptr1[i] = 10; + ptr2[i] = start; + start += 2; + } +} + +void +f3 (uint64_t *restrict ptr1, uint32_t *restrict ptr2, uint32_t start) +{ +#pragma GCC unroll 0 + for (int i = 0; i < 4; ++i) + { + ptr1[i] = 10; + ptr2[i] = start; + start += 4; + } +} + +/* { dg-final { scan-assembler {\tindex\tz[0-9]+\.d, x[0-9]+, #1\n} } } */ +/* { dg-final { scan-assembler {\tindex\tz[0-9]+\.d, x[0-9]+, #1\n} } } */ +/* { dg-final { scan-assembler {\tindex\tz[0-9]+\.d, x[0-9]+, #4\n} } } */ + +/* { dg-final { scan-assembler-not {\tindex\tz[0-9]+\.d, w[0-9]+, #1\n} } } */ +/* { dg-final { scan-assembler-not {\tindex\tz[0-9]+\.d, w[0-9]+, #1\n} } } */ +/* { dg-final { scan-assembler-not {\tindex\tz[0-9]+\.d, w[0-9]+, #4\n} } } */ |