diff options
author | Jakub Jelinek <jakub@redhat.com> | 2015-11-24 11:45:52 +0100 |
---|---|---|
committer | Jakub Jelinek <jakub@gcc.gnu.org> | 2015-11-24 11:45:52 +0100 |
commit | 3788cfb513d19a9b36311b1317aff2141a2c6a65 (patch) | |
tree | 64cec4dd60c911068b6646624ee5ba614d073759 /gcc | |
parent | 3de2a40ecdfa37efa403d4b46ef116225acb0dc0 (diff) | |
download | gcc-3788cfb513d19a9b36311b1317aff2141a2c6a65.zip gcc-3788cfb513d19a9b36311b1317aff2141a2c6a65.tar.gz gcc-3788cfb513d19a9b36311b1317aff2141a2c6a65.tar.bz2 |
re PR target/68483 (gcc 5.2: suboptimal code compared to 4.9)
PR target/68483
* tree-vect-generic.c (lower_vec_perm): If VEC_PERM_EXPR
is valid vec_shr pattern, don't lower it even if can_vec_perm_p
returns false.
* optabs.c (shift_amt_for_vec_perm_mask): Return NULL_RTX
whenever first is nelt or above. Don't mask expected with
2 * nelt - 1.
* gcc.target/i386/pr68483-1.c: New test.
* gcc.target/i386/pr68483-2.c: New test.
From-SVN: r230797
Diffstat (limited to 'gcc')
-rw-r--r-- | gcc/ChangeLog | 10 | ||||
-rw-r--r-- | gcc/optabs.c | 4 | ||||
-rw-r--r-- | gcc/testsuite/ChangeLog | 6 | ||||
-rw-r--r-- | gcc/testsuite/gcc.target/i386/pr68483-1.c | 22 | ||||
-rw-r--r-- | gcc/testsuite/gcc.target/i386/pr68483-2.c | 15 | ||||
-rw-r--r-- | gcc/tree-vect-generic.c | 24 |
6 files changed, 79 insertions, 2 deletions
diff --git a/gcc/ChangeLog b/gcc/ChangeLog index d8a5872..d91c929 100644 --- a/gcc/ChangeLog +++ b/gcc/ChangeLog @@ -1,3 +1,13 @@ +2015-11-24 Jakub Jelinek <jakub@redhat.com> + + PR target/68483 + * tree-vect-generic.c (lower_vec_perm): If VEC_PERM_EXPR + is valid vec_shr pattern, don't lower it even if can_vec_perm_p + returns false. + * optabs.c (shift_amt_for_vec_perm_mask): Return NULL_RTX + whenever first is nelt or above. Don't mask expected with + 2 * nelt - 1. + 2015-11-24 Ilya Enkovich <enkovich.gnu@gmail.com> PR c/68337 diff --git a/gcc/optabs.c b/gcc/optabs.c index 5545302..40ef582 100644 --- a/gcc/optabs.c +++ b/gcc/optabs.c @@ -5232,12 +5232,12 @@ shift_amt_for_vec_perm_mask (rtx sel) return NULL_RTX; first = INTVAL (CONST_VECTOR_ELT (sel, 0)); - if (first >= 2*nelt) + if (first >= nelt) return NULL_RTX; for (i = 1; i < nelt; i++) { int idx = INTVAL (CONST_VECTOR_ELT (sel, i)); - unsigned int expected = (i + first) & (2 * nelt - 1); + unsigned int expected = i + first; /* Indices into the second vector are all equivalent. */ if (idx < 0 || (MIN (nelt, (unsigned) idx) != MIN (nelt, expected))) return NULL_RTX; diff --git a/gcc/testsuite/ChangeLog b/gcc/testsuite/ChangeLog index 6c98a6f..3c3e3cd 100644 --- a/gcc/testsuite/ChangeLog +++ b/gcc/testsuite/ChangeLog @@ -1,3 +1,9 @@ +2015-11-24 Jakub Jelinek <jakub@redhat.com> + + PR target/68483 + * gcc.target/i386/pr68483-1.c: New test. + * gcc.target/i386/pr68483-2.c: New test. + 2015-11-24 Ilya Enkovich <enkovich.gnu@gmail.com> PR c/68337 diff --git a/gcc/testsuite/gcc.target/i386/pr68483-1.c b/gcc/testsuite/gcc.target/i386/pr68483-1.c new file mode 100644 index 0000000..29787e9 --- /dev/null +++ b/gcc/testsuite/gcc.target/i386/pr68483-1.c @@ -0,0 +1,22 @@ +/* PR target/68483 */ +/* { dg-do compile } */ +/* { dg-options "-O2 -ftree-vectorize -msse2 -mno-sse3" } */ + +void +test (int *input, int *out, unsigned x1, unsigned x2) +{ + unsigned i, j; + unsigned end = x1; + + for (i = j = 0; i < 1000; i++) + { + int sum = 0; + end += x2; + for (; j < end; j++) + sum += input[j]; + out[i] = sum; + } +} + +/* { dg-final { scan-assembler "psrldq\[^\n\r]*(8,|, 8)" { target ia32 } } } */ +/* { dg-final { scan-assembler "psrldq\[^\n\r]*(4,|, 4)" { target ia32 } } } */ diff --git a/gcc/testsuite/gcc.target/i386/pr68483-2.c b/gcc/testsuite/gcc.target/i386/pr68483-2.c new file mode 100644 index 0000000..394dc1b --- /dev/null +++ b/gcc/testsuite/gcc.target/i386/pr68483-2.c @@ -0,0 +1,15 @@ +/* PR target/68483 */ +/* { dg-do compile } */ +/* { dg-options "-O2 -msse2 -mno-sse3" } */ + +typedef int V __attribute__((vector_size (16))); + +void +foo (V *a, V *b) +{ + V c = { 0, 0, 0, 0 }; + V d = { 1, 2, 3, 4 }; + *a = __builtin_shuffle (*b, c, d); +} + +/* { dg-final { scan-assembler "psrldq\[^\n\r]*(4,|, 4)" } } */ diff --git a/gcc/tree-vect-generic.c b/gcc/tree-vect-generic.c index af1af17..2c7adf7 100644 --- a/gcc/tree-vect-generic.c +++ b/gcc/tree-vect-generic.c @@ -1272,6 +1272,30 @@ lower_vec_perm (gimple_stmt_iterator *gsi) update_stmt (stmt); return; } + /* Also detect vec_shr pattern - VEC_PERM_EXPR with zero + vector as VEC1 and a right element shift MASK. */ + if (optab_handler (vec_shr_optab, TYPE_MODE (vect_type)) + != CODE_FOR_nothing + && TREE_CODE (vec1) == VECTOR_CST + && initializer_zerop (vec1) + && sel_int[0] + && sel_int[0] < elements) + { + for (i = 1; i < elements; ++i) + { + unsigned int expected = i + sel_int[0]; + /* Indices into the second vector are all equivalent. */ + if (MIN (elements, (unsigned) sel_int[i]) + != MIN (elements, expected)) + break; + } + if (i == elements) + { + gimple_assign_set_rhs3 (stmt, mask); + update_stmt (stmt); + return; + } + } } else if (can_vec_perm_p (TYPE_MODE (vect_type), true, NULL)) return; |