aboutsummaryrefslogtreecommitdiff
path: root/gcc
diff options
context:
space:
mode:
authorliuhongt <hongtao.liu@intel.com>2022-09-20 13:22:28 +0800
committerliuhongt <hongtao.liu@intel.com>2022-09-21 15:47:40 +0800
commiteddbb81f1254f025d6f1b6b8e7554aa9a3830302 (patch)
treeea3ffbd47d9f494816bfbd1d28f317216bd5f5d3 /gcc
parent9c23fe08c1fcee524503b24e15321b20df136f6c (diff)
downloadgcc-eddbb81f1254f025d6f1b6b8e7554aa9a3830302.zip
gcc-eddbb81f1254f025d6f1b6b8e7554aa9a3830302.tar.gz
gcc-eddbb81f1254f025d6f1b6b8e7554aa9a3830302.tar.bz2
Don't check can_vec_perm_const_p for nonlinear iv_init when it's constant.
When init_expr is INTEGER_CST or REAL_CST, can_vec_perm_const_p is not necessary since there's no real vec_perm needed, but vec_gen_perm_mask_checked will gcc_assert (can_vec_perm_const_p). So it's better to use vec_gen_perm_mask_any in vect_create_nonlinear_iv_init. gcc/ChangeLog: PR tree-optimization/106963 * tree-vect-loop.cc (vect_create_nonlinear_iv_init): Use vec_gen_perm_mask_any instead of vec_gen_perm_mask_check. gcc/testsuite/ChangeLog: * gcc.target/i386/pr106963.c: New test.
Diffstat (limited to 'gcc')
-rw-r--r--gcc/testsuite/gcc.target/i386/pr106963.c14
-rw-r--r--gcc/tree-vect-loop.cc5
2 files changed, 18 insertions, 1 deletions
diff --git a/gcc/testsuite/gcc.target/i386/pr106963.c b/gcc/testsuite/gcc.target/i386/pr106963.c
new file mode 100644
index 0000000..9f2d20e
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/pr106963.c
@@ -0,0 +1,14 @@
+/* { dg-do compile } */
+/* { dg-options "-O2 -mavx -mno-avx2" } */
+
+void
+foo_neg_const (int *a)
+{
+ int i, b = 1;
+
+ for (i = 0; i < 1000; i++)
+ {
+ a[i] = b;
+ b = -b;
+ }
+}
diff --git a/gcc/tree-vect-loop.cc b/gcc/tree-vect-loop.cc
index 9c434b6..aabdc6f 100644
--- a/gcc/tree-vect-loop.cc
+++ b/gcc/tree-vect-loop.cc
@@ -8356,8 +8356,11 @@ vect_create_nonlinear_iv_init (gimple_seq* stmts, tree init_expr,
sel[2 * i + 1] = i + nunits;
}
vec_perm_indices indices (sel, 2, nunits);
+ /* Don't use vect_gen_perm_mask_checked since can_vec_perm_const_p may
+ fail when vec_init is const vector. In that situation vec_perm is not
+ really needed. */
tree perm_mask_even
- = vect_gen_perm_mask_checked (vectype, indices);
+ = vect_gen_perm_mask_any (vectype, indices);
vec_init = gimple_build (stmts, VEC_PERM_EXPR,
vectype,
vec_init, vec_neg,