aboutsummaryrefslogtreecommitdiff
path: root/gcc
diff options
context:
space:
mode:
authorRichard Sandiford <richard.sandiford@arm.com>2021-12-17 14:18:39 +0000
committerRichard Sandiford <richard.sandiford@arm.com>2021-12-17 14:18:39 +0000
commite781cb93d7d908f1f4f1611d0034eccbd1478e91 (patch)
treec4fe0953ca4dfa108c4b825fb73123b11e88ce85 /gcc
parent7dca2ad64910ba4aeae8e1f373f4d4796702b42b (diff)
downloadgcc-e781cb93d7d908f1f4f1611d0034eccbd1478e91.zip
gcc-e781cb93d7d908f1f4f1611d0034eccbd1478e91.tar.gz
gcc-e781cb93d7d908f1f4f1611d0034eccbd1478e91.tar.bz2
vect: Fix multi-vector SLP gather loads [PR103744]
This PR shows that I didn't properly test the multi-vector case when adding support for SLP gather loads. The patch fixes that case using the same approach as we do for non-SLP cases: keep the scalar base the same, but iterate through the (also multi-vector) vector offsets. “vec_num * j + i” is already used elsewhere as a way of handling both the multi-vector SLP case and the multi-vector non-SLP case. gcc/ PR tree-optimization/103744 * tree-vect-stmts.c (vectorizable_load): Handle multi-vector SLP gather loads. gcc/testsuite/ PR tree-optimization/103744 * gcc.dg/vect/pr103744-1.c: New test. * gcc.dg/vect/pr103744-2.c: Likewise.
Diffstat (limited to 'gcc')
-rw-r--r--gcc/testsuite/gcc.dg/vect/pr103744-1.c20
-rw-r--r--gcc/testsuite/gcc.dg/vect/pr103744-2.c31
-rw-r--r--gcc/tree-vect-stmts.c6
3 files changed, 55 insertions, 2 deletions
diff --git a/gcc/testsuite/gcc.dg/vect/pr103744-1.c b/gcc/testsuite/gcc.dg/vect/pr103744-1.c
new file mode 100644
index 0000000..1bc81e2
--- /dev/null
+++ b/gcc/testsuite/gcc.dg/vect/pr103744-1.c
@@ -0,0 +1,20 @@
+/* { dg-do compile } */
+
+int r;
+
+void
+foo (short int *s, short int *d1, short int *d2, int z)
+{
+ int *a;
+
+ while (z < 1)
+ {
+ int i;
+
+ i = *s++ - (*d1++ + *d2++);
+ r += a[i];
+ i = *s++ - (*d1++ + *d2++);
+ r += a[i];
+ ++z;
+ }
+}
diff --git a/gcc/testsuite/gcc.dg/vect/pr103744-2.c b/gcc/testsuite/gcc.dg/vect/pr103744-2.c
new file mode 100644
index 0000000..52307ab
--- /dev/null
+++ b/gcc/testsuite/gcc.dg/vect/pr103744-2.c
@@ -0,0 +1,31 @@
+/* { dg-do compile } */
+
+int
+f1 (int *restrict x, unsigned short *restrict y)
+{
+ int res = 0;
+ for (int i = 0; i < 100; i += 2)
+ {
+ unsigned short i1 = y[i + 0] + 1;
+ unsigned short i2 = y[i + 1] + 2;
+ res += x[i1];
+ res += x[i2];
+ }
+ return res;
+}
+
+void
+f2 (int *restrict x, unsigned short *restrict y)
+{
+ int res1 = 0;
+ int res2 = 0;
+ for (int i = 0; i < 100; i += 2)
+ {
+ unsigned short i1 = y[i + 0] + 1;
+ unsigned short i2 = y[i + 1] + 2;
+ res1 += x[i1];
+ res2 += x[i2];
+ }
+ x[0] = res1;
+ x[1] = res2;
+}
diff --git a/gcc/tree-vect-stmts.c b/gcc/tree-vect-stmts.c
index ad90cdb..c842d50 100644
--- a/gcc/tree-vect-stmts.c
+++ b/gcc/tree-vect-stmts.c
@@ -9249,6 +9249,8 @@ vectorizable_load (vec_info *vinfo,
group_size = vec_num = 1;
group_gap_adj = 0;
ref_type = reference_alias_ptr_type (DR_REF (first_dr_info->dr));
+ if (slp)
+ vec_num = SLP_TREE_NUMBER_OF_VEC_STMTS (slp_node);
}
gcc_assert (alignment_support_scheme);
@@ -9594,7 +9596,7 @@ vectorizable_load (vec_info *vinfo,
final_mask = prepare_vec_mask (loop_vinfo, mask_vectype,
final_mask, vec_mask, gsi);
- if (i > 0)
+ if (i > 0 && !STMT_VINFO_GATHER_SCATTER_P (stmt_info))
dataref_ptr = bump_vector_ptr (vinfo, dataref_ptr, ptr_incr,
gsi, stmt_info, bump);
@@ -9611,7 +9613,7 @@ vectorizable_load (vec_info *vinfo,
&& gs_info.ifn != IFN_LAST)
{
if (STMT_VINFO_GATHER_SCATTER_P (stmt_info))
- vec_offset = vec_offsets[j];
+ vec_offset = vec_offsets[vec_num * j + i];
tree zero = build_zero_cst (vectype);
tree scale = size_int (gs_info.scale);
gcall *call;