diff options
author | Richard Biener <rguenther@suse.de> | 2023-06-28 10:16:57 +0200 |
---|---|---|
committer | Richard Biener <rguenther@suse.de> | 2023-06-28 11:09:53 +0200 |
commit | 51c8cbc6bba387f953d9be48c4a4c8b657dd54a5 (patch) | |
tree | 2d3495b8ed7b8570a6b85c769c47add0a9e2471e /gcc | |
parent | 1554ab958afd4f4a94f776f3a7a03b40918bf424 (diff) | |
download | gcc-51c8cbc6bba387f953d9be48c4a4c8b657dd54a5.zip gcc-51c8cbc6bba387f953d9be48c4a4c8b657dd54a5.tar.gz gcc-51c8cbc6bba387f953d9be48c4a4c8b657dd54a5.tar.bz2 |
tree-optimization/110443 - prevent SLP splat of gathers
The following prevents non-grouped load SLP in case the element
to splat is from a gather operation. While it should be possible
to support this it is not similar to the single element interleaving
case I was trying to mimic here.
PR tree-optimization/110443
* tree-vect-slp.cc (vect_build_slp_tree_1): Reject non-grouped
gather loads.
* gcc.dg/torture/pr110443.c: New testcase.
Diffstat (limited to 'gcc')
-rw-r--r-- | gcc/testsuite/gcc.dg/torture/pr110443.c | 21 | ||||
-rw-r--r-- | gcc/tree-vect-slp.cc | 3 |
2 files changed, 23 insertions, 1 deletions
diff --git a/gcc/testsuite/gcc.dg/torture/pr110443.c b/gcc/testsuite/gcc.dg/torture/pr110443.c new file mode 100644 index 0000000..61cf705 --- /dev/null +++ b/gcc/testsuite/gcc.dg/torture/pr110443.c @@ -0,0 +1,21 @@ +/* { dg-do compile } */ + +typedef struct { + float real; + float imag; +} complex_t; +extern unsigned char fftorder[]; +float *a52_imdct_256_data; +int a52_imdct_256_i, a52_imdct_256_k; +float a52_imdct_256_b_r; +void a52_imdct_256() +{ + complex_t buf1[64]; + a52_imdct_256_i = 0; + for (; a52_imdct_256_i < 64; a52_imdct_256_i++) { + a52_imdct_256_k = fftorder[a52_imdct_256_i]; + buf1[a52_imdct_256_i].real = buf1[a52_imdct_256_i].imag = + a52_imdct_256_data[a52_imdct_256_k]; + } + a52_imdct_256_b_r = buf1[0].real * buf1[0].imag; +} diff --git a/gcc/tree-vect-slp.cc b/gcc/tree-vect-slp.cc index 8cb1ac1..355d078 100644 --- a/gcc/tree-vect-slp.cc +++ b/gcc/tree-vect-slp.cc @@ -1291,7 +1291,8 @@ vect_build_slp_tree_1 (vec_info *vinfo, unsigned char *swap, vectorization. For loop vectorization we can handle splats the same we handle single element interleaving. */ && (is_a <bb_vec_info> (vinfo) - || stmt_info != first_stmt_info)) + || stmt_info != first_stmt_info + || STMT_VINFO_GATHER_SCATTER_P (stmt_info))) { /* Not grouped load. */ if (dump_enabled_p ()) |