aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorRichard Biener <rguenther@suse.de>2025-02-07 08:46:31 +0100
committerRichard Biener <rguenth@gcc.gnu.org>2025-02-07 13:39:58 +0100
commit4931a637479aba35e35c50a86f58ecd6262bc487 (patch)
treeda27a0927dcfccf0714efcdf50180df2163d8e0c
parent6aa3329b3430c6362ddf51e403d147e0b10d7401 (diff)
downloadgcc-4931a637479aba35e35c50a86f58ecd6262bc487.zip
gcc-4931a637479aba35e35c50a86f58ecd6262bc487.tar.gz
gcc-4931a637479aba35e35c50a86f58ecd6262bc487.tar.bz2
tree-optimization/115538 - possible wrong-code with SLP conversion
The following fixes a latent issue where we use ranges to verify correctness of a vector conversion optimization. We rely on ranges from 'op0' which for SLP is extracted from the representative stmt which does not necessarily correspond to any actual scalar operation. We also do not verify the range of all scalar lanes in the SLP operand match. The following rectifies this, restricting the support to single-lane SLP nodes at this point - on branches we'd simply not perform this optimization with SLP. PR tree-optimization/115538 * tree-vectorizer.h (vect_get_slp_scalar_def): Declare. * tree-vect-slp.cc (vect_get_slp_scalar_def): New helper. * tree-vect-generic.cc (expand_vector_conversion): Adjust. * tree-vect-stmts.cc (vectorizable_conversion): For SLP correctly look at ranges of the scalar defs of the SLP operand. (supportable_indirect_convert_operation): Likewise.
-rw-r--r--gcc/tree-vect-generic.cc6
-rw-r--r--gcc/tree-vect-slp.cc19
-rw-r--r--gcc/tree-vect-stmts.cc38
-rw-r--r--gcc/tree-vectorizer.h4
4 files changed, 52 insertions, 15 deletions
diff --git a/gcc/tree-vect-generic.cc b/gcc/tree-vect-generic.cc
index c2f7a29..173ebd9 100644
--- a/gcc/tree-vect-generic.cc
+++ b/gcc/tree-vect-generic.cc
@@ -1755,10 +1755,8 @@ expand_vector_conversion (gimple_stmt_iterator *gsi)
modifier = WIDEN;
auto_vec<std::pair<tree, tree_code> > converts;
- if (supportable_indirect_convert_operation (code,
- ret_type, arg_type,
- converts,
- arg))
+ if (supportable_indirect_convert_operation (code, ret_type, arg_type,
+ converts))
{
new_rhs = arg;
for (unsigned int i = 0; i < converts.length () - 1; i++)
diff --git a/gcc/tree-vect-slp.cc b/gcc/tree-vect-slp.cc
index ac17330..8ed746e 100644
--- a/gcc/tree-vect-slp.cc
+++ b/gcc/tree-vect-slp.cc
@@ -10199,6 +10199,25 @@ vect_create_constant_vectors (vec_info *vinfo, slp_tree op_node)
SLP_TREE_VEC_DEFS (op_node).quick_push (vop);
}
+/* Get the scalar definition of the Nth lane from SLP_NODE or NULL_TREE
+ if there is no definition for it in the scalar IL or it is not known. */
+
+tree
+vect_get_slp_scalar_def (slp_tree slp_node, unsigned n)
+{
+ if (SLP_TREE_DEF_TYPE (slp_node) == vect_internal_def)
+ {
+ if (!SLP_TREE_SCALAR_STMTS (slp_node).exists ())
+ return NULL_TREE;
+ stmt_vec_info def = SLP_TREE_SCALAR_STMTS (slp_node)[n];
+ if (!def)
+ return NULL_TREE;
+ return gimple_get_lhs (STMT_VINFO_STMT (def));
+ }
+ else
+ return SLP_TREE_SCALAR_OPS (slp_node)[n];
+}
+
/* Get the Ith vectorized definition from SLP_NODE. */
tree
diff --git a/gcc/tree-vect-stmts.cc b/gcc/tree-vect-stmts.cc
index 1b639ae..6bbb16b 100644
--- a/gcc/tree-vect-stmts.cc
+++ b/gcc/tree-vect-stmts.cc
@@ -5610,10 +5610,8 @@ vectorizable_conversion (vec_info *vinfo,
return false;
gcc_assert (code.is_tree_code ());
if (supportable_indirect_convert_operation (code,
- vectype_out,
- vectype_in,
- converts,
- op0))
+ vectype_out, vectype_in,
+ converts, op0, slp_op0))
{
gcc_assert (converts.length () <= 2);
if (converts.length () == 1)
@@ -5750,7 +5748,16 @@ vectorizable_conversion (vec_info *vinfo,
else if (code == FLOAT_EXPR)
{
wide_int op_min_value, op_max_value;
- if (!vect_get_range_info (op0, &op_min_value, &op_max_value))
+ if (slp_node)
+ {
+ tree def;
+ /* ??? Merge ranges in case of more than one lane. */
+ if (SLP_TREE_LANES (slp_op0) != 1
+ || !(def = vect_get_slp_scalar_def (slp_op0, 0))
+ || !vect_get_range_info (def, &op_min_value, &op_max_value))
+ goto unsupported;
+ }
+ else if (!vect_get_range_info (op0, &op_min_value, &op_max_value))
goto unsupported;
cvt_type
@@ -15197,7 +15204,7 @@ supportable_indirect_convert_operation (code_helper code,
tree vectype_out,
tree vectype_in,
vec<std::pair<tree, tree_code> > &converts,
- tree op0)
+ tree op0, slp_tree slp_op0)
{
bool found_mode = false;
scalar_mode lhs_mode = GET_MODE_INNER (TYPE_MODE (vectype_out));
@@ -15269,10 +15276,21 @@ supportable_indirect_convert_operation (code_helper code,
In the future, if it is supported, changes may need to be made
to this part, such as checking the RANGE of each element
in the vector. */
- if (TREE_CODE (op0) != SSA_NAME
- || !SSA_NAME_RANGE_INFO (op0)
- || !vect_get_range_info (op0, &op_min_value,
- &op_max_value))
+ if (slp_op0)
+ {
+ tree def;
+ /* ??? Merge ranges in case of more than one lane. */
+ if (SLP_TREE_LANES (slp_op0) != 1
+ || !(def = vect_get_slp_scalar_def (slp_op0, 0))
+ || !vect_get_range_info (def,
+ &op_min_value, &op_max_value))
+ break;
+ }
+ else if (!op0
+ || TREE_CODE (op0) != SSA_NAME
+ || !SSA_NAME_RANGE_INFO (op0)
+ || !vect_get_range_info (op0, &op_min_value,
+ &op_max_value))
break;
if (cvt_type == NULL_TREE
diff --git a/gcc/tree-vectorizer.h b/gcc/tree-vectorizer.h
index 44d3a1d..b0cb081 100644
--- a/gcc/tree-vectorizer.h
+++ b/gcc/tree-vectorizer.h
@@ -2345,7 +2345,8 @@ extern bool supportable_narrowing_operation (code_helper, tree, tree,
extern bool supportable_indirect_convert_operation (code_helper,
tree, tree,
vec<std::pair<tree, tree_code> > &,
- tree = NULL_TREE);
+ tree = NULL_TREE,
+ slp_tree = NULL);
extern int compare_step_with_zero (vec_info *, stmt_vec_info);
extern unsigned record_stmt_cost (stmt_vector_for_cost *, int,
@@ -2598,6 +2599,7 @@ extern bool vect_make_slp_decision (loop_vec_info);
extern void vect_detect_hybrid_slp (loop_vec_info);
extern void vect_optimize_slp (vec_info *);
extern void vect_gather_slp_loads (vec_info *);
+extern tree vect_get_slp_scalar_def (slp_tree, unsigned);
extern void vect_get_slp_defs (slp_tree, vec<tree> *);
extern void vect_get_slp_defs (vec_info *, slp_tree, vec<vec<tree> > *,
unsigned n = -1U);