diff options
author | Richard Biener <rguenther@suse.de> | 2024-03-05 15:28:58 +0100 |
---|---|---|
committer | Richard Biener <rguenther@suse.de> | 2024-06-06 08:55:56 +0200 |
commit | 2ee41ef76a99ef5a8b62b351e2c01dad93f51b18 (patch) | |
tree | ac33e2cdc48cf43b7d00b94861121ddfe66527b2 /gcc/tree-vect-loop.cc | |
parent | 202a9c8fe7db9dd94e5a77f42e54ef3d966f88e8 (diff) | |
download | gcc-2ee41ef76a99ef5a8b62b351e2c01dad93f51b18.zip gcc-2ee41ef76a99ef5a8b62b351e2c01dad93f51b18.tar.gz gcc-2ee41ef76a99ef5a8b62b351e2c01dad93f51b18.tar.bz2 |
Add double reduction support for SLP vectorization
The following makes double reduction vectorization work when
using (single-lane) SLP vectorization.
* tree-vect-loop.cc (vect_analyze_scalar_cycles_1): Queue
double reductions in LOOP_VINFO_REDUCTIONS.
(vect_create_epilog_for_reduction): Remove asserts disabling
SLP for double reductions.
(vectorizable_reduction): Analyze SLP double reductions
only once and start off the correct places.
* tree-vect-slp.cc (vect_get_and_check_slp_defs): Allow
vect_double_reduction_def.
(vect_build_slp_tree_2): Fix condition for the ignored
reduction initial values.
* tree-vect-stmts.cc (vect_analyze_stmt): Allow
vect_double_reduction_def.
Diffstat (limited to 'gcc/tree-vect-loop.cc')
-rw-r--r-- | gcc/tree-vect-loop.cc | 35 |
1 files changed, 25 insertions, 10 deletions
diff --git a/gcc/tree-vect-loop.cc b/gcc/tree-vect-loop.cc index ccd6ace..b9e8e9b 100644 --- a/gcc/tree-vect-loop.cc +++ b/gcc/tree-vect-loop.cc @@ -685,6 +685,8 @@ vect_analyze_scalar_cycles_1 (loop_vec_info loop_vinfo, class loop *loop, STMT_VINFO_DEF_TYPE (stmt_vinfo) = vect_double_reduction_def; STMT_VINFO_DEF_TYPE (reduc_stmt_info) = vect_double_reduction_def; + /* Make it accessible for SLP vectorization. */ + LOOP_VINFO_REDUCTIONS (loop_vinfo).safe_push (reduc_stmt_info); } else { @@ -5975,7 +5977,6 @@ vect_create_epilog_for_reduction (loop_vec_info loop_vinfo, stmt_vec_info rdef_info = stmt_info; if (STMT_VINFO_DEF_TYPE (stmt_info) == vect_double_reduction_def) { - gcc_assert (!slp_node); double_reduc = true; stmt_info = loop_vinfo->lookup_def (gimple_phi_arg_def (stmt_info->stmt, 0)); @@ -6020,7 +6021,7 @@ vect_create_epilog_for_reduction (loop_vec_info loop_vinfo, { outer_loop = loop; loop = loop->inner; - gcc_assert (!slp_node && double_reduc); + gcc_assert (double_reduc); } vectype = STMT_VINFO_REDUC_VECTYPE (reduc_info); @@ -6035,7 +6036,7 @@ vect_create_epilog_for_reduction (loop_vec_info loop_vinfo, for induc_val, use initial_def. */ if (STMT_VINFO_REDUC_TYPE (reduc_info) == INTEGER_INDUC_COND_REDUCTION) induc_val = STMT_VINFO_VEC_INDUC_COND_INITIAL_VAL (reduc_info); - /* ??? Coverage for double_reduc and 'else' isn't clear. */ + /* ??? Coverage for 'else' isn't clear. */ } else { @@ -7605,15 +7606,16 @@ vectorizable_reduction (loop_vec_info loop_vinfo, STMT_VINFO_TYPE (stmt_info) = reduc_vec_info_type; return true; } - if (slp_node) - { - slp_node_instance->reduc_phis = slp_node; - /* ??? We're leaving slp_node to point to the PHIs, we only - need it to get at the number of vector stmts which wasn't - yet initialized for the instance root. */ - } if (STMT_VINFO_DEF_TYPE (stmt_info) == vect_double_reduction_def) { + if (gimple_bb (stmt_info->stmt) != loop->header) + { + /* For SLP we arrive here for both the inner loop LC PHI and + the outer loop PHI. The latter is what we want to analyze + the reduction with. */ + gcc_assert (slp_node); + return true; + } use_operand_p use_p; gimple *use_stmt; bool res = single_imm_use (gimple_phi_result (stmt_info->stmt), @@ -7622,6 +7624,14 @@ vectorizable_reduction (loop_vec_info loop_vinfo, phi_info = loop_vinfo->lookup_stmt (use_stmt); } + if (slp_node) + { + slp_node_instance->reduc_phis = slp_node; + /* ??? We're leaving slp_node to point to the PHIs, we only + need it to get at the number of vector stmts which wasn't + yet initialized for the instance root. */ + } + /* PHIs should not participate in patterns. */ gcc_assert (!STMT_VINFO_RELATED_STMT (phi_info)); gphi *reduc_def_phi = as_a <gphi *> (phi_info->stmt); @@ -7637,6 +7647,11 @@ vectorizable_reduction (loop_vec_info loop_vinfo, bool only_slp_reduc_chain = true; stmt_info = NULL; slp_tree slp_for_stmt_info = slp_node ? slp_node_instance->root : NULL; + /* For double-reductions we start SLP analysis at the inner loop LC PHI + which is the def of the outer loop live stmt. */ + if (STMT_VINFO_DEF_TYPE (reduc_info) == vect_double_reduction_def + && slp_node) + slp_for_stmt_info = SLP_TREE_CHILDREN (slp_for_stmt_info)[0]; while (reduc_def != PHI_RESULT (reduc_def_phi)) { stmt_vec_info def = loop_vinfo->lookup_def (reduc_def); |