aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorRichard Biener <rguenther@suse.de>2021-01-11 11:47:46 +0100
committerRichard Biener <rguenther@suse.de>2021-01-11 12:50:59 +0100
commit04bff1bbfc11a974342c0eb0c0d65d902e36e82e (patch)
treee5e388be69a634533336b93b76bd982451162442
parent928e96bbe98bafff18f11a7351cf89592967b061 (diff)
downloadgcc-04bff1bbfc11a974342c0eb0c0d65d902e36e82e.zip
gcc-04bff1bbfc11a974342c0eb0c0d65d902e36e82e.tar.gz
gcc-04bff1bbfc11a974342c0eb0c0d65d902e36e82e.tar.bz2
tree-optimization/98526 - fix vectorizer reduction cost
This fixes a double-counting in the reduction cost when vectorizing the reduction through the regular vectorizable_* functions. 2021-01-11 Richard Biener <rguenther@suse.de> PR tree-optimization/98526 * tree-vect-loop.c (vect_model_reduction_cost): Remove costing of the actual reduction op for the regular case. (vectorizable_reduction): Cost the stmts vect_transform_reduction produces here.
-rw-r--r--gcc/tree-vect-loop.c17
1 files changed, 11 insertions, 6 deletions
diff --git a/gcc/tree-vect-loop.c b/gcc/tree-vect-loop.c
index 965cc16..acfd195 100644
--- a/gcc/tree-vect-loop.c
+++ b/gcc/tree-vect-loop.c
@@ -4452,8 +4452,8 @@ have_whole_vector_shift (machine_mode mode)
/* Function vect_model_reduction_cost.
Models cost for a reduction operation, including the vector ops
- generated within the strip-mine loop, the initial definition before
- the loop, and the epilogue code that must be generated. */
+ generated within the strip-mine loop in some cases, the initial
+ definition before the loop, and the epilogue code that must be generated. */
static void
vect_model_reduction_cost (loop_vec_info loop_vinfo,
@@ -4516,10 +4516,6 @@ vect_model_reduction_cost (loop_vec_info loop_vinfo,
prologue_cost += record_stmt_cost (cost_vec, prologue_stmts,
scalar_to_vec, stmt_info, 0,
vect_prologue);
-
- /* Cost of reduction op inside loop. */
- inside_cost = record_stmt_cost (cost_vec, ncopies, vector_stmt,
- stmt_info, 0, vect_body);
}
/* Determine cost of epilogue code.
@@ -7268,6 +7264,15 @@ vectorizable_reduction (loop_vec_info loop_vinfo,
vect_model_reduction_cost (loop_vinfo, stmt_info, reduc_fn,
reduction_type, ncopies, cost_vec);
+ /* Cost the reduction op inside the loop if transformed via
+ vect_transform_reduction. Otherwise this is costed by the
+ separate vectorizable_* routines. */
+ if (single_defuse_cycle
+ || code == DOT_PROD_EXPR
+ || code == WIDEN_SUM_EXPR
+ || code == SAD_EXPR)
+ record_stmt_cost (cost_vec, ncopies, vector_stmt, stmt_info, 0, vect_body);
+
if (dump_enabled_p ()
&& reduction_type == FOLD_LEFT_REDUCTION)
dump_printf_loc (MSG_NOTE, vect_location,