aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorRichard Biener <rguenther@suse.de>2023-08-24 10:30:12 +0200
committerRichard Biener <rguenther@suse.de>2023-08-24 11:35:15 +0200
commite80f7c13f64e10c6a3354c5d6b42da60b21ed0b8 (patch)
tree4f43152b353354d1c421f575a3eaed91c4a132bf
parentaa81e80a5ae663f169496c580ba30ae281c83940 (diff)
downloadgcc-e80f7c13f64e10c6a3354c5d6b42da60b21ed0b8.zip
gcc-e80f7c13f64e10c6a3354c5d6b42da60b21ed0b8.tar.gz
gcc-e80f7c13f64e10c6a3354c5d6b42da60b21ed0b8.tar.bz2
tree-optimization/111125 - properly cost BB reduction remain stmt handling
We assume that all root stmts which compose the total reduction chain are vectorized but fail to account for the cost of adding back the scalar defs we are not vectorizing. The following rectifies this, fixing the gcc.dg/tree-ssa/slsr-11.c FAIL on aarch64. PR tree-optimization/111125 * tree-vect-slp.cc (vectorizable_bb_reduc_epilogue): Account for the remain_defs processing.
-rw-r--r--gcc/tree-vect-slp.cc5
1 files changed, 5 insertions, 0 deletions
diff --git a/gcc/tree-vect-slp.cc b/gcc/tree-vect-slp.cc
index b5f9333..0bcc530 100644
--- a/gcc/tree-vect-slp.cc
+++ b/gcc/tree-vect-slp.cc
@@ -6406,6 +6406,11 @@ vectorizable_bb_reduc_epilogue (slp_instance instance,
vectype, 0, vect_body);
record_stmt_cost (cost_vec, 1, vec_to_scalar, instance->root_stmts[0],
vectype, 0, vect_body);
+
+ /* Since we replace all stmts of a possibly longer scalar reduction
+ chain account for the extra scalar stmts for that. */
+ record_stmt_cost (cost_vec, instance->remain_defs.length (), scalar_stmt,
+ instance->root_stmts[0], 0, vect_body);
return true;
}