aboutsummaryrefslogtreecommitdiff
path: root/gcc/tree-vect-loop.c
diff options
context:
space:
mode:
authorRichard Biener <rguenther@suse.de>2021-08-23 13:37:41 +0200
committerRichard Biener <rguenther@suse.de>2021-08-23 14:28:54 +0200
commit12dc8ab983db039a570e3798b468498e2230c7d9 (patch)
treeecac15d26a768770a2701fee977df8001a7d55aa /gcc/tree-vect-loop.c
parent537878152ded8b7d271333b803b36c27a9aea8d2 (diff)
downloadgcc-12dc8ab983db039a570e3798b468498e2230c7d9.zip
gcc-12dc8ab983db039a570e3798b468498e2230c7d9.tar.gz
gcc-12dc8ab983db039a570e3798b468498e2230c7d9.tar.bz2
Fix scalar costing issue introduced by PR84512 fix.
This fixes double-scaling of the inner loop scalar cost caused by routing the scalar costs through the add_stmt_cost hook and using vect_body as the location. The issue makes almost every outer loop vectorization profitable. 2021-08-23 Richard Biener <rguenther@suse.de> * tree-vect-loop.c (vect_compute_single_scalar_iteration_cost): Properly scale the inner loop cost only once.
Diffstat (limited to 'gcc/tree-vect-loop.c')
-rw-r--r--gcc/tree-vect-loop.c12
1 files changed, 8 insertions, 4 deletions
diff --git a/gcc/tree-vect-loop.c b/gcc/tree-vect-loop.c
index 995d143..c521b43a 100644
--- a/gcc/tree-vect-loop.c
+++ b/gcc/tree-vect-loop.c
@@ -1284,6 +1284,8 @@ vect_compute_single_scalar_iteration_cost (loop_vec_info loop_vinfo)
else
kind = scalar_stmt;
+ /* We are using vect_prologue here to avoid scaling twice
+ by the inner loop factor. */
record_stmt_cost (&LOOP_VINFO_SCALAR_ITERATION_COST (loop_vinfo),
factor, kind, stmt_info, 0, vect_prologue);
}
@@ -1297,11 +1299,13 @@ vect_compute_single_scalar_iteration_cost (loop_vec_info loop_vinfo)
j, si)
(void) add_stmt_cost (loop_vinfo, target_cost_data, si->count,
si->kind, si->stmt_info, si->vectype,
- si->misalign, vect_body);
- unsigned dummy, body_cost = 0;
- finish_cost (target_cost_data, &dummy, &body_cost, &dummy);
+ si->misalign, si->where);
+ unsigned prologue_cost = 0, body_cost = 0, epilogue_cost = 0;
+ finish_cost (target_cost_data, &prologue_cost, &body_cost,
+ &epilogue_cost);
destroy_cost_data (target_cost_data);
- LOOP_VINFO_SINGLE_SCALAR_ITERATION_COST (loop_vinfo) = body_cost;
+ LOOP_VINFO_SINGLE_SCALAR_ITERATION_COST (loop_vinfo)
+ = prologue_cost + body_cost + epilogue_cost;
}