aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorHonza <jh@ryzen4.suse.cz>2023-07-28 19:39:19 +0200
committerHonza <jh@ryzen4.suse.cz>2023-07-28 19:39:19 +0200
commit88618fa0211d77d91b70f7af9b02e08a34b57912 (patch)
treecfd1053672c124cdf0613e618201b8f1a3f65280
parentfdbb0863b6111ad3f45b79f47ebfe471555b2c4a (diff)
downloadgcc-88618fa0211d77d91b70f7af9b02e08a34b57912.zip
gcc-88618fa0211d77d91b70f7af9b02e08a34b57912.tar.gz
gcc-88618fa0211d77d91b70f7af9b02e08a34b57912.tar.bz2
Cleanup profile updating code in unrolling and splitting
I have noticed that for all these three cases I need same update of loop exit probability. While my earlier patch unified it for unrollers, this patch makes it more general and also simplifies tree-ssa-loop-split.cc. I also refactored the code, since with all the special cases for corrupted profile it gets relatively long. I now also handle multiple loop exits in RTL unroller. Bootstrapped/regtested x86_64-linux, comitted. gcc/ChangeLog: * cfgloopmanip.cc (loop_count_in): Break out from ... (loop_exit_for_scaling): Break out from ... (update_loop_exit_probability_scale_dom_bbs): Break out from ...; add more sanity check and debug info. (scale_loop_profile): ... here. (create_empty_loop_on_edge): Fix whitespac. * cfgloopmanip.h (update_loop_exit_probability_scale_dom_bbs): Declare. * loop-unroll.cc (unroll_loop_constant_iterations): Use update_loop_exit_probability_scale_dom_bbs. * tree-ssa-loop-manip.cc (update_exit_probability_after_unrolling): Remove. (tree_transform_and_unroll_loop): Use update_loop_exit_probability_scale_dom_bbs. * tree-ssa-loop-split.cc (split_loop): Use update_loop_exit_probability_scale_dom_bbs.
-rw-r--r--gcc/cfgloopmanip.cc276
-rw-r--r--gcc/cfgloopmanip.h3
-rw-r--r--gcc/loop-unroll.cc8
-rw-r--r--gcc/tree-ssa-loop-manip.cc30
-rw-r--r--gcc/tree-ssa-loop-split.cc45
5 files changed, 199 insertions, 163 deletions
diff --git a/gcc/cfgloopmanip.cc b/gcc/cfgloopmanip.cc
index c3d292d..fe452ec 100644
--- a/gcc/cfgloopmanip.cc
+++ b/gcc/cfgloopmanip.cc
@@ -525,6 +525,184 @@ scale_dominated_blocks_in_loop (class loop *loop, basic_block bb,
}
}
+/* Compute how many times loop is entered. */
+
+profile_count
+loop_count_in (class loop *loop)
+{
+ /* Compute number of invocations of the loop. */
+ profile_count count_in = profile_count::zero ();
+ edge e;
+ edge_iterator ei;
+ bool found_latch = false;
+
+ if (loops_state_satisfies_p (LOOPS_MAY_HAVE_MULTIPLE_LATCHES))
+ FOR_EACH_EDGE (e, ei, loop->header->preds)
+ if (!flow_bb_inside_loop_p (loop, e->src))
+ count_in += e->count ();
+ else
+ found_latch = true;
+ else
+ FOR_EACH_EDGE (e, ei, loop->header->preds)
+ if (e->src != loop->latch)
+ count_in += e->count ();
+ else
+ found_latch = true;
+ gcc_checking_assert (found_latch);
+ return count_in;
+}
+
+/* Return exit that suitable for update when loop iterations
+ changed. */
+
+static edge
+loop_exit_for_scaling (class loop *loop)
+{
+ edge exit_edge = single_exit (loop);
+ if (!exit_edge)
+ {
+ auto_vec<edge> exits = get_loop_exit_edges (loop);
+ exit_edge = single_likely_exit (loop, exits);
+ }
+ return exit_edge;
+}
+
+/* Assume that loop's entry count and profile up to a given EXIT_EDGE is
+ consistent. Update exit probability so loop exists with PROFILE_COUNT
+ and rescale profile of basic blocks inside loop dominated by EXIT_EDGE->src.
+
+ This is useful after number of iteraitons of loop has changed.
+ If EXIT_EDGE is NULL, the function will try to identify suitable exit.
+ If DESIRED_COUNT is NULL, loop entry count will be used.
+ In consistent profile usually loop exists as many times as it is entred.
+
+ Return updated exit if successfull and NULL otherwise. */
+
+edge
+update_loop_exit_probability_scale_dom_bbs (class loop *loop,
+ edge exit_edge,
+ profile_count desired_count)
+{
+ if (!exit_edge)
+ exit_edge = loop_exit_for_scaling (loop);
+ if (!exit_edge)
+ {
+ if (dump_file && (dump_flags & TDF_DETAILS))
+ {
+ fprintf (dump_file, ";; Not updating exit probability of loop %i;"
+ " it has no single exit\n",
+ loop->num);
+ }
+ return NULL;
+ }
+ /* If exit is inside another loop, adjusting its probability will also
+ adjust number of the inner loop iterations. Just do noting for now. */
+ if (!just_once_each_iteration_p (loop, exit_edge->src))
+ {
+ if (dump_file && (dump_flags & TDF_DETAILS))
+ {
+ fprintf (dump_file, ";; Not updating exit probability of loop %i;"
+ " exit is inside inner loop\n",
+ loop->num);
+ }
+ return NULL;
+ }
+ /* Normal loops exit as many times as they are entered. */
+ if (!desired_count.initialized_p ())
+ desired_count = loop_count_in (loop);
+ /* See if everything is already perfect. */
+ if (desired_count == exit_edge->count ())
+ return exit_edge;
+ profile_count old_exit_count = exit_edge->count ();
+ /* See if update is possible.
+ Avoid turning probability to 0 or 1 just trying to reach impossible
+ value.
+
+ Natural profile update after some loop will happily scale header count to
+ be less than count of entering the loop. This is bad idea and they should
+ special case maybe_flat_loop_profile.
+
+ It may also happen that the source basic block of the exit edge is
+ inside in-loop condition:
+
+ +-> header
+ | |
+ | B1
+ | / \
+ | | B2--exit_edge-->
+ | \ /
+ | B3
+ +__/
+
+ If B2 count is smaller than desired exit edge count
+ the profile was inconsistent with the newly discovered upper bound.
+ Probablity of edge B1->B2 is too low. We do not attempt to fix
+ that (as it is hard in general). */
+ if (desired_count > exit_edge->src->count
+ && exit_edge->src->count.differs_from_p (desired_count))
+ {
+ if (dump_file)
+ {
+ fprintf (dump_file, ";; Source bb of loop %i has count ",
+ loop->num);
+ exit_edge->src->count.dump (dump_file, cfun);
+ fprintf (dump_file,
+ " which is smaller then desired count of exitting loop ");
+ desired_count.dump (dump_file, cfun);
+ fprintf (dump_file, ". Profile update is impossible.\n");
+ }
+ /* Drop quality of probability since we know it likely
+ bad. */
+ exit_edge->probability = exit_edge->probability.guessed ();
+ return NULL;
+ }
+ if (!exit_edge->src->count.nonzero_p ())
+ {
+ if (dump_file)
+ {
+ fprintf (dump_file, ";; Not updating exit edge probability"
+ " in loop %i since profile is zero ",
+ loop->num);
+ }
+ return NULL;
+ }
+ set_edge_probability_and_rescale_others
+ (exit_edge, desired_count.probability_in (exit_edge->src->count));
+ /* Rescale the remaining edge probabilities and see if there is only
+ one. */
+ edge other_edge = NULL;
+ bool found = false;
+ edge e;
+ edge_iterator ei;
+ FOR_EACH_EDGE (e, ei, exit_edge->src->succs)
+ if (!(e->flags & EDGE_FAKE)
+ && !loop_exit_edge_p (loop, e))
+ {
+ if (found)
+ {
+ other_edge = NULL;
+ break;
+ }
+ other_edge = e;
+ found = true;
+ }
+ /* If there is only loop latch after other edge,
+ update its profile. This is tiny bit more precise
+ than scaling. */
+ if (other_edge && other_edge->dest == loop->latch)
+ {
+ if (single_pred_p (loop->latch))
+ loop->latch->count = loop->latch->count
+ + old_exit_count - exit_edge->count ();
+ }
+ else
+ /* If there are multple blocks, just scale. */
+ scale_dominated_blocks_in_loop (loop, exit_edge->src,
+ exit_edge->src->count - exit_edge->count (),
+ exit_edge->src->count - old_exit_count);
+ return exit_edge;
+}
+
/* Scale profile in LOOP by P.
If ITERATION_BOUND is not -1, scale even further if loop is predicted
to iterate too many times.
@@ -571,17 +749,7 @@ scale_loop_profile (class loop *loop, profile_probability p,
if (iterations <= iteration_bound)
return;
- /* Compute number of invocations of the loop. */
- profile_count count_in = profile_count::zero ();
- edge e;
- edge_iterator ei;
- bool found_latch = false;
- FOR_EACH_EDGE (e, ei, loop->header->preds)
- if (e->src != loop->latch)
- count_in += e->count ();
- else
- found_latch = true;
- gcc_checking_assert (found_latch);
+ profile_count count_in = loop_count_in (loop);
/* Now scale the loop body so header count is
count_in * (iteration_bound + 1) */
@@ -596,8 +764,7 @@ scale_loop_profile (class loop *loop, profile_probability p,
(int)iteration_bound);
}
/* Finally attempt to fix exit edge probability. */
- auto_vec<edge> exits = get_loop_exit_edges (loop);
- edge exit_edge = single_likely_exit (loop, exits);
+ edge exit_edge = loop_exit_for_scaling (loop);
/* In a consistent profile unadjusted_exit_count should be same as count_in,
however to preserve as much of the original info, avoid recomputing
@@ -606,85 +773,8 @@ scale_loop_profile (class loop *loop, profile_probability p,
if (exit_edge)
unadjusted_exit_count = exit_edge->count ();
scale_loop_frequencies (loop, scale_prob);
-
- if (exit_edge && exit_edge->src->loop_father != loop)
- {
- if (dump_file && (dump_flags & TDF_DETAILS))
- fprintf (dump_file,
- ";; Loop exit is in inner loop;"
- " will leave exit probabilities inconsistent\n");
- }
- else if (exit_edge)
- {
- profile_count old_exit_count = exit_edge->count ();
- profile_probability new_probability;
- if (iteration_bound > 0)
- {
- /* It may happen that the source basic block of the exit edge is
- inside in-loop condition:
-
- +-> header
- | |
- | B1
- | / \
- | | B2--exit_edge-->
- | \ /
- | B3
- +__/
-
- If B2 count is smaller than desired exit edge count
- the profile was inconsistent with the newly discovered upper bound.
- Probablity of edge B1->B2 is too low. We do not attempt to fix
- that (as it is hard in general) but we want to avoid dropping
- count of edge B2->B3 to zero may confuse later optimizations. */
- if (unadjusted_exit_count.apply_scale (7, 8) > exit_edge->src->count)
- {
- if (dump_file && (dump_flags & TDF_DETAILS))
- fprintf (dump_file,
- ";; Source basic block of loop exit count is too small;"
- " will leave exit probabilities inconsistent\n");
- exit_edge->probability = exit_edge->probability.guessed ();
- return;
- }
- new_probability
- = unadjusted_exit_count.probability_in (exit_edge->src->count);
- }
- else
- new_probability = profile_probability::always ();
- set_edge_probability_and_rescale_others (exit_edge, new_probability);
- profile_count new_exit_count = exit_edge->count ();
-
- /* Rescale the remaining edge probabilities and see if there is only
- one. */
- edge other_edge = NULL;
- bool found = false;
- FOR_EACH_EDGE (e, ei, exit_edge->src->succs)
- if (!(e->flags & EDGE_FAKE)
- && !loop_exit_edge_p (loop, e))
- {
- if (found)
- {
- other_edge = NULL;
- break;
- }
- other_edge = e;
- found = true;
- }
- /* If there is only loop latch after other edge,
- update its profile. */
- if (other_edge && other_edge->dest == loop->latch)
- loop->latch->count -= new_exit_count - old_exit_count;
- else
- scale_dominated_blocks_in_loop (loop, exit_edge->src,
- exit_edge->src->count - new_exit_count,
- exit_edge->src->count - old_exit_count);
- }
- else if (dump_file && (dump_flags & TDF_DETAILS))
- {
- fprintf (dump_file,
- ";; Loop has mulitple exits;"
- " will leave exit probabilities inconsistent\n");
- }
+ update_loop_exit_probability_scale_dom_bbs (loop, exit_edge,
+ unadjusted_exit_count);
}
/* Recompute dominance information for basic blocks outside LOOP. */
@@ -924,7 +1014,7 @@ create_empty_loop_on_edge (edge entry_edge,
have no successor, which caller is expected to fix somehow.
If this may cause the information about irreducible regions to become
- invalid, IRRED_INVALIDATED is set to true.
+ invalid, IRRED_INVALIDATED is set to true.
LOOP_CLOSED_SSA_INVALIDATED, if non-NULL, is a bitmap where we store
basic blocks that had non-trivial update on their loop_father.*/
diff --git a/gcc/cfgloopmanip.h b/gcc/cfgloopmanip.h
index dab7b31..2dda504 100644
--- a/gcc/cfgloopmanip.h
+++ b/gcc/cfgloopmanip.h
@@ -68,6 +68,9 @@ class loop * loop_version (class loop *, void *,
void adjust_loop_info_after_peeling (class loop *loop, int npeel, bool precise);
void scale_dominated_blocks_in_loop (class loop *loop, basic_block bb,
profile_count num, profile_count den);
+edge update_loop_exit_probability_scale_dom_bbs
+ (class loop *loop, edge exit_edge = NULL,
+ profile_count desired_count = profile_count::uninitialized ());
void update_exit_probability_after_unrolling (class loop *loop, edge new_exit);
#endif /* GCC_CFGLOOPMANIP_H */
diff --git a/gcc/loop-unroll.cc b/gcc/loop-unroll.cc
index bbfa6cc..1df8e6c 100644
--- a/gcc/loop-unroll.cc
+++ b/gcc/loop-unroll.cc
@@ -488,6 +488,7 @@ unroll_loop_constant_iterations (class loop *loop)
struct opt_info *opt_info = NULL;
bool ok;
bool flat = maybe_flat_loop_profile (loop);
+ profile_count orig_exit_count = desc->out_edge->count ();
niter = desc->niter;
@@ -608,9 +609,10 @@ unroll_loop_constant_iterations (class loop *loop)
| (flat ? DLTHE_FLAG_FLAT_PROFILE : 0));
gcc_assert (ok);
- edge new_exit = single_dom_exit (loop);
- if (new_exit)
- update_exit_probability_after_unrolling (loop, new_exit);
+ edge exit = update_loop_exit_probability_scale_dom_bbs
+ (loop, desc->out_edge, orig_exit_count);
+ if (exit)
+ update_br_prob_note (exit->src);
if (opt_info)
{
diff --git a/gcc/tree-ssa-loop-manip.cc b/gcc/tree-ssa-loop-manip.cc
index e58892e..e743691 100644
--- a/gcc/tree-ssa-loop-manip.cc
+++ b/gcc/tree-ssa-loop-manip.cc
@@ -1040,29 +1040,6 @@ determine_exit_conditions (class loop *loop, class tree_niter_desc *desc,
*exit_bound = bound;
}
-/* Updat NEW_EXIT probability after loop has been unrolled. */
-
-void
-update_exit_probability_after_unrolling (class loop *loop, edge new_exit)
-{
- /* gimple_duplicate_loop_body_to_header_edge depending on
- DLTHE_FLAG_UPDATE_FREQ either keeps original frequency of the loop header
- or scales it down accordingly.
- However exit edge probability is kept as original. Fix it if needed
- and compensate. */
- profile_probability new_prob
- = loop_preheader_edge
- (loop)->count ().probability_in (new_exit->src->count);
- if (!(new_prob == new_exit->probability))
- {
- profile_count old_count = new_exit->src->count - new_exit->count ();
- set_edge_probability_and_rescale_others (new_exit, new_prob);
- profile_count new_count = new_exit->src->count - new_exit->count ();
- scale_dominated_blocks_in_loop (loop, new_exit->src,
- new_count, old_count);
- }
-}
-
/* Unroll LOOP FACTOR times. LOOP is known to have a single exit edge
whose source block dominates the latch. DESC describes the number of
iterations of LOOP.
@@ -1289,7 +1266,12 @@ tree_transform_and_unroll_loop (class loop *loop, unsigned factor,
update_ssa (TODO_update_ssa);
new_exit = single_dom_exit (loop);
- update_exit_probability_after_unrolling (loop, new_exit);
+ /* gimple_duplicate_loop_body_to_header_edge depending on
+ DLTHE_FLAG_UPDATE_FREQ either keeps original frequency of the loop header
+ or scales it down accordingly.
+ However exit edge probability is kept as original. Fix it if needed
+ and compensate. */
+ update_loop_exit_probability_scale_dom_bbs (loop, new_exit);
if (!single_loop_p)
{
/* Finally create the new counter for number of iterations and add
diff --git a/gcc/tree-ssa-loop-split.cc b/gcc/tree-ssa-loop-split.cc
index 641346c..923e49e 100644
--- a/gcc/tree-ssa-loop-split.cc
+++ b/gcc/tree-ssa-loop-split.cc
@@ -610,7 +610,6 @@ split_loop (class loop *loop1)
for (i = 0; i < loop1->num_nodes; i++)
if ((guard_iv = split_at_bb_p (loop1, bbs[i], &border, &iv, &guard_code)))
{
- profile_count entry_count = loop_preheader_edge (loop1)->count ();
/* Handling opposite steps is not implemented yet. Neither
is handling different step sizes. */
if ((tree_int_cst_sign_bit (iv.step)
@@ -692,48 +691,8 @@ split_loop (class loop *loop1)
= loop1_prob.invert ();
fix_loop_bb_probability (loop1, loop2, true_edge, false_edge);
-
- /* Fix loop's exit probability after scaling. */
-
- if (entry_count.initialized_p () && entry_count.nonzero_p ())
- {
- edge exit_to_latch1;
- if (EDGE_SUCC (exit1->src, 0) == exit1)
- exit_to_latch1 = EDGE_SUCC (exit1->src, 1);
- else
- exit_to_latch1 = EDGE_SUCC (exit1->src, 0);
- if (exit1->src->count.nonzero_p ())
- {
- /* First loop is entered loop1_prob * entry_count times
- and it needs to exit the same number of times. */
- exit1->probability
- = entry_count.apply_probability
- (loop1_prob).probability_in (exit1->src->count);
- exit_to_latch1->probability = exit1->probability.invert ();
- scale_dominated_blocks_in_loop (loop1, exit1->src,
- exit_to_latch1->count (),
- exit_to_latch1->dest->count);
- }
-
- edge exit_to_latch2, exit2 = single_exit (loop2);
- if (EDGE_SUCC (exit2->src, 0) == exit2)
- exit_to_latch2 = EDGE_SUCC (exit2->src, 1);
- else
- exit_to_latch2 = EDGE_SUCC (exit2->src, 0);
- if (exit2->src->count.nonzero_p ())
- {
- /* Second loop is entered very_likely * entry_count times
- and it needs to exit the same number of times. */
- exit2->probability
- = entry_count.apply_probability
- (profile_probability::very_likely ())
- .probability_in (exit2->src->count);
- exit_to_latch2->probability = exit2->probability.invert ();
- scale_dominated_blocks_in_loop (loop2, exit2->src,
- exit_to_latch2->count (),
- exit_to_latch2->dest->count);
- }
- }
+ update_loop_exit_probability_scale_dom_bbs (loop1);
+ update_loop_exit_probability_scale_dom_bbs (loop2);
edge new_e = connect_loops (loop1, loop2);
connect_loop_phis (loop1, loop2, new_e);