// Implementation of basic-block-related functions for RTL SSA -*- C++ -*-
// Copyright (C) 2020-2024 Free Software Foundation, Inc.
//
// This file is part of GCC.
//
// GCC is free software; you can redistribute it and/or modify it under
// the terms of the GNU General Public License as published by the Free
// Software Foundation; either version 3, or (at your option) any later
// version.
//
// GCC is distributed in the hope that it will be useful, but WITHOUT ANY
// WARRANTY; without even the implied warranty of MERCHANTABILITY or
// FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
// for more details.
//
// You should have received a copy of the GNU General Public License
// along with GCC; see the file COPYING3. If not see
// .
#define INCLUDE_ALGORITHM
#define INCLUDE_FUNCTIONAL
#define INCLUDE_MEMORY
#define INCLUDE_ARRAY
#include "config.h"
#include "system.h"
#include "coretypes.h"
#include "backend.h"
#include "rtl.h"
#include "df.h"
#include "rtl-ssa.h"
#include "rtl-ssa/internals.h"
#include "rtl-ssa/internals.inl"
#include "cfganal.h"
#include "cfgrtl.h"
#include "predict.h"
#include "domwalk.h"
using namespace rtl_ssa;
// Prepare to build information for a function in which all register numbers
// are less than NUM_REGS and all basic block indices are less than
// NUM_BB_INDICES
function_info::build_info::build_info (unsigned int num_regs,
unsigned int num_bb_indices)
: current_bb (nullptr),
current_ebb (nullptr),
last_access (num_regs + 1),
ebb_live_in_for_debug (nullptr),
potential_phi_regs (num_regs),
bb_phis (num_bb_indices),
bb_mem_live_out (num_bb_indices),
bb_to_rpo (num_bb_indices),
exit_block_dominator (nullptr)
{
last_access.safe_grow_cleared (num_regs + 1);
bitmap_clear (potential_phi_regs);
// These arrays shouldn't need to be initialized, since we'll always
// write to an entry before reading from it. But poison the contents
// when checking, just to make sure we don't accidentally use an
// uninitialized value.
bb_phis.quick_grow_cleared (num_bb_indices);
bb_mem_live_out.quick_grow (num_bb_indices);
bb_to_rpo.quick_grow (num_bb_indices);
if (flag_checking)
{
// Can't do this for bb_phis because it has a constructor.
memset (bb_mem_live_out.address (), 0xaf,
num_bb_indices * sizeof (bb_mem_live_out[0]));
memset (bb_to_rpo.address (), 0xaf,
num_bb_indices * sizeof (bb_to_rpo[0]));
}
// Start off with an empty set of phi nodes for each block.
for (bb_phi_info &info : bb_phis)
bitmap_initialize (&info.regs, &bitmap_default_obstack);
}
function_info::build_info::~build_info ()
{
for (bb_phi_info &info : bb_phis)
bitmap_release (&info.regs);
}
// A dom_walker for populating the basic blocks.
class function_info::bb_walker : public dom_walker
{
public:
bb_walker (function_info *, build_info &);
edge before_dom_children (basic_block) final override;
void after_dom_children (basic_block) final override;
private:
// Information about the function we're building.
function_info *m_function;
build_info &m_bi;
// We should treat the exit block as being the last child of this one.
// See the comment in the constructor for more information.
basic_block m_exit_block_dominator;
};
// Prepare to walk the blocks in FUNCTION using BI.
function_info::bb_walker::bb_walker (function_info *function, build_info &bi)
: dom_walker (CDI_DOMINATORS, ALL_BLOCKS, bi.bb_to_rpo.address ()),
m_function (function),
m_bi (bi),
m_exit_block_dominator (bi.exit_block_dominator)
{
// If the exit block is unreachable, process it last.
if (!m_exit_block_dominator)
m_exit_block_dominator = ENTRY_BLOCK_PTR_FOR_FN (m_function->m_fn);
}
edge
function_info::bb_walker::before_dom_children (basic_block bb)
{
m_function->start_block (m_bi, m_function->bb (bb));
return nullptr;
}
void
function_info::bb_walker::after_dom_children (basic_block bb)
{
// See the comment in the constructor for details.
if (bb == m_exit_block_dominator)
{
before_dom_children (EXIT_BLOCK_PTR_FOR_FN (m_function->m_fn));
after_dom_children (EXIT_BLOCK_PTR_FOR_FN (m_function->m_fn));
}
m_function->end_block (m_bi, m_function->bb (bb));
}
// See the comment above the declaration.
void
bb_info::print_identifier (pretty_printer *pp) const
{
char tmp[3 * sizeof (index ()) + 3];
snprintf (tmp, sizeof (tmp), "bb%d", index ());
pp_string (pp, tmp);
if (ebb_info *ebb = this->ebb ())
{
pp_space (pp);
pp_left_bracket (pp);
ebb->print_identifier (pp);
pp_right_bracket (pp);
}
}
// See the comment above the declaration.
void
bb_info::print_full (pretty_printer *pp) const
{
pp_string (pp, "basic block ");
print_identifier (pp);
pp_colon (pp);
auto print_insn = [pp](const char *header, const insn_info *insn)
{
pp_newline_and_indent (pp, 2);
pp_string (pp, header);
pp_newline_and_indent (pp, 2);
if (insn)
pp_insn (pp, insn);
else
pp_string (pp, "");
pp_indentation (pp) -= 4;
};
print_insn ("head:", head_insn ());
pp_newline (pp);
pp_newline_and_indent (pp, 2);
pp_string (pp, "contents:");
if (!head_insn ())
{
pp_newline_and_indent (pp, 2);
pp_string (pp, "");
pp_indentation (pp) -= 2;
}
else if (auto insns = real_insns ())
{
bool is_first = true;
for (const insn_info *insn : insns)
{
if (is_first)
is_first = false;
else
pp_newline (pp);
pp_newline_and_indent (pp, 2);
pp_insn (pp, insn);
pp_indentation (pp) -= 2;
}
}
else
{
pp_newline_and_indent (pp, 2);
pp_string (pp, "none");
pp_indentation (pp) -= 2;
}
pp_indentation (pp) -= 2;
pp_newline (pp);
print_insn ("end:", end_insn ());
}
// See the comment above the declaration.
void
ebb_call_clobbers_info::print_summary (pretty_printer *pp) const
{
pp_string (pp, "call clobbers for ABI ");
if (m_abi)
pp_decimal_int (pp, m_abi->id ());
else
pp_string (pp, "");
}
// See the comment above the declaration.
void
ebb_call_clobbers_info::print_full (pretty_printer *pp) const
{
print_summary (pp);
pp_colon (pp);
pp_newline_and_indent (pp, 2);
auto print_node = [](pretty_printer *pp,
const insn_call_clobbers_note *note)
{
if (insn_info *insn = note->insn ())
insn->print_identifier_and_location (pp);
else
pp_string (pp, "");
};
print (pp, root (), print_node);
pp_indentation (pp) -= 2;
}
// See the comment above the declaration.
void
ebb_info::print_identifier (pretty_printer *pp) const
{
// first_bb is populated by the constructor and so should always
// be nonnull.
auto index = first_bb ()->index ();
char tmp[3 * sizeof (index) + 4];
snprintf (tmp, sizeof (tmp), "ebb%d", index);
pp_string (pp, tmp);
}
// See the comment above the declaration.
void
ebb_info::print_full (pretty_printer *pp) const
{
pp_string (pp, "extended basic block ");
print_identifier (pp);
pp_colon (pp);
pp_newline_and_indent (pp, 2);
if (insn_info *phi_insn = this->phi_insn ())
{
phi_insn->print_identifier_and_location (pp);
pp_colon (pp);
if (auto phis = this->phis ())
{
bool is_first = true;
for (const phi_info *phi : phis)
{
if (is_first)
is_first = false;
else
pp_newline (pp);
pp_newline_and_indent (pp, 2);
pp_access (pp, phi, PP_ACCESS_SETTER);
pp_indentation (pp) -= 2;
}
}
else
{
pp_newline_and_indent (pp, 2);
pp_string (pp, "no phi nodes");
pp_indentation (pp) -= 2;
}
}
else
pp_string (pp, "no phi insn");
pp_indentation (pp) -= 2;
for (const bb_info *bb : bbs ())
{
pp_newline (pp);
pp_newline_and_indent (pp, 2);
pp_bb (pp, bb);
pp_indentation (pp) -= 2;
}
for (ebb_call_clobbers_info *ecc : call_clobbers ())
{
pp_newline (pp);
pp_newline_and_indent (pp, 2);
pp_ebb_call_clobbers (pp, ecc);
pp_indentation (pp) -= 2;
}
}
// Add a dummy use to mark that DEF is live out of BB's EBB at the end of BB.
void
function_info::add_live_out_use (bb_info *bb, set_info *def)
{
// There is nothing to do if DEF is an artificial definition at the end
// of BB. In that case the definitino is rooted at the end of the block
// and we wouldn't gain anything by inserting a use immediately after it.
// If we did want to insert a use, we'd need to associate it with a new
// instruction that comes after bb->end_insn ().
if (def->insn () == bb->end_insn ())
return;
// If the end of the block already has an artificial use, that use
// acts to make DEF live at the appropriate point.
use_info *use = def->last_nondebug_insn_use ();
if (use && use->insn () == bb->end_insn ())
return;
// Currently there is no need to maintain a backward link from the end
// instruction to the list of live-out uses. Such a list would be
// expensive to update if it was represented using the usual insn_info
// access arrays.
use = allocate (bb->end_insn (), def->resource (), def);
use->set_is_live_out_use (true);
add_use (use);
}
// Return true if all nondebug uses of DEF are live-out uses.
static bool
all_uses_are_live_out_uses (set_info *def)
{
for (use_info *use : def->all_uses ())
if (!use->is_in_debug_insn () && !use->is_live_out_use ())
return false;
return true;
}
// SET, if nonnull, is a definition of something that is live out from BB.
// Return the live-out value itself.
set_info *
function_info::live_out_value (bb_info *bb, set_info *set)
{
// Degenerate phis only exist to provide a definition for uses in the
// same EBB. The live-out value is the same as the live-in value.
if (auto *phi = safe_dyn_cast (set))
if (phi->is_degenerate ())
{
set = phi->input_value (0);
// Remove the phi if it turned out to be useless. This is
// mainly useful for memory, because we don't know ahead of time
// whether a block will use memory or not.
if (bb == bb->ebb ()->last_bb () && all_uses_are_live_out_uses (phi))
replace_phi (phi, set);
}
return set;
}
// Add PHI to EBB and enter it into the function's hash table.
void
function_info::append_phi (ebb_info *ebb, phi_info *phi)
{
phi_info *first_phi = ebb->first_phi ();
if (first_phi)
first_phi->set_prev_phi (phi);
phi->set_next_phi (first_phi);
ebb->set_first_phi (phi);
add_def (phi);
}
// Remove PHI from its current position in the SSA graph.
void
function_info::remove_phi (phi_info *phi)
{
phi_info *next = phi->next_phi ();
phi_info *prev = phi->prev_phi ();
if (next)
next->set_prev_phi (prev);
if (prev)
prev->set_next_phi (next);
else
phi->ebb ()->set_first_phi (next);
remove_def (phi);
phi->clear_phi_links ();
}
// Remove PHI from the SSA graph and free its memory.
void
function_info::delete_phi (phi_info *phi)
{
gcc_assert (!phi->has_any_uses ());
// Remove the inputs to the phi.
for (use_info *input : phi->inputs ())
remove_use (input);
remove_phi (phi);
phi->set_next_phi (m_free_phis);
m_free_phis = phi;
}
// If possible, remove PHI and replace all uses with NEW_VALUE.
void
function_info::replace_phi (phi_info *phi, set_info *new_value)
{
auto update_use = [&](use_info *use)
{
remove_use (use);
use->set_def (new_value);
add_use (use);
};
if (new_value)
for (use_info *use : phi->nondebug_insn_uses ())
if (!use->is_live_out_use ())
{
// We need to keep the phi around for its local uses.
// Turn it into a degenerate phi, if it isn't already.
use_info *use = phi->input_use (0);
if (use->def () != new_value)
update_use (use);
if (phi->is_degenerate ())
return;
phi->make_degenerate (use);
// Redirect all phi users to NEW_VALUE.
while (use_info *phi_use = phi->last_phi_use ())
update_use (phi_use);
return;
}
// Replace the uses. We can discard uses that only existed for the
// sake of marking live-out values, since the resource is now transparent
// in the phi's EBB.
while (use_info *use = phi->last_use ())
if (use->is_live_out_use ())
remove_use (use);
else
update_use (use);
delete_phi (phi);
}
// Create and return a phi node for EBB. RESOURCE is the resource that
// the phi node sets (and thus that all the inputs set too). NUM_INPUTS
// is the number of inputs, which is 1 for a degenerate phi. INPUTS[I]
// is a set_info that gives the value of input I, or null if the value
// is either unknown or uninitialized. If NUM_INPUTS > 1, this array
// is allocated on the main obstack and can be reused for the use array.
//
// Add the created phi node to its basic block and enter it into the
// function's hash table.
phi_info *
function_info::create_phi (ebb_info *ebb, resource_info resource,
access_info **inputs, unsigned int num_inputs)
{
phi_info *phi = m_free_phis;
if (phi)
{
m_free_phis = phi->next_phi ();
*phi = phi_info (ebb->phi_insn (), resource, phi->uid ());
}
else
{
phi = allocate (ebb->phi_insn (), resource, m_next_phi_uid);
m_next_phi_uid += 1;
}
// Convert the array of set_infos into an array of use_infos. Also work
// out what mode the phi should have.
machine_mode new_mode = resource.mode;
for (unsigned int i = 0; i < num_inputs; ++i)
{
auto *input = safe_as_a (inputs[i]);
auto *use = allocate (phi, resource, input);
add_use (use);
inputs[i] = use;
if (input)
new_mode = combine_modes (new_mode, input->mode ());
}
phi->set_inputs (use_array (inputs, num_inputs));
phi->set_mode (new_mode);
append_phi (ebb, phi);
return phi;
}
// Create and return a degenerate phi for EBB whose input comes from DEF.
// This is used in cases where DEF is known to be available on entry to
// EBB but was not previously used within it. If DEF is for a register,
// there are two cases:
//
// (1) DEF was already live on entry to EBB but was previously transparent
// within it.
//
// (2) DEF was not previously live on entry to EBB and is being made live
// by this update.
//
// At the moment, this function only handles the case in which EBB has a
// single predecessor block and DEF is defined in that block's EBB.
phi_info *
function_info::create_degenerate_phi (ebb_info *ebb, set_info *def)
{
// Allow the function to be called twice in succession for the same def.
def_lookup dl = find_def (def->resource (), ebb->phi_insn ());
if (set_info *set = dl.matching_set ())
return as_a (set);
access_info *input = def;
phi_info *phi = create_phi (ebb, def->resource (), &input, 1);
if (def->is_reg ())
{
unsigned int regno = def->regno ();
// Find the single predecessor mentioned above.
basic_block pred_cfg_bb = single_pred (ebb->first_bb ()->cfg_bb ());
bb_info *pred_bb = this->bb (pred_cfg_bb);
if (!bitmap_set_bit (DF_LR_IN (ebb->first_bb ()->cfg_bb ()), regno))
{
// The register was not previously live on entry to EBB and
// might not have been live on exit from PRED_BB either.
if (bitmap_set_bit (DF_LR_OUT (pred_cfg_bb), regno))
add_live_out_use (pred_bb, def);
}
else
{
// The register was previously live in to EBB. Add live-out uses
// at the appropriate points.
insn_info *next_insn = nullptr;
if (def_info *next_def = phi->next_def ())
next_insn = next_def->insn ();
for (bb_info *bb : ebb->bbs ())
{
if ((next_insn && *next_insn <= *bb->end_insn ())
|| !bitmap_bit_p (DF_LR_OUT (bb->cfg_bb ()), regno))
break;
add_live_out_use (bb, def);
}
}
}
return phi;
}
// Create a bb_info for CFG_BB, given that no such structure currently exists.
bb_info *
function_info::create_bb_info (basic_block cfg_bb)
{
bb_info *bb = allocate (cfg_bb);
gcc_checking_assert (!m_bbs[cfg_bb->index]);
m_bbs[cfg_bb->index] = bb;
return bb;
}
// Add BB to the end of the list of blocks.
void
function_info::append_bb (bb_info *bb)
{
if (m_last_bb)
m_last_bb->set_next_bb (bb);
else
m_first_bb = bb;
bb->set_prev_bb (m_last_bb);
m_last_bb = bb;
}
// Calculate BI.potential_phi_regs and BI.potential_phi_regs_for_debug.
void
function_info::calculate_potential_phi_regs (build_info &bi)
{
auto *lr_info = DF_LR_BB_INFO (ENTRY_BLOCK_PTR_FOR_FN (m_fn));
bool is_debug = MAY_HAVE_DEBUG_INSNS;
for (unsigned int regno = 0; regno < m_num_regs; ++regno)
if (regno >= DF_REG_SIZE (DF)
// Exclude registers that have a single definition that dominates
// all uses. If the definition does not dominate all uses,
// the register will be exposed upwards to the entry block but
// will not be defined by the entry block.
|| DF_REG_DEF_COUNT (regno) > 1
|| (!bitmap_bit_p (&lr_info->def, regno)
&& bitmap_bit_p (&lr_info->out, regno)))
{
bitmap_set_bit (bi.potential_phi_regs, regno);
if (is_debug)
bitmap_set_bit (bi.potential_phi_regs_for_debug, regno);
}
}
// Called while building SSA form using BI. Decide where phi nodes
// should be placed for each register and initialize BI.bb_phis accordingly.
void
function_info::place_phis (build_info &bi)
{
unsigned int num_bb_indices = last_basic_block_for_fn (m_fn);
// Calculate dominance frontiers.
auto_vec frontiers;
frontiers.safe_grow_cleared (num_bb_indices);
for (unsigned int i = 0; i < num_bb_indices; ++i)
bitmap_initialize (&frontiers[i], &bitmap_default_obstack);
compute_dominance_frontiers (frontiers.address ());
// The normal dominance information doesn't calculate dominators for
// the exit block, so we don't get dominance frontiers for them either.
// Calculate them by hand.
for (edge e : EXIT_BLOCK_PTR_FOR_FN (m_fn)->preds)
{
basic_block bb = e->src;
while (bb != bi.exit_block_dominator)
{
bitmap_set_bit (&frontiers[bb->index], EXIT_BLOCK);
bb = get_immediate_dominator (CDI_DOMINATORS, bb);
}
}
// In extreme cases, the number of live-in registers can be much
// greater than the number of phi nodes needed in a block (see PR98863).
// Try to reduce the number of operations involving live-in sets by using
// PENDING as a staging area: registers in PENDING need phi nodes if
// they are live on entry to the corresponding block, but do not need
// phi nodes otherwise.
auto_vec unfiltered;
unfiltered.safe_grow_cleared (num_bb_indices);
for (unsigned int i = 0; i < num_bb_indices; ++i)
bitmap_initialize (&unfiltered[i], &bitmap_default_obstack);
// If block B1 defines R and if B2 is in the dominance frontier of B1,
// queue a possible phi node for R in B2.
auto_bitmap worklist;
for (unsigned int b1 = 0; b1 < num_bb_indices; ++b1)
{
// Only access DF information for blocks that are known to exist.
if (bitmap_empty_p (&frontiers[b1]))
continue;
// Defs in B1 that are possibly in LR_IN in the dominance frontier
// blocks.
auto_bitmap b1_def;
bitmap_and (b1_def, &DF_LR_BB_INFO (BASIC_BLOCK_FOR_FN (m_fn, b1))->def,
DF_LR_OUT (BASIC_BLOCK_FOR_FN (m_fn, b1)));
bitmap_iterator bmi;
unsigned int b2;
EXECUTE_IF_SET_IN_BITMAP (&frontiers[b1], 0, b2, bmi)
if (bitmap_ior_into (&unfiltered[b2], b1_def)
&& !bitmap_empty_p (&frontiers[b2]))
// Propagate the (potential) new phi node definitions in B2.
bitmap_set_bit (worklist, b2);
}
while (!bitmap_empty_p (worklist))
{
unsigned int b1 = bitmap_first_set_bit (worklist);
bitmap_clear_bit (worklist, b1);
// Restrict the phi nodes to registers that are live on entry to
// the block.
bitmap b1_in = DF_LR_IN (BASIC_BLOCK_FOR_FN (m_fn, b1));
bitmap b1_phis = &bi.bb_phis[b1].regs;
if (!bitmap_ior_and_into (b1_phis, &unfiltered[b1], b1_in))
continue;
// If block B1 has a phi node for R and if B2 is in the dominance
// frontier of B1, queue a possible phi node for R in B2.
bitmap_iterator bmi;
unsigned int b2;
EXECUTE_IF_SET_IN_BITMAP (&frontiers[b1], 0, b2, bmi)
if (bitmap_ior_into (&unfiltered[b2], b1_phis)
&& !bitmap_empty_p (&frontiers[b2]))
bitmap_set_bit (worklist, b2);
}
basic_block cfg_bb;
FOR_ALL_BB_FN (cfg_bb, m_fn)
{
// Calculate the set of phi nodes for blocks that don't have any
// dominance frontiers. We only need to do this once per block.
unsigned int i = cfg_bb->index;
bb_phi_info &phis = bi.bb_phis[i];
if (bitmap_empty_p (&frontiers[i]))
bitmap_and (&phis.regs, &unfiltered[i], DF_LR_IN (cfg_bb));
// Create an array that contains all phi inputs for this block.
// See the comment above the member variables for more information.
phis.num_phis = bitmap_count_bits (&phis.regs);
phis.num_preds = EDGE_COUNT (cfg_bb->preds);
unsigned int num_inputs = phis.num_phis * phis.num_preds;
if (num_inputs != 0)
{
phis.inputs = XOBNEWVEC (&m_temp_obstack, set_info *, num_inputs);
memset (phis.inputs, 0, num_inputs * sizeof (phis.inputs[0]));
}
}
// Free the temporary bitmaps.
for (unsigned int i = 0; i < num_bb_indices; ++i)
{
bitmap_release (&frontiers[i]);
bitmap_release (&unfiltered[i]);
}
}
// Called while building SSA form using BI, with BI.current_bb being
// the entry block.
//
// Create the entry block instructions and their definitions. The only
// useful instruction is the end instruction, which carries definitions
// for the values that are live on entry to the function. However, it
// seems simpler to create a head instruction too, rather than force all
// users of the block information to treat the entry block as a special case.
void
function_info::add_entry_block_defs (build_info &bi)
{
bb_info *bb = bi.current_bb;
basic_block cfg_bb = bi.current_bb->cfg_bb ();
auto *lr_info = DF_LR_BB_INFO (cfg_bb);
bb->set_head_insn (append_artificial_insn (bb));
insn_info *insn = append_artificial_insn (bb);
bb->set_end_insn (insn);
start_insn_accesses ();
// Using LR to derive the liveness information means that we create an
// entry block definition for upwards exposed registers. These registers
// are sometimes genuinely uninitialized. However, some targets also
// create a pseudo PIC base register and only initialize it later.
// Handling that case correctly seems more important than optimizing
// uninitialized uses.
unsigned int regno;
bitmap_iterator in_bi;
EXECUTE_IF_SET_IN_BITMAP (&lr_info->out, 0, regno, in_bi)
{
auto *set = allocate (insn, full_register (regno));
append_def (set);
m_temp_defs.safe_push (set);
bi.record_reg_def (set);
}
// Create a definition that reflects the state of memory on entry to
// the function.
auto *set = allocate (insn, memory);
append_def (set);
m_temp_defs.safe_push (set);
bi.record_mem_def (set);
finish_insn_accesses (insn);
}
// Lazily calculate the value of BI.ebb_live_in_for_debug for BI.current_ebb.
void
function_info::calculate_ebb_live_in_for_debug (build_info &bi)
{
gcc_checking_assert (bitmap_empty_p (bi.tmp_ebb_live_in_for_debug));
bi.ebb_live_in_for_debug = bi.tmp_ebb_live_in_for_debug;
bitmap_and (bi.ebb_live_in_for_debug, bi.potential_phi_regs_for_debug,
DF_LR_IN (bi.current_ebb->first_bb ()->cfg_bb ()));
bitmap_tree_view (bi.ebb_live_in_for_debug);
}
// Called while building SSA form using BI. Create phi nodes for the
// current EBB.
void
function_info::add_phi_nodes (build_info &bi)
{
ebb_info *ebb = bi.current_ebb;
basic_block cfg_bb = ebb->first_bb ()->cfg_bb ();
// Create the register phis for this EBB.
bb_phi_info &phis = bi.bb_phis[cfg_bb->index];
unsigned int num_preds = phis.num_preds;
unsigned int regno;
bitmap_iterator in_bi;
EXECUTE_IF_SET_IN_BITMAP (&phis.regs, 0, regno, in_bi)
{
gcc_checking_assert (bitmap_bit_p (bi.potential_phi_regs, regno));
// Create an array of phi inputs, to be filled in later.
auto *inputs = XOBNEWVEC (&m_obstack, access_info *, num_preds);
memset (inputs, 0, sizeof (access_info *) * num_preds);
// Later code works out the correct mode of the phi. Use BLKmode
// as a placeholder for now.
phi_info *phi = create_phi (ebb, { E_BLKmode, regno },
inputs, num_preds);
bi.record_reg_def (phi);
}
bitmap_copy (bi.ebb_def_regs, &phis.regs);
// Collect the live-in memory definitions and record whether they're
// all the same.
m_temp_defs.reserve (num_preds);
set_info *mem_value = nullptr;
bool mem_phi_is_degenerate = true;
edge e;
edge_iterator ei;
FOR_EACH_EDGE (e, ei, cfg_bb->preds)
{
bb_info *pred_bb = this->bb (e->src);
if (pred_bb && pred_bb->head_insn ())
{
mem_value = bi.bb_mem_live_out[pred_bb->index ()];
m_temp_defs.quick_push (mem_value);
if (mem_value != m_temp_defs[0])
mem_phi_is_degenerate = false;
}
else
{
m_temp_defs.quick_push (nullptr);
mem_phi_is_degenerate = false;
}
}
// Create a phi for memory, on the assumption that something in the
// EBB will need it.
if (mem_phi_is_degenerate)
{
access_info *input[] = { mem_value };
mem_value = create_phi (ebb, memory, input, 1);
}
else
{
obstack_grow (&m_obstack, m_temp_defs.address (),
num_preds * sizeof (access_info *));
auto *inputs = static_cast (obstack_finish (&m_obstack));
mem_value = create_phi (ebb, memory, inputs, num_preds);
}
bi.record_mem_def (mem_value);
m_temp_defs.truncate (0);
}
// Called while building SSA form using BI.
//
// If FLAGS is DF_REF_AT_TOP, create the head insn for BI.current_bb
// and populate its uses and definitions. If FLAGS is 0, do the same
// for the end insn.
void
function_info::add_artificial_accesses (build_info &bi, df_ref_flags flags)
{
bb_info *bb = bi.current_bb;
basic_block cfg_bb = bb->cfg_bb ();
auto *lr_info = DF_LR_BB_INFO (cfg_bb);
df_ref ref;
insn_info *insn;
if (flags == DF_REF_AT_TOP)
{
if (cfg_bb->index == EXIT_BLOCK)
insn = append_artificial_insn (bb);
else
insn = append_artificial_insn (bb, bb_note (cfg_bb));
bb->set_head_insn (insn);
}
else
{
insn = append_artificial_insn (bb);
bb->set_end_insn (insn);
}
start_insn_accesses ();
HARD_REG_SET added_regs = {};
FOR_EACH_ARTIFICIAL_USE (ref, cfg_bb->index)
if ((DF_REF_FLAGS (ref) & DF_REF_AT_TOP) == flags)
{
unsigned int regno = DF_REF_REGNO (ref);
machine_mode mode = GET_MODE (DF_REF_REAL_REG (ref));
if (HARD_REGISTER_NUM_P (regno))
SET_HARD_REG_BIT (added_regs, regno);
// A definition must be available.
gcc_checking_assert (bitmap_bit_p (&lr_info->in, regno)
|| (flags != DF_REF_AT_TOP
&& bitmap_bit_p (&lr_info->def, regno)));
m_temp_uses.safe_push (create_reg_use (bi, insn, { mode, regno }));
}
// Ensure that global registers and memory are live at the end of any
// block that has no successors, such as the exit block and non-local gotos.
// Global registers have to be singled out because they are not part of
// the DF artifical use list (they are instead treated as used within
// every block).
if (flags == 0 && EDGE_COUNT (cfg_bb->succs) == 0)
{
for (unsigned int i = 0; i < FIRST_PSEUDO_REGISTER; ++i)
if (global_regs[i] && !TEST_HARD_REG_BIT (added_regs, i))
{
auto mode = reg_raw_mode[i];
m_temp_uses.safe_push (create_reg_use (bi, insn, { mode, i }));
}
auto *use = allocate (insn, memory, bi.current_mem_value ());
add_use (use);
m_temp_uses.safe_push (use);
}
FOR_EACH_ARTIFICIAL_DEF (ref, cfg_bb->index)
if ((DF_REF_FLAGS (ref) & DF_REF_AT_TOP) == flags)
{
unsigned int regno = DF_REF_REGNO (ref);
machine_mode mode = GET_MODE (DF_REF_REAL_REG (ref));
resource_info resource { mode, regno };
// We rely on the def set being correct.
gcc_checking_assert (bitmap_bit_p (&lr_info->def, regno));
// If the value isn't used later in the block and isn't live
// on exit, we could instead represent the definition as a
// clobber_info. However, that case should be relatively
// rare and set_info is any case more compact than clobber_info.
set_info *def = allocate (insn, resource);
append_def (def);
m_temp_defs.safe_push (def);
bi.record_reg_def (def);
}
// Model the effect of a memory clobber on an incoming edge by adding
// a fake definition of memory at the start of the block. We don't need
// to add a use of the phi node because memory is implicitly always live.
if (flags == DF_REF_AT_TOP && has_abnormal_call_or_eh_pred_edge_p (cfg_bb))
{
set_info *def = allocate (insn, memory);
append_def (def);
m_temp_defs.safe_push (def);
bi.record_mem_def (def);
}
finish_insn_accesses (insn);
}
// Called while building SSA form using BI. Create insn_infos for all
// relevant instructions in BI.current_bb.
void
function_info::add_block_contents (build_info &bi)
{
basic_block cfg_bb = bi.current_bb->cfg_bb ();
rtx_insn *insn;
FOR_BB_INSNS (cfg_bb, insn)
if (INSN_P (insn))
add_insn_to_block (bi, insn);
}
// Called while building SSA form using BI. Record live-out register values
// in the phi inputs of successor blocks and create live-out uses where
// appropriate. Record the live-out memory value in BI.bb_mem_live_out.
void
function_info::record_block_live_out (build_info &bi)
{
bb_info *bb = bi.current_bb;
ebb_info *ebb = bi.current_ebb;
basic_block cfg_bb = bb->cfg_bb ();
// Record the live-out register values in the phi inputs of
// successor blocks.
edge e;
edge_iterator ei;
FOR_EACH_EDGE (e, ei, cfg_bb->succs)
{
bb_phi_info &phis = bi.bb_phis[e->dest->index];
unsigned int input_i = e->dest_idx * phis.num_phis;
unsigned int regno;
bitmap_iterator out_bi;
EXECUTE_IF_SET_IN_BITMAP (&phis.regs, 0, regno, out_bi)
{
phis.inputs[input_i]
= live_out_value (bb, bi.current_reg_value (regno));
input_i += 1;
}
}
// Add the set of registers that were defined in this BB to the set
// of potentially-live registers defined in the EBB.
bitmap_ior_into (bi.ebb_def_regs, &DF_LR_BB_INFO (cfg_bb)->def);
// Iterate through the registers in LIVE_OUT and see whether we need
// to add a live-out use for them.
auto record_live_out_regs = [&](bitmap live_out)
{
unsigned int regno;
bitmap_iterator out_bi;
EXECUTE_IF_AND_IN_BITMAP (bi.ebb_def_regs, live_out, 0, regno, out_bi)
{
set_info *value = live_out_value (bb, bi.current_reg_value (regno));
if (value && value->ebb () == ebb)
add_live_out_use (bb, value);
}
};
if (bb == ebb->last_bb ())
// All live-out registers might need live-out uses.
record_live_out_regs (DF_LR_OUT (cfg_bb));
else
// Registers might need live-out uses if they are live on entry
// to a successor block in a different EBB.
FOR_EACH_EDGE (e, ei, cfg_bb->succs)
{
bb_info *dest_bb = this->bb (e->dest);
if (dest_bb->ebb () != ebb || dest_bb == ebb->first_bb ())
record_live_out_regs (DF_LR_IN (e->dest));
}
// Record the live-out memory value.
bi.bb_mem_live_out[cfg_bb->index]
= live_out_value (bb, bi.current_mem_value ());
}
// Add BB and its contents to the SSA information.
void
function_info::start_block (build_info &bi, bb_info *bb)
{
ebb_info *ebb = bb->ebb ();
// We (need to) add all blocks from one EBB before moving on to the next.
bi.current_bb = bb;
if (bb == ebb->first_bb ())
bi.current_ebb = ebb;
else
gcc_assert (bi.current_ebb == ebb);
// Record the start of this block's definitions in the definitions stack.
bi.old_def_stack_limit.safe_push (bi.def_stack.length ());
// Add the block itself.
append_bb (bb);
// If the block starts an EBB, create the phi insn. This insn should exist
// for all EBBs, even if they don't (yet) need phis.
if (bb == ebb->first_bb ())
ebb->set_phi_insn (append_artificial_insn (bb));
if (bb->index () == ENTRY_BLOCK)
{
add_entry_block_defs (bi);
record_block_live_out (bi);
return;
}
if (EDGE_COUNT (bb->cfg_bb ()->preds) == 0)
{
// Leave unreachable blocks empty, since there is no useful
// liveness information for them, and anything they do will
// be wasted work. In a cleaned-up cfg, the only unreachable
// block we should see is the exit block of a noreturn function.
bb->set_head_insn (append_artificial_insn (bb));
bb->set_end_insn (append_artificial_insn (bb));
return;
}
// If the block starts an EBB, create the phi nodes.
if (bb == ebb->first_bb ())
add_phi_nodes (bi);
// Process the contents of the block.
add_artificial_accesses (bi, DF_REF_AT_TOP);
if (bb->index () != EXIT_BLOCK)
add_block_contents (bi);
add_artificial_accesses (bi, df_ref_flags ());
record_block_live_out (bi);
// If we needed to calculate a live-in set for debug purposes,
// reset it to null at the end of the EBB. Convert the underlying
// bitmap to an empty list view, ready for the next calculation.
if (bi.ebb_live_in_for_debug && bb == ebb->last_bb ())
{
bitmap_clear (bi.tmp_ebb_live_in_for_debug);
bitmap_list_view (bi.tmp_ebb_live_in_for_debug);
bi.ebb_live_in_for_debug = nullptr;
}
}
// Finish adding BB and the blocks that it dominates to the SSA information.
void
function_info::end_block (build_info &bi, bb_info *bb)
{
// Restore the register last_access information to the state it was
// in before we started processing BB.
unsigned int old_limit = bi.old_def_stack_limit.pop ();
while (bi.def_stack.length () > old_limit)
{
// We pushed a definition in BB if it was the first dominating
// definition (and so the previous entry was null). In other
// cases we pushed the previous dominating definition.
def_info *def = bi.def_stack.pop ();
unsigned int regno = def->regno ();
if (def->bb () == bb)
def = nullptr;
bi.last_access[regno + 1] = def;
}
}
// Finish setting up the phi nodes for each block, now that we've added
// the contents of all blocks.
void
function_info::populate_phi_inputs (build_info &bi)
{
auto_vec sorted_phis;
for (ebb_info *ebb : ebbs ())
{
if (!ebb->first_phi ())
continue;
// Get a sorted array of EBB's phi nodes.
basic_block cfg_bb = ebb->first_bb ()->cfg_bb ();
bb_phi_info &phis = bi.bb_phis[cfg_bb->index];
sorted_phis.truncate (0);
for (phi_info *phi : ebb->phis ())
sorted_phis.safe_push (phi);
std::sort (sorted_phis.address (),
sorted_phis.address () + sorted_phis.length (),
compare_access_infos);
// Set the inputs of the non-degenerate register phis. All inputs
// for one edge come before all inputs for the next edge.
set_info **inputs = phis.inputs;
unsigned int phi_i = 0;
bitmap_iterator bmi;
unsigned int regno;
EXECUTE_IF_SET_IN_BITMAP (&phis.regs, 0, regno, bmi)
{
// Skip intervening degenerate phis.
while (sorted_phis[phi_i]->regno () < regno)
phi_i += 1;
phi_info *phi = sorted_phis[phi_i];
gcc_assert (phi->regno () == regno);
for (unsigned int input_i = 0; input_i < phis.num_preds; ++input_i)
if (set_info *input = inputs[input_i * phis.num_phis])
{
use_info *use = phi->input_use (input_i);
gcc_assert (!use->def ());
use->set_def (input);
add_use (use);
}
phi_i += 1;
inputs += 1;
}
// Fill in the backedge inputs to any memory phi.
phi_info *mem_phi = sorted_phis.last ();
if (mem_phi->is_mem () && !mem_phi->is_degenerate ())
{
edge e;
edge_iterator ei;
FOR_EACH_EDGE (e, ei, cfg_bb->preds)
{
use_info *use = mem_phi->input_use (e->dest_idx);
if (!use->def ())
{
use->set_def (bi.bb_mem_live_out[e->src->index]);
add_use (use);
}
}
}
}
}
// Return true if it would be better to continue an EBB across NEW_EDGE
// rather than across OLD_EDGE, given that both edges are viable candidates.
// This is not a total ordering.
static bool
better_ebb_edge_p (edge new_edge, edge old_edge)
{
// Prefer the likeliest edge.
if (new_edge->probability.initialized_p ()
&& old_edge->probability.initialized_p ()
&& !(old_edge->probability == new_edge->probability))
return old_edge->probability < new_edge->probability;
// If both edges are equally likely, prefer a fallthru edge.
if (new_edge->flags & EDGE_FALLTHRU)
return true;
if (old_edge->flags & EDGE_FALLTHRU)
return false;
// Otherwise just stick with OLD_EDGE.
return false;
}
// Pick and return the next basic block in an EBB that currently ends with BB.
// Return null if the EBB must end with BB.
static basic_block
choose_next_block_in_ebb (basic_block bb)
{
// Although there's nothing in principle wrong with having an EBB that
// starts with the entry block and includes later blocks, there's not
// really much point either. Keeping the entry block separate means
// that uses of arguments consistently occur through phi nodes, rather
// than the arguments sometimes appearing to come from an EBB-local
// definition instead.
if (bb->index == ENTRY_BLOCK)
return nullptr;
bool optimize_for_speed_p = optimize_bb_for_speed_p (bb);
edge best_edge = nullptr;
edge e;
edge_iterator ei;
FOR_EACH_EDGE (e, ei, bb->succs)
if (!(e->flags & EDGE_COMPLEX)
&& e->dest->index != EXIT_BLOCK
&& single_pred_p (e->dest)
&& optimize_for_speed_p == optimize_bb_for_speed_p (e->dest)
&& (!best_edge || better_ebb_edge_p (e, best_edge)))
best_edge = e;
return best_edge ? best_edge->dest : nullptr;
}
// Partition the function into extended basic blocks. Create the
// associated ebb_infos and bb_infos, but don't add the bb_infos
// to the function list yet.
void
function_info::create_ebbs (build_info &bi)
{
// Compute the starting reverse postorder. We tweak this later to try
// to get better EBB assignments.
auto *postorder = new int[n_basic_blocks_for_fn (m_fn)];
unsigned int postorder_num
= pre_and_rev_post_order_compute (nullptr, postorder, true);
gcc_assert (int (postorder_num) <= n_basic_blocks_for_fn (m_fn));
// Iterate over the blocks in reverse postorder. In cases where
// multiple possible orders exist, prefer orders that chain blocks
// together into EBBs. If multiple possible EBBs exist, try to pick
// the ones that are most likely to be profitable.
auto_vec bbs;
unsigned int next_bb_index = 0;
for (unsigned int i = 0; i < postorder_num; ++i)
if (!m_bbs[postorder[i]])
{
// Choose and create the blocks that should form the next EBB.
basic_block cfg_bb = BASIC_BLOCK_FOR_FN (m_fn, postorder[i]);
do
{
// Record the chosen block order in a new RPO.
bi.bb_to_rpo[cfg_bb->index] = next_bb_index++;
bbs.safe_push (create_bb_info (cfg_bb));
cfg_bb = choose_next_block_in_ebb (cfg_bb);
}
while (cfg_bb);
// Create the EBB itself.
auto *ebb = allocate (bbs[0], bbs.last ());
for (bb_info *bb : bbs)
bb->set_ebb (ebb);
bbs.truncate (0);
}
delete[] postorder;
}
// Partition the function's blocks into EBBs and build SSA form for all
// EBBs in the function.
void
function_info::process_all_blocks ()
{
auto temps = temp_watermark ();
unsigned int num_bb_indices = last_basic_block_for_fn (m_fn);
build_info bi (m_num_regs, num_bb_indices);
// ??? There is no dominance information associated with the exit block,
// so work out its immediate dominator using predecessor blocks.
for (edge e : EXIT_BLOCK_PTR_FOR_FN (m_fn)->preds)
if (bi.exit_block_dominator)
bi.exit_block_dominator
= nearest_common_dominator (CDI_DOMINATORS,
bi.exit_block_dominator, e->src);
else
bi.exit_block_dominator = e->src;
calculate_potential_phi_regs (bi);
create_ebbs (bi);
place_phis (bi);
bb_walker (this, bi).walk (ENTRY_BLOCK_PTR_FOR_FN (m_fn));
populate_phi_inputs (bi);
if (flag_checking)
{
// The definition stack should be empty and all register definitions
// should be back in their original undefined state.
gcc_assert (bi.def_stack.is_empty ()
&& bi.old_def_stack_limit.is_empty ());
for (unsigned int regno = 0; regno < m_num_regs; ++regno)
gcc_assert (!bi.last_access[regno + 1]);
}
}
// Print a description of CALL_CLOBBERS to PP.
void
rtl_ssa::pp_ebb_call_clobbers (pretty_printer *pp,
const ebb_call_clobbers_info *call_clobbers)
{
if (!call_clobbers)
pp_string (pp, "");
else
call_clobbers->print_full (pp);
}
// Print a description of BB to PP.
void
rtl_ssa::pp_bb (pretty_printer *pp, const bb_info *bb)
{
if (!bb)
pp_string (pp, "");
else
bb->print_full (pp);
}
// Print a description of EBB to PP
void
rtl_ssa::pp_ebb (pretty_printer *pp, const ebb_info *ebb)
{
if (!ebb)
pp_string (pp, "");
else
ebb->print_full (pp);
}
// Print a description of CALL_CLOBBERS to FILE.
void
dump (FILE *file, const ebb_call_clobbers_info *call_clobbers)
{
dump_using (file, pp_ebb_call_clobbers, call_clobbers);
}
// Print a description of BB to FILE.
void
dump (FILE *file, const bb_info *bb)
{
dump_using (file, pp_bb, bb);
}
// Print a description of EBB to FILE.
void
dump (FILE *file, const ebb_info *ebb)
{
dump_using (file, pp_ebb, ebb);
}
// Debug interfaces to the dump routines above.
void debug (const ebb_call_clobbers_info *x) { dump (stderr, x); }
void debug (const bb_info *x) { dump (stderr, x); }
void debug (const ebb_info *x) { dump (stderr, x); }