/* Search for references that a functions loads or stores.
Copyright (C) 2020-2021 Free Software Foundation, Inc.
Contributed by David Cepelik and Jan Hubicka
This file is part of GCC.
GCC is free software; you can redistribute it and/or modify it under
the terms of the GNU General Public License as published by the Free
Software Foundation; either version 3, or (at your option) any later
version.
GCC is distributed in the hope that it will be useful, but WITHOUT ANY
WARRANTY; without even the implied warranty of MERCHANTABILITY or
FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
for more details.
You should have received a copy of the GNU General Public License
along with GCC; see the file COPYING3. If not see
. */
/* Mod/ref pass records summary about loads and stores performed by the
function. This is later used by alias analysis to disambiguate memory
accesses across function calls.
This file contains a tree pass and an IPA pass. Both performs the same
analysis however tree pass is executed during early and late optimization
passes to propagate info downwards in the compilation order. IPA pass
propagates across the callgraph and is able to handle recursion and works on
whole program during link-time analysis.
LTO mode differs from the local mode by not recording alias sets but types
that are translated to alias sets later. This is necessary in order stream
the information because the alias sets are rebuild at stream-in time and may
not correspond to ones seen during analysis. For this reason part of
analysis is duplicated.
The following information is computed
1) load/store access tree described in ipa-modref-tree.h
This is used by tree-ssa-alias to disambiguate load/stores
2) EAF flags used by points-to analysis (in tree-ssa-structlias).
and defined in tree-core.h.
and stored to optimization_summaries.
There are multiple summaries computed and used during the propagation:
- summaries holds summaries from analysis to IPA propagation
time.
- summaries_lto is same as summaries but holds them in a format
that can be streamed (as described above).
- fnspec_summary holds fnspec strings for call. This is
necessary because gimple_call_fnspec performs additional
analysis except for looking callee fndecl.
- escape_summary holds escape points for given call edge.
That is a vector recording what function parmaeters
may escape to a function call (and with what parameter index). */
#include "config.h"
#include "system.h"
#include "coretypes.h"
#include "backend.h"
#include "tree.h"
#include "gimple.h"
#include "alloc-pool.h"
#include "tree-pass.h"
#include "gimple-iterator.h"
#include "tree-dfa.h"
#include "cgraph.h"
#include "ipa-utils.h"
#include "symbol-summary.h"
#include "gimple-pretty-print.h"
#include "gimple-walk.h"
#include "print-tree.h"
#include "tree-streamer.h"
#include "alias.h"
#include "calls.h"
#include "ipa-modref-tree.h"
#include "ipa-modref.h"
#include "value-range.h"
#include "ipa-prop.h"
#include "ipa-fnsummary.h"
#include "attr-fnspec.h"
#include "symtab-clones.h"
#include "gimple-ssa.h"
#include "tree-phinodes.h"
#include "tree-ssa-operands.h"
#include "ssa-iterators.h"
#include "stringpool.h"
#include "tree-ssanames.h"
namespace {
/* We record fnspec specifiers for call edges since they depends on actual
gimple statements. */
class fnspec_summary
{
public:
char *fnspec;
fnspec_summary ()
: fnspec (NULL)
{
}
~fnspec_summary ()
{
free (fnspec);
}
};
/* Summary holding fnspec string for a given call. */
class fnspec_summaries_t : public call_summary
{
public:
fnspec_summaries_t (symbol_table *symtab)
: call_summary (symtab) {}
/* Hook that is called by summary when an edge is duplicated. */
virtual void duplicate (cgraph_edge *,
cgraph_edge *,
fnspec_summary *src,
fnspec_summary *dst)
{
dst->fnspec = xstrdup (src->fnspec);
}
};
static fnspec_summaries_t *fnspec_summaries = NULL;
/* Escape summary holds a vector of param indexes that escape to
a given call. */
struct escape_entry
{
/* Parameter that escapes at a given call. */
unsigned int parm_index;
/* Argument it escapes to. */
unsigned int arg;
/* Minimal flags known about the argument. */
eaf_flags_t min_flags;
/* Does it escape directly or indirectly? */
bool direct;
};
/* Dump EAF flags. */
static void
dump_eaf_flags (FILE *out, int flags, bool newline = true)
{
if (flags & EAF_DIRECT)
fprintf (out, " direct");
if (flags & EAF_NOCLOBBER)
fprintf (out, " noclobber");
if (flags & EAF_NOESCAPE)
fprintf (out, " noescape");
if (flags & EAF_NODIRECTESCAPE)
fprintf (out, " nodirectescape");
if (flags & EAF_UNUSED)
fprintf (out, " unused");
if (flags & EAF_NOT_RETURNED)
fprintf (out, " not_returned");
if (flags & EAF_NOREAD)
fprintf (out, " noread");
if (newline)
fprintf (out, "\n");
}
struct escape_summary
{
auto_vec esc;
void dump (FILE *out)
{
for (unsigned int i = 0; i < esc.length (); i++)
{
fprintf (out, " parm %i arg %i %s min:",
esc[i].parm_index,
esc[i].arg,
esc[i].direct ? "(direct)" : "(indirect)");
dump_eaf_flags (out, esc[i].min_flags, false);
}
fprintf (out, "\n");
}
};
class escape_summaries_t : public call_summary
{
public:
escape_summaries_t (symbol_table *symtab)
: call_summary (symtab) {}
/* Hook that is called by summary when an edge is duplicated. */
virtual void duplicate (cgraph_edge *,
cgraph_edge *,
escape_summary *src,
escape_summary *dst)
{
dst->esc = src->esc.copy ();
}
};
static escape_summaries_t *escape_summaries = NULL;
} /* ANON namespace: GTY annotated summaries can not be anonymous. */
/* Class (from which there is one global instance) that holds modref summaries
for all analyzed functions. */
class GTY((user)) modref_summaries
: public fast_function_summary
{
public:
modref_summaries (symbol_table *symtab)
: fast_function_summary (symtab) {}
virtual void insert (cgraph_node *, modref_summary *state);
virtual void duplicate (cgraph_node *src_node,
cgraph_node *dst_node,
modref_summary *src_data,
modref_summary *dst_data);
static modref_summaries *create_ggc (symbol_table *symtab)
{
return new (ggc_alloc_no_dtor ())
modref_summaries (symtab);
}
};
class modref_summary_lto;
/* Class (from which there is one global instance) that holds modref summaries
for all analyzed functions. */
class GTY((user)) modref_summaries_lto
: public fast_function_summary
{
public:
modref_summaries_lto (symbol_table *symtab)
: fast_function_summary (symtab),
propagated (false) {}
virtual void insert (cgraph_node *, modref_summary_lto *state);
virtual void duplicate (cgraph_node *src_node,
cgraph_node *dst_node,
modref_summary_lto *src_data,
modref_summary_lto *dst_data);
static modref_summaries_lto *create_ggc (symbol_table *symtab)
{
return new (ggc_alloc_no_dtor ())
modref_summaries_lto (symtab);
}
bool propagated;
};
/* Global variable holding all modref summaries
(from analysis to IPA propagation time). */
static GTY(()) fast_function_summary
*summaries;
/* Global variable holding all modref optimization summaries
(from IPA propagation time or used by local optimization pass). */
static GTY(()) fast_function_summary
*optimization_summaries;
/* LTO summaries hold info from analysis to LTO streaming or from LTO
stream-in through propagation to LTO stream-out. */
static GTY(()) fast_function_summary
*summaries_lto;
/* Summary for a single function which this pass produces. */
modref_summary::modref_summary ()
: loads (NULL), stores (NULL), writes_errno (NULL)
{
}
modref_summary::~modref_summary ()
{
if (loads)
ggc_delete (loads);
if (stores)
ggc_delete (stores);
}
/* All flags that are implied by the ECF_CONST functions. */
const int implicit_const_eaf_flags = EAF_DIRECT | EAF_NOCLOBBER | EAF_NOESCAPE
| EAF_NODIRECTESCAPE | EAF_NOREAD;
/* All flags that are implied by the ECF_PURE function. */
const int implicit_pure_eaf_flags = EAF_NOCLOBBER | EAF_NOESCAPE
| EAF_NODIRECTESCAPE;
/* All flags implied when we know we can ignore stores (i.e. when handling
call to noreturn). */
const int ignore_stores_eaf_flags = EAF_DIRECT | EAF_NOCLOBBER | EAF_NOESCAPE
| EAF_NODIRECTESCAPE;
/* Remove all flags from EAF_FLAGS that are implied by ECF_FLAGS and not
useful to track. If returns_void is true moreover clear
EAF_NOT_RETURNED. */
static int
remove_useless_eaf_flags (int eaf_flags, int ecf_flags, bool returns_void)
{
if (ecf_flags & ECF_NOVOPS)
return 0;
if (ecf_flags & ECF_CONST)
eaf_flags &= ~implicit_const_eaf_flags;
else if (ecf_flags & ECF_PURE)
eaf_flags &= ~implicit_pure_eaf_flags;
else if ((ecf_flags & ECF_NORETURN) || returns_void)
eaf_flags &= ~EAF_NOT_RETURNED;
/* Only NOCLOBBER or DIRECT flags alone are not useful (see comments
in tree-ssa-alias.c). Give up earlier. */
if ((eaf_flags & ~(EAF_DIRECT | EAF_NOCLOBBER)) == 0)
return 0;
return eaf_flags;
}
/* Return true if FLAGS holds some useful information. */
static bool
eaf_flags_useful_p (vec &flags, int ecf_flags)
{
for (unsigned i = 0; i < flags.length (); i++)
if (remove_useless_eaf_flags (flags[i], ecf_flags, false))
return true;
return false;
}
/* Return true if summary is potentially useful for optimization.
If CHECK_FLAGS is false assume that arg_flags are useful. */
bool
modref_summary::useful_p (int ecf_flags, bool check_flags)
{
if (ecf_flags & ECF_NOVOPS)
return false;
if (arg_flags.length () && !check_flags)
return true;
if (check_flags && eaf_flags_useful_p (arg_flags, ecf_flags))
return true;
arg_flags.release ();
if (ecf_flags & ECF_CONST)
return false;
if (loads && !loads->every_base)
return true;
if (ecf_flags & ECF_PURE)
return false;
return stores && !stores->every_base;
}
/* Single function summary used for LTO. */
typedef modref_tree modref_records_lto;
struct GTY(()) modref_summary_lto
{
/* Load and stores in functions using types rather then alias sets.
This is necessary to make the information streamable for LTO but is also
more verbose and thus more likely to hit the limits. */
modref_records_lto *loads;
modref_records_lto *stores;
auto_vec GTY((skip)) arg_flags;
bool writes_errno;
modref_summary_lto ();
~modref_summary_lto ();
void dump (FILE *);
bool useful_p (int ecf_flags, bool check_flags = true);
};
/* Summary for a single function which this pass produces. */
modref_summary_lto::modref_summary_lto ()
: loads (NULL), stores (NULL), writes_errno (NULL)
{
}
modref_summary_lto::~modref_summary_lto ()
{
if (loads)
ggc_delete (loads);
if (stores)
ggc_delete (stores);
}
/* Return true if lto summary is potentially useful for optimization.
If CHECK_FLAGS is false assume that arg_flags are useful. */
bool
modref_summary_lto::useful_p (int ecf_flags, bool check_flags)
{
if (ecf_flags & ECF_NOVOPS)
return false;
if (arg_flags.length () && !check_flags)
return true;
if (check_flags && eaf_flags_useful_p (arg_flags, ecf_flags))
return true;
arg_flags.release ();
if (ecf_flags & ECF_CONST)
return false;
if (loads && !loads->every_base)
return true;
if (ecf_flags & ECF_PURE)
return false;
return stores && !stores->every_base;
}
/* Dump A to OUT. */
static void
dump_access (modref_access_node *a, FILE *out)
{
fprintf (out, " access:");
if (a->parm_index != -1)
{
fprintf (out, " Parm %i", a->parm_index);
if (a->parm_offset_known)
{
fprintf (out, " param offset:");
print_dec ((poly_int64_pod)a->parm_offset, out, SIGNED);
}
}
if (a->range_info_useful_p ())
{
fprintf (out, " offset:");
print_dec ((poly_int64_pod)a->offset, out, SIGNED);
fprintf (out, " size:");
print_dec ((poly_int64_pod)a->size, out, SIGNED);
fprintf (out, " max_size:");
print_dec ((poly_int64_pod)a->max_size, out, SIGNED);
if (a->adjustments)
fprintf (out, " adjusted %i times", a->adjustments);
}
fprintf (out, "\n");
}
/* Dump records TT to OUT. */
static void
dump_records (modref_records *tt, FILE *out)
{
fprintf (out, " Limits: %i bases, %i refs\n",
(int)tt->max_bases, (int)tt->max_refs);
if (tt->every_base)
{
fprintf (out, " Every base\n");
return;
}
size_t i;
modref_base_node *n;
FOR_EACH_VEC_SAFE_ELT (tt->bases, i, n)
{
fprintf (out, " Base %i: alias set %i\n", (int)i, n->base);
if (n->every_ref)
{
fprintf (out, " Every ref\n");
continue;
}
size_t j;
modref_ref_node *r;
FOR_EACH_VEC_SAFE_ELT (n->refs, j, r)
{
fprintf (out, " Ref %i: alias set %i\n", (int)j, r->ref);
if (r->every_access)
{
fprintf (out, " Every access\n");
continue;
}
size_t k;
modref_access_node *a;
FOR_EACH_VEC_SAFE_ELT (r->accesses, k, a)
dump_access (a, out);
}
}
}
/* Dump records TT to OUT. */
static void
dump_lto_records (modref_records_lto *tt, FILE *out)
{
fprintf (out, " Limits: %i bases, %i refs\n",
(int)tt->max_bases, (int)tt->max_refs);
if (tt->every_base)
{
fprintf (out, " Every base\n");
return;
}
size_t i;
modref_base_node *n;
FOR_EACH_VEC_SAFE_ELT (tt->bases, i, n)
{
fprintf (out, " Base %i:", (int)i);
print_generic_expr (dump_file, n->base);
fprintf (out, " (alias set %i)\n",
n->base ? get_alias_set (n->base) : 0);
if (n->every_ref)
{
fprintf (out, " Every ref\n");
continue;
}
size_t j;
modref_ref_node *r;
FOR_EACH_VEC_SAFE_ELT (n->refs, j, r)
{
fprintf (out, " Ref %i:", (int)j);
print_generic_expr (dump_file, r->ref);
fprintf (out, " (alias set %i)\n",
r->ref ? get_alias_set (r->ref) : 0);
if (r->every_access)
{
fprintf (out, " Every access\n");
continue;
}
size_t k;
modref_access_node *a;
FOR_EACH_VEC_SAFE_ELT (r->accesses, k, a)
dump_access (a, out);
}
}
}
/* Dump all escape points of NODE to OUT. */
static void
dump_modref_edge_summaries (FILE *out, cgraph_node *node, int depth)
{
int i = 0;
if (!escape_summaries)
return;
for (cgraph_edge *e = node->indirect_calls; e; e = e->next_callee)
{
class escape_summary *sum = escape_summaries->get (e);
if (sum)
{
fprintf (out, "%*sIndirect call %i in %s escapes:",
depth, "", i, node->dump_name ());
sum->dump (out);
}
i++;
}
for (cgraph_edge *e = node->callees; e; e = e->next_callee)
{
if (!e->inline_failed)
dump_modref_edge_summaries (out, e->callee, depth + 1);
class escape_summary *sum = escape_summaries->get (e);
if (sum)
{
fprintf (out, "%*sCall %s->%s escapes:", depth, "",
node->dump_name (), e->callee->dump_name ());
sum->dump (out);
}
class fnspec_summary *fsum = fnspec_summaries->get (e);
if (fsum)
{
fprintf (out, "%*sCall %s->%s fnspec: %s\n", depth, "",
node->dump_name (), e->callee->dump_name (),
fsum->fnspec);
}
}
}
/* Remove all call edge summaries associated with NODE. */
static void
remove_modref_edge_summaries (cgraph_node *node)
{
if (!escape_summaries)
return;
for (cgraph_edge *e = node->indirect_calls; e; e = e->next_callee)
escape_summaries->remove (e);
for (cgraph_edge *e = node->callees; e; e = e->next_callee)
{
if (!e->inline_failed)
remove_modref_edge_summaries (e->callee);
escape_summaries->remove (e);
fnspec_summaries->remove (e);
}
}
/* Dump summary. */
void
modref_summary::dump (FILE *out)
{
if (loads)
{
fprintf (out, " loads:\n");
dump_records (loads, out);
}
if (stores)
{
fprintf (out, " stores:\n");
dump_records (stores, out);
}
if (writes_errno)
fprintf (out, " Writes errno\n");
if (arg_flags.length ())
{
for (unsigned int i = 0; i < arg_flags.length (); i++)
if (arg_flags[i])
{
fprintf (out, " parm %i flags:", i);
dump_eaf_flags (out, arg_flags[i]);
}
}
}
/* Dump summary. */
void
modref_summary_lto::dump (FILE *out)
{
fprintf (out, " loads:\n");
dump_lto_records (loads, out);
fprintf (out, " stores:\n");
dump_lto_records (stores, out);
if (writes_errno)
fprintf (out, " Writes errno\n");
if (arg_flags.length ())
{
for (unsigned int i = 0; i < arg_flags.length (); i++)
if (arg_flags[i])
{
fprintf (out, " parm %i flags:", i);
dump_eaf_flags (out, arg_flags[i]);
}
}
}
/* Get function summary for FUNC if it exists, return NULL otherwise. */
modref_summary *
get_modref_function_summary (cgraph_node *func)
{
/* Avoid creation of the summary too early (e.g. when front-end calls us). */
if (!optimization_summaries)
return NULL;
/* A single function body may be represented by multiple symbols with
different visibility. For example, if FUNC is an interposable alias,
we don't want to return anything, even if we have summary for the target
function. */
enum availability avail;
func = func->function_or_virtual_thunk_symbol
(&avail, current_function_decl ?
cgraph_node::get (current_function_decl) : NULL);
if (avail <= AVAIL_INTERPOSABLE)
return NULL;
modref_summary *r = optimization_summaries->get (func);
return r;
}
/* Construct modref_access_node from REF. */
static modref_access_node
get_access (ao_ref *ref)
{
tree base;
base = ao_ref_base (ref);
modref_access_node a = {ref->offset, ref->size, ref->max_size,
0, -1, false, 0};
if (TREE_CODE (base) == MEM_REF || TREE_CODE (base) == TARGET_MEM_REF)
{
tree memref = base;
base = TREE_OPERAND (base, 0);
if (TREE_CODE (base) == SSA_NAME
&& SSA_NAME_IS_DEFAULT_DEF (base)
&& TREE_CODE (SSA_NAME_VAR (base)) == PARM_DECL)
{
a.parm_index = 0;
for (tree t = DECL_ARGUMENTS (current_function_decl);
t != SSA_NAME_VAR (base); t = DECL_CHAIN (t))
{
if (!t)
{
a.parm_index = -1;
break;
}
a.parm_index++;
}
if (TREE_CODE (memref) == MEM_REF)
{
a.parm_offset_known
= wi::to_poly_wide (TREE_OPERAND
(memref, 1)).to_shwi (&a.parm_offset);
}
else
a.parm_offset_known = false;
}
else
a.parm_index = -1;
}
else
a.parm_index = -1;
return a;
}
/* Record access into the modref_records data structure. */
static void
record_access (modref_records *tt, ao_ref *ref)
{
alias_set_type base_set = !flag_strict_aliasing ? 0
: ao_ref_base_alias_set (ref);
alias_set_type ref_set = !flag_strict_aliasing ? 0
: (ao_ref_alias_set (ref));
modref_access_node a = get_access (ref);
if (dump_file)
{
fprintf (dump_file, " - Recording base_set=%i ref_set=%i parm=%i\n",
base_set, ref_set, a.parm_index);
}
tt->insert (base_set, ref_set, a, false);
}
/* IPA version of record_access_tree. */
static void
record_access_lto (modref_records_lto *tt, ao_ref *ref)
{
/* get_alias_set sometimes use different type to compute the alias set
than TREE_TYPE (base). Do same adjustments. */
tree base_type = NULL_TREE, ref_type = NULL_TREE;
if (flag_strict_aliasing)
{
tree base;
base = ref->ref;
while (handled_component_p (base))
base = TREE_OPERAND (base, 0);
base_type = reference_alias_ptr_type_1 (&base);
if (!base_type)
base_type = TREE_TYPE (base);
else
base_type = TYPE_REF_CAN_ALIAS_ALL (base_type)
? NULL_TREE : TREE_TYPE (base_type);
tree ref_expr = ref->ref;
ref_type = reference_alias_ptr_type_1 (&ref_expr);
if (!ref_type)
ref_type = TREE_TYPE (ref_expr);
else
ref_type = TYPE_REF_CAN_ALIAS_ALL (ref_type)
? NULL_TREE : TREE_TYPE (ref_type);
/* Sanity check that we are in sync with what get_alias_set does. */
gcc_checking_assert ((!base_type && !ao_ref_base_alias_set (ref))
|| get_alias_set (base_type)
== ao_ref_base_alias_set (ref));
gcc_checking_assert ((!ref_type && !ao_ref_alias_set (ref))
|| get_alias_set (ref_type)
== ao_ref_alias_set (ref));
/* Do not bother to record types that have no meaningful alias set.
Also skip variably modified types since these go to local streams. */
if (base_type && (!get_alias_set (base_type)
|| variably_modified_type_p (base_type, NULL_TREE)))
base_type = NULL_TREE;
if (ref_type && (!get_alias_set (ref_type)
|| variably_modified_type_p (ref_type, NULL_TREE)))
ref_type = NULL_TREE;
}
modref_access_node a = get_access (ref);
if (dump_file)
{
fprintf (dump_file, " - Recording base type:");
print_generic_expr (dump_file, base_type);
fprintf (dump_file, " (alias set %i) ref type:",
base_type ? get_alias_set (base_type) : 0);
print_generic_expr (dump_file, ref_type);
fprintf (dump_file, " (alias set %i) parm:%i\n",
ref_type ? get_alias_set (ref_type) : 0,
a.parm_index);
}
tt->insert (base_type, ref_type, a, false);
}
/* Returns true if and only if we should store the access to EXPR.
Some accesses, e.g. loads from automatic variables, are not interesting. */
static bool
record_access_p (tree expr)
{
if (refs_local_or_readonly_memory_p (expr))
{
if (dump_file)
fprintf (dump_file, " - Read-only or local, ignoring.\n");
return false;
}
return true;
}
/* Return true if ECF flags says that return value can be ignored. */
static bool
ignore_retval_p (tree caller, int flags)
{
if ((flags & (ECF_NORETURN | ECF_NOTHROW)) == (ECF_NORETURN | ECF_NOTHROW)
|| (!opt_for_fn (caller, flag_exceptions) && (flags & ECF_NORETURN)))
return true;
return false;
}
/* Return true if ECF flags says that stores can be ignored. */
static bool
ignore_stores_p (tree caller, int flags)
{
if (flags & (ECF_PURE | ECF_CONST | ECF_NOVOPS))
return true;
if ((flags & (ECF_NORETURN | ECF_NOTHROW)) == (ECF_NORETURN | ECF_NOTHROW)
|| (!opt_for_fn (caller, flag_exceptions) && (flags & ECF_NORETURN)))
return true;
return false;
}
/* Determine parm_map for argument I of STMT. */
modref_parm_map
parm_map_for_arg (gimple *stmt, int i)
{
tree op = gimple_call_arg (stmt, i);
bool offset_known;
poly_int64 offset;
struct modref_parm_map parm_map;
parm_map.parm_offset_known = false;
parm_map.parm_offset = 0;
offset_known = unadjusted_ptr_and_unit_offset (op, &op, &offset);
if (TREE_CODE (op) == SSA_NAME
&& SSA_NAME_IS_DEFAULT_DEF (op)
&& TREE_CODE (SSA_NAME_VAR (op)) == PARM_DECL)
{
int index = 0;
for (tree t = DECL_ARGUMENTS (current_function_decl);
t != SSA_NAME_VAR (op); t = DECL_CHAIN (t))
{
if (!t)
{
index = -1;
break;
}
index++;
}
parm_map.parm_index = index;
parm_map.parm_offset_known = offset_known;
parm_map.parm_offset = offset;
}
else if (points_to_local_or_readonly_memory_p (op))
parm_map.parm_index = -2;
else
parm_map.parm_index = -1;
return parm_map;
}
/* Merge side effects of call STMT to function with CALLEE_SUMMARY
int CUR_SUMMARY. Return true if something changed.
If IGNORE_STORES is true, do not merge stores.
If RECORD_ADJUSTMENTS is true cap number of adjustments to
a given access to make dataflow finite. */
bool
merge_call_side_effects (modref_summary *cur_summary,
gimple *stmt, modref_summary *callee_summary,
bool ignore_stores, cgraph_node *callee_node,
bool record_adjustments)
{
auto_vec parm_map;
bool changed = false;
/* We can not safely optimize based on summary of callee if it does
not always bind to current def: it is possible that memory load
was optimized out earlier which may not happen in the interposed
variant. */
if (!callee_node->binds_to_current_def_p ())
{
if (dump_file)
fprintf (dump_file, " - May be interposed: collapsing loads.\n");
cur_summary->loads->collapse ();
}
if (dump_file)
fprintf (dump_file, " - Merging side effects of %s with parm map:",
callee_node->dump_name ());
parm_map.safe_grow_cleared (gimple_call_num_args (stmt), true);
for (unsigned i = 0; i < gimple_call_num_args (stmt); i++)
{
parm_map[i] = parm_map_for_arg (stmt, i);
if (dump_file)
{
fprintf (dump_file, " %i", parm_map[i].parm_index);
if (parm_map[i].parm_offset_known)
{
fprintf (dump_file, " offset:");
print_dec ((poly_int64_pod)parm_map[i].parm_offset,
dump_file, SIGNED);
}
}
}
if (dump_file)
fprintf (dump_file, "\n");
/* Merge with callee's summary. */
changed |= cur_summary->loads->merge (callee_summary->loads, &parm_map,
record_adjustments);
if (!ignore_stores)
{
changed |= cur_summary->stores->merge (callee_summary->stores,
&parm_map,
record_adjustments);
if (!cur_summary->writes_errno
&& callee_summary->writes_errno)
{
cur_summary->writes_errno = true;
changed = true;
}
}
return changed;
}
/* Return access mode for argument I of call STMT with FNSPEC. */
static modref_access_node
get_access_for_fnspec (gcall *call, attr_fnspec &fnspec,
unsigned int i, modref_parm_map &map)
{
tree size = NULL_TREE;
unsigned int size_arg;
if (!fnspec.arg_specified_p (i))
;
else if (fnspec.arg_max_access_size_given_by_arg_p (i, &size_arg))
size = gimple_call_arg (call, size_arg);
else if (fnspec.arg_access_size_given_by_type_p (i))
{
tree callee = gimple_call_fndecl (call);
tree t = TYPE_ARG_TYPES (TREE_TYPE (callee));
for (unsigned int p = 0; p < i; p++)
t = TREE_CHAIN (t);
size = TYPE_SIZE_UNIT (TREE_TYPE (TREE_VALUE (t)));
}
modref_access_node a = {0, -1, -1,
map.parm_offset, map.parm_index,
map.parm_offset_known, 0};
poly_int64 size_hwi;
if (size
&& poly_int_tree_p (size, &size_hwi)
&& coeffs_in_range_p (size_hwi, 0,
HOST_WIDE_INT_MAX / BITS_PER_UNIT))
{
a.size = -1;
a.max_size = size_hwi << LOG2_BITS_PER_UNIT;
}
return a;
}
/* Collapse loads and return true if something changed. */
static bool
collapse_loads (modref_summary *cur_summary,
modref_summary_lto *cur_summary_lto)
{
bool changed = false;
if (cur_summary && !cur_summary->loads->every_base)
{
cur_summary->loads->collapse ();
changed = true;
}
if (cur_summary_lto
&& !cur_summary_lto->loads->every_base)
{
cur_summary_lto->loads->collapse ();
changed = true;
}
return changed;
}
/* Collapse loads and return true if something changed. */
static bool
collapse_stores (modref_summary *cur_summary,
modref_summary_lto *cur_summary_lto)
{
bool changed = false;
if (cur_summary && !cur_summary->stores->every_base)
{
cur_summary->stores->collapse ();
changed = true;
}
if (cur_summary_lto
&& !cur_summary_lto->stores->every_base)
{
cur_summary_lto->stores->collapse ();
changed = true;
}
return changed;
}
/* Apply side effects of call STMT to CUR_SUMMARY using FNSPEC.
If IGNORE_STORES is true ignore them.
Return false if no useful summary can be produced. */
static bool
process_fnspec (modref_summary *cur_summary,
modref_summary_lto *cur_summary_lto,
gcall *call, bool ignore_stores)
{
attr_fnspec fnspec = gimple_call_fnspec (call);
if (!fnspec.known_p ())
{
if (dump_file && gimple_call_builtin_p (call, BUILT_IN_NORMAL))
fprintf (dump_file, " Builtin with no fnspec: %s\n",
IDENTIFIER_POINTER (DECL_NAME (gimple_call_fndecl (call))));
if (ignore_stores)
{
collapse_loads (cur_summary, cur_summary_lto);
return true;
}
return false;
}
if (fnspec.global_memory_read_p ())
collapse_loads (cur_summary, cur_summary_lto);
else
{
for (unsigned int i = 0; i < gimple_call_num_args (call); i++)
if (!POINTER_TYPE_P (TREE_TYPE (gimple_call_arg (call, i))))
;
else if (!fnspec.arg_specified_p (i)
|| fnspec.arg_maybe_read_p (i))
{
modref_parm_map map = parm_map_for_arg (call, i);
if (map.parm_index == -2)
continue;
if (map.parm_index == -1)
{
collapse_loads (cur_summary, cur_summary_lto);
break;
}
if (cur_summary)
cur_summary->loads->insert (0, 0,
get_access_for_fnspec (call,
fnspec, i,
map),
false);
if (cur_summary_lto)
cur_summary_lto->loads->insert (0, 0,
get_access_for_fnspec (call,
fnspec, i,
map),
false);
}
}
if (ignore_stores)
return true;
if (fnspec.global_memory_written_p ())
collapse_stores (cur_summary, cur_summary_lto);
else
{
for (unsigned int i = 0; i < gimple_call_num_args (call); i++)
if (!POINTER_TYPE_P (TREE_TYPE (gimple_call_arg (call, i))))
;
else if (!fnspec.arg_specified_p (i)
|| fnspec.arg_maybe_written_p (i))
{
modref_parm_map map = parm_map_for_arg (call, i);
if (map.parm_index == -2)
continue;
if (map.parm_index == -1)
{
collapse_stores (cur_summary, cur_summary_lto);
break;
}
if (cur_summary)
cur_summary->stores->insert (0, 0,
get_access_for_fnspec (call,
fnspec, i,
map),
false);
if (cur_summary_lto)
cur_summary_lto->stores->insert (0, 0,
get_access_for_fnspec (call,
fnspec, i,
map),
false);
}
if (fnspec.errno_maybe_written_p () && flag_errno_math)
{
if (cur_summary)
cur_summary->writes_errno = true;
if (cur_summary_lto)
cur_summary_lto->writes_errno = true;
}
}
return true;
}
/* Analyze function call STMT in function F.
Remember recursive calls in RECURSIVE_CALLS. */
static bool
analyze_call (modref_summary *cur_summary, modref_summary_lto *cur_summary_lto,
gcall *stmt, vec *recursive_calls)
{
/* Check flags on the function call. In certain cases, analysis can be
simplified. */
int flags = gimple_call_flags (stmt);
if (flags & (ECF_CONST | ECF_NOVOPS))
{
if (dump_file)
fprintf (dump_file,
" - ECF_CONST | ECF_NOVOPS, ignoring all stores and all loads "
"except for args.\n");
return true;
}
/* Pure functions do not affect global memory. Stores by functions which are
noreturn and do not throw can safely be ignored. */
bool ignore_stores = ignore_stores_p (current_function_decl, flags);
/* Next, we try to get the callee's function declaration. The goal is to
merge their summary with ours. */
tree callee = gimple_call_fndecl (stmt);
/* Check if this is an indirect call. */
if (!callee)
{
if (dump_file)
fprintf (dump_file, gimple_call_internal_p (stmt)
? " - Internal call" : " - Indirect call.\n");
return process_fnspec (cur_summary, cur_summary_lto, stmt, ignore_stores);
}
/* We only need to handle internal calls in IPA mode. */
gcc_checking_assert (!cur_summary_lto);
struct cgraph_node *callee_node = cgraph_node::get_create (callee);
/* If this is a recursive call, the target summary is the same as ours, so
there's nothing to do. */
if (recursive_call_p (current_function_decl, callee))
{
recursive_calls->safe_push (stmt);
if (dump_file)
fprintf (dump_file, " - Skipping recursive call.\n");
return true;
}
gcc_assert (callee_node != NULL);
/* Get the function symbol and its availability. */
enum availability avail;
callee_node = callee_node->function_symbol (&avail);
if (avail <= AVAIL_INTERPOSABLE)
{
if (dump_file)
fprintf (dump_file, " - Function availability <= AVAIL_INTERPOSABLE.\n");
return process_fnspec (cur_summary, cur_summary_lto, stmt, ignore_stores);
}
/* Get callee's modref summary. As above, if there's no summary, we either
have to give up or, if stores are ignored, we can just purge loads. */
modref_summary *callee_summary = optimization_summaries->get (callee_node);
if (!callee_summary)
{
if (dump_file)
fprintf (dump_file, " - No modref summary available for callee.\n");
return process_fnspec (cur_summary, cur_summary_lto, stmt, ignore_stores);
}
merge_call_side_effects (cur_summary, stmt, callee_summary, ignore_stores,
callee_node, false);
return true;
}
/* Support analysis in non-lto and lto mode in parallel. */
struct summary_ptrs
{
struct modref_summary *nolto;
struct modref_summary_lto *lto;
};
/* Helper for analyze_stmt. */
static bool
analyze_load (gimple *, tree, tree op, void *data)
{
modref_summary *summary = ((summary_ptrs *)data)->nolto;
modref_summary_lto *summary_lto = ((summary_ptrs *)data)->lto;
if (dump_file)
{
fprintf (dump_file, " - Analyzing load: ");
print_generic_expr (dump_file, op);
fprintf (dump_file, "\n");
}
if (!record_access_p (op))
return false;
ao_ref r;
ao_ref_init (&r, op);
if (summary)
record_access (summary->loads, &r);
if (summary_lto)
record_access_lto (summary_lto->loads, &r);
return false;
}
/* Helper for analyze_stmt. */
static bool
analyze_store (gimple *, tree, tree op, void *data)
{
modref_summary *summary = ((summary_ptrs *)data)->nolto;
modref_summary_lto *summary_lto = ((summary_ptrs *)data)->lto;
if (dump_file)
{
fprintf (dump_file, " - Analyzing store: ");
print_generic_expr (dump_file, op);
fprintf (dump_file, "\n");
}
if (!record_access_p (op))
return false;
ao_ref r;
ao_ref_init (&r, op);
if (summary)
record_access (summary->stores, &r);
if (summary_lto)
record_access_lto (summary_lto->stores, &r);
return false;
}
/* Analyze statement STMT of function F.
If IPA is true do not merge in side effects of calls. */
static bool
analyze_stmt (modref_summary *summary, modref_summary_lto *summary_lto,
gimple *stmt, bool ipa, vec *recursive_calls)
{
/* In general we can not ignore clobbers because they are barriers for code
motion, however after inlining it is safe to do because local optimization
passes do not consider clobbers from other functions.
Similar logic is in ipa-pure-const.c. */
if ((ipa || cfun->after_inlining) && gimple_clobber_p (stmt))
return true;
struct summary_ptrs sums = {summary, summary_lto};
/* Analyze all loads and stores in STMT. */
walk_stmt_load_store_ops (stmt, &sums,
analyze_load, analyze_store);
switch (gimple_code (stmt))
{
case GIMPLE_ASM:
/* If the ASM statement does not read nor write memory, there's nothing
to do. Otherwise just give up. */
if (!gimple_asm_clobbers_memory_p (as_a (stmt)))
return true;
if (dump_file)
fprintf (dump_file, " - Function contains GIMPLE_ASM statement "
"which clobbers memory.\n");
return false;
case GIMPLE_CALL:
if (!ipa || gimple_call_internal_p (stmt))
return analyze_call (summary, summary_lto,
as_a (stmt), recursive_calls);
else
{
attr_fnspec fnspec = gimple_call_fnspec (as_a (stmt));
if (fnspec.known_p ()
&& (!fnspec.global_memory_read_p ()
|| !fnspec.global_memory_written_p ()))
{
cgraph_edge *e = cgraph_node::get (current_function_decl)->get_edge (stmt);
if (e->callee)
{
fnspec_summaries->get_create (e)->fnspec = xstrdup (fnspec.get_str ());
if (dump_file)
fprintf (dump_file, " Recorded fnspec %s\n", fnspec.get_str ());
}
}
}
return true;
default:
/* Nothing to do for other types of statements. */
return true;
}
}
/* Remove summary of current function because during the function body
scan we determined it is not useful. LTO, NOLTO and IPA determines the
mode of scan. */
static void
remove_summary (bool lto, bool nolto, bool ipa)
{
cgraph_node *fnode = cgraph_node::get (current_function_decl);
if (!ipa)
optimization_summaries->remove (fnode);
else
{
if (nolto)
summaries->remove (fnode);
if (lto)
summaries_lto->remove (fnode);
remove_modref_edge_summaries (fnode);
}
if (dump_file)
fprintf (dump_file,
" - modref done with result: not tracked.\n");
}
/* Return true if OP accesses memory pointed to by SSA_NAME. */
bool
memory_access_to (tree op, tree ssa_name)
{
tree base = get_base_address (op);
if (!base)
return false;
if (TREE_CODE (base) != MEM_REF && TREE_CODE (base) != TARGET_MEM_REF)
return false;
return TREE_OPERAND (base, 0) == ssa_name;
}
/* Consider statement val = *arg.
return EAF flags of ARG that can be determined from EAF flags of VAL
(which are known to be FLAGS). If IGNORE_STORES is true we can ignore
all stores to VAL, i.e. when handling noreturn function. */
static int
deref_flags (int flags, bool ignore_stores)
{
int ret = EAF_NODIRECTESCAPE;
/* If argument is unused just account for
the read involved in dereference. */
if (flags & EAF_UNUSED)
ret |= EAF_DIRECT | EAF_NOCLOBBER | EAF_NOESCAPE | EAF_NOT_RETURNED;
else
{
if ((flags & EAF_NOCLOBBER) || ignore_stores)
ret |= EAF_NOCLOBBER;
if ((flags & EAF_NOESCAPE) || ignore_stores)
ret |= EAF_NOESCAPE;
/* If the value dereferenced is not used for another load or store
we can still consider ARG as used only directly.
Consider
int
test (int *a)
{
return *a!=0;
}
*/
if ((flags & (EAF_NOREAD | EAF_NOT_RETURNED | EAF_NOESCAPE | EAF_DIRECT))
== (EAF_NOREAD | EAF_NOT_RETURNED | EAF_NOESCAPE | EAF_DIRECT)
&& ((flags & EAF_NOCLOBBER) || ignore_stores))
ret |= EAF_DIRECT;
if (flags & EAF_NOT_RETURNED)
ret |= EAF_NOT_RETURNED;
}
return ret;
}
namespace {
/* Description of an escape point. */
struct escape_point
{
/* Value escapes to this call. */
gcall *call;
/* Argument it escapes to. */
int arg;
/* Flags already known about the argument (this can save us from recording
esape points if local analysis did good job already). */
eaf_flags_t min_flags;
/* Does value escape directly or indiretly? */
bool direct;
};
class modref_lattice
{
public:
/* EAF flags of the SSA name. */
eaf_flags_t flags;
/* DFS bookkkeeping: we don't do real dataflow yet. */
bool known;
bool open;
/* When doing IPA analysis we can not merge in callee escape points;
Only remember them and do the merging at IPA propagation time. */
vec escape_points;
void init ();
void release ();
bool merge (const modref_lattice &with);
bool merge (int flags);
bool merge_deref (const modref_lattice &with, bool ignore_stores);
bool merge_direct_load ();
bool merge_direct_store ();
bool add_escape_point (gcall *call, int arg, int min_flags, bool diret);
void dump (FILE *out, int indent = 0) const;
};
/* Lattices are saved to vectors, so keep them PODs. */
void
modref_lattice::init ()
{
/* All flags we track. */
int f = EAF_DIRECT | EAF_NOCLOBBER | EAF_NOESCAPE | EAF_UNUSED
| EAF_NODIRECTESCAPE | EAF_NOT_RETURNED | EAF_NOREAD;
flags = f;
/* Check that eaf_flags_t is wide enough to hold all flags. */
gcc_checking_assert (f == flags);
open = true;
known = false;
}
/* Release memory. */
void
modref_lattice::release ()
{
escape_points.release ();
}
/* Dump lattice to OUT; indent with INDENT spaces. */
void
modref_lattice::dump (FILE *out, int indent) const
{
dump_eaf_flags (out, flags);
if (escape_points.length ())
{
fprintf (out, "%*sEscapes:\n", indent, "");
for (unsigned int i = 0; i < escape_points.length (); i++)
{
fprintf (out, "%*s Arg %i (%s) min flags", indent, "",
escape_points[i].arg,
escape_points[i].direct ? "direct" : "indirect");
dump_eaf_flags (out, escape_points[i].min_flags, false);
fprintf (out, " in call ");
print_gimple_stmt (out, escape_points[i].call, 0);
}
}
}
/* Add escape point CALL, ARG, MIN_FLAGS, DIRECT. Return false if such escape
point exists. */
bool
modref_lattice::add_escape_point (gcall *call, int arg, int min_flags,
bool direct)
{
escape_point *ep;
unsigned int i;
/* If we already determined flags to be bad enough,
we do not need to record. */
if ((flags & min_flags) == flags || (min_flags & EAF_UNUSED))
return false;
FOR_EACH_VEC_ELT (escape_points, i, ep)
if (ep->call == call && ep->arg == arg && ep->direct == direct)
{
if ((ep->min_flags & min_flags) == min_flags)
return false;
ep->min_flags &= min_flags;
return true;
}
/* Give up if max escape points is met. */
if ((int)escape_points.length () > param_modref_max_escape_points)
{
if (dump_file)
fprintf (dump_file, "--param modref-max-escape-points limit reached\n");
merge (0);
return true;
}
escape_point new_ep = {call, arg, min_flags, direct};
escape_points.safe_push (new_ep);
return true;
}
/* Merge in flags from F. */
bool
modref_lattice::merge (int f)
{
if (f & EAF_UNUSED)
return false;
/* Noescape implies that value also does not escape directly.
Fnspec machinery does set both so compensate for this. */
if (f & EAF_NOESCAPE)
f |= EAF_NODIRECTESCAPE;
if ((flags & f) != flags)
{
flags &= f;
/* Prune obvoiusly useless flags;
We do not have ECF_FLAGS handy which is not big problem since
we will do final flags cleanup before producing summary.
Merging should be fast so it can work well with dataflow. */
flags = remove_useless_eaf_flags (flags, 0, false);
if (!flags)
escape_points.release ();
return true;
}
return false;
}
/* Merge in WITH. Return true if anyting changed. */
bool
modref_lattice::merge (const modref_lattice &with)
{
if (!with.known)
return merge (0);
bool changed = merge (with.flags);
if (!flags)
return changed;
for (unsigned int i = 0; i < with.escape_points.length (); i++)
changed |= add_escape_point (with.escape_points[i].call,
with.escape_points[i].arg,
with.escape_points[i].min_flags,
with.escape_points[i].direct);
return changed;
}
/* Merge in deref of WITH. If IGNORE_STORES is true do not consider
stores. Return true if anyting changed. */
bool
modref_lattice::merge_deref (const modref_lattice &with, bool ignore_stores)
{
if (!with.known)
return merge (0);
bool changed = merge (deref_flags (with.flags, ignore_stores));
if (!flags)
return changed;
for (unsigned int i = 0; i < with.escape_points.length (); i++)
{
int min_flags = with.escape_points[i].min_flags;
if (with.escape_points[i].direct)
min_flags = deref_flags (min_flags, ignore_stores);
else if (ignore_stores)
min_flags |= ignore_stores_eaf_flags;
changed |= add_escape_point (with.escape_points[i].call,
with.escape_points[i].arg,
min_flags,
false);
}
return changed;
}
/* Merge in flags for direct load. */
bool
modref_lattice::merge_direct_load ()
{
return merge (~(EAF_UNUSED | EAF_NOREAD));
}
/* Merge in flags for direct store. */
bool
modref_lattice::merge_direct_store ()
{
return merge (~(EAF_UNUSED | EAF_NOCLOBBER));
}
} /* ANON namespace. */
static void analyze_ssa_name_flags (tree name,
vec &lattice,
int depth, bool ipa);
/* Call statements may return their parameters. Consider argument number
ARG of USE_STMT and determine flags that can needs to be cleared
in case pointer possibly indirectly references from ARG I is returned.
LATTICE, DEPTH and ipa are same as in analyze_ssa_name_flags. */
static void
merge_call_lhs_flags (gcall *call, int arg, int index, bool deref,
vec &lattice,
int depth, bool ipa)
{
/* If there is no return value, no flags are affected. */
if (!gimple_call_lhs (call))
return;
/* If we know that function returns given argument and it is not ARG
we can still be happy. */
int flags = gimple_call_return_flags (call);
if ((flags & ERF_RETURNS_ARG)
&& (flags & ERF_RETURN_ARG_MASK) != arg)
return;
if (gimple_call_arg_flags (call, arg) & (EAF_NOT_RETURNED | EAF_UNUSED))
return;
/* If return value is SSA name determine its flags. */
if (TREE_CODE (gimple_call_lhs (call)) == SSA_NAME)
{
tree lhs = gimple_call_lhs (call);
analyze_ssa_name_flags (lhs, lattice, depth + 1, ipa);
if (deref)
lattice[index].merge_deref (lattice[SSA_NAME_VERSION (lhs)], false);
else
lattice[index].merge (lattice[SSA_NAME_VERSION (lhs)]);
}
/* In the case of memory store we can do nothing. */
else
lattice[index].merge (0);
}
/* Analyze EAF flags for SSA name NAME and store result to LATTICE.
LATTICE is an array of modref_lattices.
DEPTH is a recursion depth used to make debug output prettier.
If IPA is true we analyze for IPA propagation (and thus call escape points
are processed later) */
static void
analyze_ssa_name_flags (tree name, vec &lattice, int depth,
bool ipa)
{
imm_use_iterator ui;
gimple *use_stmt;
int index = SSA_NAME_VERSION (name);
/* See if value is already computed. */
if (lattice[index].known)
return;
if (lattice[index].open)
{
if (dump_file)
fprintf (dump_file,
"%*sGiving up on a cycle in SSA graph\n", depth * 4, "");
return;
}
if (depth == param_modref_max_depth)
{
if (dump_file)
fprintf (dump_file,
"%*sGiving up on max depth\n", depth * 4, "");
return;
}
/* Recursion guard. */
lattice[index].init ();
if (dump_file)
{
fprintf (dump_file,
"%*sAnalyzing flags of ssa name: ", depth * 4, "");
print_generic_expr (dump_file, name);
fprintf (dump_file, "\n");
}
FOR_EACH_IMM_USE_STMT (use_stmt, ui, name)
{
if (lattice[index].flags == 0)
break;
if (is_gimple_debug (use_stmt))
continue;
if (dump_file)
{
fprintf (dump_file, "%*s Analyzing stmt: ", depth * 4, "");
print_gimple_stmt (dump_file, use_stmt, 0);
}
/* If we see a direct non-debug use, clear unused bit.
All dereferneces should be accounted below using deref_flags. */
lattice[index].merge (~EAF_UNUSED);
/* Gimple return may load the return value.
Returning name counts as an use by tree-ssa-structalias.c */
if (greturn *ret = dyn_cast (use_stmt))
{
if (gimple_return_retval (ret) == name)
lattice[index].merge (~(EAF_UNUSED | EAF_NOT_RETURNED));
else if (memory_access_to (gimple_return_retval (ret), name))
{
lattice[index].merge_direct_load ();
lattice[index].merge (~(EAF_UNUSED | EAF_NOT_RETURNED));
}
}
/* Account for LHS store, arg loads and flags from callee function. */
else if (gcall *call = dyn_cast (use_stmt))
{
tree callee = gimple_call_fndecl (call);
/* IPA PTA internally it treats calling a function as "writing" to
the argument space of all functions the function pointer points to
(PR101949). We can not drop EAF_NOCLOBBER only when ipa-pta
is on since that would allow propagation of this from -fno-ipa-pta
to -fipa-pta functions. */
if (gimple_call_fn (use_stmt) == name)
lattice[index].merge (~(EAF_NOCLOBBER | EAF_UNUSED));
/* Recursion would require bit of propagation; give up for now. */
if (callee && !ipa && recursive_call_p (current_function_decl,
callee))
lattice[index].merge (0);
else
{
int ecf_flags = gimple_call_flags (call);
bool ignore_stores = ignore_stores_p (current_function_decl,
ecf_flags);
bool ignore_retval = ignore_retval_p (current_function_decl,
ecf_flags);
/* Handle *name = func (...). */
if (gimple_call_lhs (call)
&& memory_access_to (gimple_call_lhs (call), name))
{
lattice[index].merge_direct_store ();
/* Return slot optimization passes address of
LHS to callee via hidden parameter and this
may make LHS to escape. See PR 98499. */
if (gimple_call_return_slot_opt_p (call)
&& TREE_ADDRESSABLE (TREE_TYPE (gimple_call_lhs (call))))
lattice[index].merge (EAF_NOREAD | EAF_DIRECT);
}
/* We do not track accesses to the static chain (we could)
so give up. */
if (gimple_call_chain (call)
&& (gimple_call_chain (call) == name))
lattice[index].merge (0);
/* Process internal functions and right away. */
bool record_ipa = ipa && !gimple_call_internal_p (call);
/* Handle all function parameters. */
for (unsigned i = 0;
i < gimple_call_num_args (call) && lattice[index].flags; i++)
/* Name is directly passed to the callee. */
if (gimple_call_arg (call, i) == name)
{
if (!(ecf_flags & (ECF_CONST | ECF_NOVOPS)))
{
int call_flags = gimple_call_arg_flags (call, i)
| EAF_NOT_RETURNED;
if (ignore_stores)
call_flags |= ignore_stores_eaf_flags;
if (!record_ipa)
lattice[index].merge (call_flags);
else
lattice[index].add_escape_point (call, i,
call_flags, true);
}
if (!ignore_retval)
merge_call_lhs_flags (call, i, index, false,
lattice, depth, ipa);
}
/* Name is dereferenced and passed to a callee. */
else if (memory_access_to (gimple_call_arg (call, i), name))
{
if (ecf_flags & (ECF_CONST | ECF_NOVOPS))
lattice[index].merge_direct_load ();
else
{
int call_flags = deref_flags
(gimple_call_arg_flags (call, i)
| EAF_NOT_RETURNED, ignore_stores);
if (!record_ipa)
lattice[index].merge (call_flags);
else
lattice[index].add_escape_point (call, i,
call_flags, false);
}
if (!ignore_retval)
merge_call_lhs_flags (call, i, index, true,
lattice, depth, ipa);
}
}
}
else if (gimple_assign_load_p (use_stmt))
{
gassign *assign = as_a (use_stmt);
/* Memory to memory copy. */
if (gimple_store_p (assign))
{
/* Handle *lhs = *name.
We do not track memory locations, so assume that value
is used arbitrarily. */
if (memory_access_to (gimple_assign_rhs1 (assign), name))
lattice[index].merge (0);
/* Handle *name = *exp. */
else if (memory_access_to (gimple_assign_lhs (assign), name))
lattice[index].merge_direct_store ();
}
/* Handle lhs = *name. */
else if (memory_access_to (gimple_assign_rhs1 (assign), name))
{
tree lhs = gimple_assign_lhs (assign);
analyze_ssa_name_flags (lhs, lattice, depth + 1, ipa);
lattice[index].merge_deref (lattice[SSA_NAME_VERSION (lhs)],
false);
}
}
else if (gimple_store_p (use_stmt))
{
gassign *assign = dyn_cast (use_stmt);
/* Handle *lhs = name. */
if (assign && gimple_assign_rhs1 (assign) == name)
{
if (dump_file)
fprintf (dump_file, "%*s ssa name saved to memory\n",
depth * 4, "");
lattice[index].merge (0);
}
/* Handle *name = exp. */
else if (assign
&& memory_access_to (gimple_assign_lhs (assign), name))
{
/* In general we can not ignore clobbers because they are
barriers for code motion, however after inlining it is safe to
do because local optimization passes do not consider clobbers
from other functions. Similar logic is in ipa-pure-const.c. */
if (!cfun->after_inlining || !gimple_clobber_p (assign))
lattice[index].merge_direct_store ();
}
/* ASM statements etc. */
else if (!assign)
{
if (dump_file)
fprintf (dump_file, "%*s Unhandled store\n",
depth * 4, "");
lattice[index].merge (0);
}
}
else if (gassign *assign = dyn_cast (use_stmt))
{
enum tree_code code = gimple_assign_rhs_code (assign);
/* See if operation is a merge as considered by
tree-ssa-structalias.c:find_func_aliases. */
if (!truth_value_p (code)
&& code != POINTER_DIFF_EXPR
&& (code != POINTER_PLUS_EXPR
|| gimple_assign_rhs1 (assign) == name))
{
tree lhs = gimple_assign_lhs (assign);
analyze_ssa_name_flags (lhs, lattice, depth + 1, ipa);
lattice[index].merge (lattice[SSA_NAME_VERSION (lhs)]);
}
}
else if (gphi *phi = dyn_cast (use_stmt))
{
tree result = gimple_phi_result (phi);
analyze_ssa_name_flags (result, lattice, depth + 1, ipa);
lattice[index].merge (lattice[SSA_NAME_VERSION (result)]);
}
/* Conditions are not considered escape points
by tree-ssa-structalias. */
else if (gimple_code (use_stmt) == GIMPLE_COND)
;
else
{
if (dump_file)
fprintf (dump_file, "%*s Unhandled stmt\n", depth * 4, "");
lattice[index].merge (0);
}
if (dump_file)
{
fprintf (dump_file, "%*s current flags of ", depth * 4, "");
print_generic_expr (dump_file, name);
lattice[index].dump (dump_file, depth * 4 + 4);
}
}
if (dump_file)
{
fprintf (dump_file, "%*sflags of ssa name ", depth * 4, "");
print_generic_expr (dump_file, name);
lattice[index].dump (dump_file, depth * 4 + 2);
}
lattice[index].open = false;
lattice[index].known = true;
}
/* Determine EAF flags for function parameters. */
static void
analyze_parms (modref_summary *summary, modref_summary_lto *summary_lto,
bool ipa)
{
unsigned int parm_index = 0;
unsigned int count = 0;
int ecf_flags = flags_from_decl_or_type (current_function_decl);
/* For novops functions we have nothing to gain by EAF flags. */
if (ecf_flags & ECF_NOVOPS)
return;
for (tree parm = DECL_ARGUMENTS (current_function_decl); parm;
parm = TREE_CHAIN (parm))
count++;
if (!count)
return;
auto_vec lattice;
lattice.safe_grow_cleared (num_ssa_names, true);
for (tree parm = DECL_ARGUMENTS (current_function_decl); parm; parm_index++,
parm = TREE_CHAIN (parm))
{
tree name = ssa_default_def (cfun, parm);
if (!name || has_zero_uses (name))
{
/* We do not track non-SSA parameters,
but we want to track unused gimple_regs. */
if (!is_gimple_reg (parm))
continue;
if (summary)
{
if (parm_index >= summary->arg_flags.length ())
summary->arg_flags.safe_grow_cleared (count, true);
summary->arg_flags[parm_index] = EAF_UNUSED;
}
else if (summary_lto)
{
if (parm_index >= summary_lto->arg_flags.length ())
summary_lto->arg_flags.safe_grow_cleared (count, true);
summary_lto->arg_flags[parm_index] = EAF_UNUSED;
}
continue;
}
analyze_ssa_name_flags (name, lattice, 0, ipa);
int flags = lattice[SSA_NAME_VERSION (name)].flags;
/* Eliminate useless flags so we do not end up storing unnecessary
summaries. */
flags = remove_useless_eaf_flags
(flags, ecf_flags,
VOID_TYPE_P (TREE_TYPE (TREE_TYPE (current_function_decl))));
if (flags)
{
if (summary)
{
if (parm_index >= summary->arg_flags.length ())
summary->arg_flags.safe_grow_cleared (count, true);
summary->arg_flags[parm_index] = flags;
}
else if (summary_lto)
{
if (parm_index >= summary_lto->arg_flags.length ())
summary_lto->arg_flags.safe_grow_cleared (count, true);
summary_lto->arg_flags[parm_index] = flags;
}
if (lattice[SSA_NAME_VERSION (name)].escape_points.length ())
{
escape_point *ep;
unsigned int ip;
cgraph_node *node = cgraph_node::get (current_function_decl);
gcc_checking_assert (ipa);
FOR_EACH_VEC_ELT
(lattice[SSA_NAME_VERSION (name)].escape_points, ip, ep)
if ((ep->min_flags & flags) != flags)
{
cgraph_edge *e = node->get_edge (ep->call);
struct escape_entry ee = {parm_index, ep->arg,
ep->min_flags, ep->direct};
escape_summaries->get_create (e)->esc.safe_push (ee);
}
}
}
}
if (ipa)
for (unsigned int i = 0; i < num_ssa_names; i++)
lattice[i].release ();
}
/* Analyze function F. IPA indicates whether we're running in local mode
(false) or the IPA mode (true). */
static void
analyze_function (function *f, bool ipa)
{
if (dump_file)
fprintf (dump_file, "modref analyzing '%s' (ipa=%i)%s%s\n",
function_name (f), ipa,
TREE_READONLY (current_function_decl) ? " (const)" : "",
DECL_PURE_P (current_function_decl) ? " (pure)" : "");
/* Don't analyze this function if it's compiled with -fno-strict-aliasing. */
if (!flag_ipa_modref)
return;
/* Compute no-LTO summaries when local optimization is going to happen. */
bool nolto = (!ipa || ((!flag_lto || flag_fat_lto_objects) && !in_lto_p)
|| (in_lto_p && !flag_wpa
&& flag_incremental_link != INCREMENTAL_LINK_LTO));
/* Compute LTO when LTO streaming is going to happen. */
bool lto = ipa && ((flag_lto && !in_lto_p)
|| flag_wpa
|| flag_incremental_link == INCREMENTAL_LINK_LTO);
cgraph_node *fnode = cgraph_node::get (current_function_decl);
modref_summary *summary = NULL;
modref_summary_lto *summary_lto = NULL;
/* Initialize the summary.
If we run in local mode there is possibly pre-existing summary from
IPA pass. Dump it so it is easy to compare if mod-ref info has
improved. */
if (!ipa)
{
if (!optimization_summaries)
optimization_summaries = modref_summaries::create_ggc (symtab);
else /* Remove existing summary if we are re-running the pass. */
{
if (dump_file
&& (summary
= optimization_summaries->get (cgraph_node::get (f->decl)))
!= NULL
&& summary->loads)
{
fprintf (dump_file, "Past summary:\n");
optimization_summaries->get
(cgraph_node::get (f->decl))->dump (dump_file);
}
optimization_summaries->remove (cgraph_node::get (f->decl));
}
summary = optimization_summaries->get_create (cgraph_node::get (f->decl));
gcc_checking_assert (nolto && !lto);
}
/* In IPA mode we analyze every function precisely once. Assert that. */
else
{
if (nolto)
{
if (!summaries)
summaries = modref_summaries::create_ggc (symtab);
else
summaries->remove (cgraph_node::get (f->decl));
summary = summaries->get_create (cgraph_node::get (f->decl));
}
if (lto)
{
if (!summaries_lto)
summaries_lto = modref_summaries_lto::create_ggc (symtab);
else
summaries_lto->remove (cgraph_node::get (f->decl));
summary_lto = summaries_lto->get_create (cgraph_node::get (f->decl));
}
if (!fnspec_summaries)
fnspec_summaries = new fnspec_summaries_t (symtab);
if (!escape_summaries)
escape_summaries = new escape_summaries_t (symtab);
}
/* Create and initialize summary for F.
Note that summaries may be already allocated from previous
run of the pass. */
if (nolto)
{
gcc_assert (!summary->loads);
summary->loads = modref_records::create_ggc (param_modref_max_bases,
param_modref_max_refs,
param_modref_max_accesses);
gcc_assert (!summary->stores);
summary->stores = modref_records::create_ggc (param_modref_max_bases,
param_modref_max_refs,
param_modref_max_accesses);
summary->writes_errno = false;
}
if (lto)
{
gcc_assert (!summary_lto->loads);
summary_lto->loads = modref_records_lto::create_ggc
(param_modref_max_bases,
param_modref_max_refs,
param_modref_max_accesses);
gcc_assert (!summary_lto->stores);
summary_lto->stores = modref_records_lto::create_ggc
(param_modref_max_bases,
param_modref_max_refs,
param_modref_max_accesses);
summary_lto->writes_errno = false;
}
analyze_parms (summary, summary_lto, ipa);
int ecf_flags = flags_from_decl_or_type (current_function_decl);
auto_vec recursive_calls;
/* Analyze each statement in each basic block of the function. If the
statement cannot be analyzed (for any reason), the entire function cannot
be analyzed by modref. */
basic_block bb;
FOR_EACH_BB_FN (bb, f)
{
gimple_stmt_iterator si;
for (si = gsi_after_labels (bb); !gsi_end_p (si); gsi_next (&si))
{
if (!analyze_stmt (summary, summary_lto,
gsi_stmt (si), ipa, &recursive_calls)
|| ((!summary || !summary->useful_p (ecf_flags, false))
&& (!summary_lto
|| !summary_lto->useful_p (ecf_flags, false))))
{
collapse_loads (summary, summary_lto);
collapse_stores (summary, summary_lto);
break;
}
}
}
/* In non-IPA mode we need to perform iterative datafow on recursive calls.
This needs to be done after all other side effects are computed. */
if (!ipa)
{
bool changed = true;
bool first = true;
while (changed)
{
changed = false;
for (unsigned i = 0; i < recursive_calls.length (); i++)
{
changed |= merge_call_side_effects
(summary, recursive_calls[i], summary,
ignore_stores_p (current_function_decl,
gimple_call_flags
(recursive_calls[i])),
fnode, !first);
if (!summary->useful_p (ecf_flags, false))
{
remove_summary (lto, nolto, ipa);
return;
}
}
first = false;
}
}
if (summary && !summary->useful_p (ecf_flags))
{
if (!ipa)
optimization_summaries->remove (fnode);
else
summaries->remove (fnode);
summary = NULL;
}
if (summary_lto && !summary_lto->useful_p (ecf_flags))
{
summaries_lto->remove (fnode);
summary_lto = NULL;
}
if (ipa && !summary && !summary_lto)
remove_modref_edge_summaries (fnode);
if (dump_file)
{
fprintf (dump_file, " - modref done with result: tracked.\n");
if (summary)
summary->dump (dump_file);
if (summary_lto)
summary_lto->dump (dump_file);
dump_modref_edge_summaries (dump_file, fnode, 2);
}
}
/* Callback for generate_summary. */
static void
modref_generate (void)
{
struct cgraph_node *node;
FOR_EACH_FUNCTION_WITH_GIMPLE_BODY (node)
{
function *f = DECL_STRUCT_FUNCTION (node->decl);
if (!f)
continue;
push_cfun (f);
analyze_function (f, true);
pop_cfun ();
}
}
/* Called when a new function is inserted to callgraph late. */
void
modref_summaries::insert (struct cgraph_node *node, modref_summary *)
{
/* Local passes ought to be executed by the pass manager. */
if (this == optimization_summaries)
{
optimization_summaries->remove (node);
return;
}
if (!DECL_STRUCT_FUNCTION (node->decl)
|| !opt_for_fn (node->decl, flag_ipa_modref))
{
summaries->remove (node);
return;
}
push_cfun (DECL_STRUCT_FUNCTION (node->decl));
analyze_function (DECL_STRUCT_FUNCTION (node->decl), true);
pop_cfun ();
}
/* Called when a new function is inserted to callgraph late. */
void
modref_summaries_lto::insert (struct cgraph_node *node, modref_summary_lto *)
{
/* We do not support adding new function when IPA information is already
propagated. This is done only by SIMD cloning that is not very
critical. */
if (!DECL_STRUCT_FUNCTION (node->decl)
|| !opt_for_fn (node->decl, flag_ipa_modref)
|| propagated)
{
summaries_lto->remove (node);
return;
}
push_cfun (DECL_STRUCT_FUNCTION (node->decl));
analyze_function (DECL_STRUCT_FUNCTION (node->decl), true);
pop_cfun ();
}
/* Called when new clone is inserted to callgraph late. */
void
modref_summaries::duplicate (cgraph_node *, cgraph_node *dst,
modref_summary *src_data,
modref_summary *dst_data)
{
/* Do not duplicate optimization summaries; we do not handle parameter
transforms on them. */
if (this == optimization_summaries)
{
optimization_summaries->remove (dst);
return;
}
dst_data->stores = modref_records::create_ggc
(src_data->stores->max_bases,
src_data->stores->max_refs,
src_data->stores->max_accesses);
dst_data->stores->copy_from (src_data->stores);
dst_data->loads = modref_records::create_ggc
(src_data->loads->max_bases,
src_data->loads->max_refs,
src_data->loads->max_accesses);
dst_data->loads->copy_from (src_data->loads);
dst_data->writes_errno = src_data->writes_errno;
if (src_data->arg_flags.length ())
dst_data->arg_flags = src_data->arg_flags.copy ();
}
/* Called when new clone is inserted to callgraph late. */
void
modref_summaries_lto::duplicate (cgraph_node *, cgraph_node *,
modref_summary_lto *src_data,
modref_summary_lto *dst_data)
{
/* Be sure that no further cloning happens after ipa-modref. If it does
we will need to update signatures for possible param changes. */
gcc_checking_assert (!((modref_summaries_lto *)summaries_lto)->propagated);
dst_data->stores = modref_records_lto::create_ggc
(src_data->stores->max_bases,
src_data->stores->max_refs,
src_data->stores->max_accesses);
dst_data->stores->copy_from (src_data->stores);
dst_data->loads = modref_records_lto::create_ggc
(src_data->loads->max_bases,
src_data->loads->max_refs,
src_data->loads->max_accesses);
dst_data->loads->copy_from (src_data->loads);
dst_data->writes_errno = src_data->writes_errno;
if (src_data->arg_flags.length ())
dst_data->arg_flags = src_data->arg_flags.copy ();
}
namespace
{
/* Definition of the modref pass on GIMPLE. */
const pass_data pass_data_modref = {
GIMPLE_PASS,
"modref",
OPTGROUP_IPA,
TV_TREE_MODREF,
(PROP_cfg | PROP_ssa),
0,
0,
0,
0,
};
class pass_modref : public gimple_opt_pass
{
public:
pass_modref (gcc::context *ctxt)
: gimple_opt_pass (pass_data_modref, ctxt) {}
/* opt_pass methods: */
opt_pass *clone ()
{
return new pass_modref (m_ctxt);
}
virtual bool gate (function *)
{
return flag_ipa_modref;
}
virtual unsigned int execute (function *);
};
/* Encode TT to the output block OB using the summary streaming API. */
static void
write_modref_records (modref_records_lto *tt, struct output_block *ob)
{
streamer_write_uhwi (ob, tt->max_bases);
streamer_write_uhwi (ob, tt->max_refs);
streamer_write_uhwi (ob, tt->max_accesses);
streamer_write_uhwi (ob, tt->every_base);
streamer_write_uhwi (ob, vec_safe_length (tt->bases));
size_t i;
modref_base_node *base_node;
FOR_EACH_VEC_SAFE_ELT (tt->bases, i, base_node)
{
stream_write_tree (ob, base_node->base, true);
streamer_write_uhwi (ob, base_node->every_ref);
streamer_write_uhwi (ob, vec_safe_length (base_node->refs));
size_t j;
modref_ref_node *ref_node;
FOR_EACH_VEC_SAFE_ELT (base_node->refs, j, ref_node)
{
stream_write_tree (ob, ref_node->ref, true);
streamer_write_uhwi (ob, ref_node->every_access);
streamer_write_uhwi (ob, vec_safe_length (ref_node->accesses));
size_t k;
modref_access_node *access_node;
FOR_EACH_VEC_SAFE_ELT (ref_node->accesses, k, access_node)
{
streamer_write_hwi (ob, access_node->parm_index);
if (access_node->parm_index != -1)
{
streamer_write_uhwi (ob, access_node->parm_offset_known);
if (access_node->parm_offset_known)
{
streamer_write_poly_int64 (ob, access_node->parm_offset);
streamer_write_poly_int64 (ob, access_node->offset);
streamer_write_poly_int64 (ob, access_node->size);
streamer_write_poly_int64 (ob, access_node->max_size);
}
}
}
}
}
}
/* Read a modref_tree from the input block IB using the data from DATA_IN.
This assumes that the tree was encoded using write_modref_tree.
Either nolto_ret or lto_ret is initialized by the tree depending whether
LTO streaming is expected or not. */
void
read_modref_records (lto_input_block *ib, struct data_in *data_in,
modref_records **nolto_ret,
modref_records_lto **lto_ret)
{
size_t max_bases = streamer_read_uhwi (ib);
size_t max_refs = streamer_read_uhwi (ib);
size_t max_accesses = streamer_read_uhwi (ib);
if (lto_ret)
*lto_ret = modref_records_lto::create_ggc (max_bases, max_refs,
max_accesses);
if (nolto_ret)
*nolto_ret = modref_records::create_ggc (max_bases, max_refs,
max_accesses);
gcc_checking_assert (lto_ret || nolto_ret);
size_t every_base = streamer_read_uhwi (ib);
size_t nbase = streamer_read_uhwi (ib);
gcc_assert (!every_base || nbase == 0);
if (every_base)
{
if (nolto_ret)
(*nolto_ret)->collapse ();
if (lto_ret)
(*lto_ret)->collapse ();
}
for (size_t i = 0; i < nbase; i++)
{
tree base_tree = stream_read_tree (ib, data_in);
modref_base_node *nolto_base_node = NULL;
modref_base_node *lto_base_node = NULL;
/* At stream in time we have LTO alias info. Check if we streamed in
something obviously unnecessary. Do not glob types by alias sets;
it is not 100% clear that ltrans types will get merged same way.
Types may get refined based on ODR type conflicts. */
if (base_tree && !get_alias_set (base_tree))
{
if (dump_file)
{
fprintf (dump_file, "Streamed in alias set 0 type ");
print_generic_expr (dump_file, base_tree);
fprintf (dump_file, "\n");
}
base_tree = NULL;
}
if (nolto_ret)
nolto_base_node = (*nolto_ret)->insert_base (base_tree
? get_alias_set (base_tree)
: 0, 0);
if (lto_ret)
lto_base_node = (*lto_ret)->insert_base (base_tree, 0);
size_t every_ref = streamer_read_uhwi (ib);
size_t nref = streamer_read_uhwi (ib);
gcc_assert (!every_ref || nref == 0);
if (every_ref)
{
if (nolto_base_node)
nolto_base_node->collapse ();
if (lto_base_node)
lto_base_node->collapse ();
}
for (size_t j = 0; j < nref; j++)
{
tree ref_tree = stream_read_tree (ib, data_in);
if (ref_tree && !get_alias_set (ref_tree))
{
if (dump_file)
{
fprintf (dump_file, "Streamed in alias set 0 type ");
print_generic_expr (dump_file, ref_tree);
fprintf (dump_file, "\n");
}
ref_tree = NULL;
}
modref_ref_node *nolto_ref_node = NULL;
modref_ref_node *lto_ref_node = NULL;
if (nolto_base_node)
nolto_ref_node
= nolto_base_node->insert_ref (ref_tree
? get_alias_set (ref_tree) : 0,
max_refs);
if (lto_base_node)
lto_ref_node = lto_base_node->insert_ref (ref_tree, max_refs);
size_t every_access = streamer_read_uhwi (ib);
size_t naccesses = streamer_read_uhwi (ib);
if (nolto_ref_node)
nolto_ref_node->every_access = every_access;
if (lto_ref_node)
lto_ref_node->every_access = every_access;
for (size_t k = 0; k < naccesses; k++)
{
int parm_index = streamer_read_hwi (ib);
bool parm_offset_known = false;
poly_int64 parm_offset = 0;
poly_int64 offset = 0;
poly_int64 size = -1;
poly_int64 max_size = -1;
if (parm_index != -1)
{
parm_offset_known = streamer_read_uhwi (ib);
if (parm_offset_known)
{
parm_offset = streamer_read_poly_int64 (ib);
offset = streamer_read_poly_int64 (ib);
size = streamer_read_poly_int64 (ib);
max_size = streamer_read_poly_int64 (ib);
}
}
modref_access_node a = {offset, size, max_size, parm_offset,
parm_index, parm_offset_known, false};
if (nolto_ref_node)
nolto_ref_node->insert_access (a, max_accesses, false);
if (lto_ref_node)
lto_ref_node->insert_access (a, max_accesses, false);
}
}
}
if (lto_ret)
(*lto_ret)->cleanup ();
if (nolto_ret)
(*nolto_ret)->cleanup ();
}
/* Write ESUM to BP. */
static void
modref_write_escape_summary (struct bitpack_d *bp, escape_summary *esum)
{
if (!esum)
{
bp_pack_var_len_unsigned (bp, 0);
return;
}
bp_pack_var_len_unsigned (bp, esum->esc.length ());
unsigned int i;
escape_entry *ee;
FOR_EACH_VEC_ELT (esum->esc, i, ee)
{
bp_pack_var_len_unsigned (bp, ee->parm_index);
bp_pack_var_len_unsigned (bp, ee->arg);
bp_pack_var_len_unsigned (bp, ee->min_flags);
bp_pack_value (bp, ee->direct, 1);
}
}
/* Read escape summary for E from BP. */
static void
modref_read_escape_summary (struct bitpack_d *bp, cgraph_edge *e)
{
unsigned int n = bp_unpack_var_len_unsigned (bp);
if (!n)
return;
escape_summary *esum = escape_summaries->get_create (e);
esum->esc.reserve_exact (n);
for (unsigned int i = 0; i < n; i++)
{
escape_entry ee;
ee.parm_index = bp_unpack_var_len_unsigned (bp);
ee.arg = bp_unpack_var_len_unsigned (bp);
ee.min_flags = bp_unpack_var_len_unsigned (bp);
ee.direct = bp_unpack_value (bp, 1);
esum->esc.quick_push (ee);
}
}
/* Callback for write_summary. */
static void
modref_write ()
{
struct output_block *ob = create_output_block (LTO_section_ipa_modref);
lto_symtab_encoder_t encoder = ob->decl_state->symtab_node_encoder;
unsigned int count = 0;
int i;
if (!summaries_lto)
{
streamer_write_uhwi (ob, 0);
streamer_write_char_stream (ob->main_stream, 0);
produce_asm (ob, NULL);
destroy_output_block (ob);
return;
}
for (i = 0; i < lto_symtab_encoder_size (encoder); i++)
{
symtab_node *snode = lto_symtab_encoder_deref (encoder, i);
cgraph_node *cnode = dyn_cast (snode);
modref_summary_lto *r;
if (cnode && cnode->definition && !cnode->alias
&& (r = summaries_lto->get (cnode))
&& r->useful_p (flags_from_decl_or_type (cnode->decl)))
count++;
}
streamer_write_uhwi (ob, count);
for (i = 0; i < lto_symtab_encoder_size (encoder); i++)
{
symtab_node *snode = lto_symtab_encoder_deref (encoder, i);
cgraph_node *cnode = dyn_cast (snode);
if (cnode && cnode->definition && !cnode->alias)
{
modref_summary_lto *r = summaries_lto->get (cnode);
if (!r || !r->useful_p (flags_from_decl_or_type (cnode->decl)))
continue;
streamer_write_uhwi (ob, lto_symtab_encoder_encode (encoder, cnode));
streamer_write_uhwi (ob, r->arg_flags.length ());
for (unsigned int i = 0; i < r->arg_flags.length (); i++)
streamer_write_uhwi (ob, r->arg_flags[i]);
write_modref_records (r->loads, ob);
write_modref_records (r->stores, ob);
struct bitpack_d bp = bitpack_create (ob->main_stream);
bp_pack_value (&bp, r->writes_errno, 1);
if (!flag_wpa)
{
for (cgraph_edge *e = cnode->indirect_calls;
e; e = e->next_callee)
{
class fnspec_summary *sum = fnspec_summaries->get (e);
bp_pack_value (&bp, sum != NULL, 1);
if (sum)
bp_pack_string (ob, &bp, sum->fnspec, true);
class escape_summary *esum = escape_summaries->get (e);
modref_write_escape_summary (&bp,esum);
}
for (cgraph_edge *e = cnode->callees; e; e = e->next_callee)
{
class fnspec_summary *sum = fnspec_summaries->get (e);
bp_pack_value (&bp, sum != NULL, 1);
if (sum)
bp_pack_string (ob, &bp, sum->fnspec, true);
class escape_summary *esum = escape_summaries->get (e);
modref_write_escape_summary (&bp,esum);
}
}
streamer_write_bitpack (&bp);
}
}
streamer_write_char_stream (ob->main_stream, 0);
produce_asm (ob, NULL);
destroy_output_block (ob);
}
static void
read_section (struct lto_file_decl_data *file_data, const char *data,
size_t len)
{
const struct lto_function_header *header
= (const struct lto_function_header *) data;
const int cfg_offset = sizeof (struct lto_function_header);
const int main_offset = cfg_offset + header->cfg_size;
const int string_offset = main_offset + header->main_size;
struct data_in *data_in;
unsigned int i;
unsigned int f_count;
lto_input_block ib ((const char *) data + main_offset, header->main_size,
file_data->mode_table);
data_in
= lto_data_in_create (file_data, (const char *) data + string_offset,
header->string_size, vNULL);
f_count = streamer_read_uhwi (&ib);
for (i = 0; i < f_count; i++)
{
struct cgraph_node *node;
lto_symtab_encoder_t encoder;
unsigned int index = streamer_read_uhwi (&ib);
encoder = file_data->symtab_node_encoder;
node = dyn_cast (lto_symtab_encoder_deref (encoder,
index));
modref_summary *modref_sum = summaries
? summaries->get_create (node) : NULL;
modref_summary_lto *modref_sum_lto = summaries_lto
? summaries_lto->get_create (node)
: NULL;
if (optimization_summaries)
modref_sum = optimization_summaries->get_create (node);
if (modref_sum)
modref_sum->writes_errno = false;
if (modref_sum_lto)
modref_sum_lto->writes_errno = false;
gcc_assert (!modref_sum || (!modref_sum->loads
&& !modref_sum->stores));
gcc_assert (!modref_sum_lto || (!modref_sum_lto->loads
&& !modref_sum_lto->stores));
unsigned int args = streamer_read_uhwi (&ib);
if (args && modref_sum)
modref_sum->arg_flags.reserve_exact (args);
if (args && modref_sum_lto)
modref_sum_lto->arg_flags.reserve_exact (args);
for (unsigned int i = 0; i < args; i++)
{
eaf_flags_t flags = streamer_read_uhwi (&ib);
if (modref_sum)
modref_sum->arg_flags.quick_push (flags);
if (modref_sum_lto)
modref_sum_lto->arg_flags.quick_push (flags);
}
read_modref_records (&ib, data_in,
modref_sum ? &modref_sum->loads : NULL,
modref_sum_lto ? &modref_sum_lto->loads : NULL);
read_modref_records (&ib, data_in,
modref_sum ? &modref_sum->stores : NULL,
modref_sum_lto ? &modref_sum_lto->stores : NULL);
struct bitpack_d bp = streamer_read_bitpack (&ib);
if (bp_unpack_value (&bp, 1))
{
if (modref_sum)
modref_sum->writes_errno = true;
if (modref_sum_lto)
modref_sum_lto->writes_errno = true;
}
if (!flag_ltrans)
{
for (cgraph_edge *e = node->indirect_calls; e; e = e->next_callee)
{
if (bp_unpack_value (&bp, 1))
{
class fnspec_summary *sum = fnspec_summaries->get_create (e);
sum->fnspec = xstrdup (bp_unpack_string (data_in, &bp));
}
modref_read_escape_summary (&bp, e);
}
for (cgraph_edge *e = node->callees; e; e = e->next_callee)
{
if (bp_unpack_value (&bp, 1))
{
class fnspec_summary *sum = fnspec_summaries->get_create (e);
sum->fnspec = xstrdup (bp_unpack_string (data_in, &bp));
}
modref_read_escape_summary (&bp, e);
}
}
if (dump_file)
{
fprintf (dump_file, "Read modref for %s\n",
node->dump_name ());
if (modref_sum)
modref_sum->dump (dump_file);
if (modref_sum_lto)
modref_sum_lto->dump (dump_file);
dump_modref_edge_summaries (dump_file, node, 4);
}
}
lto_free_section_data (file_data, LTO_section_ipa_modref, NULL, data,
len);
lto_data_in_delete (data_in);
}
/* Callback for read_summary. */
static void
modref_read (void)
{
struct lto_file_decl_data **file_data_vec = lto_get_file_decl_data ();
struct lto_file_decl_data *file_data;
unsigned int j = 0;
gcc_checking_assert (!optimization_summaries && !summaries && !summaries_lto);
if (flag_ltrans)
optimization_summaries = modref_summaries::create_ggc (symtab);
else
{
if (flag_wpa || flag_incremental_link == INCREMENTAL_LINK_LTO)
summaries_lto = modref_summaries_lto::create_ggc (symtab);
if (!flag_wpa
|| (flag_incremental_link == INCREMENTAL_LINK_LTO
&& flag_fat_lto_objects))
summaries = modref_summaries::create_ggc (symtab);
if (!fnspec_summaries)
fnspec_summaries = new fnspec_summaries_t (symtab);
if (!escape_summaries)
escape_summaries = new escape_summaries_t (symtab);
}
while ((file_data = file_data_vec[j++]))
{
size_t len;
const char *data = lto_get_summary_section_data (file_data,
LTO_section_ipa_modref,
&len);
if (data)
read_section (file_data, data, len);
else
/* Fatal error here. We do not want to support compiling ltrans units
with different version of compiler or different flags than the WPA
unit, so this should never happen. */
fatal_error (input_location,
"IPA modref summary is missing in input file");
}
}
/* Recompute arg_flags for param adjustments in INFO. */
static void
remap_arg_flags (auto_vec &arg_flags, clone_info *info)
{
auto_vec old = arg_flags.copy ();
int max = -1;
size_t i;
ipa_adjusted_param *p;
arg_flags.release ();
FOR_EACH_VEC_SAFE_ELT (info->param_adjustments->m_adj_params, i, p)
{
int o = info->param_adjustments->get_original_index (i);
if (o >= 0 && (int)old.length () > o && old[o])
max = i;
}
if (max >= 0)
arg_flags.safe_grow_cleared (max + 1, true);
FOR_EACH_VEC_SAFE_ELT (info->param_adjustments->m_adj_params, i, p)
{
int o = info->param_adjustments->get_original_index (i);
if (o >= 0 && (int)old.length () > o && old[o])
arg_flags[i] = old[o];
}
}
/* If signature changed, update the summary. */
static void
update_signature (struct cgraph_node *node)
{
clone_info *info = clone_info::get (node);
if (!info || !info->param_adjustments)
return;
modref_summary *r = optimization_summaries
? optimization_summaries->get (node) : NULL;
modref_summary_lto *r_lto = summaries_lto
? summaries_lto->get (node) : NULL;
if (!r && !r_lto)
return;
if (dump_file)
{
fprintf (dump_file, "Updating summary for %s from:\n",
node->dump_name ());
if (r)
r->dump (dump_file);
if (r_lto)
r_lto->dump (dump_file);
}
size_t i, max = 0;
ipa_adjusted_param *p;
FOR_EACH_VEC_SAFE_ELT (info->param_adjustments->m_adj_params, i, p)
{
int idx = info->param_adjustments->get_original_index (i);
if (idx > (int)max)
max = idx;
}
auto_vec map;
map.reserve (max + 1);
for (i = 0; i <= max; i++)
map.quick_push (-1);
FOR_EACH_VEC_SAFE_ELT (info->param_adjustments->m_adj_params, i, p)
{
int idx = info->param_adjustments->get_original_index (i);
if (idx >= 0)
map[idx] = i;
}
if (r)
{
r->loads->remap_params (&map);
r->stores->remap_params (&map);
if (r->arg_flags.length ())
remap_arg_flags (r->arg_flags, info);
}
if (r_lto)
{
r_lto->loads->remap_params (&map);
r_lto->stores->remap_params (&map);
if (r_lto->arg_flags.length ())
remap_arg_flags (r_lto->arg_flags, info);
}
if (dump_file)
{
fprintf (dump_file, "to:\n");
if (r)
r->dump (dump_file);
if (r_lto)
r_lto->dump (dump_file);
}
return;
}
/* Definition of the modref IPA pass. */
const pass_data pass_data_ipa_modref =
{
IPA_PASS, /* type */
"modref", /* name */
OPTGROUP_IPA, /* optinfo_flags */
TV_IPA_MODREF, /* tv_id */
0, /* properties_required */
0, /* properties_provided */
0, /* properties_destroyed */
0, /* todo_flags_start */
( TODO_dump_symtab ), /* todo_flags_finish */
};
class pass_ipa_modref : public ipa_opt_pass_d
{
public:
pass_ipa_modref (gcc::context *ctxt)
: ipa_opt_pass_d (pass_data_ipa_modref, ctxt,
modref_generate, /* generate_summary */
modref_write, /* write_summary */
modref_read, /* read_summary */
modref_write, /* write_optimization_summary */
modref_read, /* read_optimization_summary */
NULL, /* stmt_fixup */
0, /* function_transform_todo_flags_start */
NULL, /* function_transform */
NULL) /* variable_transform */
{}
/* opt_pass methods: */
opt_pass *clone () { return new pass_ipa_modref (m_ctxt); }
virtual bool gate (function *)
{
return true;
}
virtual unsigned int execute (function *);
};
}
unsigned int pass_modref::execute (function *f)
{
analyze_function (f, false);
return 0;
}
gimple_opt_pass *
make_pass_modref (gcc::context *ctxt)
{
return new pass_modref (ctxt);
}
ipa_opt_pass_d *
make_pass_ipa_modref (gcc::context *ctxt)
{
return new pass_ipa_modref (ctxt);
}
/* Skip edges from and to nodes without ipa_pure_const enabled.
Ignore not available symbols. */
static bool
ignore_edge (struct cgraph_edge *e)
{
/* We merge summaries of inline clones into summaries of functions they
are inlined to. For that reason the complete function bodies must
act as unit. */
if (!e->inline_failed)
return false;
enum availability avail;
cgraph_node *callee = e->callee->function_or_virtual_thunk_symbol
(&avail, e->caller);
return (avail <= AVAIL_INTERPOSABLE
|| ((!optimization_summaries || !optimization_summaries->get (callee))
&& (!summaries_lto || !summaries_lto->get (callee)))
|| flags_from_decl_or_type (e->callee->decl)
& (ECF_CONST | ECF_NOVOPS));
}
/* Compute parm_map for CALLEE_EDGE. */
static bool
compute_parm_map (cgraph_edge *callee_edge, vec *parm_map)
{
class ipa_edge_args *args;
if (ipa_node_params_sum
&& !callee_edge->call_stmt_cannot_inline_p
&& (args = ipa_edge_args_sum->get (callee_edge)) != NULL)
{
int i, count = ipa_get_cs_argument_count (args);
class ipa_node_params *caller_parms_info, *callee_pi;
class ipa_call_summary *es
= ipa_call_summaries->get (callee_edge);
cgraph_node *callee
= callee_edge->callee->function_or_virtual_thunk_symbol
(NULL, callee_edge->caller);
caller_parms_info
= ipa_node_params_sum->get (callee_edge->caller->inlined_to
? callee_edge->caller->inlined_to
: callee_edge->caller);
callee_pi = ipa_node_params_sum->get (callee);
(*parm_map).safe_grow_cleared (count, true);
for (i = 0; i < count; i++)
{
if (es && es->param[i].points_to_local_or_readonly_memory)
{
(*parm_map)[i].parm_index = -2;
continue;
}
struct ipa_jump_func *jf
= ipa_get_ith_jump_func (args, i);
if (jf && callee_pi)
{
tree cst = ipa_value_from_jfunc (caller_parms_info,
jf,
ipa_get_type
(callee_pi, i));
if (cst && points_to_local_or_readonly_memory_p (cst))
{
(*parm_map)[i].parm_index = -2;
continue;
}
}
if (jf && jf->type == IPA_JF_PASS_THROUGH)
{
(*parm_map)[i].parm_index
= ipa_get_jf_pass_through_formal_id (jf);
if (ipa_get_jf_pass_through_operation (jf) == NOP_EXPR)
{
(*parm_map)[i].parm_offset_known = true;
(*parm_map)[i].parm_offset = 0;
}
else if (ipa_get_jf_pass_through_operation (jf)
== POINTER_PLUS_EXPR
&& ptrdiff_tree_p (ipa_get_jf_pass_through_operand (jf),
&(*parm_map)[i].parm_offset))
(*parm_map)[i].parm_offset_known = true;
else
(*parm_map)[i].parm_offset_known = false;
continue;
}
if (jf && jf->type == IPA_JF_ANCESTOR)
{
(*parm_map)[i].parm_index = ipa_get_jf_ancestor_formal_id (jf);
(*parm_map)[i].parm_offset_known = true;
gcc_checking_assert
(!(ipa_get_jf_ancestor_offset (jf) & (BITS_PER_UNIT - 1)));
(*parm_map)[i].parm_offset
= ipa_get_jf_ancestor_offset (jf) >> LOG2_BITS_PER_UNIT;
}
else
(*parm_map)[i].parm_index = -1;
}
if (dump_file)
{
fprintf (dump_file, " Parm map: ");
for (i = 0; i < count; i++)
fprintf (dump_file, " %i", (*parm_map)[i].parm_index);
fprintf (dump_file, "\n");
}
return true;
}
return false;
}
/* Map used to translate escape infos. */
struct escape_map
{
int parm_index;
bool direct;
};
/* Update escape map fo E. */
static void
update_escape_summary_1 (cgraph_edge *e,
vec > &map,
bool ignore_stores)
{
escape_summary *sum = escape_summaries->get (e);
if (!sum)
return;
auto_vec old = sum->esc.copy ();
sum->esc.release ();
unsigned int i;
escape_entry *ee;
FOR_EACH_VEC_ELT (old, i, ee)
{
unsigned int j;
struct escape_map *em;
if (ee->parm_index >= map.length ())
continue;
FOR_EACH_VEC_ELT (map[ee->parm_index], j, em)
{
int min_flags = ee->min_flags;
if (ee->direct && !em->direct)
min_flags = deref_flags (min_flags, ignore_stores);
struct escape_entry entry = {em->parm_index, ee->arg,
ee->min_flags,
ee->direct & em->direct};
sum->esc.safe_push (entry);
}
}
if (!sum->esc.length ())
escape_summaries->remove (e);
}
/* Update escape map fo NODE. */
static void
update_escape_summary (cgraph_node *node,
vec > &map,
bool ignore_stores)
{
if (!escape_summaries)
return;
for (cgraph_edge *e = node->indirect_calls; e; e = e->next_callee)
update_escape_summary_1 (e, map, ignore_stores);
for (cgraph_edge *e = node->callees; e; e = e->next_callee)
{
if (!e->inline_failed)
update_escape_summary (e->callee, map, ignore_stores);
else
update_escape_summary_1 (e, map, ignore_stores);
}
}
/* Call EDGE was inlined; merge summary from callee to the caller. */
void
ipa_merge_modref_summary_after_inlining (cgraph_edge *edge)
{
if (!summaries && !summaries_lto)
return;
struct cgraph_node *to = (edge->caller->inlined_to
? edge->caller->inlined_to : edge->caller);
class modref_summary *to_info = summaries ? summaries->get (to) : NULL;
class modref_summary_lto *to_info_lto = summaries_lto
? summaries_lto->get (to) : NULL;
if (!to_info && !to_info_lto)
{
if (summaries)
summaries->remove (edge->callee);
if (summaries_lto)
summaries_lto->remove (edge->callee);
remove_modref_edge_summaries (edge->callee);
return;
}
class modref_summary *callee_info = summaries ? summaries->get (edge->callee)
: NULL;
class modref_summary_lto *callee_info_lto
= summaries_lto ? summaries_lto->get (edge->callee) : NULL;
int flags = flags_from_decl_or_type (edge->callee->decl);
bool ignore_stores = ignore_stores_p (edge->caller->decl, flags);
if (!callee_info && to_info)
{
if (!(flags & (ECF_CONST | ECF_NOVOPS)))
to_info->loads->collapse ();
if (!ignore_stores)
to_info->stores->collapse ();
}
if (!callee_info_lto && to_info_lto)
{
if (!(flags & (ECF_CONST | ECF_NOVOPS)))
to_info_lto->loads->collapse ();
if (!ignore_stores)
to_info_lto->stores->collapse ();
}
if (callee_info || callee_info_lto)
{
auto_vec parm_map;
compute_parm_map (edge, &parm_map);
if (!ignore_stores)
{
if (to_info && callee_info)
to_info->stores->merge (callee_info->stores, &parm_map, false);
if (to_info_lto && callee_info_lto)
to_info_lto->stores->merge (callee_info_lto->stores, &parm_map,
false);
}
if (!(flags & (ECF_CONST | ECF_NOVOPS)))
{
if (to_info && callee_info)
to_info->loads->merge (callee_info->loads, &parm_map, false);
if (to_info_lto && callee_info_lto)
to_info_lto->loads->merge (callee_info_lto->loads, &parm_map,
false);
}
}
/* Now merge escape summaries.
For every escape to the callee we need to merge calle flags
and remap calees escapes. */
class escape_summary *sum = escape_summaries->get (edge);
int max_escape = -1;
escape_entry *ee;
unsigned int i;
if (sum && !(flags & (ECF_CONST | ECF_NOVOPS)))
FOR_EACH_VEC_ELT (sum->esc, i, ee)
if ((int)ee->arg > max_escape)
max_escape = ee->arg;
auto_vec , 32> emap (max_escape + 1);
emap.safe_grow (max_escape + 1, true);
for (i = 0; (int)i < max_escape + 1; i++)
emap[i] = vNULL;
if (sum && !(flags & (ECF_CONST | ECF_NOVOPS)))
FOR_EACH_VEC_ELT (sum->esc, i, ee)
{
bool needed = false;
if (to_info && to_info->arg_flags.length () > ee->parm_index)
{
int flags = callee_info
&& callee_info->arg_flags.length () > ee->arg
? callee_info->arg_flags[ee->arg] : 0;
if (!ee->direct)
flags = deref_flags (flags, ignore_stores);
else if (ignore_stores)
flags |= ignore_stores_eaf_flags;
flags |= ee->min_flags;
to_info->arg_flags[ee->parm_index] &= flags;
if (to_info->arg_flags[ee->parm_index])
needed = true;
}
if (to_info_lto && to_info_lto->arg_flags.length () > ee->parm_index)
{
int flags = callee_info_lto
&& callee_info_lto->arg_flags.length () > ee->arg
? callee_info_lto->arg_flags[ee->arg] : 0;
if (!ee->direct)
flags = deref_flags (flags, ignore_stores);
else if (ignore_stores)
flags |= ignore_stores_eaf_flags;
flags |= ee->min_flags;
to_info_lto->arg_flags[ee->parm_index] &= flags;
if (to_info_lto->arg_flags[ee->parm_index])
needed = true;
}
struct escape_map entry = {ee->parm_index, ee->direct};
if (needed)
emap[ee->arg].safe_push (entry);
}
update_escape_summary (edge->callee, emap, ignore_stores);
for (i = 0; (int)i < max_escape + 1; i++)
emap[i].release ();
if (sum)
escape_summaries->remove (edge);
if (summaries)
{
if (to_info && !to_info->useful_p (flags))
{
if (dump_file)
fprintf (dump_file, "Removed mod-ref summary for %s\n",
to->dump_name ());
summaries->remove (to);
to_info = NULL;
}
else if (to_info && dump_file)
{
if (dump_file)
fprintf (dump_file, "Updated mod-ref summary for %s\n",
to->dump_name ());
to_info->dump (dump_file);
}
if (callee_info)
summaries->remove (edge->callee);
}
if (summaries_lto)
{
if (to_info_lto && !to_info_lto->useful_p (flags))
{
if (dump_file)
fprintf (dump_file, "Removed mod-ref summary for %s\n",
to->dump_name ());
summaries_lto->remove (to);
}
else if (to_info_lto && dump_file)
{
if (dump_file)
fprintf (dump_file, "Updated mod-ref summary for %s\n",
to->dump_name ());
to_info_lto->dump (dump_file);
to_info_lto = NULL;
}
if (callee_info_lto)
summaries_lto->remove (edge->callee);
}
if (!to_info && !to_info_lto)
remove_modref_edge_summaries (to);
return;
}
/* Get parameter type from DECL. This is only safe for special cases
like builtins we create fnspec for because the type match is checked
at fnspec creation time. */
static tree
get_parm_type (tree decl, unsigned int i)
{
tree t = TYPE_ARG_TYPES (TREE_TYPE (decl));
for (unsigned int p = 0; p < i; p++)
t = TREE_CHAIN (t);
return TREE_VALUE (t);
}
/* Return access mode for argument I of call E with FNSPEC. */
static modref_access_node
get_access_for_fnspec (cgraph_edge *e, attr_fnspec &fnspec,
unsigned int i, modref_parm_map &map)
{
tree size = NULL_TREE;
unsigned int size_arg;
if (!fnspec.arg_specified_p (i))
;
else if (fnspec.arg_max_access_size_given_by_arg_p (i, &size_arg))
{
cgraph_node *node = e->caller->inlined_to
? e->caller->inlined_to : e->caller;
ipa_node_params *caller_parms_info = ipa_node_params_sum->get (node);
ipa_edge_args *args = ipa_edge_args_sum->get (e);
struct ipa_jump_func *jf = ipa_get_ith_jump_func (args, size_arg);
if (jf)
size = ipa_value_from_jfunc (caller_parms_info, jf,
get_parm_type (e->callee->decl, size_arg));
}
else if (fnspec.arg_access_size_given_by_type_p (i))
size = TYPE_SIZE_UNIT (get_parm_type (e->callee->decl, i));
modref_access_node a = {0, -1, -1,
map.parm_offset, map.parm_index,
map.parm_offset_known, 0};
poly_int64 size_hwi;
if (size
&& poly_int_tree_p (size, &size_hwi)
&& coeffs_in_range_p (size_hwi, 0,
HOST_WIDE_INT_MAX / BITS_PER_UNIT))
{
a.size = -1;
a.max_size = size_hwi << LOG2_BITS_PER_UNIT;
}
return a;
}
/* Call E in NODE with ECF_FLAGS has no summary; update MODREF_SUMMARY and
CUR_SUMMARY_LTO accordingly. Return true if something changed. */
static bool
propagate_unknown_call (cgraph_node *node,
cgraph_edge *e, int ecf_flags,
modref_summary *cur_summary,
modref_summary_lto *cur_summary_lto)
{
bool changed = false;
class fnspec_summary *fnspec_sum = fnspec_summaries->get (e);
auto_vec parm_map;
if (fnspec_sum
&& compute_parm_map (e, &parm_map))
{
attr_fnspec fnspec (fnspec_sum->fnspec);
gcc_checking_assert (fnspec.known_p ());
if (fnspec.global_memory_read_p ())
collapse_loads (cur_summary, cur_summary_lto);
else
{
tree t = TYPE_ARG_TYPES (TREE_TYPE (e->callee->decl));
for (unsigned i = 0; i < parm_map.length () && t;
i++, t = TREE_CHAIN (t))
if (!POINTER_TYPE_P (TREE_VALUE (t)))
;
else if (!fnspec.arg_specified_p (i)
|| fnspec.arg_maybe_read_p (i))
{
modref_parm_map map = parm_map[i];
if (map.parm_index == -2)
continue;
if (map.parm_index == -1)
{
collapse_loads (cur_summary, cur_summary_lto);
break;
}
if (cur_summary)
changed |= cur_summary->loads->insert
(0, 0, get_access_for_fnspec (e, fnspec, i, map), false);
if (cur_summary_lto)
changed |= cur_summary_lto->loads->insert
(0, 0, get_access_for_fnspec (e, fnspec, i, map), false);
}
}
if (ignore_stores_p (node->decl, ecf_flags))
;
else if (fnspec.global_memory_written_p ())
collapse_stores (cur_summary, cur_summary_lto);
else
{
tree t = TYPE_ARG_TYPES (TREE_TYPE (e->callee->decl));
for (unsigned i = 0; i < parm_map.length () && t;
i++, t = TREE_CHAIN (t))
if (!POINTER_TYPE_P (TREE_VALUE (t)))
;
else if (!fnspec.arg_specified_p (i)
|| fnspec.arg_maybe_written_p (i))
{
modref_parm_map map = parm_map[i];
if (map.parm_index == -2)
continue;
if (map.parm_index == -1)
{
collapse_stores (cur_summary, cur_summary_lto);
break;
}
if (cur_summary)
changed |= cur_summary->stores->insert
(0, 0, get_access_for_fnspec (e, fnspec, i, map), false);
if (cur_summary_lto)
changed |= cur_summary_lto->stores->insert
(0, 0, get_access_for_fnspec (e, fnspec, i, map), false);
}
}
if (fnspec.errno_maybe_written_p () && flag_errno_math)
{
if (cur_summary && !cur_summary->writes_errno)
{
cur_summary->writes_errno = true;
changed = true;
}
if (cur_summary_lto && !cur_summary_lto->writes_errno)
{
cur_summary_lto->writes_errno = true;
changed = true;
}
}
return changed;
}
if (dump_file)
fprintf (dump_file, " collapsing loads\n");
changed |= collapse_loads (cur_summary, cur_summary_lto);
if (!ignore_stores_p (node->decl, ecf_flags))
{
if (dump_file)
fprintf (dump_file, " collapsing stores\n");
changed |= collapse_stores (cur_summary, cur_summary_lto);
}
return changed;
}
/* Maybe remove summaies of NODE pointed to by CUR_SUMMARY_PTR
and CUR_SUMMARY_LTO_PTR if they are useless according to ECF_FLAGS. */
static void
remove_useless_summaries (cgraph_node *node,
modref_summary **cur_summary_ptr,
modref_summary_lto **cur_summary_lto_ptr,
int ecf_flags)
{
if (*cur_summary_ptr && !(*cur_summary_ptr)->useful_p (ecf_flags, false))
{
optimization_summaries->remove (node);
*cur_summary_ptr = NULL;
}
if (*cur_summary_lto_ptr
&& !(*cur_summary_lto_ptr)->useful_p (ecf_flags, false))
{
summaries_lto->remove (node);
*cur_summary_lto_ptr = NULL;
}
}
/* Perform iterative dataflow on SCC component starting in COMPONENT_NODE
and propagate loads/stores. */
static void
modref_propagate_in_scc (cgraph_node *component_node)
{
bool changed = true;
bool first = true;
int iteration = 0;
while (changed)
{
changed = false;
for (struct cgraph_node *cur = component_node; cur;
cur = ((struct ipa_dfs_info *) cur->aux)->next_cycle)
{
cgraph_node *node = cur->inlined_to ? cur->inlined_to : cur;
modref_summary *cur_summary = optimization_summaries
? optimization_summaries->get (node)
: NULL;
modref_summary_lto *cur_summary_lto = summaries_lto
? summaries_lto->get (node)
: NULL;
if (!cur_summary && !cur_summary_lto)
continue;
int cur_ecf_flags = flags_from_decl_or_type (node->decl);
if (dump_file)
fprintf (dump_file, " Processing %s%s%s\n",
cur->dump_name (),
TREE_READONLY (cur->decl) ? " (const)" : "",
DECL_PURE_P (cur->decl) ? " (pure)" : "");
for (cgraph_edge *e = cur->indirect_calls; e; e = e->next_callee)
{
if (e->indirect_info->ecf_flags & (ECF_CONST | ECF_NOVOPS))
continue;
if (dump_file)
fprintf (dump_file, " Indirect call"
"collapsing loads\n");
if (propagate_unknown_call
(node, e, e->indirect_info->ecf_flags,
cur_summary, cur_summary_lto))
{
changed = true;
remove_useless_summaries (node, &cur_summary,
&cur_summary_lto,
cur_ecf_flags);
if (!cur_summary && !cur_summary_lto)
break;
}
}
if (!cur_summary && !cur_summary_lto)
continue;
for (cgraph_edge *callee_edge = cur->callees; callee_edge;
callee_edge = callee_edge->next_callee)
{
int flags = flags_from_decl_or_type (callee_edge->callee->decl);
modref_summary *callee_summary = NULL;
modref_summary_lto *callee_summary_lto = NULL;
struct cgraph_node *callee;
if (flags & (ECF_CONST | ECF_NOVOPS)
|| !callee_edge->inline_failed)
continue;
/* Get the callee and its summary. */
enum availability avail;
callee = callee_edge->callee->function_or_virtual_thunk_symbol
(&avail, cur);
/* It is not necessary to re-process calls outside of the
SCC component. */
if (iteration > 0
&& (!callee->aux
|| ((struct ipa_dfs_info *)cur->aux)->scc_no
!= ((struct ipa_dfs_info *)callee->aux)->scc_no))
continue;
if (dump_file)
fprintf (dump_file, " Call to %s\n",
callee_edge->callee->dump_name ());
bool ignore_stores = ignore_stores_p (cur->decl, flags);
if (avail <= AVAIL_INTERPOSABLE)
{
if (dump_file)
fprintf (dump_file, " Call target interposable"
" or not available\n");
changed |= propagate_unknown_call
(node, callee_edge, flags,
cur_summary, cur_summary_lto);
if (!cur_summary && !cur_summary_lto)
break;
continue;
}
/* We don't know anything about CALLEE, hence we cannot tell
anything about the entire component. */
if (cur_summary
&& !(callee_summary = optimization_summaries->get (callee)))
{
if (dump_file)
fprintf (dump_file, " No call target summary\n");
changed |= propagate_unknown_call
(node, callee_edge, flags,
cur_summary, NULL);
}
if (cur_summary_lto
&& !(callee_summary_lto = summaries_lto->get (callee)))
{
if (dump_file)
fprintf (dump_file, " No call target summary\n");
changed |= propagate_unknown_call
(node, callee_edge, flags,
NULL, cur_summary_lto);
}
/* We can not safely optimize based on summary of callee if it
does not always bind to current def: it is possible that
memory load was optimized out earlier which may not happen in
the interposed variant. */
if (!callee_edge->binds_to_current_def_p ())
{
changed |= collapse_loads (cur_summary, cur_summary_lto);
if (dump_file)
fprintf (dump_file, " May not bind local;"
" collapsing loads\n");
}
auto_vec parm_map;
compute_parm_map (callee_edge, &parm_map);
/* Merge in callee's information. */
if (callee_summary)
{
changed |= cur_summary->loads->merge
(callee_summary->loads, &parm_map, !first);
if (!ignore_stores)
{
changed |= cur_summary->stores->merge
(callee_summary->stores, &parm_map,
!first);
if (!cur_summary->writes_errno
&& callee_summary->writes_errno)
{
cur_summary->writes_errno = true;
changed = true;
}
}
}
if (callee_summary_lto)
{
changed |= cur_summary_lto->loads->merge
(callee_summary_lto->loads, &parm_map,
!first);
if (!ignore_stores)
{
changed |= cur_summary_lto->stores->merge
(callee_summary_lto->stores, &parm_map,
!first);
if (!cur_summary_lto->writes_errno
&& callee_summary_lto->writes_errno)
{
cur_summary_lto->writes_errno = true;
changed = true;
}
}
}
if (changed)
remove_useless_summaries (node, &cur_summary,
&cur_summary_lto,
cur_ecf_flags);
if (!cur_summary && !cur_summary_lto)
break;
if (dump_file && changed)
{
if (cur_summary)
cur_summary->dump (dump_file);
if (cur_summary_lto)
cur_summary_lto->dump (dump_file);
dump_modref_edge_summaries (dump_file, node, 4);
}
}
}
iteration++;
first = false;
}
if (dump_file)
fprintf (dump_file,
"Propagation finished in %i iterations\n", iteration);
}
/* Dump results of propagation in SCC rooted in COMPONENT_NODE. */
static void
modref_propagate_dump_scc (cgraph_node *component_node)
{
for (struct cgraph_node *cur = component_node; cur;
cur = ((struct ipa_dfs_info *) cur->aux)->next_cycle)
if (!cur->inlined_to)
{
modref_summary *cur_summary = optimization_summaries
? optimization_summaries->get (cur)
: NULL;
modref_summary_lto *cur_summary_lto = summaries_lto
? summaries_lto->get (cur)
: NULL;
fprintf (dump_file, "Propagated modref for %s%s%s\n",
cur->dump_name (),
TREE_READONLY (cur->decl) ? " (const)" : "",
DECL_PURE_P (cur->decl) ? " (pure)" : "");
if (optimization_summaries)
{
if (cur_summary)
cur_summary->dump (dump_file);
else
fprintf (dump_file, " Not tracked\n");
}
if (summaries_lto)
{
if (cur_summary_lto)
cur_summary_lto->dump (dump_file);
else
fprintf (dump_file, " Not tracked (lto)\n");
}
}
}
/* Process escapes in SUM and merge SUMMARY to CUR_SUMMARY
and SUMMARY_LTO to CUR_SUMMARY_LTO.
Return true if something changed. */
static bool
modref_merge_call_site_flags (escape_summary *sum,
modref_summary *cur_summary,
modref_summary_lto *cur_summary_lto,
modref_summary *summary,
modref_summary_lto *summary_lto,
tree caller,
int ecf_flags)
{
escape_entry *ee;
unsigned int i;
bool changed = false;
bool ignore_stores = ignore_stores_p (caller, ecf_flags);
/* If we have no useful info to propagate. */
if ((!cur_summary || !cur_summary->arg_flags.length ())
&& (!cur_summary_lto || !cur_summary_lto->arg_flags.length ()))
return false;
FOR_EACH_VEC_ELT (sum->esc, i, ee)
{
int flags = 0;
int flags_lto = 0;
if (summary && ee->arg < summary->arg_flags.length ())
flags = summary->arg_flags[ee->arg];
if (summary_lto
&& ee->arg < summary_lto->arg_flags.length ())
flags_lto = summary_lto->arg_flags[ee->arg];
if (!ee->direct)
{
flags = deref_flags (flags, ignore_stores);
flags_lto = deref_flags (flags_lto, ignore_stores);
}
else if (ignore_stores)
{
flags |= ignore_stores_eaf_flags;
flags_lto |= ignore_stores_eaf_flags;
}
/* Returning the value is already accounted to at local propagation. */
flags |= ee->min_flags | EAF_NOT_RETURNED;
flags_lto |= ee->min_flags | EAF_NOT_RETURNED;
/* Noescape implies that value also does not escape directly.
Fnspec machinery does set both so compensate for this. */
if (flags & EAF_NOESCAPE)
flags |= EAF_NODIRECTESCAPE;
if (flags_lto & EAF_NOESCAPE)
flags_lto |= EAF_NODIRECTESCAPE;
if (!(flags & EAF_UNUSED)
&& cur_summary && ee->parm_index < cur_summary->arg_flags.length ())
{
int f = cur_summary->arg_flags[ee->parm_index];
if ((f & flags) != f)
{
f = remove_useless_eaf_flags
(f & flags, ecf_flags,
VOID_TYPE_P (TREE_TYPE (TREE_TYPE (caller))));
cur_summary->arg_flags[ee->parm_index] = f;
changed = true;
}
}
if (!(flags_lto & EAF_UNUSED)
&& cur_summary_lto
&& ee->parm_index < cur_summary_lto->arg_flags.length ())
{
int f = cur_summary_lto->arg_flags[ee->parm_index];
if ((f & flags_lto) != f)
{
f = remove_useless_eaf_flags
(f & flags_lto, ecf_flags,
VOID_TYPE_P (TREE_TYPE (TREE_TYPE (caller))));
cur_summary_lto->arg_flags[ee->parm_index] = f;
changed = true;
}
}
}
return changed;
}
/* Perform iterative dataflow on SCC component starting in COMPONENT_NODE
and propagate arg flags. */
static void
modref_propagate_flags_in_scc (cgraph_node *component_node)
{
bool changed = true;
int iteration = 0;
while (changed)
{
changed = false;
for (struct cgraph_node *cur = component_node; cur;
cur = ((struct ipa_dfs_info *) cur->aux)->next_cycle)
{
cgraph_node *node = cur->inlined_to ? cur->inlined_to : cur;
modref_summary *cur_summary = optimization_summaries
? optimization_summaries->get (node)
: NULL;
modref_summary_lto *cur_summary_lto = summaries_lto
? summaries_lto->get (node)
: NULL;
if (!cur_summary && !cur_summary_lto)
continue;
if (dump_file)
fprintf (dump_file, " Processing %s%s%s\n",
cur->dump_name (),
TREE_READONLY (cur->decl) ? " (const)" : "",
DECL_PURE_P (cur->decl) ? " (pure)" : "");
for (cgraph_edge *e = cur->indirect_calls; e; e = e->next_callee)
{
escape_summary *sum = escape_summaries->get (e);
if (!sum || (e->indirect_info->ecf_flags
& (ECF_CONST | ECF_NOVOPS)))
continue;
changed |= modref_merge_call_site_flags
(sum, cur_summary, cur_summary_lto,
NULL, NULL,
node->decl, e->indirect_info->ecf_flags);
}
if (!cur_summary && !cur_summary_lto)
continue;
for (cgraph_edge *callee_edge = cur->callees; callee_edge;
callee_edge = callee_edge->next_callee)
{
int ecf_flags = flags_from_decl_or_type
(callee_edge->callee->decl);
modref_summary *callee_summary = NULL;
modref_summary_lto *callee_summary_lto = NULL;
struct cgraph_node *callee;
if (ecf_flags & (ECF_CONST | ECF_NOVOPS)
|| !callee_edge->inline_failed)
continue;
/* Get the callee and its summary. */
enum availability avail;
callee = callee_edge->callee->function_or_virtual_thunk_symbol
(&avail, cur);
/* It is not necessary to re-process calls outside of the
SCC component. */
if (iteration > 0
&& (!callee->aux
|| ((struct ipa_dfs_info *)cur->aux)->scc_no
!= ((struct ipa_dfs_info *)callee->aux)->scc_no))
continue;
escape_summary *sum = escape_summaries->get (callee_edge);
if (!sum)
continue;
if (dump_file)
fprintf (dump_file, " Call to %s\n",
callee_edge->callee->dump_name ());
if (avail <= AVAIL_INTERPOSABLE
|| callee_edge->call_stmt_cannot_inline_p)
;
else
{
if (cur_summary)
callee_summary = optimization_summaries->get (callee);
if (cur_summary_lto)
callee_summary_lto = summaries_lto->get (callee);
}
changed |= modref_merge_call_site_flags
(sum, cur_summary, cur_summary_lto,
callee_summary, callee_summary_lto,
node->decl, ecf_flags);
if (dump_file && changed)
{
if (cur_summary)
cur_summary->dump (dump_file);
if (cur_summary_lto)
cur_summary_lto->dump (dump_file);
}
}
}
iteration++;
}
if (dump_file)
fprintf (dump_file,
"Propagation of flags finished in %i iterations\n", iteration);
}
/* Run the IPA pass. This will take a function's summaries and calls and
construct new summaries which represent a transitive closure. So that
summary of an analyzed function contains information about the loads and
stores that the function or any function that it calls does. */
unsigned int
pass_ipa_modref::execute (function *)
{
if (!summaries && !summaries_lto)
return 0;
if (optimization_summaries)
ggc_delete (optimization_summaries);
optimization_summaries = summaries;
summaries = NULL;
struct cgraph_node **order = XCNEWVEC (struct cgraph_node *,
symtab->cgraph_count);
int order_pos;
order_pos = ipa_reduced_postorder (order, true, ignore_edge);
int i;
/* Iterate over all strongly connected components in post-order. */
for (i = 0; i < order_pos; i++)
{
/* Get the component's representative. That's just any node in the
component from which we can traverse the entire component. */
struct cgraph_node *component_node = order[i];
if (dump_file)
fprintf (dump_file, "\n\nStart of SCC component\n");
modref_propagate_in_scc (component_node);
modref_propagate_flags_in_scc (component_node);
if (dump_file)
modref_propagate_dump_scc (component_node);
}
cgraph_node *node;
FOR_EACH_FUNCTION (node)
update_signature (node);
if (summaries_lto)
((modref_summaries_lto *)summaries_lto)->propagated = true;
ipa_free_postorder_info ();
free (order);
delete fnspec_summaries;
fnspec_summaries = NULL;
delete escape_summaries;
escape_summaries = NULL;
return 0;
}
/* Summaries must stay alive until end of compilation. */
void
ipa_modref_c_finalize ()
{
if (optimization_summaries)
ggc_delete (optimization_summaries);
optimization_summaries = NULL;
gcc_checking_assert (!summaries
|| flag_incremental_link == INCREMENTAL_LINK_LTO);
if (summaries_lto)
ggc_delete (summaries_lto);
summaries_lto = NULL;
if (fnspec_summaries)
delete fnspec_summaries;
fnspec_summaries = NULL;
if (escape_summaries)
delete escape_summaries;
escape_summaries = NULL;
}
#include "gt-ipa-modref.h"