aboutsummaryrefslogtreecommitdiff
path: root/gcc/tree-ssa-loop-niter.c
diff options
context:
space:
mode:
authorKugan Vivekanandarajah <kuganv@linaro.org>2018-06-16 21:39:31 +0000
committerKugan Vivekanandarajah <kugan@gcc.gnu.org>2018-06-16 21:39:31 +0000
commit5126ae0c6eafd2bba09fc60a23cd9c0b292846c4 (patch)
treee7ade1440d60638b78b1ca38cf5a18a29153c582 /gcc/tree-ssa-loop-niter.c
parente197e64ee8ab8e46de9069a8d951bed720a0fd67 (diff)
downloadgcc-5126ae0c6eafd2bba09fc60a23cd9c0b292846c4.zip
gcc-5126ae0c6eafd2bba09fc60a23cd9c0b292846c4.tar.gz
gcc-5126ae0c6eafd2bba09fc60a23cd9c0b292846c4.tar.bz2
re PR middle-end/82479 (missing popcount builtin detection)
gcc/ChangeLog: 2018-06-16 Kugan Vivekanandarajah <kuganv@linaro.org> PR middle-end/82479 * ipa-fnsummary.c (will_be_nonconstant_expr_predicate): Handle CALL_EXPR. * tree-scalar-evolution.c (interpret_expr): Likewise. (expression_expensive_p): Likewise. * tree-ssa-loop-ivopts.c (contains_abnormal_ssa_name_p): Likewise. * tree-ssa-loop-niter.c (number_of_iterations_popcount): New. (number_of_iterations_exit_assumptions): Use number_of_iterations_popcount. (ssa_defined_by_minus_one_stmt_p): New. gcc/testsuite/ChangeLog: 2018-06-16 Kugan Vivekanandarajah <kuganv@linaro.org> PR middle-end/82479 * gcc.dg/tree-ssa/popcount.c: New test. * gcc.dg/tree-ssa/popcount2.c: New test. From-SVN: r261682
Diffstat (limited to 'gcc/tree-ssa-loop-niter.c')
-rw-r--r--gcc/tree-ssa-loop-niter.c176
1 files changed, 175 insertions, 1 deletions
diff --git a/gcc/tree-ssa-loop-niter.c b/gcc/tree-ssa-loop-niter.c
index 7a54c5f..9365915 100644
--- a/gcc/tree-ssa-loop-niter.c
+++ b/gcc/tree-ssa-loop-niter.c
@@ -63,6 +63,10 @@ struct bounds
mpz_t below, up;
};
+static bool number_of_iterations_popcount (loop_p loop, edge exit,
+ enum tree_code code,
+ struct tree_niter_desc *niter);
+
/* Splits expression EXPR to a variable part VAR and constant OFFSET. */
@@ -2357,7 +2361,7 @@ number_of_iterations_exit_assumptions (struct loop *loop, edge exit,
tree iv0_niters = NULL_TREE;
if (!simple_iv_with_niters (loop, loop_containing_stmt (stmt),
op0, &iv0, safe ? &iv0_niters : NULL, false))
- return false;
+ return number_of_iterations_popcount (loop, exit, code, niter);
tree iv1_niters = NULL_TREE;
if (!simple_iv_with_niters (loop, loop_containing_stmt (stmt),
op1, &iv1, safe ? &iv1_niters : NULL, false))
@@ -2430,6 +2434,176 @@ number_of_iterations_exit_assumptions (struct loop *loop, edge exit,
return (!integer_zerop (niter->assumptions));
}
+
+/* Utility function to check if OP is defined by a stmt
+ that is a val - 1. */
+
+static bool
+ssa_defined_by_minus_one_stmt_p (tree op, tree val)
+{
+ gimple *stmt;
+ return (TREE_CODE (op) == SSA_NAME
+ && (stmt = SSA_NAME_DEF_STMT (op))
+ && is_gimple_assign (stmt)
+ && (gimple_assign_rhs_code (stmt) == PLUS_EXPR)
+ && val == gimple_assign_rhs1 (stmt)
+ && integer_minus_onep (gimple_assign_rhs2 (stmt)));
+}
+
+
+/* See if LOOP is a popcout implementation, determine NITER for the loop
+
+ We match:
+ <bb 2>
+ goto <bb 4>
+
+ <bb 3>
+ _1 = b_11 + -1
+ b_6 = _1 & b_11
+
+ <bb 4>
+ b_11 = PHI <b_5(D)(2), b_6(3)>
+
+ exit block
+ if (b_11 != 0)
+ goto <bb 3>
+ else
+ goto <bb 5>
+
+ OR we match copy-header version:
+ if (b_5 != 0)
+ goto <bb 3>
+ else
+ goto <bb 4>
+
+ <bb 3>
+ b_11 = PHI <b_5(2), b_6(3)>
+ _1 = b_11 + -1
+ b_6 = _1 & b_11
+
+ exit block
+ if (b_6 != 0)
+ goto <bb 3>
+ else
+ goto <bb 4>
+
+ If popcount pattern, update NITER accordingly.
+ i.e., set NITER to __builtin_popcount (b)
+ return true if we did, false otherwise.
+
+ */
+
+static bool
+number_of_iterations_popcount (loop_p loop, edge exit,
+ enum tree_code code,
+ struct tree_niter_desc *niter)
+{
+ bool adjust = true;
+ tree iter;
+ HOST_WIDE_INT max;
+ adjust = true;
+ tree fn = NULL_TREE;
+
+ /* Check loop terminating branch is like
+ if (b != 0). */
+ gimple *stmt = last_stmt (exit->src);
+ if (!stmt
+ || gimple_code (stmt) != GIMPLE_COND
+ || code != NE_EXPR
+ || !integer_zerop (gimple_cond_rhs (stmt))
+ || TREE_CODE (gimple_cond_lhs (stmt)) != SSA_NAME)
+ return false;
+
+ gimple *and_stmt = SSA_NAME_DEF_STMT (gimple_cond_lhs (stmt));
+
+ /* Depending on copy-header is performed, feeding PHI stmts might be in
+ the loop header or loop latch, handle this. */
+ if (gimple_code (and_stmt) == GIMPLE_PHI
+ && gimple_bb (and_stmt) == loop->header
+ && gimple_phi_num_args (and_stmt) == 2
+ && (TREE_CODE (gimple_phi_arg_def (and_stmt,
+ loop_latch_edge (loop)->dest_idx))
+ == SSA_NAME))
+ {
+ /* SSA used in exit condition is defined by PHI stmt
+ b_11 = PHI <b_5(D)(2), b_6(3)>
+ from the PHI stmt, get the and_stmt
+ b_6 = _1 & b_11. */
+ tree t = gimple_phi_arg_def (and_stmt, loop_latch_edge (loop)->dest_idx);
+ and_stmt = SSA_NAME_DEF_STMT (t);
+ adjust = false;
+ }
+
+ /* Make sure it is indeed an and stmt (b_6 = _1 & b_11). */
+ if (!is_gimple_assign (and_stmt)
+ || gimple_assign_rhs_code (and_stmt) != BIT_AND_EXPR)
+ return false;
+
+ tree b_11 = gimple_assign_rhs1 (and_stmt);
+ tree _1 = gimple_assign_rhs2 (and_stmt);
+
+ /* Check that _1 is defined by _b11 + -1 (_1 = b_11 + -1).
+ Also make sure that b_11 is the same in and_stmt and _1 defining stmt.
+ Also canonicalize if _1 and _b11 are revrsed. */
+ if (ssa_defined_by_minus_one_stmt_p (b_11, _1))
+ std::swap (b_11, _1);
+ else if (ssa_defined_by_minus_one_stmt_p (_1, b_11))
+ ;
+ else
+ return false;
+ /* Check the recurrence:
+ ... = PHI <b_5(2), b_6(3)>. */
+ gimple *phi = SSA_NAME_DEF_STMT (b_11);
+ if (gimple_code (phi) != GIMPLE_PHI
+ || (gimple_assign_lhs (and_stmt)
+ != gimple_phi_arg_def (phi, loop_latch_edge (loop)->dest_idx)))
+ return false;
+
+ /* We found a match. Get the corresponding popcount builtin. */
+ tree src = gimple_phi_arg_def (phi, loop_preheader_edge (loop)->dest_idx);
+ if (TYPE_PRECISION (TREE_TYPE (src)) == TYPE_PRECISION (integer_type_node))
+ fn = builtin_decl_implicit (BUILT_IN_POPCOUNT);
+ else if (TYPE_PRECISION (TREE_TYPE (src)) == TYPE_PRECISION
+ (long_integer_type_node))
+ fn = builtin_decl_implicit (BUILT_IN_POPCOUNTL);
+ else if (TYPE_PRECISION (TREE_TYPE (src)) == TYPE_PRECISION
+ (long_long_integer_type_node))
+ fn = builtin_decl_implicit (BUILT_IN_POPCOUNTLL);
+
+ /* ??? Support promoting char/short to int. */
+ if (!fn)
+ return false;
+
+ /* Update NITER params accordingly */
+ max = TYPE_PRECISION (TREE_TYPE (src));
+ if (adjust)
+ max = max - 1;
+ tree utype = unsigned_type_for (TREE_TYPE (src));
+ src = fold_convert (utype, src);
+ tree call = fold_convert (utype, build_call_expr (fn, 1, src));
+ if (adjust)
+ iter = fold_build2 (MINUS_EXPR, utype,
+ call,
+ build_int_cst (utype, 1));
+ else
+ iter = call;
+
+ niter->niter = iter;
+ niter->assumptions = boolean_true_node;
+ if (adjust)
+ niter->may_be_zero = fold_build2 (EQ_EXPR, boolean_type_node, src,
+ build_zero_cst
+ (TREE_TYPE (src)));
+ else
+ niter->may_be_zero = boolean_false_node;
+
+ niter->max = max;
+ niter->bound = NULL_TREE;
+ niter->cmp = ERROR_MARK;
+ return true;
+}
+
+
/* Like number_of_iterations_exit_assumptions, but return TRUE only if
the niter information holds unconditionally. */