diff options
author | Wilco Dijkstra <wdijkstr@arm.com> | 2016-09-28 11:06:41 +0000 |
---|---|---|
committer | Wilco Dijkstra <wilco@gcc.gnu.org> | 2016-09-28 11:06:41 +0000 |
commit | 912d9ec300f1f1262b1ab09798304d0c99ff5778 (patch) | |
tree | 3c170771d3f815d96a6d0ba133a16b9fe28bc717 /gcc/gimple-fold.c | |
parent | 1b4be62ad3e153d2e4eda115698cbf33fca09781 (diff) | |
download | gcc-912d9ec300f1f1262b1ab09798304d0c99ff5778.zip gcc-912d9ec300f1f1262b1ab09798304d0c99ff5778.tar.gz gcc-912d9ec300f1f1262b1ab09798304d0c99ff5778.tar.bz2 |
Optimize strchr (s, 0) to s + strlen (s).
Optimize strchr (s, 0) to s + strlen (s). strchr (s, 0) appears a common
idiom for finding the end of a string, however it is not a very efficient
way of doing so. Strlen is a much simpler operation which is significantly
faster (eg. on x86 strlen is 50% faster for strings of 8 bytes and about
twice as fast as strchr on strings of 1KB).
gcc/
* gimple-fold.c (gimple_fold_builtin_strchr):
New function to optimize strchr (s, 0) to strlen.
(gimple_fold_builtin): Add BUILT_IN_STRCHR case.
testsuite/
* gcc.dg/strlenopt-20.c: Update test.
* gcc.dg/strlenopt-21.c: Likewise.
* gcc.dg/strlenopt-22.c: Likewise.
* gcc.dg/strlenopt-22g.c: Likewise.
* gcc.dg/strlenopt-26.c: Likewise.
* gcc.dg/strlenopt-5.c: Likewise.
* gcc.dg/strlenopt-7.c: Likewise.
* gcc.dg/strlenopt-9.c: Likewise.
From-SVN: r240568
Diffstat (limited to 'gcc/gimple-fold.c')
-rw-r--r-- | gcc/gimple-fold.c | 51 |
1 files changed, 51 insertions, 0 deletions
diff --git a/gcc/gimple-fold.c b/gcc/gimple-fold.c index 23e4516..f5a5e5d 100644 --- a/gcc/gimple-fold.c +++ b/gcc/gimple-fold.c @@ -1457,6 +1457,55 @@ gimple_fold_builtin_strncpy (gimple_stmt_iterator *gsi, return true; } +/* Simplify strchr (str, 0) into str + strlen (str). + In general strlen is significantly faster than strchr + due to being a simpler operation. */ +static bool +gimple_fold_builtin_strchr (gimple_stmt_iterator *gsi) +{ + gimple *stmt = gsi_stmt (*gsi); + tree str = gimple_call_arg (stmt, 0); + tree c = gimple_call_arg (stmt, 1); + location_t loc = gimple_location (stmt); + + if (optimize_function_for_size_p (cfun)) + return false; + + if (!integer_zerop (c) || !gimple_call_lhs (stmt)) + return false; + + tree len; + tree strlen_fn = builtin_decl_implicit (BUILT_IN_STRLEN); + + if (!strlen_fn) + return false; + + /* Create newstr = strlen (str). */ + gimple_seq stmts = NULL; + gimple *new_stmt = gimple_build_call (strlen_fn, 1, str); + gimple_set_location (new_stmt, loc); + if (gimple_in_ssa_p (cfun)) + len = make_ssa_name (size_type_node); + else + len = create_tmp_reg (size_type_node); + gimple_call_set_lhs (new_stmt, len); + gimple_seq_add_stmt_without_update (&stmts, new_stmt); + + /* Create (str p+ strlen (str)). */ + new_stmt = gimple_build_assign (gimple_call_lhs (stmt), + POINTER_PLUS_EXPR, str, len); + gimple_seq_add_stmt_without_update (&stmts, new_stmt); + gsi_replace_with_seq_vops (gsi, stmts); + /* gsi now points at the assignment to the lhs, get a + stmt iterator to the strlen. + ??? We can't use gsi_for_stmt as that doesn't work when the + CFG isn't built yet. */ + gimple_stmt_iterator gsi2 = *gsi; + gsi_prev (&gsi2); + fold_stmt (&gsi2); + return true; +} + /* Simplify a call to the strcat builtin. DST and SRC are the arguments to the call. @@ -2898,6 +2947,8 @@ gimple_fold_builtin (gimple_stmt_iterator *gsi) gimple_call_arg (stmt, 1)); case BUILT_IN_STRNCAT: return gimple_fold_builtin_strncat (gsi); + case BUILT_IN_STRCHR: + return gimple_fold_builtin_strchr (gsi); case BUILT_IN_FPUTS: return gimple_fold_builtin_fputs (gsi, gimple_call_arg (stmt, 0), gimple_call_arg (stmt, 1), false); |