diff mbox

Fold strstr (s, t) eq/ne s to strcmp (s, t) eq/ne 0 if strlen (t) is known

Message ID CAAgBjMmkzh17CUTFZYtTaNrs5=oLvabBrMc=Gvx-2OFPaparMw@mail.gmail.com
State New
Headers show

Commit Message

Prathamesh Kulkarni Dec. 9, 2016, 12:06 p.m. UTC
On 7 December 2016 at 17:36, Jakub Jelinek <jakub@redhat.com> wrote:
> On Wed, Dec 07, 2016 at 05:02:46PM +0530, Prathamesh Kulkarni wrote:

>> +                       if (arg1_len == NULL_TREE)

>> +                         {

>> +                           gimple_stmt_iterator gsi;

>> +                           tree strlen_decl;

>> +                           gimple *strlen_call;

>> +

>> +                           strlen_decl = builtin_decl_explicit (BUILT_IN_STRLEN);

>> +                           strlen_call = gimple_build_call (strlen_decl, 1,

>> +                                                            arg1);

>> +                           arg1_len = make_ssa_name (size_type_node);

>> +                           gimple_call_set_lhs (strlen_call, arg1_len);

>> +                           update_stmt (strlen_call);

>> +                           gsi = gsi_for_stmt (call_stmt);

>> +                           gsi_insert_before (&gsi, strlen_call, GSI_SAME_STMT);

>> +                         }

>

> Why?  If the strlen isn't readily available, do you really think it is

> always a win to replace one call with 2 calls?  The string you want to do

> strlen on can be huge, the haystack could be empty or very short, etc.

> I'd just punt if strlen isn't known.

>> +

>> +                       gimple_stmt_iterator gsi = gsi_for_stmt (call_stmt);

>> +                       tree memcmp_decl = builtin_decl_explicit (BUILT_IN_MEMCMP);

>> +                       gcall *memcmp_call

>> +                         = gimple_build_call (memcmp_decl, 3, arg0, arg1,

>> +                                              arg1_len);

>> +                       tree memcmp_lhs = make_ssa_name (integer_type_node);

>> +                       gimple_call_set_lhs (memcmp_call, memcmp_lhs);

>> +                       update_stmt (memcmp_call);

>> +                       gsi_remove (&gsi, true);

>> +                       gsi_insert_before (&gsi, memcmp_call, GSI_SAME_STMT);

>> +

>> +                       gsi = gsi_for_stmt (stmt);

>> +                       tree zero = build_zero_cst (TREE_TYPE (memcmp_lhs));

>> +                       gassign *ga = gimple_build_assign (lhs, code,

>> +                                                          memcmp_lhs, zero);

>> +                       gsi_replace (&gsi, ga, false);

>> +                       update_ssa (TODO_update_ssa);

>

> And this is certainly even more wrong than the old TODO_update_ssa at the

> end of the pass, now you'll do it for every single replacement in the

> function.  Why do you need it?  The old call stmt has gimple_vdef and

> gimple_vuse, so just copy those over, see how e.g.

> replace_call_with_call_and_fold in gimple-fold.c does that.

> If you don't add strlen, you need to move the vdef/vuse from stmt to

> memcmp_call, if you really want to add strlen (see above note though),

> then that call should have a vuse added (same vuse as the stmt originally

> had).

Hi,
Thanks for the suggestions. In attached patch, I dropped the transform
if strlen (t) is unknown.
Since strstr is marked pure, so IIUC call_stmt for strstr shouldn't
have vdef assoicated with it ?
(gimple_vdef for call_stmt returned NULL for test-cases I tried it
with). Moving gimple_vuse
from call_stmt to memcmp_call worked for me.
Does the patch look OK ?
Bootstrap+tested on x86_64-unknown-linux-gnu with --enable-langauges=all,ada
Cross-tested on arm*-*-*, aarch64*-*-*.

Thanks,
Prathamesh
>

>         Jakub

Comments

Jakub Jelinek Dec. 9, 2016, 12:29 p.m. UTC | #1
On Fri, Dec 09, 2016 at 05:36:41PM +0530, Prathamesh Kulkarni wrote:
> --- a/gcc/tree-ssa-strlen.c

> +++ b/gcc/tree-ssa-strlen.c

> @@ -2302,7 +2302,81 @@ strlen_optimize_stmt (gimple_stmt_iterator *gsi)

>  	  else if (gimple_assign_rhs_code (stmt) == POINTER_PLUS_EXPR)

>  	    handle_pointer_plus (gsi);

>  	}

> -      else if (TREE_CODE (lhs) != SSA_NAME && !TREE_SIDE_EFFECTS (lhs))

> +

> +      /* Fold strstr (s, t) == s to memcmp (s, t, strlen (t)) == 0.

> +	 if strlen (t) is known and var holding return value of strstr

> +	 has single use.  */

> +

> +      else if (TREE_CODE (lhs) == SSA_NAME && INTEGRAL_TYPE_P (TREE_TYPE (lhs)))

> +	{

> +	  enum tree_code code = gimple_assign_rhs_code (stmt);

> +	  if (code == EQ_EXPR || code == NE_EXPR)


This way you handle _8 = _5 == _7;, but not if (_5 == _7) bar ();.  Shouldn't you
also handle GIMPLE_COND similarly (of course, the rhs1 and rhs2 grabbing
and code grabbing is different for GIMPLE_COND.  But the rest should be
the same, except again that you don't want to replace the GIMPLE_COND, but
adjust it.  Maybe also COND_EXPR in gimple_assign (_9 = _5 == _7 ? _10 : _11;).

> +	    {

> +	      tree rhs1 = gimple_assign_rhs1 (stmt);

> +	      tree rhs2 = gimple_assign_rhs2 (stmt);

> +	      if (TREE_CODE (rhs1) == SSA_NAME

> +		  && TREE_CODE (rhs2) == SSA_NAME)

> +		{

> +		  gcall *call_stmt = dyn_cast<gcall *> (SSA_NAME_DEF_STMT (rhs1));

> +		  if (!call_stmt)

> +		    {

> +		      call_stmt = dyn_cast<gcall *> (SSA_NAME_DEF_STMT (rhs2));

> +		      tree tmp = rhs1;

> +		      rhs1 = rhs2;

> +		      rhs2 = tmp;


We use std::swap (rhs1, rhs2); in this case these days.

> +		    }

> +

> +		  tree call_lhs;

> +		  if (call_stmt

> +		      && gimple_call_builtin_p (call_stmt, BUILT_IN_STRSTR)

> +		      && (call_lhs = gimple_call_lhs (call_stmt))

> +		      && has_single_use (call_lhs))


This might not optimize if you have:
  _5 = foo ();
  _7 = __builtin_strstr (_5, "abcd");
  _8 = _5 == _7;

Or even you could have:
  _5 = __builtin_strstr (...);
  _7 = __builtin_strstr (_5, "abcd");
  _8 = _5 == _7;

So I wonder if you shouldn't do:
		  gimple *call_stmt = NULL;
		  for (int pass = 0; pass < 2; pass++)
		    {
		      gimple *g = SSA_NAME_DEF_STMT (rhs1);
		      if (gimple_call_builtin_p (g, BUILT_IN_STRSTR)
			  && gimple_call_lhs (g) == rhs1
			  && has_single_use (rhs1)
			  && gimple_call_arg (g, 0) == rhs2)
			{
			  call_stmt = g;
			  break;
			}
		      std::swap (rhs1, rhs2);
		    }
		  if (call_stmt)
...

I think you don't need operand_equal_p, because SSA_NAMEs should just
be the same pointer if they are the same thing.
The above way you handle both orderings.  Perhaps also it is big enough to
be done in a separate function, which you call with the code/rhs1/rhs2 and
stmt for the EQ/NE_EXPR is_gimple_assign as well as for COND_EXPR and
GIMPLE_COND.

	Jakub
diff mbox

Patch

diff --git a/gcc/testsuite/gcc.dg/strlenopt-30.c b/gcc/testsuite/gcc.dg/strlenopt-30.c
new file mode 100644
index 0000000..329bc25
--- /dev/null
+++ b/gcc/testsuite/gcc.dg/strlenopt-30.c
@@ -0,0 +1,44 @@ 
+/* { dg-do compile } */
+/* { dg-options "-O2 -fdump-tree-strlen" } */
+
+__attribute__((no_icf))
+_Bool f1(char *s)
+{
+  return __builtin_strstr (s, "hello") == s;
+}
+
+__attribute__((no_icf))
+_Bool f2(char *s)
+{
+  return s == __builtin_strstr (s, "hello");
+}
+
+__attribute__((no_icf))
+_Bool f3(char *s)
+{
+  return s != __builtin_strstr (s, "hello");
+}
+
+/* Do not perform transform, since strlen (t)
+   is unknown.  */
+
+__attribute__((no_icf))
+_Bool f4(char *s, char *t)
+{
+  return __builtin_strstr (s, t) == s;
+}
+
+/* Do not perform transform in this case, since
+   t1 doesn't have single use.  */
+
+__attribute__((no_icf))
+_Bool f5(char *s)
+{
+  void foo(char *);
+
+  char *t1 = __builtin_strstr (s, "hello");
+  foo (t1);
+  return (t1 == s);
+}
+
+/* { dg-final { scan-tree-dump-times "__builtin_memcmp" 3 "strlen" } } */
diff --git a/gcc/tree-ssa-strlen.c b/gcc/tree-ssa-strlen.c
index 339812e..06b07b0 100644
--- a/gcc/tree-ssa-strlen.c
+++ b/gcc/tree-ssa-strlen.c
@@ -2302,7 +2302,81 @@  strlen_optimize_stmt (gimple_stmt_iterator *gsi)
 	  else if (gimple_assign_rhs_code (stmt) == POINTER_PLUS_EXPR)
 	    handle_pointer_plus (gsi);
 	}
-      else if (TREE_CODE (lhs) != SSA_NAME && !TREE_SIDE_EFFECTS (lhs))
+
+      /* Fold strstr (s, t) == s to memcmp (s, t, strlen (t)) == 0.
+	 if strlen (t) is known and var holding return value of strstr
+	 has single use.  */
+
+      else if (TREE_CODE (lhs) == SSA_NAME && INTEGRAL_TYPE_P (TREE_TYPE (lhs)))
+	{
+	  enum tree_code code = gimple_assign_rhs_code (stmt);
+	  if (code == EQ_EXPR || code == NE_EXPR)
+	    {
+	      tree rhs1 = gimple_assign_rhs1 (stmt);
+	      tree rhs2 = gimple_assign_rhs2 (stmt);
+	      if (TREE_CODE (rhs1) == SSA_NAME
+		  && TREE_CODE (rhs2) == SSA_NAME)
+		{
+		  gcall *call_stmt = dyn_cast<gcall *> (SSA_NAME_DEF_STMT (rhs1));
+		  if (!call_stmt)
+		    {
+		      call_stmt = dyn_cast<gcall *> (SSA_NAME_DEF_STMT (rhs2));
+		      tree tmp = rhs1;
+		      rhs1 = rhs2;
+		      rhs2 = tmp;
+		    }
+
+		  tree call_lhs;
+		  if (call_stmt
+		      && gimple_call_builtin_p (call_stmt, BUILT_IN_STRSTR)
+		      && (call_lhs = gimple_call_lhs (call_stmt))
+		      && has_single_use (call_lhs))
+		    {
+		      tree arg0 = gimple_call_arg (call_stmt, 0);
+		      if (operand_equal_p (arg0, rhs2, 0))
+			{
+			  tree arg1 = gimple_call_arg (call_stmt, 1);
+			  tree arg1_len = NULL_TREE;
+			  int idx = get_stridx (arg1);
+
+			  if (idx)
+			    {
+			      if (idx < 0)
+				arg1_len = build_int_cst (size_type_node,
+							  ~idx);
+			      else
+				{
+				  strinfo *si = get_strinfo (idx);
+				  if (si)
+				    arg1_len = get_string_length (si);
+				}
+			    }
+
+			  if (arg1_len != NULL_TREE)
+			    {
+			      gimple_stmt_iterator gsi = gsi_for_stmt (call_stmt);
+			      tree memcmp_decl = builtin_decl_explicit (BUILT_IN_MEMCMP);
+			      gcall *memcmp_call
+				= gimple_build_call (memcmp_decl, 3, arg0, arg1,
+						     arg1_len);
+			      tree memcmp_lhs = make_ssa_name (integer_type_node);
+			      gimple_set_vuse (memcmp_call, gimple_vuse (call_stmt));
+			      gimple_call_set_lhs (memcmp_call, memcmp_lhs);
+			      gsi_remove (&gsi, true);
+			      gsi_insert_before (&gsi, memcmp_call, GSI_SAME_STMT);
+			      gsi = gsi_for_stmt (stmt);
+			      tree zero = build_zero_cst (TREE_TYPE (memcmp_lhs));
+			      gassign *ga = gimple_build_assign (lhs, code,
+								 memcmp_lhs,
+								 zero);
+			      gsi_replace (&gsi, ga, false);
+			    }
+			}
+		    }
+		}
+	    }
+	}
+    else if (TREE_CODE (lhs) != SSA_NAME && !TREE_SIDE_EFFECTS (lhs))
 	{
 	  tree type = TREE_TYPE (lhs);
 	  if (TREE_CODE (type) == ARRAY_TYPE)