On 7 December 2016 at 17:36, Jakub Jelinek <ja...@redhat.com> wrote:
> On Wed, Dec 07, 2016 at 05:02:46PM +0530, Prathamesh Kulkarni wrote:
>> +                       if (arg1_len == NULL_TREE)
>> +                         {
>> +                           gimple_stmt_iterator gsi;
>> +                           tree strlen_decl;
>> +                           gimple *strlen_call;
>> +
>> +                           strlen_decl = builtin_decl_explicit 
>> (BUILT_IN_STRLEN);
>> +                           strlen_call = gimple_build_call (strlen_decl, 1,
>> +                                                            arg1);
>> +                           arg1_len = make_ssa_name (size_type_node);
>> +                           gimple_call_set_lhs (strlen_call, arg1_len);
>> +                           update_stmt (strlen_call);
>> +                           gsi = gsi_for_stmt (call_stmt);
>> +                           gsi_insert_before (&gsi, strlen_call, 
>> GSI_SAME_STMT);
>> +                         }
>
> Why?  If the strlen isn't readily available, do you really think it is
> always a win to replace one call with 2 calls?  The string you want to do
> strlen on can be huge, the haystack could be empty or very short, etc.
> I'd just punt if strlen isn't known.
>> +
>> +                       gimple_stmt_iterator gsi = gsi_for_stmt (call_stmt);
>> +                       tree memcmp_decl = builtin_decl_explicit 
>> (BUILT_IN_MEMCMP);
>> +                       gcall *memcmp_call
>> +                         = gimple_build_call (memcmp_decl, 3, arg0, arg1,
>> +                                              arg1_len);
>> +                       tree memcmp_lhs = make_ssa_name (integer_type_node);
>> +                       gimple_call_set_lhs (memcmp_call, memcmp_lhs);
>> +                       update_stmt (memcmp_call);
>> +                       gsi_remove (&gsi, true);
>> +                       gsi_insert_before (&gsi, memcmp_call, GSI_SAME_STMT);
>> +
>> +                       gsi = gsi_for_stmt (stmt);
>> +                       tree zero = build_zero_cst (TREE_TYPE (memcmp_lhs));
>> +                       gassign *ga = gimple_build_assign (lhs, code,
>> +                                                          memcmp_lhs, zero);
>> +                       gsi_replace (&gsi, ga, false);
>> +                       update_ssa (TODO_update_ssa);
>
> And this is certainly even more wrong than the old TODO_update_ssa at the
> end of the pass, now you'll do it for every single replacement in the
> function.  Why do you need it?  The old call stmt has gimple_vdef and
> gimple_vuse, so just copy those over, see how e.g.
> replace_call_with_call_and_fold in gimple-fold.c does that.
> If you don't add strlen, you need to move the vdef/vuse from stmt to
> memcmp_call, if you really want to add strlen (see above note though),
> then that call should have a vuse added (same vuse as the stmt originally
> had).
Hi,
Thanks for the suggestions. In attached patch, I dropped the transform
if strlen (t) is unknown.
Since strstr is marked pure, so IIUC call_stmt for strstr shouldn't
have vdef assoicated with it ?
(gimple_vdef for call_stmt returned NULL for test-cases I tried it
with). Moving gimple_vuse
from call_stmt to memcmp_call worked for me.
Does the patch look OK ?
Bootstrap+tested on x86_64-unknown-linux-gnu with --enable-langauges=all,ada
Cross-tested on arm*-*-*, aarch64*-*-*.

Thanks,
Prathamesh
>
>         Jakub
diff --git a/gcc/testsuite/gcc.dg/strlenopt-30.c 
b/gcc/testsuite/gcc.dg/strlenopt-30.c
new file mode 100644
index 0000000..329bc25
--- /dev/null
+++ b/gcc/testsuite/gcc.dg/strlenopt-30.c
@@ -0,0 +1,44 @@
+/* { dg-do compile } */
+/* { dg-options "-O2 -fdump-tree-strlen" } */
+
+__attribute__((no_icf))
+_Bool f1(char *s)
+{
+  return __builtin_strstr (s, "hello") == s;
+}
+
+__attribute__((no_icf))
+_Bool f2(char *s)
+{
+  return s == __builtin_strstr (s, "hello");
+}
+
+__attribute__((no_icf))
+_Bool f3(char *s)
+{
+  return s != __builtin_strstr (s, "hello");
+}
+
+/* Do not perform transform, since strlen (t)
+   is unknown.  */
+
+__attribute__((no_icf))
+_Bool f4(char *s, char *t)
+{
+  return __builtin_strstr (s, t) == s;
+}
+
+/* Do not perform transform in this case, since
+   t1 doesn't have single use.  */
+
+__attribute__((no_icf))
+_Bool f5(char *s)
+{
+  void foo(char *);
+
+  char *t1 = __builtin_strstr (s, "hello");
+  foo (t1);
+  return (t1 == s);
+}
+
+/* { dg-final { scan-tree-dump-times "__builtin_memcmp" 3 "strlen" } } */
diff --git a/gcc/tree-ssa-strlen.c b/gcc/tree-ssa-strlen.c
index 339812e..06b07b0 100644
--- a/gcc/tree-ssa-strlen.c
+++ b/gcc/tree-ssa-strlen.c
@@ -2302,7 +2302,81 @@ strlen_optimize_stmt (gimple_stmt_iterator *gsi)
          else if (gimple_assign_rhs_code (stmt) == POINTER_PLUS_EXPR)
            handle_pointer_plus (gsi);
        }
-      else if (TREE_CODE (lhs) != SSA_NAME && !TREE_SIDE_EFFECTS (lhs))
+
+      /* Fold strstr (s, t) == s to memcmp (s, t, strlen (t)) == 0.
+        if strlen (t) is known and var holding return value of strstr
+        has single use.  */
+
+      else if (TREE_CODE (lhs) == SSA_NAME && INTEGRAL_TYPE_P (TREE_TYPE 
(lhs)))
+       {
+         enum tree_code code = gimple_assign_rhs_code (stmt);
+         if (code == EQ_EXPR || code == NE_EXPR)
+           {
+             tree rhs1 = gimple_assign_rhs1 (stmt);
+             tree rhs2 = gimple_assign_rhs2 (stmt);
+             if (TREE_CODE (rhs1) == SSA_NAME
+                 && TREE_CODE (rhs2) == SSA_NAME)
+               {
+                 gcall *call_stmt = dyn_cast<gcall *> (SSA_NAME_DEF_STMT 
(rhs1));
+                 if (!call_stmt)
+                   {
+                     call_stmt = dyn_cast<gcall *> (SSA_NAME_DEF_STMT (rhs2));
+                     tree tmp = rhs1;
+                     rhs1 = rhs2;
+                     rhs2 = tmp;
+                   }
+
+                 tree call_lhs;
+                 if (call_stmt
+                     && gimple_call_builtin_p (call_stmt, BUILT_IN_STRSTR)
+                     && (call_lhs = gimple_call_lhs (call_stmt))
+                     && has_single_use (call_lhs))
+                   {
+                     tree arg0 = gimple_call_arg (call_stmt, 0);
+                     if (operand_equal_p (arg0, rhs2, 0))
+                       {
+                         tree arg1 = gimple_call_arg (call_stmt, 1);
+                         tree arg1_len = NULL_TREE;
+                         int idx = get_stridx (arg1);
+
+                         if (idx)
+                           {
+                             if (idx < 0)
+                               arg1_len = build_int_cst (size_type_node,
+                                                         ~idx);
+                             else
+                               {
+                                 strinfo *si = get_strinfo (idx);
+                                 if (si)
+                                   arg1_len = get_string_length (si);
+                               }
+                           }
+
+                         if (arg1_len != NULL_TREE)
+                           {
+                             gimple_stmt_iterator gsi = gsi_for_stmt 
(call_stmt);
+                             tree memcmp_decl = builtin_decl_explicit 
(BUILT_IN_MEMCMP);
+                             gcall *memcmp_call
+                               = gimple_build_call (memcmp_decl, 3, arg0, arg1,
+                                                    arg1_len);
+                             tree memcmp_lhs = make_ssa_name 
(integer_type_node);
+                             gimple_set_vuse (memcmp_call, gimple_vuse 
(call_stmt));
+                             gimple_call_set_lhs (memcmp_call, memcmp_lhs);
+                             gsi_remove (&gsi, true);
+                             gsi_insert_before (&gsi, memcmp_call, 
GSI_SAME_STMT);
+                             gsi = gsi_for_stmt (stmt);
+                             tree zero = build_zero_cst (TREE_TYPE 
(memcmp_lhs));
+                             gassign *ga = gimple_build_assign (lhs, code,
+                                                                memcmp_lhs,
+                                                                zero);
+                             gsi_replace (&gsi, ga, false);
+                           }
+                       }
+                   }
+               }
+           }
+       }
+    else if (TREE_CODE (lhs) != SSA_NAME && !TREE_SIDE_EFFECTS (lhs))
        {
          tree type = TREE_TYPE (lhs);
          if (TREE_CODE (type) == ARRAY_TYPE)

Reply via email to