On Thu, 26 Mar 2015, Jakub Jelinek wrote:

> On Thu, Mar 26, 2015 at 09:33:56AM +0100, Richard Biener wrote:
> > this hunk which I think is not really necessary given that
> > the late object-size pass now runs right before FRE which
> 
> Not really immediately before that, but a few passes appart.
> And in the -Og case, while the immediately next pass is fab which doesn't
> manage to optimize it, then there is copyprop pass which does
> (at least on the pr64715-2.c testcase where I had to change objsz2 dump
> in which it doesn't happen to optimized dump (could be also fre2, but
> dind't want to make the testcase too fragile on pass reordering)).
> 
> The propagation was introduced by you in 2013, perhaps it is unnecessary now
> with the introduction of match.pd and trying to fold stuff much more often
> than previously.

I think I simply didn't want to change more testcases at that point,
but I can't see how followup passes at the very point wouldn't
clean things up very quickly (via fre or copyprop).  Eventually
it was -Og and pass_fold_builtins interaction (thinking of
__builtin_constant_p (__builtin_object_size (...)) or so).
If so I'm sure I added a testcase.

> So here is the updated patch I'm going to retest before installing:

Thanks,
Richard.

> 2015-03-26  Jakub Jelinek  <ja...@redhat.com>
> 
>       PR tree-optimization/64715
>       * passes.def: Add another instance of pass_object_sizes before
>       ccp1.
>       * tree-object-size.c (pass_object_sizes::execute): In
>       first_pass_instance, only handle __bos (, 1) and __bos (, 3)
>       calls, and keep the call in the IL, as {MIN,MAX}_EXPR of the
>       __bos result and the computed constant.  Remove redundant
>       checks, obsoleted by gimple_call_builtin_p test.
> 
>       * gcc.dg/builtin-object-size-15.c: New test.
>       * gcc.dg/pr64715-1.c: New test.
>       * gcc.dg/pr64715-2.c: New test.
> 
> --- gcc/passes.def.jj 2015-03-26 09:36:13.117579045 +0100
> +++ gcc/passes.def    2015-03-26 09:44:53.680118862 +0100
> @@ -77,6 +77,7 @@ along with GCC; see the file COPYING3.
>        PUSH_INSERT_PASSES_WITHIN (pass_all_early_optimizations)
>         NEXT_PASS (pass_remove_cgraph_callee_edges);
>         NEXT_PASS (pass_rename_ssa_copies);
> +       NEXT_PASS (pass_object_sizes);
>         NEXT_PASS (pass_ccp);
>         /* After CCP we rewrite no longer addressed locals into SSA
>            form if possible.  */
> --- gcc/tree-object-size.c.jj 2015-03-26 09:36:13.140578671 +0100
> +++ gcc/tree-object-size.c    2015-03-26 09:56:20.335960571 +0100
> @@ -1268,25 +1268,60 @@ pass_object_sizes::execute (function *fu
>           continue;
>  
>         init_object_sizes ();
> +
> +       /* In the first pass instance, only attempt to fold
> +          __builtin_object_size (x, 1) and __builtin_object_size (x, 3),
> +          and rather than folding the builtin to the constant if any,
> +          create a MIN_EXPR or MAX_EXPR of the __builtin_object_size
> +          call result and the computed constant.  */
> +       if (first_pass_instance)
> +         {
> +           tree ost = gimple_call_arg (call, 1);
> +           if (tree_fits_uhwi_p (ost))
> +             {
> +               unsigned HOST_WIDE_INT object_size_type = tree_to_uhwi (ost);
> +               tree ptr = gimple_call_arg (call, 0);
> +               tree lhs = gimple_call_lhs (call);
> +               if ((object_size_type == 1 || object_size_type == 3)
> +                   && (TREE_CODE (ptr) == ADDR_EXPR
> +                       || TREE_CODE (ptr) == SSA_NAME)
> +                   && lhs)
> +                 {
> +                   tree type = TREE_TYPE (lhs);
> +                   unsigned HOST_WIDE_INT bytes
> +                     = compute_builtin_object_size (ptr, object_size_type);
> +                   if (bytes != (unsigned HOST_WIDE_INT) (object_size_type 
> == 1
> +                                                          ? -1 : 0)
> +                       && wi::fits_to_tree_p (bytes, type))
> +                     {
> +                       tree tem = make_ssa_name (type);
> +                       gimple_call_set_lhs (call, tem);
> +                       enum tree_code code
> +                         = object_size_type == 1 ? MIN_EXPR : MAX_EXPR;
> +                       tree cst = build_int_cstu (type, bytes);
> +                       gimple g = gimple_build_assign (lhs, code, tem, cst);
> +                       gsi_insert_after (&i, g, GSI_NEW_STMT);
> +                       update_stmt (call);
> +                     }
> +                 }
> +             }
> +           continue;
> +         }
> +
>         result = fold_call_stmt (as_a <gcall *> (call), false);
>         if (!result)
>           {
> -           if (gimple_call_num_args (call) == 2
> -               && POINTER_TYPE_P (TREE_TYPE (gimple_call_arg (call, 0))))
> -             {
> -               tree ost = gimple_call_arg (call, 1);
> +           tree ost = gimple_call_arg (call, 1);
>  
> -               if (tree_fits_uhwi_p (ost))
> -                 {
> -                   unsigned HOST_WIDE_INT object_size_type
> -                     = tree_to_uhwi (ost);
> +           if (tree_fits_uhwi_p (ost))
> +             {
> +               unsigned HOST_WIDE_INT object_size_type = tree_to_uhwi (ost);
>  
> -                   if (object_size_type < 2)
> -                     result = fold_convert (size_type_node,
> -                                            integer_minus_one_node);
> -                   else if (object_size_type < 4)
> -                     result = build_zero_cst (size_type_node);
> -                 }
> +               if (object_size_type < 2)
> +                 result = fold_convert (size_type_node,
> +                                        integer_minus_one_node);
> +               else if (object_size_type < 4)
> +                 result = build_zero_cst (size_type_node);
>               }
>  
>             if (!result)
> --- gcc/testsuite/gcc.dg/builtin-object-size-15.c.jj  2015-03-26 
> 09:44:53.681118846 +0100
> +++ gcc/testsuite/gcc.dg/builtin-object-size-15.c     2015-03-26 
> 09:44:53.681118846 +0100
> @@ -0,0 +1,27 @@
> +/* { dg-do run } */
> +/* { dg-options "-O2" } */
> +
> +extern void abort (void);
> +
> +int
> +main ()
> +{
> +  struct A { char buf1[9]; char buf2[1]; } a;
> +
> +  if (__builtin_object_size (a.buf1 + (0 + 4), 1) != 5)
> +    abort ();
> +  char *p = a.buf1;
> +  p += 1;
> +  p += 3;
> +  if (__builtin_object_size (p, 1) != 5)
> +    abort ();
> +  p = (char *) &a;
> +  char *q = p + 1;
> +  char *r = q + 3;
> +  char *t = r;
> +  if (r != (char *) &a + 4)
> +    t = (char *) &a + 1;
> +  if (__builtin_object_size (t, 1) != 6)
> +    abort ();
> +  return 0;
> +}
> --- gcc/testsuite/gcc.dg/pr64715-1.c.jj       2015-03-26 09:44:53.682118830 
> +0100
> +++ gcc/testsuite/gcc.dg/pr64715-1.c  2015-03-26 09:44:53.682118830 +0100
> @@ -0,0 +1,23 @@
> +/* PR tree-optimization/64715 */
> +/* { dg-do compile } */
> +/* { dg-options "-O2 -fdump-tree-optimized" } */
> +
> +extern inline __attribute__ ((always_inline, gnu_inline, artificial, 
> nothrow, leaf)) char *
> +strcpy (char *__restrict dest, const char *__restrict src)
> +{
> +  return __builtin___strcpy_chk (dest, src, __builtin_object_size (dest, 2 > 
> 1));
> +}
> +
> +const char *str1 = "JIHGFEDCBA";
> +void bar (char *);
> +
> +void
> +foo ()
> +{
> +  struct A { char buf1[9]; char buf2[1]; } a;
> +  strcpy (a.buf1 + (0 + 4), str1 + 5);
> +  bar ((char *) &a);
> +}
> +
> +/* { dg-final { scan-tree-dump "__builtin___strcpy_chk\[^;\n\r\]*, 5\\\);" 
> "optimized" } } */
> +/* { dg-final { cleanup-tree-dump "optimized" } } */
> --- gcc/testsuite/gcc.dg/pr64715-2.c.jj       2015-03-26 09:44:53.682118830 
> +0100
> +++ gcc/testsuite/gcc.dg/pr64715-2.c  2015-03-26 09:57:50.198501347 +0100
> @@ -0,0 +1,19 @@
> +/* PR tree-optimization/64715 */
> +/* { dg-do compile } */
> +/* { dg-options "-O2 -fdump-tree-optimized" } */
> +
> +void bar (char *, int);
> +
> +void
> +foo (int x)
> +{
> +  char p[16], *q;
> +  q = p;
> +  if (x)
> +    q = p + 3;
> +  __builtin___strcpy_chk (q, "abcdefghijkl", __builtin_object_size (q, 1));
> +  bar (p, x);
> +}
> +
> +/* { dg-final { scan-tree-dump "__builtin_memcpy \\\(\[^;\n\r\]*, 
> \"abcdefghijkl\", 13\\\);" "optimized" } } */
> +/* { dg-final { cleanup-tree-dump "optimized" } } */
> 
> 
>       Jakub
> 
> 

-- 
Richard Biener <rguent...@suse.de>
SUSE LINUX GmbH, GF: Felix Imendoerffer, Jane Smithard, Jennifer Guild,
Dilip Upmanyu, Graham Norton HRB 21284 (AG Nuernberg)

Reply via email to