On Sat, Sep 7, 2024 at 1:31 AM Andrew Pinski <quic_apin...@quicinc.com> wrote:
>
> I noticed this folding inside fab could be done else where and could
> even improve inlining decisions and a few other things so let's
> move it to fold_stmt.
> It also fixes PR 116601 because places which call fold_stmt already
> have to deal with the stmt becoming a non-throw statement.
>
> For the fix for PR 116601 on the branches should be the original patch
> rather than a backport of this one.

OK.

Thanks,
Richard.

> Bootstrapped and tested on x86_64-linux-gnu.
>
>         PR tree-optimization/116601
>
> gcc/ChangeLog:
>
>         * gimple-fold.cc (optimize_memcpy_to_memset): Move
>         from tree-ssa-ccp.cc and rename. Also return true
>         if the optimization happened.
>         (gimple_fold_builtin_memory_op): Call
>         optimize_memcpy_to_memset.
>         (fold_stmt_1): Call optimize_memcpy_to_memset for
>         load/store copies.
>         * tree-ssa-ccp.cc (optimize_memcpy): Delete.
>         (pass_fold_builtins::execute): Remove code that
>         calls optimize_memcpy.
>
> gcc/testsuite/ChangeLog:
>
>         * gcc.dg/pr78408-1.c: Adjust dump scan to match where
>         the optimization now happens.
>         * g++.dg/torture/except-2.C: New test.
>
> Signed-off-by: Andrew Pinski <quic_apin...@quicinc.com>
> ---
>  gcc/gimple-fold.cc                      | 134 ++++++++++++++++++++++++
>  gcc/testsuite/g++.dg/torture/except-2.C |  18 ++++
>  gcc/testsuite/gcc.dg/pr78408-1.c        |   5 +-
>  gcc/tree-ssa-ccp.cc                     | 132 +----------------------
>  4 files changed, 156 insertions(+), 133 deletions(-)
>  create mode 100644 gcc/testsuite/g++.dg/torture/except-2.C
>
> diff --git a/gcc/gimple-fold.cc b/gcc/gimple-fold.cc
> index 2746fcfe314..942de7720fd 100644
> --- a/gcc/gimple-fold.cc
> +++ b/gcc/gimple-fold.cc
> @@ -894,6 +894,121 @@ size_must_be_zero_p (tree size)
>    return vr.zero_p ();
>  }
>
> +/* Optimize
> +   a = {};
> +   b = a;
> +   into
> +   a = {};
> +   b = {};
> +   Similarly for memset (&a, ..., sizeof (a)); instead of a = {};
> +   and/or memcpy (&b, &a, sizeof (a)); instead of b = a;  */
> +
> +static bool
> +optimize_memcpy_to_memset (gimple_stmt_iterator *gsip, tree dest, tree src, 
> tree len)
> +{
> +  gimple *stmt = gsi_stmt (*gsip);
> +  if (gimple_has_volatile_ops (stmt))
> +    return false;
> +
> +  tree vuse = gimple_vuse (stmt);
> +  if (vuse == NULL || TREE_CODE (vuse) != SSA_NAME)
> +    return false;
> +
> +  gimple *defstmt = SSA_NAME_DEF_STMT (vuse);
> +  tree src2 = NULL_TREE, len2 = NULL_TREE;
> +  poly_int64 offset, offset2;
> +  tree val = integer_zero_node;
> +  if (gimple_store_p (defstmt)
> +      && gimple_assign_single_p (defstmt)
> +      && TREE_CODE (gimple_assign_rhs1 (defstmt)) == CONSTRUCTOR
> +      && !gimple_clobber_p (defstmt))
> +    src2 = gimple_assign_lhs (defstmt);
> +  else if (gimple_call_builtin_p (defstmt, BUILT_IN_MEMSET)
> +          && TREE_CODE (gimple_call_arg (defstmt, 0)) == ADDR_EXPR
> +          && TREE_CODE (gimple_call_arg (defstmt, 1)) == INTEGER_CST)
> +    {
> +      src2 = TREE_OPERAND (gimple_call_arg (defstmt, 0), 0);
> +      len2 = gimple_call_arg (defstmt, 2);
> +      val = gimple_call_arg (defstmt, 1);
> +      /* For non-0 val, we'd have to transform stmt from assignment
> +        into memset (only if dest is addressable).  */
> +      if (!integer_zerop (val) && is_gimple_assign (stmt))
> +       src2 = NULL_TREE;
> +    }
> +
> +  if (src2 == NULL_TREE)
> +    return false;
> +
> +  if (len == NULL_TREE)
> +    len = (TREE_CODE (src) == COMPONENT_REF
> +          ? DECL_SIZE_UNIT (TREE_OPERAND (src, 1))
> +          : TYPE_SIZE_UNIT (TREE_TYPE (src)));
> +  if (len2 == NULL_TREE)
> +    len2 = (TREE_CODE (src2) == COMPONENT_REF
> +           ? DECL_SIZE_UNIT (TREE_OPERAND (src2, 1))
> +           : TYPE_SIZE_UNIT (TREE_TYPE (src2)));
> +  if (len == NULL_TREE
> +      || !poly_int_tree_p (len)
> +      || len2 == NULL_TREE
> +      || !poly_int_tree_p (len2))
> +    return false;
> +
> +  src = get_addr_base_and_unit_offset (src, &offset);
> +  src2 = get_addr_base_and_unit_offset (src2, &offset2);
> +  if (src == NULL_TREE
> +      || src2 == NULL_TREE
> +      || maybe_lt (offset, offset2))
> +    return false;
> +
> +  if (!operand_equal_p (src, src2, 0))
> +    return false;
> +
> +  /* [ src + offset2, src + offset2 + len2 - 1 ] is set to val.
> +     Make sure that
> +     [ src + offset, src + offset + len - 1 ] is a subset of that.  */
> +  if (maybe_gt (wi::to_poly_offset (len) + (offset - offset2),
> +               wi::to_poly_offset (len2)))
> +    return false;
> +
> +  if (dump_file && (dump_flags & TDF_DETAILS))
> +    {
> +      fprintf (dump_file, "Simplified\n  ");
> +      print_gimple_stmt (dump_file, stmt, 0, dump_flags);
> +      fprintf (dump_file, "after previous\n  ");
> +      print_gimple_stmt (dump_file, defstmt, 0, dump_flags);
> +    }
> +
> +  /* For simplicity, don't change the kind of the stmt,
> +     turn dest = src; into dest = {}; and memcpy (&dest, &src, len);
> +     into memset (&dest, val, len);
> +     In theory we could change dest = src into memset if dest
> +     is addressable (maybe beneficial if val is not 0), or
> +     memcpy (&dest, &src, len) into dest = {} if len is the size
> +     of dest, dest isn't volatile.  */
> +  if (is_gimple_assign (stmt))
> +    {
> +      tree ctor = build_constructor (TREE_TYPE (dest), NULL);
> +      gimple_assign_set_rhs_from_tree (gsip, ctor);
> +      update_stmt (stmt);
> +    }
> +  else /* If stmt is memcpy, transform it into memset.  */
> +    {
> +      gcall *call = as_a <gcall *> (stmt);
> +      tree fndecl = builtin_decl_implicit (BUILT_IN_MEMSET);
> +      gimple_call_set_fndecl (call, fndecl);
> +      gimple_call_set_fntype (call, TREE_TYPE (fndecl));
> +      gimple_call_set_arg (call, 1, val);
> +      update_stmt (stmt);
> +    }
> +
> +  if (dump_file && (dump_flags & TDF_DETAILS))
> +    {
> +      fprintf (dump_file, "into\n  ");
> +      print_gimple_stmt (dump_file, stmt, 0, dump_flags);
> +    }
> +  return true;
> +}
> +
>  /* Fold function call to builtin mem{{,p}cpy,move}.  Try to detect and
>     diagnose (otherwise undefined) overlapping copies without preventing
>     folding.  When folded, GCC guarantees that overlapping memcpy has
> @@ -1171,6 +1286,15 @@ gimple_fold_builtin_memory_op (gimple_stmt_iterator 
> *gsi,
>           return false;
>         }
>
> +     /* Try to optimize the memcpy to memset if src and dest are addresses. 
> */
> +     if (code != BUILT_IN_MEMPCPY
> +        && TREE_CODE (dest) == ADDR_EXPR
> +        && TREE_CODE (src) == ADDR_EXPR
> +        && TREE_CODE (len) == INTEGER_CST
> +        && optimize_memcpy_to_memset (gsi, TREE_OPERAND (dest, 0),
> +                                      TREE_OPERAND (src, 0), len))
> +       return true;
> +
>        if (!tree_fits_shwi_p (len))
>         return false;
>        if (!srctype
> @@ -6475,6 +6599,16 @@ fold_stmt_1 (gimple_stmt_iterator *gsi, bool inplace, 
> tree (*valueize) (tree),
>      {
>      case GIMPLE_ASSIGN:
>        {
> +       if (gimple_assign_load_p (stmt) && gimple_store_p (stmt))
> +         {
> +           if (optimize_memcpy_to_memset (gsi, gimple_assign_lhs (stmt),
> +                                          gimple_assign_rhs1 (stmt),
> +                                          /* len = */NULL_TREE))
> +             {
> +               changed = true;
> +               break;
> +             }
> +         }
>         /* Try to canonicalize for boolean-typed X the comparisons
>            X == 0, X == 1, X != 0, and X != 1.  */
>         if (gimple_assign_rhs_code (stmt) == EQ_EXPR
> diff --git a/gcc/testsuite/g++.dg/torture/except-2.C 
> b/gcc/testsuite/g++.dg/torture/except-2.C
> new file mode 100644
> index 00000000000..d896937a118
> --- /dev/null
> +++ b/gcc/testsuite/g++.dg/torture/except-2.C
> @@ -0,0 +1,18 @@
> +// { dg-do compile }
> +// { dg-additional-options "-fexceptions -fnon-call-exceptions" }
> +// PR tree-optimization/116601
> +
> +struct RefitOption {
> +  char subtype;
> +  int string;
> +} n;
> +void h(RefitOption);
> +void k(RefitOption *__val)
> +{
> +  try {
> +    *__val = RefitOption{};
> +    RefitOption __trans_tmp_2 = *__val;
> +    h(__trans_tmp_2);
> +  }
> +  catch(...){}
> +}
> diff --git a/gcc/testsuite/gcc.dg/pr78408-1.c 
> b/gcc/testsuite/gcc.dg/pr78408-1.c
> index dc9870ac6af..a2d9306848b 100644
> --- a/gcc/testsuite/gcc.dg/pr78408-1.c
> +++ b/gcc/testsuite/gcc.dg/pr78408-1.c
> @@ -1,7 +1,8 @@
>  /* PR c/78408 */
>  /* { dg-do compile { target size32plus } } */
> -/* { dg-options "-O2 -fdump-tree-fab1-details" } */
> -/* { dg-final { scan-tree-dump-times "after previous" 17 "fab1" } } */
> +/* { dg-options "-O2 -fdump-tree-ccp-details -fdump-tree-forwprop-details" } 
> */
> +/* { dg-final { scan-tree-dump-times "after previous" 1 "ccp1" } } */
> +/* { dg-final { scan-tree-dump-times "after previous" 16 "forwprop1" } } */
>
>  struct S { char a[33]; };
>  struct T { char a[65536]; };
> diff --git a/gcc/tree-ssa-ccp.cc b/gcc/tree-ssa-ccp.cc
> index 44711018e0e..47b2ce9441e 100644
> --- a/gcc/tree-ssa-ccp.cc
> +++ b/gcc/tree-ssa-ccp.cc
> @@ -4159,120 +4159,6 @@ optimize_atomic_op_fetch_cmp_0 (gimple_stmt_iterator 
> *gsip,
>    return true;
>  }
>
> -/* Optimize
> -   a = {};
> -   b = a;
> -   into
> -   a = {};
> -   b = {};
> -   Similarly for memset (&a, ..., sizeof (a)); instead of a = {};
> -   and/or memcpy (&b, &a, sizeof (a)); instead of b = a;  */
> -
> -static void
> -optimize_memcpy (gimple_stmt_iterator *gsip, tree dest, tree src, tree len)
> -{
> -  gimple *stmt = gsi_stmt (*gsip);
> -  if (gimple_has_volatile_ops (stmt))
> -    return;
> -
> -  tree vuse = gimple_vuse (stmt);
> -  if (vuse == NULL)
> -    return;
> -
> -  gimple *defstmt = SSA_NAME_DEF_STMT (vuse);
> -  tree src2 = NULL_TREE, len2 = NULL_TREE;
> -  poly_int64 offset, offset2;
> -  tree val = integer_zero_node;
> -  if (gimple_store_p (defstmt)
> -      && gimple_assign_single_p (defstmt)
> -      && TREE_CODE (gimple_assign_rhs1 (defstmt)) == CONSTRUCTOR
> -      && !gimple_clobber_p (defstmt))
> -    src2 = gimple_assign_lhs (defstmt);
> -  else if (gimple_call_builtin_p (defstmt, BUILT_IN_MEMSET)
> -          && TREE_CODE (gimple_call_arg (defstmt, 0)) == ADDR_EXPR
> -          && TREE_CODE (gimple_call_arg (defstmt, 1)) == INTEGER_CST)
> -    {
> -      src2 = TREE_OPERAND (gimple_call_arg (defstmt, 0), 0);
> -      len2 = gimple_call_arg (defstmt, 2);
> -      val = gimple_call_arg (defstmt, 1);
> -      /* For non-0 val, we'd have to transform stmt from assignment
> -        into memset (only if dest is addressable).  */
> -      if (!integer_zerop (val) && is_gimple_assign (stmt))
> -       src2 = NULL_TREE;
> -    }
> -
> -  if (src2 == NULL_TREE)
> -    return;
> -
> -  if (len == NULL_TREE)
> -    len = (TREE_CODE (src) == COMPONENT_REF
> -          ? DECL_SIZE_UNIT (TREE_OPERAND (src, 1))
> -          : TYPE_SIZE_UNIT (TREE_TYPE (src)));
> -  if (len2 == NULL_TREE)
> -    len2 = (TREE_CODE (src2) == COMPONENT_REF
> -           ? DECL_SIZE_UNIT (TREE_OPERAND (src2, 1))
> -           : TYPE_SIZE_UNIT (TREE_TYPE (src2)));
> -  if (len == NULL_TREE
> -      || !poly_int_tree_p (len)
> -      || len2 == NULL_TREE
> -      || !poly_int_tree_p (len2))
> -    return;
> -
> -  src = get_addr_base_and_unit_offset (src, &offset);
> -  src2 = get_addr_base_and_unit_offset (src2, &offset2);
> -  if (src == NULL_TREE
> -      || src2 == NULL_TREE
> -      || maybe_lt (offset, offset2))
> -    return;
> -
> -  if (!operand_equal_p (src, src2, 0))
> -    return;
> -
> -  /* [ src + offset2, src + offset2 + len2 - 1 ] is set to val.
> -     Make sure that
> -     [ src + offset, src + offset + len - 1 ] is a subset of that.  */
> -  if (maybe_gt (wi::to_poly_offset (len) + (offset - offset2),
> -               wi::to_poly_offset (len2)))
> -    return;
> -
> -  if (dump_file && (dump_flags & TDF_DETAILS))
> -    {
> -      fprintf (dump_file, "Simplified\n  ");
> -      print_gimple_stmt (dump_file, stmt, 0, dump_flags);
> -      fprintf (dump_file, "after previous\n  ");
> -      print_gimple_stmt (dump_file, defstmt, 0, dump_flags);
> -    }
> -
> -  /* For simplicity, don't change the kind of the stmt,
> -     turn dest = src; into dest = {}; and memcpy (&dest, &src, len);
> -     into memset (&dest, val, len);
> -     In theory we could change dest = src into memset if dest
> -     is addressable (maybe beneficial if val is not 0), or
> -     memcpy (&dest, &src, len) into dest = {} if len is the size
> -     of dest, dest isn't volatile.  */
> -  if (is_gimple_assign (stmt))
> -    {
> -      tree ctor = build_constructor (TREE_TYPE (dest), NULL);
> -      gimple_assign_set_rhs_from_tree (gsip, ctor);
> -      update_stmt (stmt);
> -    }
> -  else /* If stmt is memcpy, transform it into memset.  */
> -    {
> -      gcall *call = as_a <gcall *> (stmt);
> -      tree fndecl = builtin_decl_implicit (BUILT_IN_MEMSET);
> -      gimple_call_set_fndecl (call, fndecl);
> -      gimple_call_set_fntype (call, TREE_TYPE (fndecl));
> -      gimple_call_set_arg (call, 1, val);
> -      update_stmt (stmt);
> -    }
> -
> -  if (dump_file && (dump_flags & TDF_DETAILS))
> -    {
> -      fprintf (dump_file, "into\n  ");
> -      print_gimple_stmt (dump_file, stmt, 0, dump_flags);
> -    }
> -}
> -
>  /* A simple pass that attempts to fold all builtin functions.  This pass
>     is run after we've propagated as many constants as we can.  */
>
> @@ -4322,11 +4208,8 @@ pass_fold_builtins::execute (function *fun)
>
>           stmt = gsi_stmt (i);
>
> -          if (gimple_code (stmt) != GIMPLE_CALL)
> +         if (gimple_code (stmt) != GIMPLE_CALL)
>             {
> -             if (gimple_assign_load_p (stmt) && gimple_store_p (stmt))
> -               optimize_memcpy (&i, gimple_assign_lhs (stmt),
> -                                gimple_assign_rhs1 (stmt), NULL_TREE);
>               gsi_next (&i);
>               continue;
>             }
> @@ -4532,19 +4415,6 @@ pass_fold_builtins::execute (function *fun)
>                                                   false);
>                   break;
>
> -               case BUILT_IN_MEMCPY:
> -                 if (gimple_call_builtin_p (stmt, BUILT_IN_NORMAL)
> -                     && TREE_CODE (gimple_call_arg (stmt, 0)) == ADDR_EXPR
> -                     && TREE_CODE (gimple_call_arg (stmt, 1)) == ADDR_EXPR
> -                     && TREE_CODE (gimple_call_arg (stmt, 2)) == INTEGER_CST)
> -                   {
> -                     tree dest = TREE_OPERAND (gimple_call_arg (stmt, 0), 0);
> -                     tree src = TREE_OPERAND (gimple_call_arg (stmt, 1), 0);
> -                     tree len = gimple_call_arg (stmt, 2);
> -                     optimize_memcpy (&i, dest, src, len);
> -                   }
> -                 break;
> -
>                 case BUILT_IN_VA_START:
>                 case BUILT_IN_VA_END:
>                 case BUILT_IN_VA_COPY:
> --
> 2.43.0
>

Reply via email to