https://gcc.gnu.org/bugzilla/show_bug.cgi?id=106365

--- Comment #10 from Kewen Lin <linkw at gcc dot gnu.org> ---
(In reply to Richard Biener from comment #7)
> Created attachment 53323 [details]
> prototype
> 
> I'm testing this - for .LEN_STORE you mainly have to compute pd.rhs_off,
> pd.offset, pd.size and do a single
> 
>   return data->push_partial_def (pd, set, set, offseti, maxsizei);

Thanks!  Added the below diff and confirm it can make most of code optimized
away and generate "return 285;".

diff --git a/gcc/tree-ssa-sccvn.cc b/gcc/tree-ssa-sccvn.cc
index 0a16984d2ca..ea5b7c54f82 100644
--- a/gcc/tree-ssa-sccvn.cc
+++ b/gcc/tree-ssa-sccvn.cc
@@ -3228,6 +3228,7 @@ vn_reference_lookup_3 (ao_ref *ref, tree vuse, void
*data_,
        return (void *)-1;

       tree mask = NULL_TREE;
+      tree len = NULL_TREE;
       switch (fn)
        {
        case IFN_MASK_STORE:
@@ -3236,6 +3237,19 @@ vn_reference_lookup_3 (ao_ref *ref, tree vuse, void
*data_,
          if (TREE_CODE (mask) != VECTOR_CST)
            return (void *)-1;
          break;
+       case IFN_LEN_STORE:
+         {
+           /* Extract the length without bias.  */
+           tree len0 = gimple_call_arg (call, 2);
+           len0 = vn_valueize (len0);
+           if (TREE_CODE (len0) != INTEGER_CST)
+             return (void *) -1;
+           tree bias = gimple_call_arg (call, 4);
+           len = fold_build2 (MINUS_EXPR, TREE_TYPE (len0), len0, bias);
+           /* Bias is either 0 or -1, biased length should be constant.  */
+           gcc_assert (TREE_CODE (len) == INTEGER_CST);
+           break;
+         }
        default:
          return (void *)-1;
        }
@@ -3311,6 +3325,16 @@ vn_reference_lookup_3 (ao_ref *ref, tree vuse, void
*data_,
                                                       offseti, maxsizei);
                    }
                }
+             else if (len)
+               {
+                 pd.rhs_off = 0;
+                 pd.offset = offset2i;
+                 pd.size = tree_to_uhwi (len) * elsz;
+                 if (ranges_known_overlap_p (offset, maxsize, pd.offset,
+                                             pd.size))
+                   return data->push_partial_def (pd, set, set, offseti,
+                                                  maxsizei);
+               }
              else
                gcc_unreachable ();
              return NULL;

But it still keeps the .LEN_STORE there:

int foo ()
{
  int a[10];

  <bb 2> [local count: 97603129]:
  .LEN_STORE (&MEM <int[10]> [(void *)&a + 32B], 128B, 8, { 64, 0, 0, 0, 81, 0,
0, 0, 100, 0, 0, 0, 121, 0, 0, 0 }, 0);
  a ={v} {CLOBBER(eol)};
  return 285;

}

btw, the latest commit "Add alias disambiguation for vectorizer load/store
IFNs" has been applied.

Reply via email to