On August 29, 2016 9:57:00 PM GMT+02:00, Jakub Jelinek <ja...@redhat.com> wrote: >Hi! > >As the testcase shows, with deep chains of COND_EXPRs with the same >SSA_NAMEs appearing more than once in the various operands we can >hang in search_type_for_mask. Similar check_bool_pattern function >uses a hash_set to handle stmts that have been checked already, this >patch >uses a hash_map in which we cache the return values once we've handled >some >stmt already. > >Bootstrapped/regtested on x86_64-linux and i686-linux, ok for trunk?
OK. Thanks, Richard. >2016-08-29 Jakub Jelinek <ja...@redhat.com> > > PR tree-optimization/72866 > * tree-vect-patterns.c (search_type_for_mask): Turn into > a small wrapper, move all code to ... > (search_type_for_mask_1): ... this new function. Add caching > and adjust recursive calls. > > * gcc.dg/vect/pr72866.c: New test. > >--- gcc/tree-vect-patterns.c.jj 2016-07-21 08:59:55.000000000 +0200 >+++ gcc/tree-vect-patterns.c 2016-08-29 19:26:12.807164641 +0200 >@@ -3459,13 +3459,11 @@ adjust_bool_stmts (hash_set <gimple *> & > return gimple_assign_lhs (pattern_stmt); > } > >-/* Return the proper type for converting bool VAR into >- an integer value or NULL_TREE if no such type exists. >- The type is chosen so that converted value has the >- same number of elements as VAR's vector type. */ >+/* Helper for search_type_for_mask. */ > > static tree >-search_type_for_mask (tree var, vec_info *vinfo) >+search_type_for_mask_1 (tree var, vec_info *vinfo, >+ hash_map<gimple *, tree> &cache) > { > gimple *def_stmt; > enum vect_def_type dt; >@@ -3490,6 +3488,10 @@ search_type_for_mask (tree var, vec_info > if (!is_gimple_assign (def_stmt)) > return NULL_TREE; > >+ tree *c = cache.get (def_stmt); >+ if (c) >+ return *c; >+ > rhs_code = gimple_assign_rhs_code (def_stmt); > rhs1 = gimple_assign_rhs1 (def_stmt); > >@@ -3498,14 +3500,15 @@ search_type_for_mask (tree var, vec_info > case SSA_NAME: > case BIT_NOT_EXPR: > CASE_CONVERT: >- res = search_type_for_mask (rhs1, vinfo); >+ res = search_type_for_mask_1 (rhs1, vinfo, cache); > break; > > case BIT_AND_EXPR: > case BIT_IOR_EXPR: > case BIT_XOR_EXPR: >- res = search_type_for_mask (rhs1, vinfo); >- res2 = search_type_for_mask (gimple_assign_rhs2 (def_stmt), >vinfo); >+ res = search_type_for_mask_1 (rhs1, vinfo, cache); >+ res2 = search_type_for_mask_1 (gimple_assign_rhs2 (def_stmt), >vinfo, >+ cache); > if (!res || (res2 && TYPE_PRECISION (res) > TYPE_PRECISION (res2))) > res = res2; > break; >@@ -3517,8 +3520,9 @@ search_type_for_mask (tree var, vec_info > > if (TREE_CODE (TREE_TYPE (rhs1)) == BOOLEAN_TYPE) > { >- res = search_type_for_mask (rhs1, vinfo); >- res2 = search_type_for_mask (gimple_assign_rhs2 (def_stmt), >vinfo); >+ res = search_type_for_mask_1 (rhs1, vinfo, cache); >+ res2 = search_type_for_mask_1 (gimple_assign_rhs2 (def_stmt), >+ vinfo, cache); > if (!res || (res2 && TYPE_PRECISION (res) > TYPE_PRECISION >(res2))) > res = res2; > break; >@@ -3526,12 +3530,18 @@ search_type_for_mask (tree var, vec_info > > comp_vectype = get_vectype_for_scalar_type (TREE_TYPE (rhs1)); > if (comp_vectype == NULL_TREE) >- return NULL_TREE; >+ { >+ res = NULL_TREE; >+ break; >+ } > > mask_type = get_mask_type_for_scalar_type (TREE_TYPE (rhs1)); > if (!mask_type > || !expand_vec_cmp_expr_p (comp_vectype, mask_type)) >- return NULL_TREE; >+ { >+ res = NULL_TREE; >+ break; >+ } > > if (TREE_CODE (TREE_TYPE (rhs1)) != INTEGER_TYPE > || !TYPE_UNSIGNED (TREE_TYPE (rhs1))) >@@ -3544,9 +3554,21 @@ search_type_for_mask (tree var, vec_info > } > } > >+ cache.put (def_stmt, res); > return res; > } > >+/* Return the proper type for converting bool VAR into >+ an integer value or NULL_TREE if no such type exists. >+ The type is chosen so that converted value has the >+ same number of elements as VAR's vector type. */ >+ >+static tree >+search_type_for_mask (tree var, vec_info *vinfo) >+{ >+ hash_map<gimple *, tree> cache; >+ return search_type_for_mask_1 (var, vinfo, cache); >+} > > /* Function vect_recog_bool_pattern > >--- gcc/testsuite/gcc.dg/vect/pr72866.c.jj 2016-08-29 >19:28:22.453646025 +0200 >+++ gcc/testsuite/gcc.dg/vect/pr72866.c 2016-08-29 19:28:17.000000000 >+0200 >@@ -0,0 +1,19 @@ >+/* PR tree-optimization/72866 */ >+/* { dg-do compile } */ >+ >+unsigned int dl; >+int rx, lb; >+ >+void >+fo (int jv, int be) >+{ >+ const unsigned int xw = 16; >+ unsigned int ya, wo; >+ >+ for (ya = 0; ya < 2; ++ya) >+ for (wo = 0; wo < xw; ++wo) >+ { >+ dl += (jv ? be : rx); >+ rx += ((lb == 0) + 1); >+ } >+} > > Jakub