On Mon, Jul 31, 2023 at 7:35 AM Andrew Pinski via Gcc-patches <gcc-patches@gcc.gnu.org> wrote: > > I noticed that there are patterns that optimize > `(X CMP1 CST1) AND/IOR (X CMP2 CST2)` and we can easily extend > them to support the `(X CMP1 Y) AND/IOR (X CMP2 Y)` by saying they > compare equal. This allows for this kind of optimization for integral > and pointer types (which have the same semantics). > > OK? Bootstrapped and tested on x86_64-linux-gnu with no regressions.
OK. Thanks, Richard. > gcc/ChangeLog: > > PR tree-optimization/106164 > * match.pd: Extend the `(X CMP1 CST1) AND/IOR (X CMP2 CST2)` > patterns to support `(X CMP1 Y) AND/IOR (X CMP2 Y)`. > > gcc/testsuite/ChangeLog: > > PR tree-optimization/106164 > * gcc.dg/tree-ssa/cmpbit-1.c: New test. > --- > gcc/match.pd | 66 +++++++++++++++++++----- > gcc/testsuite/gcc.dg/tree-ssa/cmpbit-1.c | 38 ++++++++++++++ > 2 files changed, 90 insertions(+), 14 deletions(-) > create mode 100644 gcc/testsuite/gcc.dg/tree-ssa/cmpbit-1.c > > diff --git a/gcc/match.pd b/gcc/match.pd > index 73eb249f704..00af5d99119 100644 > --- a/gcc/match.pd > +++ b/gcc/match.pd > @@ -2799,14 +2799,24 @@ DEFINE_INT_AND_FLOAT_ROUND_FN (RINT) > > /* Convert (X == CST1) && (X OP2 CST2) to a known value > based on CST1 OP2 CST2. Similarly for (X != CST1). */ > +/* Convert (X == Y) && (X OP2 Y) to a known value if X is an integral type. > + Similarly for (X != Y). */ > > (for code1 (eq ne) > (for code2 (eq ne lt gt le ge) > (simplify > - (bit_and:c (code1@3 @0 INTEGER_CST@1) (code2@4 @0 INTEGER_CST@2)) > + (bit_and:c (code1@3 @0 @1) (code2@4 @0 @2)) > + (if ((TREE_CODE (@1) == INTEGER_CST > + && TREE_CODE (@2) == INTEGER_CST) > + || ((INTEGRAL_TYPE_P (TREE_TYPE (@1)) > + || POINTER_TYPE_P (TREE_TYPE (@1))) > + && operand_equal_p (@1, @2))) > (with > { > - int cmp = tree_int_cst_compare (@1, @2); > + int cmp = 0; > + if (TREE_CODE (@1) == INTEGER_CST > + && TREE_CODE (@2) == INTEGER_CST) > + cmp = tree_int_cst_compare (@1, @2); > bool val; > switch (code2) > { > @@ -2822,17 +2832,26 @@ DEFINE_INT_AND_FLOAT_ROUND_FN (RINT) > (switch > (if (code1 == EQ_EXPR && val) @3) > (if (code1 == EQ_EXPR && !val) { constant_boolean_node (false, type); > }) > - (if (code1 == NE_EXPR && !val) @4)))))) > + (if (code1 == NE_EXPR && !val) @4))))))) > > -/* Convert (X OP1 CST1) && (X OP2 CST2). */ > +/* Convert (X OP1 CST1) && (X OP2 CST2). > + Convert (X OP1 Y) && (X OP2 Y). */ > > (for code1 (lt le gt ge) > (for code2 (lt le gt ge) > (simplify > - (bit_and (code1:c@3 @0 INTEGER_CST@1) (code2:c@4 @0 INTEGER_CST@2)) > + (bit_and (code1:c@3 @0 @1) (code2:c@4 @0 @2)) > + (if ((TREE_CODE (@1) == INTEGER_CST > + && TREE_CODE (@2) == INTEGER_CST) > + || ((INTEGRAL_TYPE_P (TREE_TYPE (@1)) > + || POINTER_TYPE_P (TREE_TYPE (@1))) > + && operand_equal_p (@1, @2))) > (with > { > - int cmp = tree_int_cst_compare (@1, @2); > + int cmp = 0; > + if (TREE_CODE (@1) == INTEGER_CST > + && TREE_CODE (@2) == INTEGER_CST) > + cmp = tree_int_cst_compare (@1, @2); > } > (switch > /* Choose the more restrictive of two < or <= comparisons. */ > @@ -2861,18 +2880,28 @@ DEFINE_INT_AND_FLOAT_ROUND_FN (RINT) > && (code1 == GT_EXPR || code1 == GE_EXPR) > && (code2 == LT_EXPR || code2 == LE_EXPR)) > { constant_boolean_node (false, type); }) > - ))))) > + )))))) > > /* Convert (X == CST1) || (X OP2 CST2) to a known value > based on CST1 OP2 CST2. Similarly for (X != CST1). */ > +/* Convert (X == Y) || (X OP2 Y) to a known value if X is an integral type. > + Similarly for (X != Y). */ > > (for code1 (eq ne) > (for code2 (eq ne lt gt le ge) > (simplify > - (bit_ior:c (code1@3 @0 INTEGER_CST@1) (code2@4 @0 INTEGER_CST@2)) > + (bit_ior:c (code1@3 @0 @1) (code2@4 @0 @2)) > + (if ((TREE_CODE (@1) == INTEGER_CST > + && TREE_CODE (@2) == INTEGER_CST) > + || ((INTEGRAL_TYPE_P (TREE_TYPE (@1)) > + || POINTER_TYPE_P (TREE_TYPE (@1))) > + && operand_equal_p (@1, @2))) > (with > { > - int cmp = tree_int_cst_compare (@1, @2); > + int cmp = 0; > + if (TREE_CODE (@1) == INTEGER_CST > + && TREE_CODE (@2) == INTEGER_CST) > + cmp = tree_int_cst_compare (@1, @2); > bool val; > switch (code2) > { > @@ -2888,17 +2917,26 @@ DEFINE_INT_AND_FLOAT_ROUND_FN (RINT) > (switch > (if (code1 == EQ_EXPR && val) @4) > (if (code1 == NE_EXPR && val) { constant_boolean_node (true, type); }) > - (if (code1 == NE_EXPR && !val) @3)))))) > + (if (code1 == NE_EXPR && !val) @3))))))) > > -/* Convert (X OP1 CST1) || (X OP2 CST2). */ > +/* Convert (X OP1 CST1) || (X OP2 CST2). > + Convert (X OP1 Y) || (X OP2 Y). */ > > (for code1 (lt le gt ge) > (for code2 (lt le gt ge) > (simplify > - (bit_ior (code1@3 @0 INTEGER_CST@1) (code2@4 @0 INTEGER_CST@2)) > + (bit_ior (code1@3 @0 @1) (code2@4 @0 @2)) > + (if ((TREE_CODE (@1) == INTEGER_CST > + && TREE_CODE (@2) == INTEGER_CST) > + || ((INTEGRAL_TYPE_P (TREE_TYPE (@1)) > + || POINTER_TYPE_P (TREE_TYPE (@1))) > + && operand_equal_p (@1, @2))) > (with > { > - int cmp = tree_int_cst_compare (@1, @2); > + int cmp = 0; > + if (TREE_CODE (@1) == INTEGER_CST > + && TREE_CODE (@2) == INTEGER_CST) > + cmp = tree_int_cst_compare (@1, @2); > } > (switch > /* Choose the more restrictive of two < or <= comparisons. */ > @@ -2927,7 +2965,7 @@ DEFINE_INT_AND_FLOAT_ROUND_FN (RINT) > && (code1 == GT_EXPR || code1 == GE_EXPR) > && (code2 == LT_EXPR || code2 == LE_EXPR)) > { constant_boolean_node (true, type); }) > - ))))) > + )))))) > > /* We can't reassociate at all for saturating types. */ > (if (!TYPE_SATURATING (type)) > diff --git a/gcc/testsuite/gcc.dg/tree-ssa/cmpbit-1.c > b/gcc/testsuite/gcc.dg/tree-ssa/cmpbit-1.c > new file mode 100644 > index 00000000000..c219e047ba8 > --- /dev/null > +++ b/gcc/testsuite/gcc.dg/tree-ssa/cmpbit-1.c > @@ -0,0 +1,38 @@ > +/* { dg-do compile } */ > +/* { dg-options "-O1 -fno-tree-reassoc -fdump-tree-optimized-raw" } */ > +_Bool f(int a, int b) > +{ > + _Bool c = a > b; > + _Bool d = a >= b; > + return c & d; > +} > + > +_Bool f1(int a, int b) > +{ > + _Bool c = a > b; > + _Bool d = a >= b; > + return c | d; > +} > + > +_Bool g(int a, int b) > +{ > + _Bool c = a < b; > + _Bool d = a <= b; > + return c & d; > +} > + > +_Bool g1(int a, int b) > +{ > + _Bool c = a < b; > + _Bool d = a <= b; > + return c | d; > +} > + > + > +/* We should be able to optimize these without reassociation too. */ > +/* { dg-final { scan-tree-dump-not "bit_and_expr," "optimized" } } */ > +/* { dg-final { scan-tree-dump-not "bit_ior_expr," "optimized" } } */ > +/* { dg-final { scan-tree-dump-times "gt_expr," 1 "optimized" } } */ > +/* { dg-final { scan-tree-dump-times "ge_expr," 1 "optimized" } } */ > +/* { dg-final { scan-tree-dump-times "lt_expr," 1 "optimized" } } */ > +/* { dg-final { scan-tree-dump-times "le_expr," 1 "optimized" } } */ > -- > 2.31.1 >