I noticed that there are patterns that optimize `(X CMP1 CST1) AND/IOR (X CMP2 CST2)` and we can easily extend them to support the `(X CMP1 Y) AND/IOR (X CMP2 Y)` by saying they compare equal. This allows for this kind of optimization for integral and pointer types (which have the same semantics).
OK? Bootstrapped and tested on x86_64-linux-gnu with no regressions. gcc/ChangeLog: PR tree-optimization/106164 * match.pd: Extend the `(X CMP1 CST1) AND/IOR (X CMP2 CST2)` patterns to support `(X CMP1 Y) AND/IOR (X CMP2 Y)`. gcc/testsuite/ChangeLog: PR tree-optimization/106164 * gcc.dg/tree-ssa/cmpbit-1.c: New test. --- gcc/match.pd | 66 +++++++++++++++++++----- gcc/testsuite/gcc.dg/tree-ssa/cmpbit-1.c | 38 ++++++++++++++ 2 files changed, 90 insertions(+), 14 deletions(-) create mode 100644 gcc/testsuite/gcc.dg/tree-ssa/cmpbit-1.c diff --git a/gcc/match.pd b/gcc/match.pd index 73eb249f704..00af5d99119 100644 --- a/gcc/match.pd +++ b/gcc/match.pd @@ -2799,14 +2799,24 @@ DEFINE_INT_AND_FLOAT_ROUND_FN (RINT) /* Convert (X == CST1) && (X OP2 CST2) to a known value based on CST1 OP2 CST2. Similarly for (X != CST1). */ +/* Convert (X == Y) && (X OP2 Y) to a known value if X is an integral type. + Similarly for (X != Y). */ (for code1 (eq ne) (for code2 (eq ne lt gt le ge) (simplify - (bit_and:c (code1@3 @0 INTEGER_CST@1) (code2@4 @0 INTEGER_CST@2)) + (bit_and:c (code1@3 @0 @1) (code2@4 @0 @2)) + (if ((TREE_CODE (@1) == INTEGER_CST + && TREE_CODE (@2) == INTEGER_CST) + || ((INTEGRAL_TYPE_P (TREE_TYPE (@1)) + || POINTER_TYPE_P (TREE_TYPE (@1))) + && operand_equal_p (@1, @2))) (with { - int cmp = tree_int_cst_compare (@1, @2); + int cmp = 0; + if (TREE_CODE (@1) == INTEGER_CST + && TREE_CODE (@2) == INTEGER_CST) + cmp = tree_int_cst_compare (@1, @2); bool val; switch (code2) { @@ -2822,17 +2832,26 @@ DEFINE_INT_AND_FLOAT_ROUND_FN (RINT) (switch (if (code1 == EQ_EXPR && val) @3) (if (code1 == EQ_EXPR && !val) { constant_boolean_node (false, type); }) - (if (code1 == NE_EXPR && !val) @4)))))) + (if (code1 == NE_EXPR && !val) @4))))))) -/* Convert (X OP1 CST1) && (X OP2 CST2). */ +/* Convert (X OP1 CST1) && (X OP2 CST2). + Convert (X OP1 Y) && (X OP2 Y). */ (for code1 (lt le gt ge) (for code2 (lt le gt ge) (simplify - (bit_and (code1:c@3 @0 INTEGER_CST@1) (code2:c@4 @0 INTEGER_CST@2)) + (bit_and (code1:c@3 @0 @1) (code2:c@4 @0 @2)) + (if ((TREE_CODE (@1) == INTEGER_CST + && TREE_CODE (@2) == INTEGER_CST) + || ((INTEGRAL_TYPE_P (TREE_TYPE (@1)) + || POINTER_TYPE_P (TREE_TYPE (@1))) + && operand_equal_p (@1, @2))) (with { - int cmp = tree_int_cst_compare (@1, @2); + int cmp = 0; + if (TREE_CODE (@1) == INTEGER_CST + && TREE_CODE (@2) == INTEGER_CST) + cmp = tree_int_cst_compare (@1, @2); } (switch /* Choose the more restrictive of two < or <= comparisons. */ @@ -2861,18 +2880,28 @@ DEFINE_INT_AND_FLOAT_ROUND_FN (RINT) && (code1 == GT_EXPR || code1 == GE_EXPR) && (code2 == LT_EXPR || code2 == LE_EXPR)) { constant_boolean_node (false, type); }) - ))))) + )))))) /* Convert (X == CST1) || (X OP2 CST2) to a known value based on CST1 OP2 CST2. Similarly for (X != CST1). */ +/* Convert (X == Y) || (X OP2 Y) to a known value if X is an integral type. + Similarly for (X != Y). */ (for code1 (eq ne) (for code2 (eq ne lt gt le ge) (simplify - (bit_ior:c (code1@3 @0 INTEGER_CST@1) (code2@4 @0 INTEGER_CST@2)) + (bit_ior:c (code1@3 @0 @1) (code2@4 @0 @2)) + (if ((TREE_CODE (@1) == INTEGER_CST + && TREE_CODE (@2) == INTEGER_CST) + || ((INTEGRAL_TYPE_P (TREE_TYPE (@1)) + || POINTER_TYPE_P (TREE_TYPE (@1))) + && operand_equal_p (@1, @2))) (with { - int cmp = tree_int_cst_compare (@1, @2); + int cmp = 0; + if (TREE_CODE (@1) == INTEGER_CST + && TREE_CODE (@2) == INTEGER_CST) + cmp = tree_int_cst_compare (@1, @2); bool val; switch (code2) { @@ -2888,17 +2917,26 @@ DEFINE_INT_AND_FLOAT_ROUND_FN (RINT) (switch (if (code1 == EQ_EXPR && val) @4) (if (code1 == NE_EXPR && val) { constant_boolean_node (true, type); }) - (if (code1 == NE_EXPR && !val) @3)))))) + (if (code1 == NE_EXPR && !val) @3))))))) -/* Convert (X OP1 CST1) || (X OP2 CST2). */ +/* Convert (X OP1 CST1) || (X OP2 CST2). + Convert (X OP1 Y) || (X OP2 Y). */ (for code1 (lt le gt ge) (for code2 (lt le gt ge) (simplify - (bit_ior (code1@3 @0 INTEGER_CST@1) (code2@4 @0 INTEGER_CST@2)) + (bit_ior (code1@3 @0 @1) (code2@4 @0 @2)) + (if ((TREE_CODE (@1) == INTEGER_CST + && TREE_CODE (@2) == INTEGER_CST) + || ((INTEGRAL_TYPE_P (TREE_TYPE (@1)) + || POINTER_TYPE_P (TREE_TYPE (@1))) + && operand_equal_p (@1, @2))) (with { - int cmp = tree_int_cst_compare (@1, @2); + int cmp = 0; + if (TREE_CODE (@1) == INTEGER_CST + && TREE_CODE (@2) == INTEGER_CST) + cmp = tree_int_cst_compare (@1, @2); } (switch /* Choose the more restrictive of two < or <= comparisons. */ @@ -2927,7 +2965,7 @@ DEFINE_INT_AND_FLOAT_ROUND_FN (RINT) && (code1 == GT_EXPR || code1 == GE_EXPR) && (code2 == LT_EXPR || code2 == LE_EXPR)) { constant_boolean_node (true, type); }) - ))))) + )))))) /* We can't reassociate at all for saturating types. */ (if (!TYPE_SATURATING (type)) diff --git a/gcc/testsuite/gcc.dg/tree-ssa/cmpbit-1.c b/gcc/testsuite/gcc.dg/tree-ssa/cmpbit-1.c new file mode 100644 index 00000000000..c219e047ba8 --- /dev/null +++ b/gcc/testsuite/gcc.dg/tree-ssa/cmpbit-1.c @@ -0,0 +1,38 @@ +/* { dg-do compile } */ +/* { dg-options "-O1 -fno-tree-reassoc -fdump-tree-optimized-raw" } */ +_Bool f(int a, int b) +{ + _Bool c = a > b; + _Bool d = a >= b; + return c & d; +} + +_Bool f1(int a, int b) +{ + _Bool c = a > b; + _Bool d = a >= b; + return c | d; +} + +_Bool g(int a, int b) +{ + _Bool c = a < b; + _Bool d = a <= b; + return c & d; +} + +_Bool g1(int a, int b) +{ + _Bool c = a < b; + _Bool d = a <= b; + return c | d; +} + + +/* We should be able to optimize these without reassociation too. */ +/* { dg-final { scan-tree-dump-not "bit_and_expr," "optimized" } } */ +/* { dg-final { scan-tree-dump-not "bit_ior_expr," "optimized" } } */ +/* { dg-final { scan-tree-dump-times "gt_expr," 1 "optimized" } } */ +/* { dg-final { scan-tree-dump-times "ge_expr," 1 "optimized" } } */ +/* { dg-final { scan-tree-dump-times "lt_expr," 1 "optimized" } } */ +/* { dg-final { scan-tree-dump-times "le_expr," 1 "optimized" } } */ -- 2.31.1