On Fri, Nov 12, 2021 at 07:30:35AM +0000, Tamar Christina via Gcc-patches wrote: > @@ -2099,7 +2124,7 @@ spaceship_replacement (basic_block cond_bb, basic_block > middle_bb, > || !tree_fits_shwi_p (rhs) > || !IN_RANGE (tree_to_shwi (rhs), -1, 1)) > return false; > - if (orig_use_lhs) > + if (orig_use_lhs && !is_cast) > { > if ((cmp != EQ_EXPR && cmp != NE_EXPR) || !integer_zerop (rhs)) > return false;
I actually meant that you'd do the if (is_cast) handling right above the if (orig_use_lhs), i.e. if (is_cast) { if (TREE_CODE (rhs) != INTEGER_CST) return false; /* As for -ffast-math we assume the 2 return to be impossible, canonicalize (unsigned) res <= 1U or (unsigned) res < 2U into res >= 0 and (unsigned) res > 1U or (unsigned) res >= 2U as res < 0. */ switch (cmp) { case LE_EXPR: if (!integer_onep (rhs)) return false; cmp = GE_EXPR; break; case LT_EXPR: if (wi::ne_p (wi::to_widest (rhs), 2)) return false; cmp = GE_EXPR; break; case GT_EXPR: if (!integer_onep (rhs)) return false; cmp = LT_EXPR; break; case GE_EXPR: if (wi::ne_p (wi::to_widest (rhs), 2)) return false; cmp = LT_EXPR; break; default: return false; } rhs = build_zero_cst (TREE_TYPE (phires)); } else if (orig_use_lhs) ... and keep the code in the following hunk untouched. Similarly to how for the BIT_AND_EXPR if (orig_use_lhs), it virtually undoes the match.pd optimization. Because in the place you've placed it you're totally ignoring one_cmp, and I'm pretty sure that is the wrong thing. one_cmp is computed as: /* lhs1 one_cmp rhs1 results in phires of 1. */ enum tree_code one_cmp; if ((cmp1 == LT_EXPR || cmp1 == LE_EXPR) ^ (!integer_onep ((e1->flags & EDGE_TRUE_VALUE) ? arg1 : arg0))) one_cmp = LT_EXPR; else one_cmp = GT_EXPR; and it is something unrelated to what actual comparison is done or virtually done on the phires. > @@ -2310,62 +2335,101 @@ spaceship_replacement (basic_block cond_bb, > basic_block middle_bb, > one_cmp = GT_EXPR; > > enum tree_code res_cmp; > - switch (cmp) > + > + if (is_cast) > { > - case EQ_EXPR: > - if (integer_zerop (rhs)) > - res_cmp = EQ_EXPR; > - else if (integer_minus_onep (rhs)) > - res_cmp = one_cmp == LT_EXPR ? GT_EXPR : LT_EXPR; > - else if (integer_onep (rhs)) > - res_cmp = one_cmp; > - else > + if (TREE_CODE (rhs) != INTEGER_CST) > return false; > - break; > - case NE_EXPR: > - if (integer_zerop (rhs)) > - res_cmp = NE_EXPR; > - else if (integer_minus_onep (rhs)) > - res_cmp = one_cmp == LT_EXPR ? LE_EXPR : GE_EXPR; > - else if (integer_onep (rhs)) > - res_cmp = one_cmp == LT_EXPR ? GE_EXPR : LE_EXPR; > - else > - return false; > - break; > - case LT_EXPR: > - if (integer_onep (rhs)) > - res_cmp = one_cmp == LT_EXPR ? GE_EXPR : LE_EXPR; > - else if (integer_zerop (rhs)) > - res_cmp = one_cmp == LT_EXPR ? GT_EXPR : LT_EXPR; > - else > - return false; > - break; > - case LE_EXPR: > - if (integer_zerop (rhs)) > - res_cmp = one_cmp == LT_EXPR ? GE_EXPR : LE_EXPR; > - else if (integer_minus_onep (rhs)) > - res_cmp = one_cmp == LT_EXPR ? GT_EXPR : LT_EXPR; > - else > - return false; > - break; > - case GT_EXPR: > - if (integer_minus_onep (rhs)) > - res_cmp = one_cmp == LT_EXPR ? LE_EXPR : GE_EXPR; > - else if (integer_zerop (rhs)) > - res_cmp = one_cmp; > - else > - return false; > - break; > - case GE_EXPR: > - if (integer_zerop (rhs)) > - res_cmp = one_cmp == LT_EXPR ? LE_EXPR : GE_EXPR; > - else if (integer_onep (rhs)) > - res_cmp = one_cmp; > - else > - return false; > - break; > - default: > - gcc_unreachable (); > + /* As for -ffast-math we assume the 2 return to be > + impossible, canonicalize (unsigned) res <= 1U or > + (unsigned) res < 2U into res >= 0 and (unsigned) res > 1U > + or (unsigned) res >= 2U as res < 0. */ > + switch (cmp) > + { > + case LE_EXPR: > + if (!integer_onep (rhs)) > + return false; > + res_cmp = GE_EXPR; > + break; > + case LT_EXPR: > + if (wi::ne_p (wi::to_widest (rhs), 2)) > + return false; > + res_cmp = GE_EXPR; > + break; > + case GT_EXPR: > + if (!integer_onep (rhs)) > + return false; > + res_cmp = LT_EXPR; > + break; > + case GE_EXPR: > + if (wi::ne_p (wi::to_widest (rhs), 2)) > + return false; > + res_cmp = LT_EXPR; > + break; > + default: > + return false; > + } > + rhs = build_zero_cst (TREE_TYPE (phires)); > + } > + else > + { > + switch (cmp) > + { > + case EQ_EXPR: > + if (integer_zerop (rhs)) > + res_cmp = EQ_EXPR; > + else if (integer_minus_onep (rhs)) > + res_cmp = one_cmp == LT_EXPR ? GT_EXPR : LT_EXPR; > + else if (integer_onep (rhs)) > + res_cmp = one_cmp; > + else > + return false; > + break; > + case NE_EXPR: > + if (integer_zerop (rhs)) > + res_cmp = NE_EXPR; > + else if (integer_minus_onep (rhs)) > + res_cmp = one_cmp == LT_EXPR ? LE_EXPR : GE_EXPR; > + else if (integer_onep (rhs)) > + res_cmp = one_cmp == LT_EXPR ? GE_EXPR : LE_EXPR; > + else > + return false; > + break; > + case LT_EXPR: > + if (integer_onep (rhs)) > + res_cmp = one_cmp == LT_EXPR ? GE_EXPR : LE_EXPR; > + else if (integer_zerop (rhs)) > + res_cmp = one_cmp == LT_EXPR ? GT_EXPR : LT_EXPR; > + else > + return false; > + break; > + case LE_EXPR: > + if (integer_zerop (rhs)) > + res_cmp = one_cmp == LT_EXPR ? GE_EXPR : LE_EXPR; > + else if (integer_minus_onep (rhs)) > + res_cmp = one_cmp == LT_EXPR ? GT_EXPR : LT_EXPR; > + else > + return false; > + break; > + case GT_EXPR: > + if (integer_minus_onep (rhs)) > + res_cmp = one_cmp == LT_EXPR ? LE_EXPR : GE_EXPR; > + else if (integer_zerop (rhs)) > + res_cmp = one_cmp; > + else > + return false; > + break; > + case GE_EXPR: > + if (integer_zerop (rhs)) > + res_cmp = one_cmp == LT_EXPR ? LE_EXPR : GE_EXPR; > + else if (integer_onep (rhs)) > + res_cmp = one_cmp; > + else > + return false; > + break; > + default: > + gcc_unreachable (); > + } > } > > if (gimple_code (use_stmt) == GIMPLE_COND) > @@ -2405,12 +2470,14 @@ spaceship_replacement (basic_block cond_bb, > basic_block middle_bb, > } > if (orig_use_lhs) > { > - if (!has_debug_uses) > + if (!has_debug_uses || is_cast) > FOR_EACH_IMM_USE_FAST (use_p, iter, orig_use_lhs) > { > gimple *use_stmt = USE_STMT (use_p); > gcc_assert (is_gimple_debug (use_stmt)); > has_debug_uses = true; > + if (is_cast) > + has_cast_debug_uses = true; > } > gimple_stmt_iterator gsi = gsi_for_stmt (orig_use_stmt); > tree zero = build_zero_cst (TREE_TYPE (orig_use_lhs)); > @@ -2448,7 +2515,23 @@ spaceship_replacement (basic_block cond_bb, > basic_block middle_bb, > gsi_insert_before (&gsi, g, GSI_SAME_STMT); > replace_uses_by (phires, temp2); > if (orig_use_lhs) > - replace_uses_by (orig_use_lhs, temp2); > + { > + if (has_cast_debug_uses) > + { > + tree temp3 = make_node (DEBUG_EXPR_DECL); > + DECL_ARTIFICIAL (temp3) = 1; > + TREE_TYPE (temp3) = TREE_TYPE (orig_use_lhs); > + SET_DECL_MODE (temp3, TYPE_MODE (type)); > + t = build2 (EQ_EXPR, boolean_type_node, lhs1, rhs2); > + t = build3 (COND_EXPR, type, t, build_zero_cst (type), > + temp1); This will create a debug stmt with correct type on lhs, but incorrect on the rhs (type rather than TREE_TYPE (orig_use_lhs). You should instead of the above 3 lines do: t = fold_convert (TREE_TYPE (temp3), temp2); Otherwise LGTM. Jakub