Hi! The following testcases FAIL, because EH cleanup is performed only before IPA and then right before musttail pass. At -O2 etc. (except for -O0/-Og) we handle musttail calls in the tailc pass though, and we can fail at that point because the calls might appear to throw internal exceptions which just don't do anything interesting (perhaps have debug statements or clobber statements in them) before they continue with resume of the exception (i.e. throw it externally).
As Richi said in the PR (and I agree) that moving passes is risky at this point, the following patch instead teaches the tail{r,c} and musttail passes to deal with such extra EDGE_EH edges. It is fairly simple thing, if we see an EDGE_EH edge from the call we just look up where it lands and if there are no non-debug/non-clobber/non-label statements before resx which throws externally, such edge can be ignored for tail call optimization or tail recursion. At other spots I just need to avoid using single_succ/single_succ_edge because the bb might have another edge - EDGE_EH. To make this less risky, this is done solely for the musttail calls for now. Bootstrapped/regtested on x86_64-linux and i686-linux, ok for trunk? 2025-04-02 Jakub Jelinek <ja...@redhat.com> PR tree-optimization/119491 * tree-tailcall.cc (single_non_eh_succ_edge): New function. (independent_of_stmt_p): Use single_non_eh_succ_edge (bb)->dest instead of single_succ (bb). (empty_eh_cleanup): New function. (find_tail_calls): Diagnose throwing of exceptions which do not propagate only if there are no EDGE_EH successor edges. If there are and the call is musttail, use empty_eh_cleanup to find if the cleanup is not empty. If not or the call is not musttail, use different diagnostics. Set is_noreturn even if there are successor edges. Use single_non_eh_succ_edge (abb) instead of single_succ_edge (abb). Punt on internal noreturn calls. (decrease_profile): Don't assert 0 or 1 successor edges. (eliminate_tail_call): Use single_non_eh_succ_edge (gsi_bb (t->call_gsi)) instead of single_succ_edge (gsi_bb (t->call_gsi)). (tree_optimize_tail_calls_1): Also look into basic blocks with single succ edge which is EDGE_EH for noreturn musttail calls. * g++.dg/opt/musttail3.C: New test. * g++.dg/opt/musttail4.C: New test. * g++.dg/opt/musttail5.C: New test. --- gcc/tree-tailcall.cc.jj 2025-04-01 16:47:30.373502796 +0200 +++ gcc/tree-tailcall.cc 2025-04-02 09:02:35.572760732 +0200 @@ -219,6 +219,23 @@ suitable_for_tail_call_opt_p (gcall *cal return true; } +/* Return single successor edge ignoring EDGE_EH edges. */ + +static edge +single_non_eh_succ_edge (basic_block bb) +{ + edge e, ret = NULL; + edge_iterator ei; + FOR_EACH_EDGE (e, ei, bb->succs) + if ((e->flags & EDGE_EH) == 0) + { + gcc_assert (ret == NULL); + ret = e; + } + gcc_assert (ret); + return ret; +} + /* Checks whether the expression EXPR in stmt AT is independent of the statement pointed to by GSI (in a sense that we already know EXPR's value at GSI). We use the fact that we are only called from the chain of @@ -245,7 +262,7 @@ independent_of_stmt_p (tree expr, gimple /* Mark the blocks in the chain leading to the end. */ at_bb = gimple_bb (at); call_bb = gimple_bb (gsi_stmt (gsi)); - for (bb = call_bb; bb != at_bb; bb = single_succ (bb)) + for (bb = call_bb; bb != at_bb; bb = single_non_eh_succ_edge (bb)->dest) bb->aux = &bb->aux; bb->aux = &bb->aux; @@ -289,7 +306,7 @@ independent_of_stmt_p (tree expr, gimple } /* Unmark the blocks. */ - for (bb = call_bb; bb != at_bb; bb = single_succ (bb)) + for (bb = call_bb; bb != at_bb; bb = single_non_eh_succ_edge (bb)->dest) bb->aux = NULL; bb->aux = NULL; @@ -462,6 +479,33 @@ maybe_error_musttail (gcall *call, const } } +/* Return true if there is no real work performed in the exception + path starting at BB and it will in the end result in external exception. + Search at most CNT basic blocks (so that we don't need to do trivial + loop discovery). */ +static bool +empty_eh_cleanup (basic_block bb, int cnt) +{ + if (EDGE_COUNT (bb->succs) > 1) + return false; + + for (gimple_stmt_iterator gsi = gsi_after_labels (bb); !gsi_end_p (gsi); + gsi_next (&gsi)) + { + gimple *g = gsi_stmt (gsi); + if (is_gimple_debug (g) || gimple_clobber_p (g)) + continue; + if (is_gimple_resx (g) && stmt_can_throw_external (cfun, g)) + return true; + return false; + } + if (!single_succ_p (bb)) + return false; + if (cnt == 1) + return false; + return empty_eh_cleanup (single_succ (bb), cnt - 1); +} + /* Argument for compute_live_vars/live_vars_at_stmt and what compute_live_vars returns. Computed lazily, but just once for the function. */ static live_vars_map *live_vars; @@ -612,14 +656,36 @@ find_tail_calls (basic_block bb, struct if ((stmt_could_throw_p (cfun, stmt) && !stmt_can_throw_external (cfun, stmt)) || EDGE_COUNT (bb->succs) > 1) { - if (stmt == last_stmt) - maybe_error_musttail (call, - _("call may throw exception that does not " - "propagate"), diag_musttail); - else - maybe_error_musttail (call, _("code between call and return"), - diag_musttail); - return; + if (stmt != last_stmt) + { + maybe_error_musttail (call, _("code between call and return"), + diag_musttail); + return; + } + + edge e; + edge_iterator ei; + FOR_EACH_EDGE (e, ei, bb->succs) + if (e->flags & EDGE_EH) + break; + + if (!e) + { + maybe_error_musttail (call, + _("call may throw exception that does not " + "propagate"), diag_musttail); + return; + } + + if (!gimple_call_must_tail_p (call) + || !empty_eh_cleanup (e->dest, 20) + || EDGE_COUNT (bb->succs) > 2) + { + maybe_error_musttail (call, + _("call may throw exception caught locally " + "or perform cleanups"), diag_musttail); + return; + } } /* If the function returns a value, then at present, the tail call @@ -763,8 +829,7 @@ find_tail_calls (basic_block bb, struct a = NULL_TREE; auto_bitmap to_move_defs; auto_vec<gimple *> to_move_stmts; - bool is_noreturn - = EDGE_COUNT (bb->succs) == 0 && gimple_call_noreturn_p (call); + bool is_noreturn = gimple_call_noreturn_p (call); abb = bb; agsi = gsi; @@ -776,8 +841,9 @@ find_tail_calls (basic_block bb, struct while (gsi_end_p (agsi)) { - ass_var = propagate_through_phis (ass_var, single_succ_edge (abb)); - abb = single_succ (abb); + edge e = single_non_eh_succ_edge (abb); + ass_var = propagate_through_phis (ass_var, e); + abb = e->dest; agsi = gsi_start_bb (abb); } @@ -851,6 +917,11 @@ find_tail_calls (basic_block bb, struct /* See if this is a tail call we can handle. */ if (is_noreturn) { + if (gimple_call_internal_p (call)) + { + maybe_error_musttail (call, _("internal call"), diag_musttail); + return; + } tree rettype = TREE_TYPE (TREE_TYPE (current_function_decl)); tree calltype = TREE_TYPE (gimple_call_fntype (call)); if (!VOID_TYPE_P (rettype) @@ -1112,11 +1183,6 @@ static void decrease_profile (basic_block bb, profile_count count) { bb->count = bb->count - count; - if (!single_succ_p (bb)) - { - gcc_assert (!EDGE_COUNT (bb->succs)); - return; - } } /* Eliminates tail call described by T. TMP_VARS is a list of @@ -1181,7 +1247,7 @@ eliminate_tail_call (struct tailcall *t, else { /* Number of executions of function has reduced by the tailcall. */ - e = single_succ_edge (gsi_bb (t->call_gsi)); + e = single_non_eh_succ_edge (gsi_bb (t->call_gsi)); profile_count count = e->count (); @@ -1196,8 +1262,7 @@ eliminate_tail_call (struct tailcall *t, decrease_profile (e->dest, count); /* Replace the call by a jump to the start of function. */ - e = redirect_edge_and_branch (single_succ_edge (gsi_bb (t->call_gsi)), - first); + e = redirect_edge_and_branch (e, first); } gcc_assert (e); PENDING_STMT (e) = NULL; @@ -1362,7 +1427,9 @@ tree_optimize_tail_calls_1 (bool opt_tai { basic_block bb; FOR_EACH_BB_FN (bb, cfun) - if (EDGE_COUNT (bb->succs) == 0) + if (EDGE_COUNT (bb->succs) == 0 + || (single_succ_p (bb) + && (single_succ_edge (bb)->flags & EDGE_EH))) if (gimple *c = last_nondebug_stmt (bb)) if (is_gimple_call (c) && gimple_call_must_tail_p (as_a <gcall *> (c)) --- gcc/testsuite/g++.dg/opt/musttail3.C.jj 2025-04-01 18:47:10.474945080 +0200 +++ gcc/testsuite/g++.dg/opt/musttail3.C 2025-04-01 18:49:27.063068029 +0200 @@ -0,0 +1,41 @@ +// PR tree-optimization/119491 +// { dg-do compile { target { external_musttail && c++11 } } } +// { dg-options "-O2" } + +struct A { + struct B {}; + A () {} +}; +void qux (); +unsigned char v; +A w; +void foo (A); + +template <typename T> +[[gnu::always_inline]] static inline void +bar (int &) +{ +} + +[[gnu::always_inline]] static inline void +baz (int *) +{ + int r = 0; + bar<int> (r); +} + +[[gnu::always_inline]] inline void +corge (A) +{ + if (v) + qux (); + [[gnu::musttail]] return foo (w); +} + +void +freddy (A) +{ + int t; + baz (&t); + [[gnu::musttail]] return corge (A{}); +} --- gcc/testsuite/g++.dg/opt/musttail4.C.jj 2025-04-01 19:10:56.389350911 +0200 +++ gcc/testsuite/g++.dg/opt/musttail4.C 2025-04-01 19:28:18.285020409 +0200 @@ -0,0 +1,35 @@ +// { dg-do compile { target { external_musttail && c++11 } } } +// { dg-options "-O2 -fexceptions" } + +struct S { ~S (); }; +volatile int v; +struct T { ~T () { v = v + 1; } }; +struct U { ~U () {} }; +int foo (); + +int +bar () noexcept +{ + [[gnu::musttail]] return foo (); // { dg-error "cannot tail-call: call may throw exception that does not propagate" } +} + +int +baz () +{ + S s; + [[gnu::musttail]] return foo (); // { dg-error "cannot tail-call: other reasons" } +} + +int +qux () +{ + T t; + [[gnu::musttail]] return foo (); // { dg-error "cannot tail-call: other reasons" } +} + +int +corge () +{ + U u; + [[gnu::musttail]] return foo (); +} --- gcc/testsuite/g++.dg/opt/musttail5.C.jj 2025-04-01 19:14:50.981127712 +0200 +++ gcc/testsuite/g++.dg/opt/musttail5.C 2025-04-01 19:11:25.249954382 +0200 @@ -0,0 +1,41 @@ +// PR tree-optimization/119491 +// { dg-do compile { target { external_musttail && c++11 } } } +// { dg-options "-O2" } + +struct A { + struct B {}; + A () {} +}; +void qux (); +unsigned char v; +A w; +[[noreturn]] void foo (A); + +template <typename T> +[[gnu::always_inline]] static inline void +bar (int &) +{ +} + +[[gnu::always_inline]] static inline void +baz (int *) +{ + int r = 0; + bar<int> (r); +} + +[[gnu::always_inline]] inline void +corge (A) +{ + if (v) + qux (); + [[gnu::musttail]] return foo (w); +} + +void +freddy (A) +{ + int t; + baz (&t); + [[gnu::musttail]] return corge (A{}); +} Jakub