Hello world, the attached patch fixes the PR by removing common function elimination in FORALL statements.
In the course of fixing this PR, I had originally fixed the ICE only to find that the transformation (where f is a function) forall (i=1:2) a(i) = f(i) + f(i) end forall to forall (i=1:2) tmp = f(i) a(i) = tmp end forall did the Wrong Thing. Oh well... Regression-tested. OK for tunk? Thomas 2011-10-09 Thomas Koenig <tkoe...@gcc.gnu.org> PR fortran/50564 * frontend-passes (forall_level): New variable. (cfe_register_funcs): Don't register functions if we are within a forall loop. (optimize_namespace): Set forall_level to 0 before entry. (gfc_code_walker): Increase/decrease forall_level. 2011-10-09 Thomas Koenig <tkoe...@gcc.gnu.org> PR fortran/50564 * gfortran.dg/forall_15.f90: New test case.
Index: frontend-passes.c =================================================================== --- frontend-passes.c (Revision 179709) +++ frontend-passes.c (Arbeitskopie) @@ -62,6 +62,10 @@ static gfc_code *inserted_block, **changed_stateme gfc_namespace *current_ns; +/* If we are within any forall loop. */ + +static int forall_level; + /* Entry point - run all passes for a namespace. So far, only an optimization pass is run. */ @@ -165,6 +169,12 @@ cfe_register_funcs (gfc_expr **e, int *walk_subtre || (*e)->ts.u.cl->length->expr_type != EXPR_CONSTANT)) return 0; + /* We don't do function elimination within FORALL statements, it can + lead to wrong-code in certain circumstances. */ + + if (forall_level > 0) + return 0; + /* If we don't know the shape at compile time, we create an allocatable temporary variable to hold the intermediate result, but only if allocation on assignment is active. */ @@ -493,6 +503,7 @@ optimize_namespace (gfc_namespace *ns) { current_ns = ns; + forall_level = 0; gfc_code_walker (&ns->code, convert_do_while, dummy_expr_callback, NULL); gfc_code_walker (&ns->code, cfe_code, cfe_expr_0, NULL); @@ -1193,6 +1204,7 @@ gfc_code_walker (gfc_code **c, walk_code_fn_t code WALK_SUBEXPR (fa->end); WALK_SUBEXPR (fa->stride); } + forall_level ++; break; } @@ -1335,6 +1347,10 @@ gfc_code_walker (gfc_code **c, walk_code_fn_t code WALK_SUBEXPR (b->expr2); WALK_SUBCODE (b->next); } + + if (co->op == EXEC_FORALL || co->op == EXEC_DO_CONCURRENT) + forall_level --; + } } return 0;
! { dg-do run } ! { dg-options "-ffrontend-optimize -fdump-tree-original" } ! PR 50564 - this used to ICE with front end optimization. ! Original test case by Andrew Benson. program test implicit none double precision, dimension(2) :: timeSteps, control integer :: iTime double precision :: ratio double precision :: a ratio = 0.7d0 control(1) = ratio**(dble(1)-0.5d0)-ratio**(dble(1)-1.5d0) control(2) = ratio**(dble(2)-0.5d0)-ratio**(dble(2)-1.5d0) forall(iTime=1:2) timeSteps(iTime)=ratio**(dble(iTime)-0.5d0)-ratio**(dble(iTime)-1.5d0) end forall if (any(abs(timesteps - control) > 1d-10)) call abort ! Make sure we still do the front-end optimization after a forall a = cos(ratio)*cos(ratio) + sin(ratio)*sin(ratio) if (abs(a-1.d0) > 1d-10) call abort end program test ! { dg-final { scan-tree-dump-times "__builtin_cos" 1 "original" } } ! { dg-final { scan-tree-dump-times "__builtin_sin" 1 "original" } } ! { dg-final { cleanup-tree-dump "original" } }