Hi Tobias,
> On 10.06.21 20:52, Harald Anlauf via Fortran wrote:
> > +static bool
> > +substring_has_constant_len (gfc_expr *e)
> > +{
> > + ptrdiff_t istart, iend;
> > + size_t length;
> > + bool equal_length = false;
> > +
> > + if (e->ts.type != BT_CHARACTER
> > + || !e->ref
> > + || e->ref->type != REF_SUBSTRING
>
> Is there a reason why you do not handle:
>
> type t
> character(len=5) :: str1
> character(len=:), allocatable :: str2
> end type
> type(t) :: x
>
> allocate(x%str2, source="abd")
> if (len (x%str)) /= 1) ...
> if (len (x%str2(1:2) /= 2) ...
> etc.
>
> Namely: Search the last_ref = expr->ref->next->next ...?
> and then check that lastref?
I was assuming that the argument passed to LEN() is already the ultimate
component for the case of substrings, and I was unable to find a case which
requires implementing that iteration. The cases you provided do not seem
to apply here:
- derived type component str1, which is a string of given length, poses no
problem. I added a case to the testcase, see attached updated patch.
- derived type component str2 has deferred length. I do not see that the
simplification can be applied here, as the allocation could lead to str2
being too short, and we do not want to simplify invalid code, such as:
type t
character(len=:), allocatable :: str2
end type
type(t) :: x
allocate(x%str2, source="z")
if (len (x%str2(1:2)) /= 2) stop 1
end
If we want this to be catchable by bounds checking, we need to punt
at simplification of this. The updated patch skips deferred strings.
> * * *
>
> Slightly unrelated: I think the following does not violate
> F2018's R916 / C923 – but is rejected, namely:
> R916 type-param-inquiry is designator % type-param-name
> the latter is 'len' or 'kind' for intrinsic types. And:
> R901 designator is ...
> or substring
> But
>
> character(len=5) :: str
> print *, str(1:3)%len
> end
>
> fails with
>
> 2 | print *, str(1:3)%len
> | 1
> Error: Syntax error in PRINT statement at (1)
>
>
> Assuming you don't want to handle it, can you open a new PR?
> Thanks!
Good point. I'd rather open a separate PR for this, though.
> > + istart = gfc_mpz_get_hwi (e->ref->u.ss.start->value.integer);
> > + iend = gfc_mpz_get_hwi (e->ref->u.ss.end->value.integer);
> > + length = gfc_mpz_get_hwi (e->ref->u.ss.length->length->value.integer);
> > +
> > + if (istart <= iend)
> > + {
> > + if (istart < 1)
> > + {
> > + gfc_error ("Substring start index (%ld) at %L below 1",
> > + (long) istart, &e->ref->u.ss.start->where);
>
> As mentioned by Bernhard, you could use HOST_WIDE_INT_PRINT_DEC.
>
> (It probably only matters on Windows which uses long == int = 32bit for
> strings longer than INT_MAX.)
I am not familiar enough with Windows. What is HOST_WIDE_INT
on that system? (As compared to e.g. size_t, ptrdiff_t).
The (slightly) updated patch regtests fine.
Thanks,
Harald
diff --git a/gcc/fortran/simplify.c b/gcc/fortran/simplify.c
index c27b47aa98f..7f22372afec 100644
--- a/gcc/fortran/simplify.c
+++ b/gcc/fortran/simplify.c
@@ -4512,6 +4512,62 @@ gfc_simplify_leadz (gfc_expr *e)
}
+/* Check for constant length of a substring. */
+
+static bool
+substring_has_constant_len (gfc_expr *e)
+{
+ ptrdiff_t istart, iend;
+ size_t length;
+ bool equal_length = false;
+
+ if (e->ts.type != BT_CHARACTER
+ || e->ts.deferred
+ || !e->ref
+ || e->ref->type != REF_SUBSTRING
+ || !e->ref->u.ss.start
+ || e->ref->u.ss.start->expr_type != EXPR_CONSTANT
+ || !e->ref->u.ss.end
+ || e->ref->u.ss.end->expr_type != EXPR_CONSTANT
+ || !e->ref->u.ss.length
+ || !e->ref->u.ss.length->length
+ || e->ref->u.ss.length->length->expr_type != EXPR_CONSTANT)
+ return false;
+
+ /* Basic checks on substring starting and ending indices. */
+ if (!gfc_resolve_substring (e->ref, &equal_length))
+ return false;
+
+ istart = gfc_mpz_get_hwi (e->ref->u.ss.start->value.integer);
+ iend = gfc_mpz_get_hwi (e->ref->u.ss.end->value.integer);
+ length = gfc_mpz_get_hwi (e->ref->u.ss.length->length->value.integer);
+
+ if (istart <= iend)
+ {
+ if (istart < 1)
+ {
+ gfc_error ("Substring start index (%ld) at %L below 1",
+ (long) istart, &e->ref->u.ss.start->where);
+ return false;
+ }
+ if (iend > (ssize_t) length)
+ {
+ gfc_error ("Substring end index (%ld) at %L exceeds string "
+ "length", (long) iend, &e->ref->u.ss.end->where);
+ return false;
+ }
+ length = iend - istart + 1;
+ }
+ else
+ length = 0;
+
+ /* Fix substring length. */
+ e->value.character.length = length;
+
+ return true;
+}
+
+
gfc_expr *
gfc_simplify_len (gfc_expr *e, gfc_expr *kind)
{
@@ -4521,7 +4577,11 @@ gfc_simplify_len (gfc_expr *e, gfc_expr *kind)
if (k == -1)
return &gfc_bad_expr;
- if (e->expr_type == EXPR_CONSTANT)
+ if (e->ts.deferred)
+ return NULL;
+
+ if (e->expr_type == EXPR_CONSTANT
+ || substring_has_constant_len (e))
{
result = gfc_get_constant_expr (BT_INTEGER, k, &e->where);
mpz_set_si (result->value.integer, e->value.character.length);
diff --git a/gcc/testsuite/gfortran.dg/pr100950.f90 b/gcc/testsuite/gfortran.dg/pr100950.f90
new file mode 100644
index 00000000000..f082cfea795
--- /dev/null
+++ b/gcc/testsuite/gfortran.dg/pr100950.f90
@@ -0,0 +1,28 @@
+! { dg-do run }
+! PR fortran/100950 - ICE in output_constructor_regular_field, at varasm.c:5514
+
+program p
+ character(8), parameter :: u = "123"
+ character(8) :: x = "", s
+ character(2) :: w(2) = [character(len(x(3:4))) :: 'a','b' ]
+ character(*), parameter :: y(*) = [character(len(u(3:4))) :: 'a','b' ]
+ character(*), parameter :: z(*) = [character(len(x(3:4))) :: 'a','b' ]
+ character(*), parameter :: t(*) = [character(len(x( :2))) :: 'a','b' ]
+ character(*), parameter :: v(*) = [character(len(x(7: ))) :: 'a','b' ]
+ type t_
+ character(len=5) :: s
+ end type t_
+ type(t_) :: q, r(1)
+ if (len (y) /= 2) stop 1
+ if (len (z) /= 2) stop 2
+ if (any (w /= y)) stop 3
+ if (len ([character(len(u(3:4))) :: 'a','b' ]) /= 2) stop 4
+ if (len ([character(len(x(3:4))) :: 'a','b' ]) /= 2) stop 5
+ if (any ([character(len(x(3:4))) :: 'a','b' ] /= y)) stop 6
+ write(s,*) [character(len(x(3:4))) :: 'a','b' ]
+ if (s /= " a b ") stop 7
+ if (len (t) /= 2) stop 8
+ if (len (v) /= 2) stop 9
+ if (len (q%s) /= 5) stop 10
+ if (len (r%s) /= 5) stop 11
+end