The following revises the original fix for PR101173 to correctly
check for a reversed dependence rather than disallowing a zero
distance.  It also adds a check from TSVC which asks for this
kind of interchange (but with a valid dependence).

Bootstrapped and tested on x86_64-unknown-linux-gnu, pushed.

2021-07-01  Richard Biener  <rguent...@suse.de>

        PR tree-optimization/101280
        PR tree-optimization/101173
        * gimple-loop-interchange.cc
        (tree_loop_interchange::valid_data_dependences): Revert
        previous change and instead correctly handle DDR_REVERSED_P
        dependence.

        * gcc.dg/tree-ssa/loop-interchange-16.c: New testcase.
---
 gcc/gimple-loop-interchange.cc                |  7 ++++--
 .../gcc.dg/tree-ssa/loop-interchange-16.c     | 22 +++++++++++++++++++
 2 files changed, 27 insertions(+), 2 deletions(-)
 create mode 100644 gcc/testsuite/gcc.dg/tree-ssa/loop-interchange-16.c

diff --git a/gcc/gimple-loop-interchange.cc b/gcc/gimple-loop-interchange.cc
index 43045c5455e..43ef112a2d0 100644
--- a/gcc/gimple-loop-interchange.cc
+++ b/gcc/gimple-loop-interchange.cc
@@ -1043,8 +1043,11 @@ tree_loop_interchange::valid_data_dependences (unsigned 
i_idx, unsigned o_idx,
            continue;
 
          /* Be conservative, skip case if either direction at i_idx/o_idx
-            levels is not '=' (for the inner loop) or '<'.  */
-         if (dist_vect[i_idx] < 0 || dist_vect[o_idx] <= 0)
+            levels is not '=' or '<'.  */
+         if (dist_vect[i_idx] < 0
+             || (DDR_REVERSED_P (ddr) && dist_vect[i_idx] > 0)
+             || dist_vect[o_idx] < 0
+             || (DDR_REVERSED_P (ddr) && dist_vect[o_idx] > 0))
            return false;
        }
     }
diff --git a/gcc/testsuite/gcc.dg/tree-ssa/loop-interchange-16.c 
b/gcc/testsuite/gcc.dg/tree-ssa/loop-interchange-16.c
new file mode 100644
index 00000000000..781555e085d
--- /dev/null
+++ b/gcc/testsuite/gcc.dg/tree-ssa/loop-interchange-16.c
@@ -0,0 +1,22 @@
+/* PR/101280 */
+/* { dg-do compile } */
+/* { dg-options "-O3 -fdump-tree-linterchange-details" } */
+
+void dummy (double *, double *);
+#define LEN_2D 32
+double aa[LEN_2D][LEN_2D], bb[LEN_2D][LEN_2D];
+double s231(int iterations)
+{
+//    loop interchange
+//    loop with data dependency
+    for (int nl = 0; nl < 100*(iterations/LEN_2D); nl++) {
+        for (int i = 0; i < LEN_2D; ++i) {
+            for (int j = 1; j < LEN_2D; j++) {
+                aa[j][i] = aa[j - 1][i] + bb[j][i];
+            }
+        }
+        dummy(aa[0],bb[0]);
+    }
+}
+
+/* { dg-final { scan-tree-dump "loops interchanged" "linterchange" } } */
-- 
2.26.2

Reply via email to