https://gcc.gnu.org/g:76048bd0693e30a5abc67aa6dcce9f4973ea208e

commit r15-5012-g76048bd0693e30a5abc67aa6dcce9f4973ea208e
Author: Richard Biener <rguent...@suse.de>
Date:   Mon Nov 4 13:03:33 2024 +0100

    Check LOOP_VINFO_PEELING_FOR_GAPS on epilog is supported
    
    We need to check that an epilogue doesn't require 
LOOP_VINFO_PEELING_FOR_GAPS
    in case the main loop didn't (the other way around is OK), the
    computation whether the epilog is executed or not gets our of sync
    otherwise.
    
            * tree-vect-loop.cc (vect_analyze_loop_2): Move
            vect_analyze_loop_costing after check whether we can do
            peeling.  Add check on LOOP_VINFO_PEELING_FOR_GAPS for
            epilogues.

Diff:
---
 gcc/tree-vect-loop.cc | 30 ++++++++++++++++++++----------
 1 file changed, 20 insertions(+), 10 deletions(-)

diff --git a/gcc/tree-vect-loop.cc b/gcc/tree-vect-loop.cc
index e6d241482ce3..e91549a643b9 100644
--- a/gcc/tree-vect-loop.cc
+++ b/gcc/tree-vect-loop.cc
@@ -3143,17 +3143,15 @@ start_over:
                                       " epilogue loop.\n");
     }
 
-  /* Check the costings of the loop make vectorizing worthwhile.  */
-  res = vect_analyze_loop_costing (loop_vinfo, suggested_unroll_factor);
-  if (res < 0)
-    {
-      ok = opt_result::failure_at (vect_location,
-                                  "Loop costings may not be worthwhile.\n");
-      goto again;
-    }
-  if (!res)
+  /* If the epilogue needs peeling for gaps but the main loop doesn't give
+     up on the epilogue.  */
+  if (LOOP_VINFO_EPILOGUE_P (loop_vinfo)
+      && LOOP_VINFO_PEELING_FOR_GAPS (loop_vinfo)
+      && (LOOP_VINFO_PEELING_FOR_GAPS (orig_loop_vinfo)
+         != LOOP_VINFO_PEELING_FOR_GAPS (loop_vinfo)))
     return opt_result::failure_at (vect_location,
-                                  "Loop costings not worthwhile.\n");
+                                  "Epilogue loop requires peeling for gaps "
+                                  "but main loop does not.\n");
 
   /* If an epilogue loop is required make sure we can create one.  */
   if (LOOP_VINFO_PEELING_FOR_GAPS (loop_vinfo)
@@ -3174,6 +3172,18 @@ start_over:
         }
     }
 
+  /* Check the costings of the loop make vectorizing worthwhile.  */
+  res = vect_analyze_loop_costing (loop_vinfo, suggested_unroll_factor);
+  if (res < 0)
+    {
+      ok = opt_result::failure_at (vect_location,
+                                  "Loop costings may not be worthwhile.\n");
+      goto again;
+    }
+  if (!res)
+    return opt_result::failure_at (vect_location,
+                                  "Loop costings not worthwhile.\n");
+
   /* During peeling, we need to check if number of loop iterations is
      enough for both peeled prolog loop and vector loop.  This check
      can be merged along with threshold check of loop versioning, so

Reply via email to