https://gcc.gnu.org/g:6fc3da8fa2af1d4ee154ea803636eabde358b553

commit r15-6091-g6fc3da8fa2af1d4ee154ea803636eabde358b553
Author: Vladimir N. Makarov <vmaka...@redhat.com>
Date:   Tue Dec 10 12:50:27 2024 -0500

    [PR117946][LRA]: When assigning hard reg use biggest mode to check 
ira_prohibited_class_mode_regs
    
    A pseudo in the PR test case gets hard reg 43 which is x86 r15 (after
    r15, xmm regs go).  The pseudo is of INT_SSE_CLASS and SImode but is
    used in TImode as paradoxical subreg.  r15 in TImode is wrong and does
    not satisfy constraint 'r'.  Therefore LRA creates moves involving the
    pseudo in TImode until the limit of reload insns is achieved.
    Unfortunately x86 hard_regno_mode_ok (as some hooks for other targets)
    says that it is ok to use r15 for TImode pseudo.  Therefore LRA uses
    ira_prohibited_class_mode_regs for such cases but it was checked
    against native pseudo mode.  The patch fixes it by using the biggest
    pseudo mode.
    
    gcc/ChangeLog:
    
            PR rtl-optimization/117946
            * lra-assigns.cc: (find_hard_regno_for_1): Use the biggest mode to
            check ira_prohibited_class_mode_regs.
    
    gcc/testsuite/ChangeLog:
    
            PR rtl-optimization/117946
            * gcc.target/i386/pr117946.c: New.

Diff:
---
 gcc/lra-assigns.cc                       |  5 ++---
 gcc/testsuite/gcc.target/i386/pr117946.c | 16 ++++++++++++++++
 2 files changed, 18 insertions(+), 3 deletions(-)

diff --git a/gcc/lra-assigns.cc b/gcc/lra-assigns.cc
index 0a14bde5e743..405afc06f57e 100644
--- a/gcc/lra-assigns.cc
+++ b/gcc/lra-assigns.cc
@@ -629,13 +629,12 @@ find_hard_regno_for_1 (int regno, int *cost, int 
try_only_hard_regno,
        hard_regno = ira_class_hard_regs[rclass][i];
       if (! overlaps_hard_reg_set_p (conflict_set,
                                     PSEUDO_REGNO_MODE (regno), hard_regno)
-         && targetm.hard_regno_mode_ok (hard_regno,
-                                        PSEUDO_REGNO_MODE (regno))
+         && targetm.hard_regno_mode_ok (hard_regno, PSEUDO_REGNO_MODE (regno))
          /* We cannot use prohibited_class_mode_regs for all classes
             because it is not defined for all classes.  */
          && (ira_allocno_class_translate[rclass] != rclass
              || ! TEST_HARD_REG_BIT (ira_prohibited_class_mode_regs
-                                     [rclass][PSEUDO_REGNO_MODE (regno)],
+                                     [rclass][biggest_mode],
                                      hard_regno))
          && ! TEST_HARD_REG_BIT (impossible_start_hard_regs, hard_regno)
          && (nregs_diff == 0
diff --git a/gcc/testsuite/gcc.target/i386/pr117946.c 
b/gcc/testsuite/gcc.target/i386/pr117946.c
new file mode 100644
index 000000000000..7304e01d1a7e
--- /dev/null
+++ b/gcc/testsuite/gcc.target/i386/pr117946.c
@@ -0,0 +1,16 @@
+/* { dg-do compile  { target { ! ia32 } } } */
+/* { dg-options "-O -favoid-store-forwarding -mavx10.1 -mprefer-avx128 
--param=store-forwarding-max-distance=128 -Wno-psabi" } */
+typedef __attribute__((__vector_size__ (64))) _Decimal32 V;
+
+void
+bar (float, float, float, float, float, _Complex, float, float, float,
+     _BitInt(1023), _BitInt (1023), float, float, float, float, float, float,
+     float, float, float, float, float, float, _Decimal64, float, float, float,
+     V, float, _Decimal64);
+
+void
+foo ()
+{
+  bar (0, 0, 0, 0, 0, 0, 0, __builtin_nand64 ("nan"), 0, 0, 0, 0, 0, 0, 0, 0,
+       0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, (V){}, 0, 0);
+}

Reply via email to