On Mon, Jun 23, 2025 at 07:30:51PM +0530, Surya Kumari Jangala wrote:
> Hi Mike,
>
> On 14/06/25 2:07 pm, Michael Meissner wrote:
> > This is patch #1 of 4 that adds the support that can be used in developing
> > GCC
> > support for future PowerPC processors.
>
> Please reword the commit message, perhaps something like:
> This is patch #1 of 4 that adds support for the option -mcpu=future. This
> enables
> future enhancements to GCC for supporting upcoming PowerPC processors.
Ok.
> > diff --git a/gcc/config/rs6000/rs6000-cpus.def
> > b/gcc/config/rs6000/rs6000-cpus.def
> > index 4a1037616d7..228d0b5e7b5 100644
> > --- a/gcc/config/rs6000/rs6000-cpus.def
> > +++ b/gcc/config/rs6000/rs6000-cpus.def
> > @@ -83,6 +83,9 @@
> > #define POWER11_MASKS_SERVER (ISA_3_1_MASKS_SERVER \
> > | OPTION_MASK_POWER11)
> >
> > +#define FUTURE_MASKS_SERVER (POWER11_MASKS_SERVER
> > \
> > + | OPTION_MASK_FUTURE)
> > +
> > /* Flags that need to be turned off if -mno-vsx. */
> > #define OTHER_VSX_VECTOR_MASKS (OPTION_MASK_EFFICIENT_UNALIGNED_VSX
> > \
> > | OPTION_MASK_FLOAT128_KEYWORD \
> > @@ -119,6 +122,7 @@
> > | OPTION_MASK_FLOAT128_HW \
> > | OPTION_MASK_FLOAT128_KEYWORD \
> > | OPTION_MASK_FPRND \
> > + | OPTION_MASK_FUTURE \
> > | OPTION_MASK_POWER10 \
> > | OPTION_MASK_POWER11 \
>
> Please add OPTION_MASK_FUTURE after OPTION_MASK_POWER11.
The style in rs6000-cpus.def for the POWERPC_MASKS macro is to have all of the
option masks be sorted alphabetically. This macro is a list of all of the
options that need to be toggled as setting ISA bits when using either:
#pragma GCC target "..."
or
__attribute__((__target__("...")))
But if desired, I can certainly change it.
> > | OPTION_MASK_P10_FUSION \
> > @@ -249,6 +253,7 @@ RS6000_CPU ("power9", PROCESSOR_POWER9, MASK_POWERPC64
> > | ISA_3_0_MASKS_SERVER
> > | OPTION_MASK_HTM)
> > RS6000_CPU ("power10", PROCESSOR_POWER10, MASK_POWERPC64 |
> > ISA_3_1_MASKS_SERVER)
> > RS6000_CPU ("power11", PROCESSOR_POWER11, MASK_POWERPC64 |
> > POWER11_MASKS_SERVER)
> > +RS6000_CPU ("future", PROCESSOR_FUTURE, MASK_POWERPC64 |
> > FUTURE_MASKS_SERVER)
> > RS6000_CPU ("powerpc", PROCESSOR_POWERPC, 0)
> > RS6000_CPU ("powerpc64", PROCESSOR_POWERPC64, OPTION_MASK_PPC_GFXOPT
> > | MASK_POWERPC64)
> > diff --git a/gcc/config/rs6000/rs6000-opts.h
> > b/gcc/config/rs6000/rs6000-opts.h
> > index c31d2975f04..3983d463e31 100644
> > --- a/gcc/config/rs6000/rs6000-opts.h
> > +++ b/gcc/config/rs6000/rs6000-opts.h
> > @@ -63,6 +63,7 @@ enum processor_type
> > PROCESSOR_POWER9,
> > PROCESSOR_POWER10,
> > PROCESSOR_POWER11,
> > + PROCESSOR_FUTURE,
> >
> > PROCESSOR_RS64A,
> > PROCESSOR_MPCCORE,
> > diff --git a/gcc/config/rs6000/rs6000-tables.opt
> > b/gcc/config/rs6000/rs6000-tables.opt
> > index f5bbed5ea74..518324e7aea 100644
> > --- a/gcc/config/rs6000/rs6000-tables.opt
> > +++ b/gcc/config/rs6000/rs6000-tables.opt
> > @@ -189,14 +189,17 @@ EnumValue
> > Enum(rs6000_cpu_opt_value) String(power11) Value(53)
> >
> > EnumValue
> > -Enum(rs6000_cpu_opt_value) String(powerpc) Value(54)
> > +Enum(rs6000_cpu_opt_value) String(future) Value(54)
> >
> > EnumValue
> > -Enum(rs6000_cpu_opt_value) String(powerpc64) Value(55)
> > +Enum(rs6000_cpu_opt_value) String(powerpc) Value(55)
> >
> > EnumValue
> > -Enum(rs6000_cpu_opt_value) String(powerpc64le) Value(56)
> > +Enum(rs6000_cpu_opt_value) String(powerpc64) Value(56)
> >
> > EnumValue
> > -Enum(rs6000_cpu_opt_value) String(rs64) Value(57)
> > +Enum(rs6000_cpu_opt_value) String(powerpc64le) Value(57)
> > +
> > +EnumValue
> > +Enum(rs6000_cpu_opt_value) String(rs64) Value(58)
> >
> > diff --git a/gcc/config/rs6000/rs6000.cc b/gcc/config/rs6000/rs6000.cc
> > index 7ee26e52b13..141d53b1a12 100644
> > --- a/gcc/config/rs6000/rs6000.cc
> > +++ b/gcc/config/rs6000/rs6000.cc
> > @@ -1066,7 +1066,7 @@ struct processor_costs power9_cost = {
> > COSTS_N_INSNS (3), /* SF->DF convert */
> > };
> >
> > -/* Instruction costs on Power10/Power11 processors. */
> > +/* Instruction costs on Power10/Power11/future processors. */
> > static const
> > struct processor_costs power10_cost = {
> > COSTS_N_INSNS (2), /* mulsi */
> > @@ -4388,7 +4388,8 @@ rs6000_option_override_internal (bool global_init_p)
> > if (!(rs6000_isa_flags_explicit & OPTION_MASK_P10_FUSION))
> > {
> > if (rs6000_tune == PROCESSOR_POWER10
> > - || rs6000_tune == PROCESSOR_POWER11)
> > + || rs6000_tune == PROCESSOR_POWER11
> > + || rs6000_tune == PROCESSOR_FUTURE)
> > rs6000_isa_flags |= OPTION_MASK_P10_FUSION;
> > else
> > rs6000_isa_flags &= ~OPTION_MASK_P10_FUSION;
> > @@ -4418,6 +4419,7 @@ rs6000_option_override_internal (bool global_init_p)
> > && rs6000_tune != PROCESSOR_POWER9
> > && rs6000_tune != PROCESSOR_POWER10
> > && rs6000_tune != PROCESSOR_POWER11
> > + && rs6000_tune != PROCESSOR_FUTURE
> > && rs6000_tune != PROCESSOR_PPCA2
> > && rs6000_tune != PROCESSOR_CELL
> > && rs6000_tune != PROCESSOR_PPC476);
> > @@ -4433,6 +4435,7 @@ rs6000_option_override_internal (bool global_init_p)
> > || rs6000_tune == PROCESSOR_POWER9
> > || rs6000_tune == PROCESSOR_POWER10
> > || rs6000_tune == PROCESSOR_POWER11
> > + || rs6000_tune == PROCESSOR_FUTURE
> > || rs6000_tune == PROCESSOR_PPCE500MC
> > || rs6000_tune == PROCESSOR_PPCE500MC64
> > || rs6000_tune == PROCESSOR_PPCE5500
> > @@ -4733,6 +4736,7 @@ rs6000_option_override_internal (bool global_init_p)
> >
> > case PROCESSOR_POWER10:
> > case PROCESSOR_POWER11:
> > + case PROCESSOR_FUTURE:
> > rs6000_cost = &power10_cost;
> > break;
> >
> > @@ -5905,6 +5909,8 @@ rs6000_machine_from_flags (void)
> > flags &= ~(OPTION_MASK_PPC_GFXOPT | OPTION_MASK_PPC_GPOPT |
> > OPTION_MASK_ISEL
> > | OPTION_MASK_ALTIVEC);
> >
> > + if ((flags & (FUTURE_MASKS_SERVER & ~ISA_3_1_MASKS_SERVER)) != 0)
>
> The test should be against POWER11_MASKS_SERVER, not ISA_3_1_MASKS_SERVER.
>
> > + return "future";
> > if ((flags & (POWER11_MASKS_SERVER & ~ISA_3_1_MASKS_SERVER)) != 0)
> > return "power11";
> > if ((flags & (ISA_3_1_MASKS_SERVER & ~ISA_3_0_MASKS_SERVER)) != 0)
> > @@ -10155,6 +10161,7 @@ rs6000_reassociation_width (unsigned int opc
> > ATTRIBUTE_UNUSED,
> > case PROCESSOR_POWER9:
> > case PROCESSOR_POWER10:
> > case PROCESSOR_POWER11:
> > + case PROCESSOR_FUTURE:
> > if (DECIMAL_FLOAT_MODE_P (mode))
> > return 1;
> > if (VECTOR_MODE_P (mode))
> > @@ -18197,7 +18204,8 @@ rs6000_adjust_cost (rtx_insn *insn, int dep_type,
> > rtx_insn *dep_insn, int cost,
> > /* Separate a load from a narrower, dependent store. */
> > if ((rs6000_sched_groups || rs6000_tune == PROCESSOR_POWER9
> > || rs6000_tune == PROCESSOR_POWER10
> > - || rs6000_tune == PROCESSOR_POWER11)
> > + || rs6000_tune == PROCESSOR_POWER11
> > + || rs6000_tune == PROCESSOR_FUTURE)
> > && GET_CODE (PATTERN (insn)) == SET
> > && GET_CODE (PATTERN (dep_insn)) == SET
> > && MEM_P (XEXP (PATTERN (insn), 1))
> > @@ -18237,6 +18245,7 @@ rs6000_adjust_cost (rtx_insn *insn, int dep_type,
> > rtx_insn *dep_insn, int cost,
> > || rs6000_tune == PROCESSOR_POWER9
> > || rs6000_tune == PROCESSOR_POWER10
> > || rs6000_tune == PROCESSOR_POWER11
> > + || rs6000_tune == PROCESSOR_FUTURE
> > || rs6000_tune == PROCESSOR_CELL)
> > && recog_memoized (dep_insn)
> > && (INSN_CODE (dep_insn) >= 0))
> > @@ -18812,6 +18821,7 @@ rs6000_issue_rate (void)
> > return 6;
> > case PROCESSOR_POWER10:
> > case PROCESSOR_POWER11:
> > + case PROCESSOR_FUTURE:
> > return 8;
> > default:
> > return 1;
> > @@ -19527,10 +19537,11 @@ rs6000_sched_reorder (FILE *dump
> > ATTRIBUTE_UNUSED, int sched_verbose,
> > if (rs6000_tune == PROCESSOR_POWER6)
> > load_store_pendulum = 0;
> >
> > - /* Do Power10/Power11 dependent reordering. */
> > + /* Do Power10/Power11/future dependent reordering. */
> > if (last_scheduled_insn
> > && (rs6000_tune == PROCESSOR_POWER10
> > - || rs6000_tune == PROCESSOR_POWER11))
> > + || rs6000_tune == PROCESSOR_POWER11
> > + || rs6000_tune == PROCESSOR_FUTURE))
> > power10_sched_reorder (ready, n_ready - 1);
> >
> > return rs6000_issue_rate ();
> > @@ -19554,10 +19565,11 @@ rs6000_sched_reorder2 (FILE *dump, int
> > sched_verbose, rtx_insn **ready,
> > && recog_memoized (last_scheduled_insn) >= 0)
> > return power9_sched_reorder2 (ready, *pn_ready - 1);
> >
> > - /* Do Power10/Power11 dependent reordering. */
> > + /* Do Power10/Power11/future dependent reordering. */
> > if (last_scheduled_insn
> > && (rs6000_tune == PROCESSOR_POWER10
> > - || rs6000_tune == PROCESSOR_POWER11))
> > + || rs6000_tune == PROCESSOR_POWER11
> > + || rs6000_tune == PROCESSOR_FUTURE))
> > return power10_sched_reorder (ready, *pn_ready - 1);
> >
> > return cached_can_issue_more;
> > @@ -22780,7 +22792,8 @@ rs6000_register_move_cost (machine_mode mode,
> > out to be a nop. */
> > if (rs6000_tune == PROCESSOR_POWER9
> > || rs6000_tune == PROCESSOR_POWER10
> > - || rs6000_tune == PROCESSOR_POWER11)
> > + || rs6000_tune == PROCESSOR_POWER11
> > + || rs6000_tune == PROCESSOR_FUTURE)
> > ret = 3 * hard_regno_nregs (FIRST_GPR_REGNO, mode);
> > else
> > ret = 4 * hard_regno_nregs (FIRST_GPR_REGNO, mode);
> > @@ -24450,6 +24463,7 @@ static struct rs6000_opt_mask const
> > rs6000_opt_masks[] =
> > { "float128", OPTION_MASK_FLOAT128_KEYWORD, false,
> > true },
> > { "float128-hardware", OPTION_MASK_FLOAT128_HW, false, true },
> > { "fprnd", OPTION_MASK_FPRND, false,
> > true },
> > + { "future", OPTION_MASK_FUTURE, false,
> > false },
>
> Please add this line after the "power11" line.
>
>
> > { "power10", OPTION_MASK_POWER10, false,
> > true },
> > { "power11", OPTION_MASK_POWER11, false,
> > false },
> > { "hard-dfp", OPTION_MASK_DFP, false,
> > true },
> > diff --git a/gcc/config/rs6000/rs6000.h b/gcc/config/rs6000/rs6000.h
> > index db6112a09e1..76c6cd1ab8e 100644
> > --- a/gcc/config/rs6000/rs6000.h
> > +++ b/gcc/config/rs6000/rs6000.h
> > @@ -101,6 +101,7 @@
> > you make changes here, make them also there. */
> > #define ASM_CPU_SPEC \
> > "%{mcpu=native: %(asm_cpu_native); \
> > + mcpu=future: -mfuture; \
> > mcpu=power11: -mpower11; \
> > mcpu=power10: -mpower10; \
> > mcpu=power9: -mpower9; \
> > diff --git a/gcc/config/rs6000/rs6000.md b/gcc/config/rs6000/rs6000.md
> > index 9c718ca2a22..605047f99a8 100644
> > --- a/gcc/config/rs6000/rs6000.md
> > +++ b/gcc/config/rs6000/rs6000.md
> > @@ -364,7 +364,7 @@ (define_attr "cpu"
> > ppc750,ppc7400,ppc7450,
> > ppc403,ppc405,ppc440,ppc476,
> >
> > ppc8540,ppc8548,ppce300c2,ppce300c3,ppce500mc,ppce500mc64,ppce5500,ppce6500,
> > - power4,power5,power6,power7,power8,power9,power10,power11,
> > + power4,power5,power6,power7,power8,power9,power10,power11,future,
> > rs64a,mpccore,cell,ppca2,titan"
> > (const (symbol_ref "(enum attr_cpu) rs6000_tune")))
> >
> > diff --git a/gcc/config/rs6000/rs6000.opt b/gcc/config/rs6000/rs6000.opt
> > index 88cf16ca581..7e1af7120bc 100644
> > --- a/gcc/config/rs6000/rs6000.opt
> > +++ b/gcc/config/rs6000/rs6000.opt
> > @@ -634,6 +634,12 @@ mieee128-constant
> > Target Var(TARGET_IEEE128_CONSTANT) Init(1) Save
> > Generate (do not generate) code that uses the LXVKQ instruction.
> >
> > +;; Users should not use -mfuture, but we need to use a bit to identify when
> > +;; the user changes the default cpu via #pragma GCC target("cpu=future")
> > +;; and then resets it later.
> > +mfuture
> > +Target Undocumented Mask(FUTURE) Var(rs6000_isa_flags) WarnRemoved
> > +
>
> Please add this after 'mpower11'
Historically, we have always added new flag bits at the end, which is what I
did in this patch. The -mpower11 option should have been added after
-mieee128-constant (-mprefixed, -mpcrel, -mpcrel-opt, -mmma,
-msplat-* are all power10 options).
Granted -mrelative-jumptables, -mrop-protect, and -mprivileged are not power10
specific, but they were added after the basic power10 support was added (hence,
add new ISA options at the end).
I mentioned in my other reply, that I have a set of patches that separates the
option bits (i.e. -mpopcntb, -mcmpb, etc.) from the ISA bits set via
-mcpu=<xxx>. If/when those sets of patches go in, then it allows use to remove
these fake option bits. This patch would allow us to delete:
-mpower8-internal
-mpower10
-mpower11
-mfuture
> Also, in the routine expand_compare_loop(), we should handle PROCESSOR_FUTURE
> when computing max_bytes.
Ok, I'll look at it.
>
> -Surya
>
> > ; Documented parameters
> >
> > -param=rs6000-vect-unroll-limit=
>
--
Michael Meissner, IBM
PO Box 98, Ayer, Massachusetts, USA, 01432
email: [email protected]