pushed, thanks :)
On Fri, Feb 2, 2024 at 11:59 AM Monk Chiang <monk.chi...@sifive.com> wrote: > > Add sifive p400 series scheduler module. For more information > see https://www.sifive.com/cores/performance-p450-470. > > gcc/ChangeLog: > > * config/riscv/riscv.md: Include sifive-p400.md. > * config/riscv/sifive-p400.md: New file. > * config/riscv/riscv-cores.def (RISCV_TUNE): Add parameter. > * config/riscv/riscv-opts.h (enum riscv_microarchitecture_type): > Add sifive_p400. > * config/riscv/riscv.cc (sifive_p400_tune_info): New. > * config/riscv/riscv.h (TARGET_SFB_ALU): Update. > * doc/invoke.texi (RISC-V Options): Add sifive-p400-series > --- > gcc/config/riscv/riscv-cores.def | 1 + > gcc/config/riscv/riscv-opts.h | 1 + > gcc/config/riscv/riscv.cc | 17 +++ > gcc/config/riscv/riscv.h | 1 + > gcc/config/riscv/riscv.md | 3 +- > gcc/config/riscv/sifive-p400.md | 174 +++++++++++++++++++++++++++++++ > gcc/doc/invoke.texi | 4 +- > 7 files changed, 198 insertions(+), 3 deletions(-) > create mode 100644 gcc/config/riscv/sifive-p400.md > > diff --git a/gcc/config/riscv/riscv-cores.def > b/gcc/config/riscv/riscv-cores.def > index a07a79e2cb7..0785e8f3fbd 100644 > --- a/gcc/config/riscv/riscv-cores.def > +++ b/gcc/config/riscv/riscv-cores.def > @@ -37,6 +37,7 @@ RISCV_TUNE("rocket", generic, rocket_tune_info) > RISCV_TUNE("sifive-3-series", generic, rocket_tune_info) > RISCV_TUNE("sifive-5-series", generic, rocket_tune_info) > RISCV_TUNE("sifive-7-series", sifive_7, sifive_7_tune_info) > +RISCV_TUNE("sifive-p400-series", sifive_p400, sifive_p400_tune_info) > RISCV_TUNE("sifive-p600-series", sifive_p600, sifive_p600_tune_info) > RISCV_TUNE("thead-c906", generic, thead_c906_tune_info) > RISCV_TUNE("generic-ooo", generic_ooo, generic_ooo_tune_info) > diff --git a/gcc/config/riscv/riscv-opts.h b/gcc/config/riscv/riscv-opts.h > index 25951665b13..4edddbadc37 100644 > --- a/gcc/config/riscv/riscv-opts.h > +++ b/gcc/config/riscv/riscv-opts.h > @@ -55,6 +55,7 @@ extern enum riscv_isa_spec_class riscv_isa_spec; > enum riscv_microarchitecture_type { > generic, > sifive_7, > + sifive_p400, > sifive_p600, > generic_ooo > }; > diff --git a/gcc/config/riscv/riscv.cc b/gcc/config/riscv/riscv.cc > index cead76fe1a2..4b24e4b9a0a 100644 > --- a/gcc/config/riscv/riscv.cc > +++ b/gcc/config/riscv/riscv.cc > @@ -447,6 +447,23 @@ static const struct riscv_tune_param sifive_7_tune_info > = { > NULL, /* vector cost */ > }; > > +/* Costs to use when optimizing for Sifive p400 Series. */ > +static const struct riscv_tune_param sifive_p400_tune_info = { > + {COSTS_N_INSNS (4), COSTS_N_INSNS (4)}, /* fp_add */ > + {COSTS_N_INSNS (4), COSTS_N_INSNS (4)}, /* fp_mul */ > + {COSTS_N_INSNS (20), COSTS_N_INSNS (20)}, /* fp_div */ > + {COSTS_N_INSNS (4), COSTS_N_INSNS (4)}, /* int_mul */ > + {COSTS_N_INSNS (6), COSTS_N_INSNS (6)}, /* int_div */ > + 3, /* issue_rate */ > + 4, /* branch_cost */ > + 3, /* memory_cost */ > + 4, /* fmv_cost */ > + true, /* > slow_unaligned_access */ > + false, /* use_divmod_expansion */ > + RISCV_FUSE_LUI_ADDI | RISCV_FUSE_AUIPC_ADDI, /* fusible_ops */ > + &generic_vector_cost, /* vector cost */ > +}; > + > /* Costs to use when optimizing for Sifive p600 Series. */ > static const struct riscv_tune_param sifive_p600_tune_info = { > {COSTS_N_INSNS (4), COSTS_N_INSNS (4)}, /* fp_add */ > diff --git a/gcc/config/riscv/riscv.h b/gcc/config/riscv/riscv.h > index e0cb3ba08d4..669308cc96d 100644 > --- a/gcc/config/riscv/riscv.h > +++ b/gcc/config/riscv/riscv.h > @@ -898,6 +898,7 @@ extern enum riscv_cc get_riscv_cc (const rtx use); > > #define TARGET_SFB_ALU \ > ((riscv_microarchitecture == sifive_7) \ > + || (riscv_microarchitecture == sifive_p400) \ > || (riscv_microarchitecture == sifive_p600)) > > #define LOGICAL_OP_NON_SHORT_CIRCUIT 0 > diff --git a/gcc/config/riscv/riscv.md b/gcc/config/riscv/riscv.md > index 2a164a03dbd..39b29795cd6 100644 > --- a/gcc/config/riscv/riscv.md > +++ b/gcc/config/riscv/riscv.md > @@ -687,7 +687,7 @@ > ;; Microarchitectures we know how to tune for. > ;; Keep this in sync with enum riscv_microarchitecture. > (define_attr "tune" > - "generic,sifive_7,sifive_p600,generic_ooo" > + "generic,sifive_7,sifive_p400,sifive_p600,generic_ooo" > (const (symbol_ref "((enum attr_tune) riscv_microarchitecture)"))) > > ;; Describe a user's asm statement. > @@ -3850,6 +3850,7 @@ > (include "pic.md") > (include "generic.md") > (include "sifive-7.md") > +(include "sifive-p400.md") > (include "sifive-p600.md") > (include "thead.md") > (include "generic-ooo.md") > diff --git a/gcc/config/riscv/sifive-p400.md b/gcc/config/riscv/sifive-p400.md > new file mode 100644 > index 00000000000..cc244d3c3e6 > --- /dev/null > +++ b/gcc/config/riscv/sifive-p400.md > @@ -0,0 +1,174 @@ > +;; Scheduling description for Sifive p400. > + > +;; Sifive p400 series is a triple-issue, superscalar, out-of-order processor. > + > +;; CPU execution units: > +;; ialu Integer Units: all arithmetic and logic. > +;; > +;; bru Branch Resolution Unit: all branches. > +;; > +;; st Memory Write Unit: all writes to memory. > +;; > +;; ld Memory Read Unit: all reads from memory. > +;; > +;; imul Integer Multiply Unit > +;; > +;; idiv Integer Divide Unit > +;; > +;; system System Unit: all coprocessor accesses. > +;; > +;; fpu Floating Point Unit > +;; > +;; fmul Floating Point Multiply Unit > +;; > +;; fdiv Floating Point Divide Unit > + > +;; Four automata are defined to reduce number of states > +;; which a single large automaton will have. > +(define_automaton > "sifive_p400_iex,sifive_p400_fex,sifive_p400_mem,sifive_p400_div") > + > +;; The Sifive p400 has six pipelines: > +;; A-pipe Load, Store > +;; B-pipe ALU, Branch > +;; M-pipe ALU, MUL, DIV and I2F(integer to float instruction) > +;; C-pipe ALU, Conditional move and system for coprocessor accesses > +;; F-pipe FPU, MUL, F2I(float to integer instruction) > +;; FM-pipe FPU, MUL, DIV > + > +(define_cpu_unit "sifive_p400_A" "sifive_p400_mem") > +(define_cpu_unit "sifive_p400_B" "sifive_p400_iex") > +(define_cpu_unit "sifive_p400_M" "sifive_p400_iex") > +(define_cpu_unit "sifive_p400_C" "sifive_p400_iex") > +(define_cpu_unit "sifive_p400_F" "sifive_p400_fex") > +(define_cpu_unit "sifive_p400_FM" "sifive_p400_fex") > + > +;; Load and store unit. > +(define_cpu_unit "sifive_p400_ld" "sifive_p400_mem") > +(define_cpu_unit "sifive_p400_st" "sifive_p400_mem") > + > +;; Branch unit. > +(define_cpu_unit "sifive_p400_bru" "sifive_p400_iex") > + > +;; Integer and multiply unit. > +(define_cpu_unit "sifive_p400_ialu" "sifive_p400_iex") > +(define_cpu_unit "sifive_p400_imul" "sifive_p400_iex") > +(define_cpu_unit "sifive_p400_system" "sifive_p400_iex") > + > +;; Divide unit. > +(define_cpu_unit "sifive_p400_idiv" "sifive_p400_div") > +(define_cpu_unit "sifive_p400_fdiv" "sifive_p400_div") > + > +;; Float and multiply unit. > +(define_cpu_unit "sifive_p400_fmul" "sifive_p400_fex") > +(define_cpu_unit "sifive_p400_fpu" "sifive_p400_fex") > + > +;; ALU instruction can use pipeline C, B and M. > +(define_reservation "p400_int_pipe" > "(sifive_p400_C|sifive_p400_B|sifive_p400_M)") > +;; FPU instruction can use pipeline F and FM. > +(define_reservation "p400_float_pipe" "(sifive_p400_F|sifive_p400_FM)") > + > +(define_insn_reservation "sifive_p400_load" 3 > + (and (eq_attr "tune" "sifive_p400") > + (eq_attr "type" "load")) > + "sifive_p400_A,sifive_p400_ld*2") > + > +(define_insn_reservation "sifive_p400_fpload" 4 > + (and (eq_attr "tune" "sifive_p400") > + (eq_attr "type" "fpload")) > + "sifive_p400_A,sifive_p400_ld*3") > + > +(define_insn_reservation "sifive_p400_store" 1 > + (and (eq_attr "tune" "sifive_p400") > + (eq_attr "type" "store")) > + "sifive_p400_A+sifive_p400_st") > + > +(define_insn_reservation "sifive_p400_fpstore" 1 > + (and (eq_attr "tune" "sifive_p400") > + (eq_attr "type" "fpstore")) > + "sifive_p400_A+sifive_p400_st") > + > +(define_insn_reservation "sifive_p400_branch" 1 > + (and (eq_attr "tune" "sifive_p400") > + (eq_attr "type" "branch,jump,call")) > + "sifive_p400_B+sifive_p400_bru") > + > +(define_insn_reservation "sifive_p400_sfb_alu" 1 > + (and (eq_attr "tune" "sifive_p400") > + (eq_attr "type" "sfb_alu")) > + "sifive_p400_C+sifive_p400_bru+sifive_p400_ialu") > + > +(define_insn_reservation "sifive_p400_atomic" 3 > + (and (eq_attr "tune" "sifive_p400") > + (eq_attr "type" "atomic")) > + "sifive_p400_C,sifive_p400_system*2") > + > +(define_insn_reservation "sifive_p400_mul" 3 > + (and (eq_attr "tune" "sifive_p400") > + (eq_attr "type" "imul")) > + "sifive_p400_M,sifive_p400_imul*2") > + > +(define_insn_reservation "sifive_p400_div" 31 > + (and (eq_attr "tune" "sifive_p400") > + (eq_attr "type" "idiv")) > + "sifive_p400_M, sifive_p400_idiv*5") > + > +(define_insn_reservation "sifive_p400_alu" 1 > + (and (eq_attr "tune" "sifive_p400") > + (eq_attr "type" > "unknown,arith,logical,shift,slt,multi,bitmanip,clz,ctz,rotate")) > + "p400_int_pipe+sifive_p400_ialu") > + > +(define_insn_reservation "sifive_p400_cpop" 3 > + (and (eq_attr "tune" "sifive_p400") > + (eq_attr "type" "cpop")) > + "p400_int_pipe,sifive_p400_ialu*2") > + > +(define_insn_reservation "sifive_p400_load_immediate" 1 > + (and (eq_attr "tune" "sifive_p400") > + (eq_attr "type" "nop,const,auipc,move")) > + "p400_int_pipe") > + > +(define_insn_reservation "sifive_p400_fma" 4 > + (and (eq_attr "tune" "sifive_p400") > + (eq_attr "type" "fadd,fmul,fmadd")) > + "p400_float_pipe,sifive_p400_fmul*3") > + > +(define_insn_reservation "sifive_p400_i2f" 2 > + (and (eq_attr "tune" "sifive_p400") > + (eq_attr "type" "mtc,fcvt_i2f")) > + "sifive_p400_M,sifive_p400_ialu") > + > +(define_insn_reservation "sifive_p400_f2i" 2 > + (and (eq_attr "tune" "sifive_p400") > + (eq_attr "type" "mfc,fcmp,fcvt_f2i")) > + "sifive_p400_F,sifive_p400_fpu") > + > +(define_insn_reservation "sifive_p400_fmove" 2 > + (and (eq_attr "tune" "sifive_p400") > + (eq_attr "type" "fmove,fcvt")) > + "p400_float_pipe,sifive_p400_fpu") > + > +(define_insn_reservation "sifive_p400_fdiv_s" 18 > + (and (eq_attr "tune" "sifive_p400") > + (eq_attr "type" "fdiv,fsqrt") > + (eq_attr "mode" "SF")) > + "sifive_p400_FM, sifive_p400_fdiv*5") > + > +(define_insn_reservation "sifive_p400_fdiv_d" 31 > + (and (eq_attr "tune" "sifive_p400") > + (eq_attr "type" "fdiv,fsqrt") > + (eq_attr "mode" "DF")) > + "sifive_p400_FM, sifive_p400_fdiv*5") > + > +(define_bypass 1 > "sifive_p400_load,sifive_p400_alu,sifive_p400_mul,sifive_p400_sfb_alu" > + "sifive_p400_alu,sifive_p400_branch") > + > +(define_bypass 1 "sifive_p400_load,sifive_p400_alu,sifive_p400_mul, > + sifive_p400_f2i,sifive_p400_fmove,sifive_p400_sfb_alu" > + "sifive_p400_store" "riscv_store_data_bypass_p") > + > +(define_bypass 1 "sifive_p400_i2f" > + > "sifive_p400_fma,sifive_p400_f2i,sifive_p400_fmove,sifive_p400_fdiv_s,sifive_p400_fdiv_d") > + > +(define_bypass 1 "sifive_p400_f2i" > + "sifive_p400_branch,sifive_p400_sfb_alu,sifive_p400_mul, > + sifive_p400_div,sifive_p400_alu,sifive_p400_cpop") > diff --git a/gcc/doc/invoke.texi b/gcc/doc/invoke.texi > index e9c691d63da..f8645822ca4 100644 > --- a/gcc/doc/invoke.texi > +++ b/gcc/doc/invoke.texi > @@ -30714,8 +30714,8 @@ Permissible values for this option are: > @samp{sifive-e20}, @samp{sifive-e21}, > Optimize the output for the given processor, specified by microarchitecture > or > particular CPU name. Permissible values for this option are: @samp{rocket}, > @samp{sifive-3-series}, @samp{sifive-5-series}, @samp{sifive-7-series}, > -@samp{thead-c906}, @samp{size}, @samp{sifive-p600-series}, > -and all valid options for @option{-mcpu=}. > +@samp{thead-c906}, @samp{size}, @samp{sifive-p400-series}, > +@samp{sifive-p600-series}, and all valid options for @option{-mcpu=}. > > When @option{-mtune=} is not specified, use the setting from @option{-mcpu}, > the default is @samp{rocket} if both are not specified. > -- > 2.40.1 >