RISC-V: Support scheduling for sifive p600 series
Checks
Commit Message
Add sifive p600 series scheduler module. For more information
see https://www.sifive.com/cores/performance-p650-670.
Add sifive-p650, sifive-p670 for mcpu option will come in separate patches.
gcc/ChangeLog:
* config/riscv/riscv.md: Add "fcvt_i2f", "fcvt_f2i" type
attribute, and include sifive-p600.md.
* config/riscv/generic-ooo.md: Update type attribute.
* config/riscv/sifive-7.md: Update type attribute.
* config/riscv/sifive-p600.md: New file.
* config/riscv/riscv-cores.def (RISCV_TUNE): Add parameter.
* config/riscv/riscv-opts.h (enum riscv_microarchitecture_type):
Add sifive_p600.
* config/riscv/riscv.c (sifive_p600_tune_info): New.
* config/riscv/riscv.h (TARGET_SFB_ALU): Update.
* doc/invoke.texi (RISC-V Options): Add sifive-p600-series
---
gcc/config/riscv/generic-ooo.md | 2 +-
gcc/config/riscv/generic.md | 2 +-
gcc/config/riscv/riscv-cores.def | 1 +
gcc/config/riscv/riscv-opts.h | 1 +
gcc/config/riscv/riscv.cc | 17 +++
gcc/config/riscv/riscv.h | 4 +-
gcc/config/riscv/riscv.md | 19 ++--
gcc/config/riscv/sifive-7.md | 2 +-
gcc/config/riscv/sifive-p600.md | 174 +++++++++++++++++++++++++++++++
gcc/doc/invoke.texi | 3 +-
10 files changed, 212 insertions(+), 13 deletions(-)
create mode 100644 gcc/config/riscv/sifive-p600.md
Comments
> + NULL, /* vector cost */
> +};
Does the P600 series include a vector unit? From what I found on
the web it looks like it. If so I would suggest specifying at least
the default (generic) vector cost model here. We fall back to the
default one for NULL but I find it more explicit to specify one.
> +;; The Sifive 8 has six pipelines:
P600? Is 8 the generation and P600 the official name?
> +(define_insn_reservation "sifive_p600_div" 33
> + (and (eq_attr "tune" "sifive_p600")
> + (eq_attr "type" "idiv"))
> + "sifive_p600_M, sifive_p600_idiv*32")
> +
> +(define_insn_reservation "sifive_p600_fdiv_s" 18
> + (and (eq_attr "tune" "sifive_p600")
> + (eq_attr "type" "fdiv,fsqrt")
> + (eq_attr "mode" "SF"))
> + "sifive_p600_FM, sifive_p600_fdiv*17")
> +
> +(define_insn_reservation "sifive_p600_fdiv_d" 31
> + (and (eq_attr "tune" "sifive_p600")
> + (eq_attr "type" "fdiv,fsqrt")
> + (eq_attr "mode" "DF"))
> + "sifive_p600_FM, sifive_p600_fdiv*30")
I would suggest not to block the units for that long. It will
needlessly increase the automata's complexity causing longer build
times. Even if you want to keep the latency high (doubtful if
that's beneficial in terms of spilling) you could just block the
unit for maybe 3-5 cycles. Up to you in the end, though and not
a blocker.
Regards
Robin
I recently committed changes modifying the scheduling reservations. Some
things may need to be retested with the newly enabled asserts.
Edwin
On 1/31/2024 1:40 AM, Monk Chiang wrote:
> Add sifive p600 series scheduler module. For more information
> see https://www.sifive.com/cores/performance-p650-670.
> Add sifive-p650, sifive-p670 for mcpu option will come in separate patches.
>
> gcc/ChangeLog:
> * config/riscv/riscv.md: Add "fcvt_i2f", "fcvt_f2i" type
> attribute, and include sifive-p600.md.
> * config/riscv/generic-ooo.md: Update type attribute.
> * config/riscv/sifive-7.md: Update type attribute.
> * config/riscv/sifive-p600.md: New file.
> * config/riscv/riscv-cores.def (RISCV_TUNE): Add parameter.
> * config/riscv/riscv-opts.h (enum riscv_microarchitecture_type):
> Add sifive_p600.
> * config/riscv/riscv.c (sifive_p600_tune_info): New.
> * config/riscv/riscv.h (TARGET_SFB_ALU): Update.
> * doc/invoke.texi (RISC-V Options): Add sifive-p600-series
> ---
> gcc/config/riscv/generic-ooo.md | 2 +-
> gcc/config/riscv/generic.md | 2 +-
> gcc/config/riscv/riscv-cores.def | 1 +
> gcc/config/riscv/riscv-opts.h | 1 +
> gcc/config/riscv/riscv.cc | 17 +++
> gcc/config/riscv/riscv.h | 4 +-
> gcc/config/riscv/riscv.md | 19 ++--
> gcc/config/riscv/sifive-7.md | 2 +-
> gcc/config/riscv/sifive-p600.md | 174 +++++++++++++++++++++++++++++++
> gcc/doc/invoke.texi | 3 +-
> 10 files changed, 212 insertions(+), 13 deletions(-)
> create mode 100644 gcc/config/riscv/sifive-p600.md
>
> diff --git a/gcc/config/riscv/generic-ooo.md b/gcc/config/riscv/generic-ooo.md
> index 421a7bb929d..a22f8a3e079 100644
> --- a/gcc/config/riscv/generic-ooo.md
> +++ b/gcc/config/riscv/generic-ooo.md
> @@ -127,7 +127,7 @@
>
> (define_insn_reservation "generic_ooo_fcvt" 3
> (and (eq_attr "tune" "generic_ooo")
> - (eq_attr "type" "fcvt"))
> + (eq_attr "type" "fcvt,fcvt_i2f,fcvt_f2i"))
> "generic_ooo_issue,generic_ooo_fxu")
>
> (define_insn_reservation "generic_ooo_fcmp" 2
> diff --git a/gcc/config/riscv/generic.md b/gcc/config/riscv/generic.md
> index b99ae345bb3..3f0eaa2ea08 100644
> --- a/gcc/config/riscv/generic.md
> +++ b/gcc/config/riscv/generic.md
> @@ -42,7 +42,7 @@
>
> (define_insn_reservation "generic_xfer" 3
> (and (eq_attr "tune" "generic")
> - (eq_attr "type" "mfc,mtc,fcvt,fmove,fcmp"))
> + (eq_attr "type" "mfc,mtc,fcvt,fcvt_i2f,fcvt_f2i,fmove,fcmp"))
> "alu")
>
> (define_insn_reservation "generic_branch" 1
> diff --git a/gcc/config/riscv/riscv-cores.def b/gcc/config/riscv/riscv-cores.def
> index b30f4dfb08e..a07a79e2cb7 100644
> --- a/gcc/config/riscv/riscv-cores.def
> +++ b/gcc/config/riscv/riscv-cores.def
> @@ -37,6 +37,7 @@ RISCV_TUNE("rocket", generic, rocket_tune_info)
> RISCV_TUNE("sifive-3-series", generic, rocket_tune_info)
> RISCV_TUNE("sifive-5-series", generic, rocket_tune_info)
> RISCV_TUNE("sifive-7-series", sifive_7, sifive_7_tune_info)
> +RISCV_TUNE("sifive-p600-series", sifive_p600, sifive_p600_tune_info)
> RISCV_TUNE("thead-c906", generic, thead_c906_tune_info)
> RISCV_TUNE("generic-ooo", generic_ooo, generic_ooo_tune_info)
> RISCV_TUNE("size", generic, optimize_size_tune_info)
> diff --git a/gcc/config/riscv/riscv-opts.h b/gcc/config/riscv/riscv-opts.h
> index 1500f8811ef..25951665b13 100644
> --- a/gcc/config/riscv/riscv-opts.h
> +++ b/gcc/config/riscv/riscv-opts.h
> @@ -55,6 +55,7 @@ extern enum riscv_isa_spec_class riscv_isa_spec;
> enum riscv_microarchitecture_type {
> generic,
> sifive_7,
> + sifive_p600,
> generic_ooo
> };
> extern enum riscv_microarchitecture_type riscv_microarchitecture;
> diff --git a/gcc/config/riscv/riscv.cc b/gcc/config/riscv/riscv.cc
> index 7b6111aa545..92d6fd5cf47 100644
> --- a/gcc/config/riscv/riscv.cc
> +++ b/gcc/config/riscv/riscv.cc
> @@ -447,6 +447,23 @@ static const struct riscv_tune_param sifive_7_tune_info = {
> NULL, /* vector cost */
> };
>
> +/* Costs to use when optimizing for Sifive p600 Series. */
> +static const struct riscv_tune_param sifive_p600_tune_info = {
> + {COSTS_N_INSNS (4), COSTS_N_INSNS (4)}, /* fp_add */
> + {COSTS_N_INSNS (4), COSTS_N_INSNS (4)}, /* fp_mul */
> + {COSTS_N_INSNS (20), COSTS_N_INSNS (20)}, /* fp_div */
> + {COSTS_N_INSNS (4), COSTS_N_INSNS (4)}, /* int_mul */
> + {COSTS_N_INSNS (6), COSTS_N_INSNS (6)}, /* int_div */
> + 4, /* issue_rate */
> + 4, /* branch_cost */
> + 3, /* memory_cost */
> + 4, /* fmv_cost */
> + true, /* slow_unaligned_access */
> + false, /* use_divmod_expansion */
> + RISCV_FUSE_LUI_ADDI | RISCV_FUSE_AUIPC_ADDI, /* fusible_ops */
> + NULL, /* vector cost */
> +};
> +
> /* Costs to use when optimizing for T-HEAD c906. */
> static const struct riscv_tune_param thead_c906_tune_info = {
> {COSTS_N_INSNS (4), COSTS_N_INSNS (5)}, /* fp_add */
> diff --git a/gcc/config/riscv/riscv.h b/gcc/config/riscv/riscv.h
> index 627eba12548..e0cb3ba08d4 100644
> --- a/gcc/config/riscv/riscv.h
> +++ b/gcc/config/riscv/riscv.h
> @@ -896,7 +896,9 @@ extern enum riscv_cc get_riscv_cc (const rtx use);
> SLT[I][U], AND[I], XOR[I], OR[I], LUI, AUIPC, and their compressed
> counterparts, including C.MV and C.LI) can be in the branch shadow. */
>
> -#define TARGET_SFB_ALU (riscv_microarchitecture == sifive_7)
> +#define TARGET_SFB_ALU \
> + ((riscv_microarchitecture == sifive_7) \
> + || (riscv_microarchitecture == sifive_p600))
>
> #define LOGICAL_OP_NON_SHORT_CIRCUIT 0
>
> diff --git a/gcc/config/riscv/riscv.md b/gcc/config/riscv/riscv.md
> index edcaec4a786..02aefc76400 100644
> --- a/gcc/config/riscv/riscv.md
> +++ b/gcc/config/riscv/riscv.md
> @@ -314,6 +314,8 @@
> ;; fdiv floating point divide
> ;; fcmp floating point compare
> ;; fcvt floating point convert
> +;; fcvt_i2f integer to floating point convert
> +;; fcvt_f2i floating point to integer convert
> ;; fsqrt floating point square root
> ;; multi multiword sequence (or user asm statements)
> ;; auipc integer addition to PC
> @@ -466,8 +468,8 @@
> (define_attr "type"
> "unknown,branch,jump,jalr,ret,call,load,fpload,store,fpstore,
> mtc,mfc,const,arith,logical,shift,slt,imul,idiv,move,fmove,fadd,fmul,
> - fmadd,fdiv,fcmp,fcvt,fsqrt,multi,auipc,sfb_alu,nop,trap,ghost,bitmanip,
> - rotate,clmul,min,max,minu,maxu,clz,ctz,cpop,
> + fmadd,fdiv,fcmp,fcvt,fcvt_i2f,fcvt_f2i,fsqrt,multi,auipc,sfb_alu,nop,trap,
> + ghost,bitmanip,rotate,clmul,min,max,minu,maxu,clz,ctz,cpop,
> atomic,condmove,cbo,crypto,pushpop,mvpair,zicond,rdvlenb,rdvl,wrvxrm,wrfrm,
> rdfrm,vsetvl,vsetvl_pre,vlde,vste,vldm,vstm,vlds,vsts,
> vldux,vldox,vstux,vstox,vldff,vldr,vstr,
> @@ -685,7 +687,7 @@
> ;; Microarchitectures we know how to tune for.
> ;; Keep this in sync with enum riscv_microarchitecture.
> (define_attr "tune"
> - "generic,sifive_7,generic_ooo"
> + "generic,sifive_7,sifive_p600,generic_ooo"
> (const (symbol_ref "((enum attr_tune) riscv_microarchitecture)")))
>
> ;; Describe a user's asm statement.
> @@ -1973,7 +1975,7 @@
> (match_operand:ANYF 1 "register_operand" " f")))]
> "TARGET_HARD_FLOAT || TARGET_ZFINX"
> "fcvt.<GPR:ifmt>.<ANYF:fmt> %0,%1,rtz"
> - [(set_attr "type" "fcvt")
> + [(set_attr "type" "fcvt_f2i")
> (set_attr "mode" "<ANYF:MODE>")])
>
> (define_insn "fixuns_trunc<ANYF:mode><GPR:mode>2"
> @@ -1982,7 +1984,7 @@
> (match_operand:ANYF 1 "register_operand" " f")))]
> "TARGET_HARD_FLOAT || TARGET_ZFINX"
> "fcvt.<GPR:ifmt>u.<ANYF:fmt> %0,%1,rtz"
> - [(set_attr "type" "fcvt")
> + [(set_attr "type" "fcvt_f2i")
> (set_attr "mode" "<ANYF:MODE>")])
>
> (define_insn "float<GPR:mode><ANYF:mode>2"
> @@ -1991,7 +1993,7 @@
> (match_operand:GPR 1 "reg_or_0_operand" " rJ")))]
> "TARGET_HARD_FLOAT || TARGET_ZFINX"
> "fcvt.<ANYF:fmt>.<GPR:ifmt>\t%0,%z1"
> - [(set_attr "type" "fcvt")
> + [(set_attr "type" "fcvt_i2f")
> (set_attr "mode" "<ANYF:MODE>")])
>
> (define_insn "floatuns<GPR:mode><ANYF:mode>2"
> @@ -2000,7 +2002,7 @@
> (match_operand:GPR 1 "reg_or_0_operand" " rJ")))]
> "TARGET_HARD_FLOAT || TARGET_ZFINX"
> "fcvt.<ANYF:fmt>.<GPR:ifmt>u\t%0,%z1"
> - [(set_attr "type" "fcvt")
> + [(set_attr "type" "fcvt_i2f")
> (set_attr "mode" "<ANYF:MODE>")])
>
> (define_insn "l<rint_pattern><ANYF:mode><GPR:mode>2"
> @@ -2010,7 +2012,7 @@
> RINT))]
> "TARGET_HARD_FLOAT || TARGET_ZFINX"
> "fcvt.<GPR:ifmt>.<ANYF:fmt> %0,%1,<rint_rm>"
> - [(set_attr "type" "fcvt")
> + [(set_attr "type" "fcvt_f2i")
> (set_attr "mode" "<ANYF:MODE>")])
>
> (define_insn "<round_pattern><ANYF:mode>2"
> @@ -3848,6 +3850,7 @@
> (include "pic.md")
> (include "generic.md")
> (include "sifive-7.md")
> +(include "sifive-p600.md")
> (include "thead.md")
> (include "generic-ooo.md")
> (include "vector.md")
> diff --git a/gcc/config/riscv/sifive-7.md b/gcc/config/riscv/sifive-7.md
> index a63394c8c58..48bdba48190 100644
> --- a/gcc/config/riscv/sifive-7.md
> +++ b/gcc/config/riscv/sifive-7.md
> @@ -81,7 +81,7 @@
>
> (define_insn_reservation "sifive_7_fp_other" 3
> (and (eq_attr "tune" "sifive_7")
> - (eq_attr "type" "fcvt,fcmp,fmove"))
> + (eq_attr "type" "fcvt,fcvt_i2f,fcvt_f2i,fcmp,fmove"))
> "sifive_7_B")
>
> (define_insn_reservation "sifive_7_fdiv_s" 27
> diff --git a/gcc/config/riscv/sifive-p600.md b/gcc/config/riscv/sifive-p600.md
> new file mode 100644
> index 00000000000..1529d1b743c
> --- /dev/null
> +++ b/gcc/config/riscv/sifive-p600.md
> @@ -0,0 +1,174 @@
> +;; Scheduling description for Sifive p600 series.
> +
> +;; Sifive p600 series is a triple-issue, superscalar, out-of-order processor.
> +
> +;; CPU execution units:
> +;; ialu Integer Units: all arithmetic and logic.
> +;;
> +;; bru Branch Resolution Unit: all branches.
> +;;
> +;; st Memory Write Unit: all writes to memory.
> +;;
> +;; ld Memory Read Unit: all reads from memory.
> +;;
> +;; imul Integer Multiply Unit
> +;;
> +;; idiv Integer Divide Unit
> +;;
> +;; system System Unit: all coprocessor accesses.
> +;;
> +;; fpu Floating Point Unit
> +;;
> +;; fmul Floating Point Multiply Unit
> +;;
> +;; fdiv Floating Point Divide Unit
> +
> +;; Four automata are defined to reduce number of states
> +;; which a single large automaton will have.
> +(define_automaton "sifive_p600_iex,sifive_p600_fex,sifive_p600_mem,sifive_p600_div")
> +
> +;; The Sifive 8 has six pipelines:
> +;; A-pipe Load, Store
> +;; B-pipe ALU, Branch
> +;; M-pipe ALU, MUL, DIV and I2F(integer to float instruction)
> +;; C-pipe ALU, Conditional move and system for coprocessor accesses
> +;; F-pipe FPU, MUL, F2I(float to integer instruction)
> +;; FM-pipe FPU, MUL, DIV
> +
> +(define_cpu_unit "sifive_p600_A" "sifive_p600_mem")
> +(define_cpu_unit "sifive_p600_B" "sifive_p600_iex")
> +(define_cpu_unit "sifive_p600_M" "sifive_p600_iex")
> +(define_cpu_unit "sifive_p600_C" "sifive_p600_iex")
> +(define_cpu_unit "sifive_p600_F" "sifive_p600_fex")
> +(define_cpu_unit "sifive_p600_FM" "sifive_p600_fex")
> +
> +;; Load and store unit.
> +(define_cpu_unit "sifive_p600_ld" "sifive_p600_mem")
> +(define_cpu_unit "sifive_p600_st" "sifive_p600_mem")
> +
> +;; Branch unit.
> +(define_cpu_unit "sifive_p600_bru" "sifive_p600_iex")
> +
> +;; Integer and multiply unit.
> +(define_cpu_unit "sifive_p600_ialu" "sifive_p600_iex")
> +(define_cpu_unit "sifive_p600_imul" "sifive_p600_iex")
> +(define_cpu_unit "sifive_p600_system" "sifive_p600_iex")
> +
> +;; Divide unit.
> +(define_cpu_unit "sifive_p600_idiv" "sifive_p600_div")
> +(define_cpu_unit "sifive_p600_fdiv" "sifive_p600_div")
> +
> +;; Float and multiply unit.
> +(define_cpu_unit "sifive_p600_fmul" "sifive_p600_fex")
> +(define_cpu_unit "sifive_p600_fpu" "sifive_p600_fex")
> +
> +;; ALU instruction can use pipeline C, B and M.
> +(define_reservation "int_pipe" "(sifive_p600_C|sifive_p600_B|sifive_p600_M)")
> +;; FPU instruction can use pipeline F and FM.
> +(define_reservation "float_pipe" "(sifive_p600_F|sifive_p600_FM)")
> +
> +(define_insn_reservation "sifive_p600_load" 3
> + (and (eq_attr "tune" "sifive_p600")
> + (eq_attr "type" "load"))
> + "sifive_p600_A,sifive_p600_ld*2")
> +
> +(define_insn_reservation "sifive_p600_fpload" 4
> + (and (eq_attr "tune" "sifive_p600")
> + (eq_attr "type" "fpload"))
> + "sifive_p600_A,sifive_p600_ld*3")
> +
> +(define_insn_reservation "sifive_p600_store" 1
> + (and (eq_attr "tune" "sifive_p600")
> + (eq_attr "type" "store"))
> + "sifive_p600_A+sifive_p600_st")
> +
> +(define_insn_reservation "sifive_p600_fpstore" 1
> + (and (eq_attr "tune" "sifive_p600")
> + (eq_attr "type" "fpstore"))
> + "sifive_p600_A+sifive_p600_st")
> +
> +(define_insn_reservation "sifive_p600_branch" 1
> + (and (eq_attr "tune" "sifive_p600")
> + (eq_attr "type" "branch,jump,call"))
> + "sifive_p600_B+sifive_p600_bru")
> +
> +(define_insn_reservation "sifive_p600_sfb_alu" 1
> + (and (eq_attr "tune" "sifive_p600")
> + (eq_attr "type" "sfb_alu"))
> + "sifive_p600_C+sifive_p600_bru+sifive_p600_ialu")
> +
> +(define_insn_reservation "sifive_p600_atomic" 3
> + (and (eq_attr "tune" "sifive_p600")
> + (eq_attr "type" "atomic"))
> + "sifive_p600_C,sifive_p600_system*2")
> +
> +(define_insn_reservation "sifive_p600_mul" 3
> + (and (eq_attr "tune" "sifive_p600")
> + (eq_attr "type" "imul"))
> + "sifive_p600_M,sifive_p600_imul*2")
> +
> +(define_insn_reservation "sifive_p600_div" 33
> + (and (eq_attr "tune" "sifive_p600")
> + (eq_attr "type" "idiv"))
> + "sifive_p600_M, sifive_p600_idiv*32")
> +
> +(define_insn_reservation "sifive_p600_alu" 1
> + (and (eq_attr "tune" "sifive_p600")
> + (eq_attr "type" "unknown,arith,logical,shift,slt,multi,bitmanip,clz,ctz,rotate"))
> + "int_pipe+sifive_p600_ialu")
> +
> +(define_insn_reservation "sifive_p600_cpop" 3
> + (and (eq_attr "tune" "sifive_p600")
> + (eq_attr "type" "cpop"))
> + "int_pipe,sifive_p600_ialu*2")
> +
> +(define_insn_reservation "sifive_p600_load_immediate" 1
> + (and (eq_attr "tune" "sifive_p600")
> + (eq_attr "type" "nop,const,auipc,move"))
> + "int_pipe")
> +
> +(define_insn_reservation "sifive_p600_fma" 4
> + (and (eq_attr "tune" "sifive_p600")
> + (eq_attr "type" "fadd,fmul,fmadd"))
> + "float_pipe,sifive_p600_fmul*3")
> +
> +(define_insn_reservation "sifive_p600_i2f" 2
> + (and (eq_attr "tune" "sifive_p600")
> + (eq_attr "type" "mtc,fcvt_i2f"))
> + "sifive_p600_M,sifive_p600_ialu")
> +
> +(define_insn_reservation "sifive_p600_f2i" 2
> + (and (eq_attr "tune" "sifive_p600")
> + (eq_attr "type" "mfc,fcmp,fcvt_f2i"))
> + "sifive_p600_F,sifive_p600_fpu")
> +
> +(define_insn_reservation "sifive_p600_fmove" 2
> + (and (eq_attr "tune" "sifive_p600")
> + (eq_attr "type" "fmove,fcvt"))
> + "float_pipe,sifive_p600_fpu")
> +
> +(define_insn_reservation "sifive_p600_fdiv_s" 18
> + (and (eq_attr "tune" "sifive_p600")
> + (eq_attr "type" "fdiv,fsqrt")
> + (eq_attr "mode" "SF"))
> + "sifive_p600_FM, sifive_p600_fdiv*17")
> +
> +(define_insn_reservation "sifive_p600_fdiv_d" 31
> + (and (eq_attr "tune" "sifive_p600")
> + (eq_attr "type" "fdiv,fsqrt")
> + (eq_attr "mode" "DF"))
> + "sifive_p600_FM, sifive_p600_fdiv*30")
> +
> +(define_bypass 1 "sifive_p600_load,sifive_p600_alu,sifive_p600_mul,sifive_p600_sfb_alu"
> + "sifive_p600_alu,sifive_p600_branch")
> +
> +(define_bypass 1 "sifive_p600_load,sifive_p600_alu,sifive_p600_mul,
> + sifive_p600_f2i,sifive_p600_fmove,sifive_p600_sfb_alu"
> + "sifive_p600_store" "riscv_store_data_bypass_p")
> +
> +(define_bypass 1 "sifive_p600_i2f"
> + "sifive_p600_fma,sifive_p600_f2i,sifive_p600_fmove,sifive_p600_fdiv_s,sifive_p600_fdiv_d")
> +
> +(define_bypass 1 "sifive_p600_f2i"
> + "sifive_p600_branch,sifive_p600_sfb_alu,sifive_p600_mul,
> + sifive_p600_div,sifive_p600_alu,sifive_p600_cpop")
> diff --git a/gcc/doc/invoke.texi b/gcc/doc/invoke.texi
> index 819a75dfe94..1017f4de8d2 100644
> --- a/gcc/doc/invoke.texi
> +++ b/gcc/doc/invoke.texi
> @@ -30670,7 +30670,8 @@ Permissible values for this option are: @samp{sifive-e20}, @samp{sifive-e21},
> Optimize the output for the given processor, specified by microarchitecture or
> particular CPU name. Permissible values for this option are: @samp{rocket},
> @samp{sifive-3-series}, @samp{sifive-5-series}, @samp{sifive-7-series},
> -@samp{thead-c906}, @samp{size}, and all valid options for @option{-mcpu=}.
> +@samp{thead-c906}, @samp{size}, @samp{sifive-p600-series},
> +and all valid options for @option{-mcpu=}.
>
> When @option{-mtune=} is not specified, use the setting from @option{-mcpu},
> the default is @samp{rocket} if both are not specified.
Thanks, I will push a V2 patch, to fix the typo and add a vector cost model
for p600 series.
About block the div units, I decided to use your suggestion. The P600
series
divider is 4 bits per cycle. So blocking 3-5 cycles is enough.
On Thu, Feb 1, 2024 at 9:50 AM Edwin Lu <ewlu@rivosinc.com> wrote:
> I recently committed changes modifying the scheduling reservations. Some
> things may need to be retested with the newly enabled asserts.
>
> Edwin
>
> On 1/31/2024 1:40 AM, Monk Chiang wrote:
> > Add sifive p600 series scheduler module. For more information
> > see https://www.sifive.com/cores/performance-p650-670.
> > Add sifive-p650, sifive-p670 for mcpu option will come in separate
> patches.
> >
> > gcc/ChangeLog:
> > * config/riscv/riscv.md: Add "fcvt_i2f", "fcvt_f2i" type
> > attribute, and include sifive-p600.md.
> > * config/riscv/generic-ooo.md: Update type attribute.
> > * config/riscv/sifive-7.md: Update type attribute.
> > * config/riscv/sifive-p600.md: New file.
> > * config/riscv/riscv-cores.def (RISCV_TUNE): Add parameter.
> > * config/riscv/riscv-opts.h (enum riscv_microarchitecture_type):
> > Add sifive_p600.
> > * config/riscv/riscv.c (sifive_p600_tune_info): New.
> > * config/riscv/riscv.h (TARGET_SFB_ALU): Update.
> > * doc/invoke.texi (RISC-V Options): Add sifive-p600-series
> > ---
> > gcc/config/riscv/generic-ooo.md | 2 +-
> > gcc/config/riscv/generic.md | 2 +-
> > gcc/config/riscv/riscv-cores.def | 1 +
> > gcc/config/riscv/riscv-opts.h | 1 +
> > gcc/config/riscv/riscv.cc | 17 +++
> > gcc/config/riscv/riscv.h | 4 +-
> > gcc/config/riscv/riscv.md | 19 ++--
> > gcc/config/riscv/sifive-7.md | 2 +-
> > gcc/config/riscv/sifive-p600.md | 174 +++++++++++++++++++++++++++++++
> > gcc/doc/invoke.texi | 3 +-
> > 10 files changed, 212 insertions(+), 13 deletions(-)
> > create mode 100644 gcc/config/riscv/sifive-p600.md
> >
> > diff --git a/gcc/config/riscv/generic-ooo.md
> b/gcc/config/riscv/generic-ooo.md
> > index 421a7bb929d..a22f8a3e079 100644
> > --- a/gcc/config/riscv/generic-ooo.md
> > +++ b/gcc/config/riscv/generic-ooo.md
> > @@ -127,7 +127,7 @@
> >
> > (define_insn_reservation "generic_ooo_fcvt" 3
> > (and (eq_attr "tune" "generic_ooo")
> > - (eq_attr "type" "fcvt"))
> > + (eq_attr "type" "fcvt,fcvt_i2f,fcvt_f2i"))
> > "generic_ooo_issue,generic_ooo_fxu")
> >
> > (define_insn_reservation "generic_ooo_fcmp" 2
> > diff --git a/gcc/config/riscv/generic.md b/gcc/config/riscv/generic.md
> > index b99ae345bb3..3f0eaa2ea08 100644
> > --- a/gcc/config/riscv/generic.md
> > +++ b/gcc/config/riscv/generic.md
> > @@ -42,7 +42,7 @@
> >
> > (define_insn_reservation "generic_xfer" 3
> > (and (eq_attr "tune" "generic")
> > - (eq_attr "type" "mfc,mtc,fcvt,fmove,fcmp"))
> > + (eq_attr "type" "mfc,mtc,fcvt,fcvt_i2f,fcvt_f2i,fmove,fcmp"))
> > "alu")
> >
> > (define_insn_reservation "generic_branch" 1
> > diff --git a/gcc/config/riscv/riscv-cores.def
> b/gcc/config/riscv/riscv-cores.def
> > index b30f4dfb08e..a07a79e2cb7 100644
> > --- a/gcc/config/riscv/riscv-cores.def
> > +++ b/gcc/config/riscv/riscv-cores.def
> > @@ -37,6 +37,7 @@ RISCV_TUNE("rocket", generic, rocket_tune_info)
> > RISCV_TUNE("sifive-3-series", generic, rocket_tune_info)
> > RISCV_TUNE("sifive-5-series", generic, rocket_tune_info)
> > RISCV_TUNE("sifive-7-series", sifive_7, sifive_7_tune_info)
> > +RISCV_TUNE("sifive-p600-series", sifive_p600, sifive_p600_tune_info)
> > RISCV_TUNE("thead-c906", generic, thead_c906_tune_info)
> > RISCV_TUNE("generic-ooo", generic_ooo, generic_ooo_tune_info)
> > RISCV_TUNE("size", generic, optimize_size_tune_info)
> > diff --git a/gcc/config/riscv/riscv-opts.h
> b/gcc/config/riscv/riscv-opts.h
> > index 1500f8811ef..25951665b13 100644
> > --- a/gcc/config/riscv/riscv-opts.h
> > +++ b/gcc/config/riscv/riscv-opts.h
> > @@ -55,6 +55,7 @@ extern enum riscv_isa_spec_class riscv_isa_spec;
> > enum riscv_microarchitecture_type {
> > generic,
> > sifive_7,
> > + sifive_p600,
> > generic_ooo
> > };
> > extern enum riscv_microarchitecture_type riscv_microarchitecture;
> > diff --git a/gcc/config/riscv/riscv.cc b/gcc/config/riscv/riscv.cc
> > index 7b6111aa545..92d6fd5cf47 100644
> > --- a/gcc/config/riscv/riscv.cc
> > +++ b/gcc/config/riscv/riscv.cc
> > @@ -447,6 +447,23 @@ static const struct riscv_tune_param
> sifive_7_tune_info = {
> > NULL, /* vector cost */
> > };
> >
> > +/* Costs to use when optimizing for Sifive p600 Series. */
> > +static const struct riscv_tune_param sifive_p600_tune_info = {
> > + {COSTS_N_INSNS (4), COSTS_N_INSNS (4)}, /* fp_add */
> > + {COSTS_N_INSNS (4), COSTS_N_INSNS (4)}, /* fp_mul */
> > + {COSTS_N_INSNS (20), COSTS_N_INSNS (20)}, /* fp_div */
> > + {COSTS_N_INSNS (4), COSTS_N_INSNS (4)}, /* int_mul */
> > + {COSTS_N_INSNS (6), COSTS_N_INSNS (6)}, /* int_div */
> > + 4, /* issue_rate */
> > + 4, /* branch_cost */
> > + 3, /* memory_cost */
> > + 4, /* fmv_cost */
> > + true, /*
> slow_unaligned_access */
> > + false, /* use_divmod_expansion */
> > + RISCV_FUSE_LUI_ADDI | RISCV_FUSE_AUIPC_ADDI, /* fusible_ops */
> > + NULL, /* vector cost */
> > +};
> > +
> > /* Costs to use when optimizing for T-HEAD c906. */
> > static const struct riscv_tune_param thead_c906_tune_info = {
> > {COSTS_N_INSNS (4), COSTS_N_INSNS (5)}, /* fp_add */
> > diff --git a/gcc/config/riscv/riscv.h b/gcc/config/riscv/riscv.h
> > index 627eba12548..e0cb3ba08d4 100644
> > --- a/gcc/config/riscv/riscv.h
> > +++ b/gcc/config/riscv/riscv.h
> > @@ -896,7 +896,9 @@ extern enum riscv_cc get_riscv_cc (const rtx use);
> > SLT[I][U], AND[I], XOR[I], OR[I], LUI, AUIPC, and their compressed
> > counterparts, including C.MV and C.LI) can be in the branch
> shadow. */
> >
> > -#define TARGET_SFB_ALU (riscv_microarchitecture == sifive_7)
> > +#define TARGET_SFB_ALU \
> > + ((riscv_microarchitecture == sifive_7) \
> > + || (riscv_microarchitecture == sifive_p600))
> >
> > #define LOGICAL_OP_NON_SHORT_CIRCUIT 0
> >
> > diff --git a/gcc/config/riscv/riscv.md b/gcc/config/riscv/riscv.md
> > index edcaec4a786..02aefc76400 100644
> > --- a/gcc/config/riscv/riscv.md
> > +++ b/gcc/config/riscv/riscv.md
> > @@ -314,6 +314,8 @@
> > ;; fdiv floating point divide
> > ;; fcmp floating point compare
> > ;; fcvt floating point convert
> > +;; fcvt_i2f integer to floating point convert
> > +;; fcvt_f2i floating point to integer convert
> > ;; fsqrt floating point square root
> > ;; multi multiword sequence (or user asm statements)
> > ;; auipc integer addition to PC
> > @@ -466,8 +468,8 @@
> > (define_attr "type"
> > "unknown,branch,jump,jalr,ret,call,load,fpload,store,fpstore,
> >
> mtc,mfc,const,arith,logical,shift,slt,imul,idiv,move,fmove,fadd,fmul,
> > -
> fmadd,fdiv,fcmp,fcvt,fsqrt,multi,auipc,sfb_alu,nop,trap,ghost,bitmanip,
> > - rotate,clmul,min,max,minu,maxu,clz,ctz,cpop,
> > +
> fmadd,fdiv,fcmp,fcvt,fcvt_i2f,fcvt_f2i,fsqrt,multi,auipc,sfb_alu,nop,trap,
> > + ghost,bitmanip,rotate,clmul,min,max,minu,maxu,clz,ctz,cpop,
> >
> atomic,condmove,cbo,crypto,pushpop,mvpair,zicond,rdvlenb,rdvl,wrvxrm,wrfrm,
> > rdfrm,vsetvl,vsetvl_pre,vlde,vste,vldm,vstm,vlds,vsts,
> > vldux,vldox,vstux,vstox,vldff,vldr,vstr,
> > @@ -685,7 +687,7 @@
> > ;; Microarchitectures we know how to tune for.
> > ;; Keep this in sync with enum riscv_microarchitecture.
> > (define_attr "tune"
> > - "generic,sifive_7,generic_ooo"
> > + "generic,sifive_7,sifive_p600,generic_ooo"
> > (const (symbol_ref "((enum attr_tune) riscv_microarchitecture)")))
> >
> > ;; Describe a user's asm statement.
> > @@ -1973,7 +1975,7 @@
> > (match_operand:ANYF 1 "register_operand" " f")))]
> > "TARGET_HARD_FLOAT || TARGET_ZFINX"
> > "fcvt.<GPR:ifmt>.<ANYF:fmt> %0,%1,rtz"
> > - [(set_attr "type" "fcvt")
> > + [(set_attr "type" "fcvt_f2i")
> > (set_attr "mode" "<ANYF:MODE>")])
> >
> > (define_insn "fixuns_trunc<ANYF:mode><GPR:mode>2"
> > @@ -1982,7 +1984,7 @@
> > (match_operand:ANYF 1 "register_operand" " f")))]
> > "TARGET_HARD_FLOAT || TARGET_ZFINX"
> > "fcvt.<GPR:ifmt>u.<ANYF:fmt> %0,%1,rtz"
> > - [(set_attr "type" "fcvt")
> > + [(set_attr "type" "fcvt_f2i")
> > (set_attr "mode" "<ANYF:MODE>")])
> >
> > (define_insn "float<GPR:mode><ANYF:mode>2"
> > @@ -1991,7 +1993,7 @@
> > (match_operand:GPR 1 "reg_or_0_operand" " rJ")))]
> > "TARGET_HARD_FLOAT || TARGET_ZFINX"
> > "fcvt.<ANYF:fmt>.<GPR:ifmt>\t%0,%z1"
> > - [(set_attr "type" "fcvt")
> > + [(set_attr "type" "fcvt_i2f")
> > (set_attr "mode" "<ANYF:MODE>")])
> >
> > (define_insn "floatuns<GPR:mode><ANYF:mode>2"
> > @@ -2000,7 +2002,7 @@
> > (match_operand:GPR 1 "reg_or_0_operand" " rJ")))]
> > "TARGET_HARD_FLOAT || TARGET_ZFINX"
> > "fcvt.<ANYF:fmt>.<GPR:ifmt>u\t%0,%z1"
> > - [(set_attr "type" "fcvt")
> > + [(set_attr "type" "fcvt_i2f")
> > (set_attr "mode" "<ANYF:MODE>")])
> >
> > (define_insn "l<rint_pattern><ANYF:mode><GPR:mode>2"
> > @@ -2010,7 +2012,7 @@
> > RINT))]
> > "TARGET_HARD_FLOAT || TARGET_ZFINX"
> > "fcvt.<GPR:ifmt>.<ANYF:fmt> %0,%1,<rint_rm>"
> > - [(set_attr "type" "fcvt")
> > + [(set_attr "type" "fcvt_f2i")
> > (set_attr "mode" "<ANYF:MODE>")])
> >
> > (define_insn "<round_pattern><ANYF:mode>2"
> > @@ -3848,6 +3850,7 @@
> > (include "pic.md")
> > (include "generic.md")
> > (include "sifive-7.md")
> > +(include "sifive-p600.md")
> > (include "thead.md")
> > (include "generic-ooo.md")
> > (include "vector.md")
> > diff --git a/gcc/config/riscv/sifive-7.md b/gcc/config/riscv/sifive-7.md
> > index a63394c8c58..48bdba48190 100644
> > --- a/gcc/config/riscv/sifive-7.md
> > +++ b/gcc/config/riscv/sifive-7.md
> > @@ -81,7 +81,7 @@
> >
> > (define_insn_reservation "sifive_7_fp_other" 3
> > (and (eq_attr "tune" "sifive_7")
> > - (eq_attr "type" "fcvt,fcmp,fmove"))
> > + (eq_attr "type" "fcvt,fcvt_i2f,fcvt_f2i,fcmp,fmove"))
> > "sifive_7_B")
> >
> > (define_insn_reservation "sifive_7_fdiv_s" 27
> > diff --git a/gcc/config/riscv/sifive-p600.md
> b/gcc/config/riscv/sifive-p600.md
> > new file mode 100644
> > index 00000000000..1529d1b743c
> > --- /dev/null
> > +++ b/gcc/config/riscv/sifive-p600.md
> > @@ -0,0 +1,174 @@
> > +;; Scheduling description for Sifive p600 series.
> > +
> > +;; Sifive p600 series is a triple-issue, superscalar, out-of-order
> processor.
> > +
> > +;; CPU execution units:
> > +;; ialu Integer Units: all arithmetic and logic.
> > +;;
> > +;; bru Branch Resolution Unit: all branches.
> > +;;
> > +;; st Memory Write Unit: all writes to memory.
> > +;;
> > +;; ld Memory Read Unit: all reads from memory.
> > +;;
> > +;; imul Integer Multiply Unit
> > +;;
> > +;; idiv Integer Divide Unit
> > +;;
> > +;; system System Unit: all coprocessor accesses.
> > +;;
> > +;; fpu Floating Point Unit
> > +;;
> > +;; fmul Floating Point Multiply Unit
> > +;;
> > +;; fdiv Floating Point Divide Unit
> > +
> > +;; Four automata are defined to reduce number of states
> > +;; which a single large automaton will have.
> > +(define_automaton
> "sifive_p600_iex,sifive_p600_fex,sifive_p600_mem,sifive_p600_div")
> > +
> > +;; The Sifive 8 has six pipelines:
> > +;; A-pipe Load, Store
> > +;; B-pipe ALU, Branch
> > +;; M-pipe ALU, MUL, DIV and I2F(integer to float instruction)
> > +;; C-pipe ALU, Conditional move and system for coprocessor
> accesses
> > +;; F-pipe FPU, MUL, F2I(float to integer instruction)
> > +;; FM-pipe FPU, MUL, DIV
> > +
> > +(define_cpu_unit "sifive_p600_A" "sifive_p600_mem")
> > +(define_cpu_unit "sifive_p600_B" "sifive_p600_iex")
> > +(define_cpu_unit "sifive_p600_M" "sifive_p600_iex")
> > +(define_cpu_unit "sifive_p600_C" "sifive_p600_iex")
> > +(define_cpu_unit "sifive_p600_F" "sifive_p600_fex")
> > +(define_cpu_unit "sifive_p600_FM" "sifive_p600_fex")
> > +
> > +;; Load and store unit.
> > +(define_cpu_unit "sifive_p600_ld" "sifive_p600_mem")
> > +(define_cpu_unit "sifive_p600_st" "sifive_p600_mem")
> > +
> > +;; Branch unit.
> > +(define_cpu_unit "sifive_p600_bru" "sifive_p600_iex")
> > +
> > +;; Integer and multiply unit.
> > +(define_cpu_unit "sifive_p600_ialu" "sifive_p600_iex")
> > +(define_cpu_unit "sifive_p600_imul" "sifive_p600_iex")
> > +(define_cpu_unit "sifive_p600_system" "sifive_p600_iex")
> > +
> > +;; Divide unit.
> > +(define_cpu_unit "sifive_p600_idiv" "sifive_p600_div")
> > +(define_cpu_unit "sifive_p600_fdiv" "sifive_p600_div")
> > +
> > +;; Float and multiply unit.
> > +(define_cpu_unit "sifive_p600_fmul" "sifive_p600_fex")
> > +(define_cpu_unit "sifive_p600_fpu" "sifive_p600_fex")
> > +
> > +;; ALU instruction can use pipeline C, B and M.
> > +(define_reservation "int_pipe"
> "(sifive_p600_C|sifive_p600_B|sifive_p600_M)")
> > +;; FPU instruction can use pipeline F and FM.
> > +(define_reservation "float_pipe" "(sifive_p600_F|sifive_p600_FM)")
> > +
> > +(define_insn_reservation "sifive_p600_load" 3
> > + (and (eq_attr "tune" "sifive_p600")
> > + (eq_attr "type" "load"))
> > + "sifive_p600_A,sifive_p600_ld*2")
> > +
> > +(define_insn_reservation "sifive_p600_fpload" 4
> > + (and (eq_attr "tune" "sifive_p600")
> > + (eq_attr "type" "fpload"))
> > + "sifive_p600_A,sifive_p600_ld*3")
> > +
> > +(define_insn_reservation "sifive_p600_store" 1
> > + (and (eq_attr "tune" "sifive_p600")
> > + (eq_attr "type" "store"))
> > + "sifive_p600_A+sifive_p600_st")
> > +
> > +(define_insn_reservation "sifive_p600_fpstore" 1
> > + (and (eq_attr "tune" "sifive_p600")
> > + (eq_attr "type" "fpstore"))
> > + "sifive_p600_A+sifive_p600_st")
> > +
> > +(define_insn_reservation "sifive_p600_branch" 1
> > + (and (eq_attr "tune" "sifive_p600")
> > + (eq_attr "type" "branch,jump,call"))
> > + "sifive_p600_B+sifive_p600_bru")
> > +
> > +(define_insn_reservation "sifive_p600_sfb_alu" 1
> > + (and (eq_attr "tune" "sifive_p600")
> > + (eq_attr "type" "sfb_alu"))
> > + "sifive_p600_C+sifive_p600_bru+sifive_p600_ialu")
> > +
> > +(define_insn_reservation "sifive_p600_atomic" 3
> > + (and (eq_attr "tune" "sifive_p600")
> > + (eq_attr "type" "atomic"))
> > + "sifive_p600_C,sifive_p600_system*2")
> > +
> > +(define_insn_reservation "sifive_p600_mul" 3
> > + (and (eq_attr "tune" "sifive_p600")
> > + (eq_attr "type" "imul"))
> > + "sifive_p600_M,sifive_p600_imul*2")
> > +
> > +(define_insn_reservation "sifive_p600_div" 33
> > + (and (eq_attr "tune" "sifive_p600")
> > + (eq_attr "type" "idiv"))
> > + "sifive_p600_M, sifive_p600_idiv*32")
> > +
> > +(define_insn_reservation "sifive_p600_alu" 1
> > + (and (eq_attr "tune" "sifive_p600")
> > + (eq_attr "type"
> "unknown,arith,logical,shift,slt,multi,bitmanip,clz,ctz,rotate"))
> > + "int_pipe+sifive_p600_ialu")
> > +
> > +(define_insn_reservation "sifive_p600_cpop" 3
> > + (and (eq_attr "tune" "sifive_p600")
> > + (eq_attr "type" "cpop"))
> > + "int_pipe,sifive_p600_ialu*2")
> > +
> > +(define_insn_reservation "sifive_p600_load_immediate" 1
> > + (and (eq_attr "tune" "sifive_p600")
> > + (eq_attr "type" "nop,const,auipc,move"))
> > + "int_pipe")
> > +
> > +(define_insn_reservation "sifive_p600_fma" 4
> > + (and (eq_attr "tune" "sifive_p600")
> > + (eq_attr "type" "fadd,fmul,fmadd"))
> > + "float_pipe,sifive_p600_fmul*3")
> > +
> > +(define_insn_reservation "sifive_p600_i2f" 2
> > + (and (eq_attr "tune" "sifive_p600")
> > + (eq_attr "type" "mtc,fcvt_i2f"))
> > + "sifive_p600_M,sifive_p600_ialu")
> > +
> > +(define_insn_reservation "sifive_p600_f2i" 2
> > + (and (eq_attr "tune" "sifive_p600")
> > + (eq_attr "type" "mfc,fcmp,fcvt_f2i"))
> > + "sifive_p600_F,sifive_p600_fpu")
> > +
> > +(define_insn_reservation "sifive_p600_fmove" 2
> > + (and (eq_attr "tune" "sifive_p600")
> > + (eq_attr "type" "fmove,fcvt"))
> > + "float_pipe,sifive_p600_fpu")
> > +
> > +(define_insn_reservation "sifive_p600_fdiv_s" 18
> > + (and (eq_attr "tune" "sifive_p600")
> > + (eq_attr "type" "fdiv,fsqrt")
> > + (eq_attr "mode" "SF"))
> > + "sifive_p600_FM, sifive_p600_fdiv*17")
> > +
> > +(define_insn_reservation "sifive_p600_fdiv_d" 31
> > + (and (eq_attr "tune" "sifive_p600")
> > + (eq_attr "type" "fdiv,fsqrt")
> > + (eq_attr "mode" "DF"))
> > + "sifive_p600_FM, sifive_p600_fdiv*30")
> > +
> > +(define_bypass 1
> "sifive_p600_load,sifive_p600_alu,sifive_p600_mul,sifive_p600_sfb_alu"
> > + "sifive_p600_alu,sifive_p600_branch")
> > +
> > +(define_bypass 1 "sifive_p600_load,sifive_p600_alu,sifive_p600_mul,
> > + sifive_p600_f2i,sifive_p600_fmove,sifive_p600_sfb_alu"
> > + "sifive_p600_store" "riscv_store_data_bypass_p")
> > +
> > +(define_bypass 1 "sifive_p600_i2f"
> > +
> "sifive_p600_fma,sifive_p600_f2i,sifive_p600_fmove,sifive_p600_fdiv_s,sifive_p600_fdiv_d")
> > +
> > +(define_bypass 1 "sifive_p600_f2i"
> > + "sifive_p600_branch,sifive_p600_sfb_alu,sifive_p600_mul,
> > + sifive_p600_div,sifive_p600_alu,sifive_p600_cpop")
> > diff --git a/gcc/doc/invoke.texi b/gcc/doc/invoke.texi
> > index 819a75dfe94..1017f4de8d2 100644
> > --- a/gcc/doc/invoke.texi
> > +++ b/gcc/doc/invoke.texi
> > @@ -30670,7 +30670,8 @@ Permissible values for this option are:
> @samp{sifive-e20}, @samp{sifive-e21},
> > Optimize the output for the given processor, specified by
> microarchitecture or
> > particular CPU name. Permissible values for this option are:
> @samp{rocket},
> > @samp{sifive-3-series}, @samp{sifive-5-series}, @samp{sifive-7-series},
> > -@samp{thead-c906}, @samp{size}, and all valid options for
> @option{-mcpu=}.
> > +@samp{thead-c906}, @samp{size}, @samp{sifive-p600-series},
> > +and all valid options for @option{-mcpu=}.
> >
> > When @option{-mtune=} is not specified, use the setting from
> @option{-mcpu},
> > the default is @samp{rocket} if both are not specified.
>
>
@@ -127,7 +127,7 @@
(define_insn_reservation "generic_ooo_fcvt" 3
(and (eq_attr "tune" "generic_ooo")
- (eq_attr "type" "fcvt"))
+ (eq_attr "type" "fcvt,fcvt_i2f,fcvt_f2i"))
"generic_ooo_issue,generic_ooo_fxu")
(define_insn_reservation "generic_ooo_fcmp" 2
@@ -42,7 +42,7 @@
(define_insn_reservation "generic_xfer" 3
(and (eq_attr "tune" "generic")
- (eq_attr "type" "mfc,mtc,fcvt,fmove,fcmp"))
+ (eq_attr "type" "mfc,mtc,fcvt,fcvt_i2f,fcvt_f2i,fmove,fcmp"))
"alu")
(define_insn_reservation "generic_branch" 1
@@ -37,6 +37,7 @@ RISCV_TUNE("rocket", generic, rocket_tune_info)
RISCV_TUNE("sifive-3-series", generic, rocket_tune_info)
RISCV_TUNE("sifive-5-series", generic, rocket_tune_info)
RISCV_TUNE("sifive-7-series", sifive_7, sifive_7_tune_info)
+RISCV_TUNE("sifive-p600-series", sifive_p600, sifive_p600_tune_info)
RISCV_TUNE("thead-c906", generic, thead_c906_tune_info)
RISCV_TUNE("generic-ooo", generic_ooo, generic_ooo_tune_info)
RISCV_TUNE("size", generic, optimize_size_tune_info)
@@ -55,6 +55,7 @@ extern enum riscv_isa_spec_class riscv_isa_spec;
enum riscv_microarchitecture_type {
generic,
sifive_7,
+ sifive_p600,
generic_ooo
};
extern enum riscv_microarchitecture_type riscv_microarchitecture;
@@ -447,6 +447,23 @@ static const struct riscv_tune_param sifive_7_tune_info = {
NULL, /* vector cost */
};
+/* Costs to use when optimizing for Sifive p600 Series. */
+static const struct riscv_tune_param sifive_p600_tune_info = {
+ {COSTS_N_INSNS (4), COSTS_N_INSNS (4)}, /* fp_add */
+ {COSTS_N_INSNS (4), COSTS_N_INSNS (4)}, /* fp_mul */
+ {COSTS_N_INSNS (20), COSTS_N_INSNS (20)}, /* fp_div */
+ {COSTS_N_INSNS (4), COSTS_N_INSNS (4)}, /* int_mul */
+ {COSTS_N_INSNS (6), COSTS_N_INSNS (6)}, /* int_div */
+ 4, /* issue_rate */
+ 4, /* branch_cost */
+ 3, /* memory_cost */
+ 4, /* fmv_cost */
+ true, /* slow_unaligned_access */
+ false, /* use_divmod_expansion */
+ RISCV_FUSE_LUI_ADDI | RISCV_FUSE_AUIPC_ADDI, /* fusible_ops */
+ NULL, /* vector cost */
+};
+
/* Costs to use when optimizing for T-HEAD c906. */
static const struct riscv_tune_param thead_c906_tune_info = {
{COSTS_N_INSNS (4), COSTS_N_INSNS (5)}, /* fp_add */
@@ -896,7 +896,9 @@ extern enum riscv_cc get_riscv_cc (const rtx use);
SLT[I][U], AND[I], XOR[I], OR[I], LUI, AUIPC, and their compressed
counterparts, including C.MV and C.LI) can be in the branch shadow. */
-#define TARGET_SFB_ALU (riscv_microarchitecture == sifive_7)
+#define TARGET_SFB_ALU \
+ ((riscv_microarchitecture == sifive_7) \
+ || (riscv_microarchitecture == sifive_p600))
#define LOGICAL_OP_NON_SHORT_CIRCUIT 0
@@ -314,6 +314,8 @@
;; fdiv floating point divide
;; fcmp floating point compare
;; fcvt floating point convert
+;; fcvt_i2f integer to floating point convert
+;; fcvt_f2i floating point to integer convert
;; fsqrt floating point square root
;; multi multiword sequence (or user asm statements)
;; auipc integer addition to PC
@@ -466,8 +468,8 @@
(define_attr "type"
"unknown,branch,jump,jalr,ret,call,load,fpload,store,fpstore,
mtc,mfc,const,arith,logical,shift,slt,imul,idiv,move,fmove,fadd,fmul,
- fmadd,fdiv,fcmp,fcvt,fsqrt,multi,auipc,sfb_alu,nop,trap,ghost,bitmanip,
- rotate,clmul,min,max,minu,maxu,clz,ctz,cpop,
+ fmadd,fdiv,fcmp,fcvt,fcvt_i2f,fcvt_f2i,fsqrt,multi,auipc,sfb_alu,nop,trap,
+ ghost,bitmanip,rotate,clmul,min,max,minu,maxu,clz,ctz,cpop,
atomic,condmove,cbo,crypto,pushpop,mvpair,zicond,rdvlenb,rdvl,wrvxrm,wrfrm,
rdfrm,vsetvl,vsetvl_pre,vlde,vste,vldm,vstm,vlds,vsts,
vldux,vldox,vstux,vstox,vldff,vldr,vstr,
@@ -685,7 +687,7 @@
;; Microarchitectures we know how to tune for.
;; Keep this in sync with enum riscv_microarchitecture.
(define_attr "tune"
- "generic,sifive_7,generic_ooo"
+ "generic,sifive_7,sifive_p600,generic_ooo"
(const (symbol_ref "((enum attr_tune) riscv_microarchitecture)")))
;; Describe a user's asm statement.
@@ -1973,7 +1975,7 @@
(match_operand:ANYF 1 "register_operand" " f")))]
"TARGET_HARD_FLOAT || TARGET_ZFINX"
"fcvt.<GPR:ifmt>.<ANYF:fmt> %0,%1,rtz"
- [(set_attr "type" "fcvt")
+ [(set_attr "type" "fcvt_f2i")
(set_attr "mode" "<ANYF:MODE>")])
(define_insn "fixuns_trunc<ANYF:mode><GPR:mode>2"
@@ -1982,7 +1984,7 @@
(match_operand:ANYF 1 "register_operand" " f")))]
"TARGET_HARD_FLOAT || TARGET_ZFINX"
"fcvt.<GPR:ifmt>u.<ANYF:fmt> %0,%1,rtz"
- [(set_attr "type" "fcvt")
+ [(set_attr "type" "fcvt_f2i")
(set_attr "mode" "<ANYF:MODE>")])
(define_insn "float<GPR:mode><ANYF:mode>2"
@@ -1991,7 +1993,7 @@
(match_operand:GPR 1 "reg_or_0_operand" " rJ")))]
"TARGET_HARD_FLOAT || TARGET_ZFINX"
"fcvt.<ANYF:fmt>.<GPR:ifmt>\t%0,%z1"
- [(set_attr "type" "fcvt")
+ [(set_attr "type" "fcvt_i2f")
(set_attr "mode" "<ANYF:MODE>")])
(define_insn "floatuns<GPR:mode><ANYF:mode>2"
@@ -2000,7 +2002,7 @@
(match_operand:GPR 1 "reg_or_0_operand" " rJ")))]
"TARGET_HARD_FLOAT || TARGET_ZFINX"
"fcvt.<ANYF:fmt>.<GPR:ifmt>u\t%0,%z1"
- [(set_attr "type" "fcvt")
+ [(set_attr "type" "fcvt_i2f")
(set_attr "mode" "<ANYF:MODE>")])
(define_insn "l<rint_pattern><ANYF:mode><GPR:mode>2"
@@ -2010,7 +2012,7 @@
RINT))]
"TARGET_HARD_FLOAT || TARGET_ZFINX"
"fcvt.<GPR:ifmt>.<ANYF:fmt> %0,%1,<rint_rm>"
- [(set_attr "type" "fcvt")
+ [(set_attr "type" "fcvt_f2i")
(set_attr "mode" "<ANYF:MODE>")])
(define_insn "<round_pattern><ANYF:mode>2"
@@ -3848,6 +3850,7 @@
(include "pic.md")
(include "generic.md")
(include "sifive-7.md")
+(include "sifive-p600.md")
(include "thead.md")
(include "generic-ooo.md")
(include "vector.md")
@@ -81,7 +81,7 @@
(define_insn_reservation "sifive_7_fp_other" 3
(and (eq_attr "tune" "sifive_7")
- (eq_attr "type" "fcvt,fcmp,fmove"))
+ (eq_attr "type" "fcvt,fcvt_i2f,fcvt_f2i,fcmp,fmove"))
"sifive_7_B")
(define_insn_reservation "sifive_7_fdiv_s" 27
new file mode 100644
@@ -0,0 +1,174 @@
+;; Scheduling description for Sifive p600 series.
+
+;; Sifive p600 series is a triple-issue, superscalar, out-of-order processor.
+
+;; CPU execution units:
+;; ialu Integer Units: all arithmetic and logic.
+;;
+;; bru Branch Resolution Unit: all branches.
+;;
+;; st Memory Write Unit: all writes to memory.
+;;
+;; ld Memory Read Unit: all reads from memory.
+;;
+;; imul Integer Multiply Unit
+;;
+;; idiv Integer Divide Unit
+;;
+;; system System Unit: all coprocessor accesses.
+;;
+;; fpu Floating Point Unit
+;;
+;; fmul Floating Point Multiply Unit
+;;
+;; fdiv Floating Point Divide Unit
+
+;; Four automata are defined to reduce number of states
+;; which a single large automaton will have.
+(define_automaton "sifive_p600_iex,sifive_p600_fex,sifive_p600_mem,sifive_p600_div")
+
+;; The Sifive 8 has six pipelines:
+;; A-pipe Load, Store
+;; B-pipe ALU, Branch
+;; M-pipe ALU, MUL, DIV and I2F(integer to float instruction)
+;; C-pipe ALU, Conditional move and system for coprocessor accesses
+;; F-pipe FPU, MUL, F2I(float to integer instruction)
+;; FM-pipe FPU, MUL, DIV
+
+(define_cpu_unit "sifive_p600_A" "sifive_p600_mem")
+(define_cpu_unit "sifive_p600_B" "sifive_p600_iex")
+(define_cpu_unit "sifive_p600_M" "sifive_p600_iex")
+(define_cpu_unit "sifive_p600_C" "sifive_p600_iex")
+(define_cpu_unit "sifive_p600_F" "sifive_p600_fex")
+(define_cpu_unit "sifive_p600_FM" "sifive_p600_fex")
+
+;; Load and store unit.
+(define_cpu_unit "sifive_p600_ld" "sifive_p600_mem")
+(define_cpu_unit "sifive_p600_st" "sifive_p600_mem")
+
+;; Branch unit.
+(define_cpu_unit "sifive_p600_bru" "sifive_p600_iex")
+
+;; Integer and multiply unit.
+(define_cpu_unit "sifive_p600_ialu" "sifive_p600_iex")
+(define_cpu_unit "sifive_p600_imul" "sifive_p600_iex")
+(define_cpu_unit "sifive_p600_system" "sifive_p600_iex")
+
+;; Divide unit.
+(define_cpu_unit "sifive_p600_idiv" "sifive_p600_div")
+(define_cpu_unit "sifive_p600_fdiv" "sifive_p600_div")
+
+;; Float and multiply unit.
+(define_cpu_unit "sifive_p600_fmul" "sifive_p600_fex")
+(define_cpu_unit "sifive_p600_fpu" "sifive_p600_fex")
+
+;; ALU instruction can use pipeline C, B and M.
+(define_reservation "int_pipe" "(sifive_p600_C|sifive_p600_B|sifive_p600_M)")
+;; FPU instruction can use pipeline F and FM.
+(define_reservation "float_pipe" "(sifive_p600_F|sifive_p600_FM)")
+
+(define_insn_reservation "sifive_p600_load" 3
+ (and (eq_attr "tune" "sifive_p600")
+ (eq_attr "type" "load"))
+ "sifive_p600_A,sifive_p600_ld*2")
+
+(define_insn_reservation "sifive_p600_fpload" 4
+ (and (eq_attr "tune" "sifive_p600")
+ (eq_attr "type" "fpload"))
+ "sifive_p600_A,sifive_p600_ld*3")
+
+(define_insn_reservation "sifive_p600_store" 1
+ (and (eq_attr "tune" "sifive_p600")
+ (eq_attr "type" "store"))
+ "sifive_p600_A+sifive_p600_st")
+
+(define_insn_reservation "sifive_p600_fpstore" 1
+ (and (eq_attr "tune" "sifive_p600")
+ (eq_attr "type" "fpstore"))
+ "sifive_p600_A+sifive_p600_st")
+
+(define_insn_reservation "sifive_p600_branch" 1
+ (and (eq_attr "tune" "sifive_p600")
+ (eq_attr "type" "branch,jump,call"))
+ "sifive_p600_B+sifive_p600_bru")
+
+(define_insn_reservation "sifive_p600_sfb_alu" 1
+ (and (eq_attr "tune" "sifive_p600")
+ (eq_attr "type" "sfb_alu"))
+ "sifive_p600_C+sifive_p600_bru+sifive_p600_ialu")
+
+(define_insn_reservation "sifive_p600_atomic" 3
+ (and (eq_attr "tune" "sifive_p600")
+ (eq_attr "type" "atomic"))
+ "sifive_p600_C,sifive_p600_system*2")
+
+(define_insn_reservation "sifive_p600_mul" 3
+ (and (eq_attr "tune" "sifive_p600")
+ (eq_attr "type" "imul"))
+ "sifive_p600_M,sifive_p600_imul*2")
+
+(define_insn_reservation "sifive_p600_div" 33
+ (and (eq_attr "tune" "sifive_p600")
+ (eq_attr "type" "idiv"))
+ "sifive_p600_M, sifive_p600_idiv*32")
+
+(define_insn_reservation "sifive_p600_alu" 1
+ (and (eq_attr "tune" "sifive_p600")
+ (eq_attr "type" "unknown,arith,logical,shift,slt,multi,bitmanip,clz,ctz,rotate"))
+ "int_pipe+sifive_p600_ialu")
+
+(define_insn_reservation "sifive_p600_cpop" 3
+ (and (eq_attr "tune" "sifive_p600")
+ (eq_attr "type" "cpop"))
+ "int_pipe,sifive_p600_ialu*2")
+
+(define_insn_reservation "sifive_p600_load_immediate" 1
+ (and (eq_attr "tune" "sifive_p600")
+ (eq_attr "type" "nop,const,auipc,move"))
+ "int_pipe")
+
+(define_insn_reservation "sifive_p600_fma" 4
+ (and (eq_attr "tune" "sifive_p600")
+ (eq_attr "type" "fadd,fmul,fmadd"))
+ "float_pipe,sifive_p600_fmul*3")
+
+(define_insn_reservation "sifive_p600_i2f" 2
+ (and (eq_attr "tune" "sifive_p600")
+ (eq_attr "type" "mtc,fcvt_i2f"))
+ "sifive_p600_M,sifive_p600_ialu")
+
+(define_insn_reservation "sifive_p600_f2i" 2
+ (and (eq_attr "tune" "sifive_p600")
+ (eq_attr "type" "mfc,fcmp,fcvt_f2i"))
+ "sifive_p600_F,sifive_p600_fpu")
+
+(define_insn_reservation "sifive_p600_fmove" 2
+ (and (eq_attr "tune" "sifive_p600")
+ (eq_attr "type" "fmove,fcvt"))
+ "float_pipe,sifive_p600_fpu")
+
+(define_insn_reservation "sifive_p600_fdiv_s" 18
+ (and (eq_attr "tune" "sifive_p600")
+ (eq_attr "type" "fdiv,fsqrt")
+ (eq_attr "mode" "SF"))
+ "sifive_p600_FM, sifive_p600_fdiv*17")
+
+(define_insn_reservation "sifive_p600_fdiv_d" 31
+ (and (eq_attr "tune" "sifive_p600")
+ (eq_attr "type" "fdiv,fsqrt")
+ (eq_attr "mode" "DF"))
+ "sifive_p600_FM, sifive_p600_fdiv*30")
+
+(define_bypass 1 "sifive_p600_load,sifive_p600_alu,sifive_p600_mul,sifive_p600_sfb_alu"
+ "sifive_p600_alu,sifive_p600_branch")
+
+(define_bypass 1 "sifive_p600_load,sifive_p600_alu,sifive_p600_mul,
+ sifive_p600_f2i,sifive_p600_fmove,sifive_p600_sfb_alu"
+ "sifive_p600_store" "riscv_store_data_bypass_p")
+
+(define_bypass 1 "sifive_p600_i2f"
+ "sifive_p600_fma,sifive_p600_f2i,sifive_p600_fmove,sifive_p600_fdiv_s,sifive_p600_fdiv_d")
+
+(define_bypass 1 "sifive_p600_f2i"
+ "sifive_p600_branch,sifive_p600_sfb_alu,sifive_p600_mul,
+ sifive_p600_div,sifive_p600_alu,sifive_p600_cpop")
@@ -30670,7 +30670,8 @@ Permissible values for this option are: @samp{sifive-e20}, @samp{sifive-e21},
Optimize the output for the given processor, specified by microarchitecture or
particular CPU name. Permissible values for this option are: @samp{rocket},
@samp{sifive-3-series}, @samp{sifive-5-series}, @samp{sifive-7-series},
-@samp{thead-c906}, @samp{size}, and all valid options for @option{-mcpu=}.
+@samp{thead-c906}, @samp{size}, @samp{sifive-p600-series},
+and all valid options for @option{-mcpu=}.
When @option{-mtune=} is not specified, use the setting from @option{-mcpu},
the default is @samp{rocket} if both are not specified.