LGTM juzhe.zh...@rivai.ai <juzhe.zh...@rivai.ai> 於 2023年5月11日 週四 18:36 寫道:
> LGTM. Plz commit it now. Then I can rebase vec_init patch. > > > > juzhe.zh...@rivai.ai > > From: Robin Dapp > Date: 2023-05-11 18:29 > To: Kito Cheng; Palmer Dabbelt > CC: gcc-patches; juzhe.zhong; collison; jeffreyalaw > Subject: [PATCH v2] RISC-V: Clarify vlmax and length handling. > Changes from v1: > - Change subject to RISC-V ;) > - Minor comment updates and rebasing. > > This patch tries to improve the wrappers that emit either vlmax or > non-vlmax operations. Now, emit_len_op can be used to > emit a regular operation. Depending on whether a length != NULL > is passed either no VLMAX flags are set or we emit a vsetvli and > set VLMAX flags. The patch also adds some comments that describes > some of the rationale of the current handling of vlmax/nonvlmax > operations. > > gcc/ChangeLog: > > * config/riscv/autovec.md: Use renamed functions. > * config/riscv/riscv-protos.h (emit_vlmax_op): Rename. > (emit_vlmax_reg_op): To this. > (emit_nonvlmax_op): Rename. > (emit_len_op): To this. > (emit_nonvlmax_binop): Rename. > (emit_len_binop): To this. > * config/riscv/riscv-v.cc (emit_pred_op): Add default parameter. > (emit_pred_binop): Remove vlmax_p. > (emit_vlmax_op): Rename. > (emit_vlmax_reg_op): To this. > (emit_nonvlmax_op): Rename. > (emit_len_op): To this. > (emit_nonvlmax_binop): Rename. > (emit_len_binop): To this. > (sew64_scalar_helper): Use renamed functions. > (expand_tuple_move): Use renamed functions. > * config/riscv/riscv.cc (vector_zero_call_used_regs): Use > renamed functions. > * config/riscv/vector.md: Use renamed functions. > --- > gcc/config/riscv/autovec.md | 26 ++++----- > gcc/config/riscv/riscv-protos.h | 8 +-- > gcc/config/riscv/riscv-v.cc | 94 ++++++++++++++++++++------------- > gcc/config/riscv/riscv.cc | 4 +- > gcc/config/riscv/vector.md | 12 +++-- > 5 files changed, 83 insertions(+), 61 deletions(-) > > diff --git a/gcc/config/riscv/autovec.md b/gcc/config/riscv/autovec.md > index e249f4be704..58926ed3e67 100644 > --- a/gcc/config/riscv/autovec.md > +++ b/gcc/config/riscv/autovec.md > @@ -31,8 +31,8 @@ (define_expand "len_load_<mode>" > (match_operand 3 "const_0_operand")] > "TARGET_VECTOR" > { > - riscv_vector::emit_nonvlmax_op (code_for_pred_mov (<MODE>mode), > operands[0], > - operands[1], operands[2], <VM>mode); > + riscv_vector::emit_len_op (code_for_pred_mov (<MODE>mode), operands[0], > + operands[1], operands[2], <VM>mode); > DONE; > }) > @@ -43,8 +43,8 @@ (define_expand "len_store_<mode>" > (match_operand 3 "const_0_operand")] > "TARGET_VECTOR" > { > - riscv_vector::emit_nonvlmax_op (code_for_pred_mov (<MODE>mode), > operands[0], > - operands[1], operands[2], <VM>mode); > + riscv_vector::emit_len_op (code_for_pred_mov (<MODE>mode), operands[0], > + operands[1], operands[2], <VM>mode); > DONE; > }) > @@ -106,16 +106,16 @@ (define_expand "<optab><mode>3" > { > rtx cst; > gcc_assert (const_vec_duplicate_p(operands[2], &cst)); > - riscv_vector::emit_nonvlmax_binop (code_for_pred_scalar > - (<CODE>, <MODE>mode), > - operands[0], operands[1], cst, > - NULL, <VM>mode, > - <VEL>mode); > + riscv_vector::emit_len_binop (code_for_pred_scalar > + (<CODE>, <MODE>mode), > + operands[0], operands[1], cst, > + NULL, <VM>mode, > + <VEL>mode); > } > else > - riscv_vector::emit_nonvlmax_binop (code_for_pred > - (<CODE>, <MODE>mode), > - operands[0], operands[1], operands[2], > - NULL, <VM>mode); > + riscv_vector::emit_len_binop (code_for_pred > + (<CODE>, <MODE>mode), > + operands[0], operands[1], operands[2], > + NULL, <VM>mode); > DONE; > }) > diff --git a/gcc/config/riscv/riscv-protos.h > b/gcc/config/riscv/riscv-protos.h > index 4d0589e502c..55a43d6270e 100644 > --- a/gcc/config/riscv/riscv-protos.h > +++ b/gcc/config/riscv/riscv-protos.h > @@ -167,10 +167,10 @@ bool legitimize_move (rtx, rtx, machine_mode); > void emit_vlmax_vsetvl (machine_mode, rtx); > void emit_hard_vlmax_vsetvl (machine_mode, rtx); > void emit_vlmax_op (unsigned, rtx, rtx, machine_mode); > -void emit_vlmax_op (unsigned, rtx, rtx, rtx, machine_mode); > -void emit_nonvlmax_op (unsigned, rtx, rtx, rtx, machine_mode); > -void emit_nonvlmax_binop (unsigned, rtx, rtx, rtx, rtx, machine_mode, > - machine_mode = VOIDmode); > +void emit_vlmax_reg_op (unsigned, rtx, rtx, rtx, machine_mode); > +void emit_len_op (unsigned, rtx, rtx, rtx, machine_mode); > +void emit_len_binop (unsigned, rtx, rtx, rtx, rtx, machine_mode, > + machine_mode = VOIDmode); > enum vlmul_type get_vlmul (machine_mode); > unsigned int get_ratio (machine_mode); > unsigned int get_nf (machine_mode); > diff --git a/gcc/config/riscv/riscv-v.cc b/gcc/config/riscv/riscv-v.cc > index 8f46226d571..7cf5ec9f3ba 100644 > --- a/gcc/config/riscv/riscv-v.cc > +++ b/gcc/config/riscv/riscv-v.cc > @@ -99,27 +99,24 @@ public: > add_vundef_operand (dest_mode); > } > - void set_len_and_policy (rtx len, bool vlmax_p) > + void set_len_and_policy (rtx len, bool force_vlmax = false) > { > + bool vlmax_p = force_vlmax; > gcc_assert (has_dest); > - gcc_assert (len || vlmax_p); > - if (len) > - add_input_operand (len, Pmode); > - else > + if (!len) > { > - rtx vlmax = gen_reg_rtx (Pmode); > - emit_vlmax_vsetvl (dest_mode, vlmax); > - add_input_operand (vlmax, Pmode); > + vlmax_p = true; > + len = gen_reg_rtx (Pmode); > + emit_vlmax_vsetvl (dest_mode, len); > } > + add_input_operand (len, Pmode); > + > if (GET_MODE_CLASS (dest_mode) != MODE_VECTOR_BOOL) > add_policy_operand (get_prefer_tail_policy (), get_prefer_mask_policy ()); > - if (vlmax_p) > - add_avl_type_operand (avl_type::VLMAX); > - else > - add_avl_type_operand (avl_type::NONVLMAX); > + add_avl_type_operand (vlmax_p ? avl_type::VLMAX : > avl_type::NONVLMAX); > } > void expand (enum insn_code icode, bool temporary_volatile_p = false) > @@ -232,14 +229,14 @@ autovec_use_vlmax_p (void) > /* Emit an RVV unmask && vl mov from SRC to DEST. */ > static void > emit_pred_op (unsigned icode, rtx mask, rtx dest, rtx src, rtx len, > - machine_mode mask_mode, bool vlmax_p) > + machine_mode mask_mode, bool force_vlmax = false) > { > insn_expander<8> e; > e.set_dest_and_mask (mask, dest, mask_mode); > e.add_input_operand (src, GET_MODE (src)); > - e.set_len_and_policy (len, vlmax_p); > + e.set_len_and_policy (len, force_vlmax); > e.expand ((enum insn_code) icode, MEM_P (dest) || MEM_P (src)); > } > @@ -248,8 +245,8 @@ emit_pred_op (unsigned icode, rtx mask, rtx dest, rtx > src, rtx len, > specified using SCALAR_MODE. */ > static void > emit_pred_binop (unsigned icode, rtx mask, rtx dest, rtx src1, rtx src2, > - rtx len, machine_mode mask_mode, machine_mode scalar_mode, > - bool vlmax_p) > + rtx len, machine_mode mask_mode, > + machine_mode scalar_mode = VOIDmode) > { > insn_expander<9> e; > e.set_dest_and_mask (mask, dest, mask_mode); > @@ -267,37 +264,60 @@ emit_pred_binop (unsigned icode, rtx mask, rtx dest, > rtx src1, rtx src2, > else > e.add_input_operand (src2, scalar_mode); > - e.set_len_and_policy (len, vlmax_p); > + e.set_len_and_policy (len); > e.expand ((enum insn_code) icode, MEM_P (dest) || MEM_P (src1) || MEM_P > (src2)); > } > +/* The RISC-V vsetvli pass uses "known vlmax" operations for optimization. > + Whether or not an instruction actually is a vlmax operation is not > + recognizable from the length operand alone but the avl_type operand > + is used instead. In general, there are two cases: > + > + - Emit a vlmax operation by passing a NULL length. Here we emit > + a vsetvli with vlmax configuration and set the avl_type to VLMAX. > + - Emit an operation that uses the existing (last-set) length and > + set the avl_type to NONVLMAX. > + > + Sometimes we also need to set the VLMAX avl_type to an operation that > + already uses a given length register. This can happen during or after > + register allocation when we are not allowed to create a new register. > + For that case we also allow to set the avl_type to VLMAX. > +*/ > + > +/* This function emits a VLMAX vsetvli followed by the actual operation. > */ > void > emit_vlmax_op (unsigned icode, rtx dest, rtx src, machine_mode mask_mode) > { > - emit_pred_op (icode, NULL_RTX, dest, src, NULL_RTX, mask_mode, true); > + emit_pred_op (icode, NULL_RTX, dest, src, NULL_RTX, mask_mode); > } > +/* This function emits an operation with a given LEN that is determined > + by a previously emitted VLMAX vsetvli. */ > void > -emit_vlmax_op (unsigned icode, rtx dest, rtx src, rtx len, > - machine_mode mask_mode) > +emit_len_op (unsigned icode, rtx dest, rtx src, rtx len, > + machine_mode mask_mode) > { > - emit_pred_op (icode, NULL_RTX, dest, src, len, mask_mode, true); > + emit_pred_op (icode, NULL_RTX, dest, src, len, mask_mode); > } > +/* This function emits an operation with a given LEN that is known to be > + a preceding VLMAX. It also sets the VLMAX flag which allows further > + optimization in the vsetvli pass. */ > void > -emit_nonvlmax_op (unsigned icode, rtx dest, rtx src, rtx len, > - machine_mode mask_mode) > +emit_vlmax_reg_op (unsigned icode, rtx dest, rtx src, rtx len, > + machine_mode mask_mode) > { > - emit_pred_op (icode, NULL_RTX, dest, src, len, mask_mode, false); > + emit_pred_op (icode, NULL_RTX, dest, src, len, mask_mode, > + /* Force VLMAX */ true); > } > void > -emit_nonvlmax_binop (unsigned icode, rtx dest, rtx src1, rtx src2, rtx > len, > - machine_mode mask_mode, machine_mode scalar_mode) > +emit_len_binop (unsigned icode, rtx dest, rtx src1, rtx src2, rtx len, > + machine_mode mask_mode, machine_mode scalar_mode) > { > - emit_pred_binop (icode, NULL_RTX, dest, src1, src2, len, mask_mode, > - scalar_mode, len ? false : true); > + emit_pred_binop (icode, NULL_RTX, dest, src1, src2, len, > + mask_mode, scalar_mode); > } > /* Emit vid.v instruction. */ > @@ -345,14 +365,14 @@ expand_vec_series (rtx dest, rtx base, rtx step) > int shift = exact_log2 (INTVAL (step)); > rtx shift_amount = gen_int_mode (shift, Pmode); > insn_code icode = code_for_pred_scalar (ASHIFT, mode); > - emit_nonvlmax_binop (icode, step_adj, vid, shift_amount, > - NULL, mask_mode, Pmode); > + emit_len_binop (icode, step_adj, vid, shift_amount, > + NULL, mask_mode, Pmode); > } > else > { > insn_code icode = code_for_pred_scalar (MULT, mode); > - emit_nonvlmax_binop (icode, step_adj, vid, step, > - NULL, mask_mode, inner_mode); > + emit_len_binop (icode, step_adj, vid, step, > + NULL, mask_mode, inner_mode); > } > } > @@ -367,7 +387,7 @@ expand_vec_series (rtx dest, rtx base, rtx step) > { > rtx result = gen_reg_rtx (mode); > insn_code icode = code_for_pred_scalar (PLUS, mode); > - emit_nonvlmax_binop (icode, result, step_adj, base, > + emit_len_binop (icode, result, step_adj, base, > NULL, mask_mode, inner_mode); > emit_move_insn (dest, result); > } > @@ -739,8 +759,8 @@ sew64_scalar_helper (rtx *operands, rtx *scalar_op, > rtx vl, > *scalar_op = force_reg (scalar_mode, *scalar_op); > rtx tmp = gen_reg_rtx (vector_mode); > - riscv_vector::emit_nonvlmax_op (code_for_pred_broadcast (vector_mode), > tmp, > - *scalar_op, vl, mask_mode); > + riscv_vector::emit_len_op (code_for_pred_broadcast (vector_mode), tmp, > + *scalar_op, vl, mask_mode); > emit_vector_func (operands, tmp); > return true; > @@ -1046,7 +1066,7 @@ expand_tuple_move (machine_mode mask_mode, rtx *ops) > rtx mem = gen_rtx_MEM (subpart_mode, ops[3]); > if (fractional_p) > - emit_vlmax_op (code_for_pred_mov (subpart_mode), subreg, mem, > + emit_vlmax_reg_op (code_for_pred_mov (subpart_mode), subreg, mem, > ops[4], mask_mode); > else > emit_move_insn (subreg, mem); > @@ -1068,7 +1088,7 @@ expand_tuple_move (machine_mode mask_mode, rtx *ops) > rtx mem = gen_rtx_MEM (subpart_mode, ops[3]); > if (fractional_p) > - emit_vlmax_op (code_for_pred_mov (subpart_mode), mem, subreg, > + emit_vlmax_reg_op (code_for_pred_mov (subpart_mode), mem, subreg, > ops[4], mask_mode); > else > emit_move_insn (mem, subreg); > diff --git a/gcc/config/riscv/riscv.cc b/gcc/config/riscv/riscv.cc > index 02d581589ac..cecb4d49092 100644 > --- a/gcc/config/riscv/riscv.cc > +++ b/gcc/config/riscv/riscv.cc > @@ -7391,8 +7391,8 @@ vector_zero_call_used_regs (HARD_REG_SET > need_zeroed_hardregs) > emitted_vlmax_vsetvl = true; > } > - riscv_vector::emit_vlmax_op (code_for_pred_mov (mode), target, > - CONST0_RTX (mode), vl, mask_mode); > + riscv_vector::emit_vlmax_reg_op (code_for_pred_mov (mode), target, > + CONST0_RTX (mode), vl, mask_mode); > SET_HARD_REG_BIT (zeroed_hardregs, regno); > } > diff --git a/gcc/config/riscv/vector.md b/gcc/config/riscv/vector.md > index 9ccc0d6a513..75479f27bcd 100644 > --- a/gcc/config/riscv/vector.md > +++ b/gcc/config/riscv/vector.md > @@ -721,8 +721,9 @@ (define_insn_and_split "*mov<V_FRACT:mode><P:mode>_lra" > else > { > riscv_vector::emit_vlmax_vsetvl (<V_FRACT:MODE>mode, operands[2]); > - riscv_vector::emit_vlmax_op (code_for_pred_mov (<V_FRACT:MODE>mode), > - operands[0], operands[1], operands[2], <VM>mode); > + riscv_vector::emit_vlmax_reg_op (code_for_pred_mov > (<V_FRACT:MODE>mode), > + operands[0], operands[1], operands[2], > + <VM>mode); > } > DONE; > }) > @@ -741,8 +742,9 @@ (define_insn_and_split "*mov<VB:mode><P:mode>_lra" > else > { > riscv_vector::emit_vlmax_vsetvl (<VB:MODE>mode, operands[2]); > - riscv_vector::emit_vlmax_op (code_for_pred_mov (<VB:MODE>mode), > - operands[0], operands[1], operands[2], <VB:MODE>mode); > + riscv_vector::emit_vlmax_reg_op (code_for_pred_mov (<VB:MODE>mode), > + operands[0], operands[1], operands[2], > + <VB:MODE>mode); > } > DONE; > }) > @@ -806,7 +808,7 @@ (define_expand "vec_duplicate<mode>" > "TARGET_VECTOR" > { > riscv_vector::emit_vlmax_op (code_for_pred_broadcast (<MODE>mode), > - operands[0], operands[1], <VM>mode); > + operands[0], operands[1], <VM>mode); > DONE; > } > ) > -- > 2.40.0 > > > >