On Tue, May 3, 2022 at 9:40 AM ~eopxd <[email protected]> wrote: > > From: eopXD <[email protected]> > > Compares write mask registers, and so always operate under a tail- > agnostic policy. > > Signed-off-by: eop Chen <[email protected]> > Reviewed-by: Frank Chang <[email protected]> > Reviewed-by: Weiwei Li <[email protected]>
Acked-by: Alistair Francis <[email protected]> Alistair > --- > target/riscv/vector_helper.c | 18 ++++++++++++++++++ > 1 file changed, 18 insertions(+) > > diff --git a/target/riscv/vector_helper.c b/target/riscv/vector_helper.c > index c1ae2ea2f1..ddaf364573 100644 > --- a/target/riscv/vector_helper.c > +++ b/target/riscv/vector_helper.c > @@ -1373,6 +1373,8 @@ void HELPER(NAME)(void *vd, void *v0, void *vs1, void > *vs2, \ > { \ > uint32_t vm = vext_vm(desc); \ > uint32_t vl = env->vl; \ > + uint32_t total_elems = env_archcpu(env)->cfg.vlen; \ > + uint32_t vta_all_1s = vext_vta_all_1s(desc); \ > uint32_t i; \ > \ > for (i = env->vstart; i < vl; i++) { \ > @@ -1384,6 +1386,13 @@ void HELPER(NAME)(void *vd, void *v0, void *vs1, void > *vs2, \ > vext_set_elem_mask(vd, i, DO_OP(s2, s1)); \ > } \ > env->vstart = 0; \ > + /* mask destination register are always tail-agnostic */ \ > + /* set tail elements to 1s */ \ > + if (vta_all_1s) { \ > + for (; i < total_elems; i++) { \ > + vext_set_elem_mask(vd, i, 1); \ > + } \ > + } \ > } > > GEN_VEXT_CMP_VV(vmseq_vv_b, uint8_t, H1, DO_MSEQ) > @@ -1422,6 +1431,8 @@ void HELPER(NAME)(void *vd, void *v0, target_ulong s1, > void *vs2, \ > { \ > uint32_t vm = vext_vm(desc); \ > uint32_t vl = env->vl; \ > + uint32_t total_elems = env_archcpu(env)->cfg.vlen; \ > + uint32_t vta_all_1s = vext_vta_all_1s(desc); \ > uint32_t i; \ > \ > for (i = env->vstart; i < vl; i++) { \ > @@ -1433,6 +1444,13 @@ void HELPER(NAME)(void *vd, void *v0, target_ulong s1, > void *vs2, \ > DO_OP(s2, (ETYPE)(target_long)s1)); \ > } \ > env->vstart = 0; \ > + /* mask destination register are always tail-agnostic */ \ > + /* set tail elements to 1s */ \ > + if (vta_all_1s) { \ > + for (; i < total_elems; i++) { \ > + vext_set_elem_mask(vd, i, 1); \ > + } \ > + } \ > } > > GEN_VEXT_CMP_VX(vmseq_vx_b, uint8_t, H1, DO_MSEQ) > -- > 2.34.2 > >
