XTheadVector floating-point scalar move instructions diff from RVV1.0 in the following points: 1. When src width < dst width, RVV1.0 checks whether the input value is a valid NaN-boxed value, in which case the least-significant dst-width bits are used, else the canonical NaN value is used. XTheadVector always use the least-significant bits. 2. different tail elements process policy.
Signed-off-by: Huang Tao <eric.hu...@linux.alibaba.com> --- .../riscv/insn_trans/trans_xtheadvector.c.inc | 59 ++++++++++++++++++- 1 file changed, 57 insertions(+), 2 deletions(-) diff --git a/target/riscv/insn_trans/trans_xtheadvector.c.inc b/target/riscv/insn_trans/trans_xtheadvector.c.inc index a8a1ec7b3f..54ccd933c0 100644 --- a/target/riscv/insn_trans/trans_xtheadvector.c.inc +++ b/target/riscv/insn_trans/trans_xtheadvector.c.inc @@ -2740,14 +2740,69 @@ static bool trans_th_vmv_s_x(DisasContext *s, arg_th_vmv_s_x *a) return false; } +/* Floating-Point Scalar Move Instructions */ +static bool trans_th_vfmv_f_s(DisasContext *s, arg_th_vfmv_f_s *a) +{ + if (require_xtheadvector(s) && + !s->vill && has_ext(s, RVF) && + (s->mstatus_fs != 0) && + (s->sew != 0)) { + unsigned int len = 8 << s->sew; + + th_element_loadi(s, cpu_fpr[a->rd], a->rs2, 0); + if (len < 64) { + tcg_gen_ori_i64(cpu_fpr[a->rd], cpu_fpr[a->rd], + MAKE_64BIT_MASK(len, 64 - len)); + } + + mark_fs_dirty(s); + tcg_gen_movi_tl(cpu_vstart, 0); + finalize_rvv_inst(s); + return true; + } + return false; +} + +/* vfmv.s.f vd, rs1 # vd[0] = rs1 (vs2=0) */ +static bool trans_th_vfmv_s_f(DisasContext *s, arg_th_vfmv_s_f *a) +{ + if (require_xtheadvector(s) && + !s->vill && has_ext(s, RVF) && + (s->sew != 0)) { + TCGv_i64 t1; + /* The instructions ignore LMUL and vector register group. */ + uint32_t vlmax = s->cfg_ptr->vlenb; + + /* if vl == 0, skip vector register write back */ + TCGLabel *over = gen_new_label(); + tcg_gen_brcond_tl(TCG_COND_GEU, cpu_vstart, cpu_vl, over); + + /* zeroed all elements */ + tcg_gen_gvec_dup_imm(MO_64, vreg_ofs(s, a->rd), vlmax, vlmax, 0); + + /* NaN-box f[rs1] as necessary for SEW */ + t1 = tcg_temp_new_i64(); + if (s->sew == MO_64 && !has_ext(s, RVD)) { + tcg_gen_ori_i64(t1, cpu_fpr[a->rs1], MAKE_64BIT_MASK(32, 32)); + } else { + tcg_gen_mov_i64(t1, cpu_fpr[a->rs1]); + } + th_element_storei(s, a->rd, 0, t1); + + gen_set_label(over); + tcg_gen_movi_tl(cpu_vstart, 0); + finalize_rvv_inst(s); + return true; + } + return false; +} + #define TH_TRANS_STUB(NAME) \ static bool trans_##NAME(DisasContext *s, arg_##NAME *a) \ { \ return require_xtheadvector(s); \ } -TH_TRANS_STUB(th_vfmv_f_s) -TH_TRANS_STUB(th_vfmv_s_f) TH_TRANS_STUB(th_vslideup_vx) TH_TRANS_STUB(th_vslideup_vi) TH_TRANS_STUB(th_vslide1up_vx) -- 2.44.0