[RFC,v3,12/71] target/riscv: rvv-1.0: add fractional LMUL

Message ID	20200806104709.13235-13-frank.chang@sifive.com
State	New
Headers	show Return-Path: <qemu-devel-bounces+incoming=patchwork.ozlabs.org@nongnu.org> From: frank.chang@sifive.com To: qemu-devel@nongnu.org, qemu-riscv@nongnu.org Subject: [RFC v3 12/71] target/riscv: rvv-1.0: add fractional LMUL Date: Thu, 6 Aug 2020 18:46:09 +0800 Message-Id: <20200806104709.13235-13-frank.chang@sifive.com> In-Reply-To: <20200806104709.13235-1-frank.chang@sifive.com> References: <20200806104709.13235-1-frank.chang@sifive.com> Received-SPF: pass client-ip=2607:f8b0:4864:20::102b; envelope-from=frank.chang@sifive.com; helo=mail-pj1-x102b.google.com Precedence: list Cc: Frank Chang <frank.chang@sifive.com>, Alistair Francis <Alistair.Francis@wdc.com>, Palmer Dabbelt <palmer@dabbelt.com>, Sagar Karandikar <sagark@eecs.berkeley.edu>, Bastian Koppelmann <kbastian@mail.uni-paderborn.de> Errors-To: qemu-devel-bounces+incoming=patchwork.ozlabs.org@nongnu.org Sender: "Qemu-devel" <qemu-devel-bounces+incoming=patchwork.ozlabs.org@nongnu.org>
Series	target/riscv: support vector extension v1.0 \| expand [RFC,v3,00/71] target/riscv: support vector extension v1.0 [RFC,v3,01/71] target/riscv: drop vector 0.7.1 and add 1.0 support [RFC,v3,02/71] target/riscv: Use FIELD_EX32() to extract wd field [RFC,v3,03/71] target/riscv: rvv-1.0: add mstatus VS field [RFC,v3,04/71] target/riscv: rvv-1.0: add sstatus VS field [RFC,v3,05/71] target/riscv: rvv-1.0: introduce writable misa.v field [RFC,v3,06/71] target/riscv: rvv-1.0: add translation-time vector context status [RFC,v3,07/71] target/riscv: rvv-1.0: remove vxrm and vxsat fields from fcsr register [RFC,v3,08/71] target/riscv: rvv-1.0: add vcsr register [RFC,v3,09/71] target/riscv: rvv-1.0: add vlenb register [RFC,v3,10/71] target/riscv: rvv-1.0: check MSTATUS_VS when accessing vector csr registers [RFC,v3,11/71] target/riscv: rvv-1.0: remove MLEN calculations [RFC,v3,12/71] target/riscv: rvv-1.0: add fractional LMUL [RFC,v3,13/71] target/riscv: rvv-1.0: add VMA and VTA [RFC,v3,14/71] target/riscv: rvv-1.0: update check functions [RFC,v3,15/71] target/riscv: introduce more imm value modes in translator functions [RFC,v3,16/71] target/riscv: add fp16 nan-box check generator function [RFC,v3,17/71] target/riscv: rvv:1.0: add translation-time nan-box helper function [RFC,v3,18/71] target/riscv: rvv-1.0: apply nanbox helper in opfvf_trans [RFC,v3,19/71] target/riscv: rvv-1.0: configure instructions [RFC,v3,20/71] target/riscv: rvv-1.0: stride load and store instructions [RFC,v3,21/71] target/riscv: rvv-1.0: index load and store instructions [RFC,v3,22/71] target/riscv: rvv-1.0: fix address index overflow bug of indexed load/store insns [RFC,v3,23/71] target/riscv: rvv-1.0: fault-only-first unit stride load [RFC,v3,24/71] target/riscv: rvv-1.0: amo operations [RFC,v3,25/71] target/riscv: rvv-1.0: load/store whole register instructions [RFC,v3,26/71] target/riscv: rvv-1.0: update vext_max_elems() for load/store insns [RFC,v3,27/71] target/riscv: rvv-1.0: take fractional LMUL into vector max elements calculation [RFC,v3,28/71] target/riscv: rvv-1.0: floating-point square-root instruction [RFC,v3,29/71] target/riscv: rvv-1.0: floating-point classify instructions [RFC,v3,30/71] target/riscv: rvv-1.0: mask population count instruction [RFC,v3,31/71] target/riscv: rvv-1.0: find-first-set mask bit instruction [RFC,v3,32/71] target/riscv: rvv-1.0: set-X-first mask bit instructions [RFC,v3,33/71] target/riscv: rvv-1.0: iota instruction [RFC,v3,34/71] target/riscv: rvv-1.0: element index instruction [RFC,v3,35/71] target/riscv: rvv-1.0: allow load element with sign-extended [RFC,v3,36/71] target/riscv: rvv-1.0: register gather instructions [RFC,v3,37/71] target/riscv: rvv-1.0: integer scalar move instructions [RFC,v3,38/71] target/riscv: rvv-1.0: floating-point move instruction [RFC,v3,39/71] target/riscv: rvv-1.0: floating-point scalar move instructions [RFC,v3,40/71] target/riscv: rvv-1.0: whole register move instructions [RFC,v3,41/71] target/riscv: rvv-1.0: integer extension instructions [RFC,v3,42/71] target/riscv: rvv-1.0: single-width averaging add and subtract instructions [RFC,v3,43/71] target/riscv: rvv-1.0: single-width bit shift instructions [RFC,v3,44/71] target/riscv: rvv-1.0: integer add-with-carry/subtract-with-borrow [RFC,v3,45/71] target/riscv: rvv-1.0: narrowing integer right shift instructions [RFC,v3,46/71] target/riscv: rvv-1.0: widening integer multiply-add instructions [RFC,v3,47/71] target/riscv: rvv-1.0: add Zvqmac extension [RFC,v3,48/71] target/riscv: rvv-1.0: quad-widening integer multiply-add instructions [RFC,v3,49/71] target/riscv: rvv-1.0: single-width saturating add and subtract instructions [RFC,v3,50/71] target/riscv: rvv-1.0: integer comparison instructions [RFC,v3,51/71] target/riscv: use softfloat lib float16 comparison functions [RFC,v3,52/71] target/riscv: rvv-1.0: floating-point compare instructions [RFC,v3,53/71] target/riscv: rvv-1.0: mask-register logical instructions [RFC,v3,54/71] target/riscv: rvv-1.0: slide instructions [RFC,v3,55/71] target/riscv: rvv-1.0: floating-point slide instructions [RFC,v3,56/71] target/riscv: rvv-1.0: narrowing fixed-point clip instructions [RFC,v3,57/71] target/riscv: rvv-1.0: single-width floating-point reduction [RFC,v3,58/71] target/riscv: rvv-1.0: widening floating-point reduction instructions [RFC,v3,59/71] target/riscv: rvv-1.0: single-width scaling shift instructions [RFC,v3,60/71] target/riscv: rvv-1.0: remove widening saturating scaled multiply-add [RFC,v3,61/71] target/riscv: rvv-1.0: remove vmford.vv and vmford.vf [RFC,v3,62/71] target/riscv: rvv-1.0: remove integer extract instruction [RFC,v3,63/71] target/riscv: rvv-1.0: floating-point min/max instructions [RFC,v3,64/71] target/riscv: introduce floating-point rounding mode enum [RFC,v3,65/71] target/riscv: rvv-1.0: floating-point/integer type-convert instructions [RFC,v3,66/71] target/riscv: rvv-1.0: widening floating-point/integer type-convert [RFC,v3,67/71] target/riscv: add "set round to odd" rounding mode helper function [RFC,v3,68/71] target/riscv: rvv-1.0: narrowing floating-point/integer type-convert [RFC,v3,69/71] target/riscv: gdb: modify gdb csr xml file to align with csr register map [RFC,v3,70/71] target/riscv: gdb: support vector registers for rv64 [RFC,v3,71/71] target/riscv: gdb: support vector registers for rv32

Message ID

20200806104709.13235-13-frank.chang@sifive.com

State

New

Headers

From: frank.chang@sifive.com
To: qemu-devel@nongnu.org,
	qemu-riscv@nongnu.org
Subject: [RFC v3 12/71] target/riscv: rvv-1.0: add fractional LMUL
Date: Thu,  6 Aug 2020 18:46:09 +0800
Message-Id: <20200806104709.13235-13-frank.chang@sifive.com>
In-Reply-To: <20200806104709.13235-1-frank.chang@sifive.com>
References: <20200806104709.13235-1-frank.chang@sifive.com>
Received-SPF: pass client-ip=2607:f8b0:4864:20::102b;
 envelope-from=frank.chang@sifive.com; helo=mail-pj1-x102b.google.com
X-Spam_score_int: -20
X-Spam_score: -2.1
X-Spam_bar: --
X-Spam_report: (-2.1 / 5.0 requ) BAYES_00=-1.9, DKIM_SIGNED=0.1,
 DKIM_VALID=-0.1, DKIM_VALID_AU=-0.1, DKIM_VALID_EF=-0.1,
 RCVD_IN_DNSWL_NONE=-0.0001, SPF_HELO_NONE=0.001, SPF_PASS=-0.001,
 URIBL_BLOCKED=0.001 autolearn=unavailable autolearn_force=no
X-Spam_action: no action
X-BeenThere: qemu-devel@nongnu.org
X-Mailman-Version: 2.1.23
Precedence: list
List-Id: <qemu-devel.nongnu.org>
List-Unsubscribe: <https://lists.nongnu.org/mailman/options/qemu-devel>,
 <mailto:qemu-devel-request@nongnu.org?subject=unsubscribe>
List-Archive: <https://lists.nongnu.org/archive/html/qemu-devel>
List-Post: <mailto:qemu-devel@nongnu.org>
List-Help: <mailto:qemu-devel-request@nongnu.org?subject=help>
List-Subscribe: <https://lists.nongnu.org/mailman/listinfo/qemu-devel>,
 <mailto:qemu-devel-request@nongnu.org?subject=subscribe>
Cc: Frank Chang <frank.chang@sifive.com>,
 Alistair Francis <Alistair.Francis@wdc.com>,
 Palmer Dabbelt <palmer@dabbelt.com>,
 Sagar Karandikar <sagark@eecs.berkeley.edu>,
 Bastian Koppelmann <kbastian@mail.uni-paderborn.de>
Errors-To: qemu-devel-bounces+incoming=patchwork.ozlabs.org@nongnu.org
Sender: "Qemu-devel"
 <qemu-devel-bounces+incoming=patchwork.ozlabs.org@nongnu.org>

Series

target/riscv: support vector extension v1.0 | expand

Commit Message

Frank Chang Aug. 6, 2020, 10:46 a.m. UTC

From: Frank Chang <frank.chang@sifive.com>

Introduce the concepts of fractional LMUL for RVV 1.0.
In RVV 1.0, LMUL bits are contiguous in vtype register.

Signed-off-by: Frank Chang <frank.chang@sifive.com>
---
 target/riscv/cpu.h                      | 15 ++++++++-------
 target/riscv/insn_trans/trans_rvv.inc.c |  9 ++++++---
 target/riscv/translate.c                |  3 +++
 target/riscv/vector_helper.c            | 17 +++++++++++++++--
 4 files changed, 32 insertions(+), 12 deletions(-)

Comments

Richard Henderson Aug. 6, 2020, 6:36 p.m. UTC | #1

On 8/6/20 3:46 AM, frank.chang@sifive.com wrote:
> +    float flmul;

int8_t?  It seems weird that the translator wouldn't also use...

> +/*
> + * Encode LMUL to lmul as following:
> + *     LMUL    vlmul    lmul
> + *      1       000       0
> + *      2       001       1
> + *      4       010       2
> + *      8       011       3
> + *      -       100       -
> + *     1/8      101      -3
> + *     1/4      110      -2
> + *     1/2      111      -1
> + */
> +static inline int32_t vext_lmul(uint32_t desc)
>  {
> -    return FIELD_EX32(simd_data(desc), VDATA, LMUL);
> +    uint32_t lmul = FIELD_EX32(simd_data(desc), VDATA, LMUL);
> +    return (int8_t)(lmul << 5) >> 5;
>  }

... this encoding?

Oh, and sextract32(lmul, 0, 3) instead of those shifts.


r~

Frank Chang Aug. 14, 2020, 3:12 a.m. UTC | #2

On Fri, Aug 7, 2020 at 2:36 AM Richard Henderson <
richard.henderson@linaro.org> wrote:

> On 8/6/20 3:46 AM, frank.chang@sifive.com wrote:
> > +    float flmul;
>
> int8_t?  It seems weird that the translator wouldn't also use...
>

It was kept for vector check functions.
However, I've removed float flmul and changed my
vector check functions to something like:

> static bool vext_check_sss(DisasContext *s, int vd, int vs1,
>                            int vs2, int vm, bool is_vs1)
> {
>     bool ret = require_vm(vm, vd);
>     if (s->lmul > 0) {
>         ret &= require_align(vd, 1 << s->lmul) &&
>                require_align(vs2, 1 << s->lmul);
>         if (is_vs1) {
>             ret &= require_align(vs1, 1 << s->lmul);
>         }
>     }
>     return ret;
> }

which use shifts to check the alignment/noover of vector registers.

The parameters passed to require_align() and require_noover()
are also changed to const uint8_t type so that the shifted value can be
wrapped within 8-bits.

int8_t lmul in DisasContext is also encoded:
ctx->lmul = sextract32(FIELD_EX32(tb_flags, TB_FLAGS, LMUL), 0, 3);


> > +/*
> > + * Encode LMUL to lmul as following:
> > + *     LMUL    vlmul    lmul
> > + *      1       000       0
> > + *      2       001       1
> > + *      4       010       2
> > + *      8       011       3
> > + *      -       100       -
> > + *     1/8      101      -3
> > + *     1/4      110      -2
> > + *     1/2      111      -1
> > + */
> > +static inline int32_t vext_lmul(uint32_t desc)
> >  {
> > -    return FIELD_EX32(simd_data(desc), VDATA, LMUL);
> > +    uint32_t lmul = FIELD_EX32(simd_data(desc), VDATA, LMUL);
> > +    return (int8_t)(lmul << 5) >> 5;
> >  }
>
> ... this encoding?
>
> Oh, and sextract32(lmul, 0, 3) instead of those shifts.
>

OK~


>
>
> r~
>

Thanks
Frank Chang

diff --git a/target/riscv/cpu.h b/target/riscv/cpu.h
index 08d2c10a024..d0f9a76ca01 100644
--- a/target/riscv/cpu.h
+++ b/target/riscv/cpu.h
@@ -94,10 +94,10 @@  typedef struct CPURISCVState CPURISCVState;
 
 #define RV_VLEN_MAX 256
 
-FIELD(VTYPE, VLMUL, 0, 2)
-FIELD(VTYPE, VSEW, 2, 3)
-FIELD(VTYPE, VEDIV, 5, 2)
-FIELD(VTYPE, RESERVED, 7, sizeof(target_ulong) * 8 - 9)
+FIELD(VTYPE, VLMUL, 0, 3)
+FIELD(VTYPE, VSEW, 3, 3)
+FIELD(VTYPE, VEDIV, 8, 2)
+FIELD(VTYPE, RESERVED, 10, sizeof(target_ulong) * 8 - 11)
 FIELD(VTYPE, VILL, sizeof(target_ulong) * 8 - 1, 1)
 
 struct CPURISCVState {
@@ -368,9 +368,10 @@  typedef RISCVCPU ArchCPU;
 #include "exec/cpu-all.h"
 
 FIELD(TB_FLAGS, VL_EQ_VLMAX, 2, 1)
-FIELD(TB_FLAGS, LMUL, 3, 2)
-FIELD(TB_FLAGS, SEW, 5, 3)
-FIELD(TB_FLAGS, VILL, 8, 1)
+FIELD(TB_FLAGS, LMUL, 3, 3)
+FIELD(TB_FLAGS, SEW, 6, 3)
+/* Skip MSTATUS_VS (0x600) fields */
+FIELD(TB_FLAGS, VILL, 11, 1)
 
 /*
  * A simplification for VLMAX
diff --git a/target/riscv/insn_trans/trans_rvv.inc.c b/target/riscv/insn_trans/trans_rvv.inc.c
index b529474403e..75aab0a50f9 100644
--- a/target/riscv/insn_trans/trans_rvv.inc.c
+++ b/target/riscv/insn_trans/trans_rvv.inc.c
@@ -1653,7 +1653,8 @@  static bool trans_vmv_v_v(DisasContext *s, arg_vmv_v_v *a)
                              vreg_ofs(s, a->rs1),
                              MAXSZ(s), MAXSZ(s));
         } else {
-            uint32_t data = FIELD_DP32(0, VDATA, LMUL, s->lmul);
+            uint32_t data = 0;
+            data = FIELD_DP32(data, VDATA, LMUL, s->lmul);
             static gen_helper_gvec_2_ptr * const fns[4] = {
                 gen_helper_vmv_v_v_b, gen_helper_vmv_v_v_h,
                 gen_helper_vmv_v_v_w, gen_helper_vmv_v_v_d,
@@ -1691,7 +1692,8 @@  static bool trans_vmv_v_x(DisasContext *s, arg_vmv_v_x *a)
             TCGv_i32 desc ;
             TCGv_i64 s1_i64 = tcg_temp_new_i64();
             TCGv_ptr dest = tcg_temp_new_ptr();
-            uint32_t data = FIELD_DP32(0, VDATA, LMUL, s->lmul);
+            uint32_t data = 0;
+            data = FIELD_DP32(data, VDATA, LMUL, s->lmul);
             static gen_helper_vmv_vx * const fns[4] = {
                 gen_helper_vmv_v_x_b, gen_helper_vmv_v_x_h,
                 gen_helper_vmv_v_x_w, gen_helper_vmv_v_x_d,
@@ -1729,7 +1731,8 @@  static bool trans_vmv_v_i(DisasContext *s, arg_vmv_v_i *a)
             TCGv_i32 desc;
             TCGv_i64 s1;
             TCGv_ptr dest;
-            uint32_t data = FIELD_DP32(0, VDATA, LMUL, s->lmul);
+            uint32_t data = 0;
+            data = FIELD_DP32(data, VDATA, LMUL, s->lmul);
             static gen_helper_vmv_vx * const fns[4] = {
                 gen_helper_vmv_v_x_b, gen_helper_vmv_v_x_h,
                 gen_helper_vmv_v_x_w, gen_helper_vmv_v_x_d,
diff --git a/target/riscv/translate.c b/target/riscv/translate.c
index 7b6088677d4..24026f901d1 100644
--- a/target/riscv/translate.c
+++ b/target/riscv/translate.c
@@ -60,6 +60,7 @@  typedef struct DisasContext {
     /* vector extension */
     bool vill;
     uint8_t lmul;
+    float flmul;
     uint8_t sew;
     uint16_t vlen;
     bool vl_eq_vlmax;
@@ -852,6 +853,8 @@  static void riscv_tr_init_disas_context(DisasContextBase *dcbase, CPUState *cs)
     ctx->vill = FIELD_EX32(tb_flags, TB_FLAGS, VILL);
     ctx->sew = FIELD_EX32(tb_flags, TB_FLAGS, SEW);
     ctx->lmul = FIELD_EX32(tb_flags, TB_FLAGS, LMUL);
+    ctx->flmul = (ctx->lmul < 4) ?
+                    (1 << ctx->lmul) : 1.0f / (1 << (8 - ctx->lmul));
     ctx->vl_eq_vlmax = FIELD_EX32(tb_flags, TB_FLAGS, VL_EQ_VLMAX);
 }
 
diff --git a/target/riscv/vector_helper.c b/target/riscv/vector_helper.c
index f42346cb9ca..4a4c18b8a96 100644
--- a/target/riscv/vector_helper.c
+++ b/target/riscv/vector_helper.c
@@ -86,9 +86,22 @@  static inline uint32_t vext_vm(uint32_t desc)
     return FIELD_EX32(simd_data(desc), VDATA, VM);
 }
 
-static inline uint32_t vext_lmul(uint32_t desc)
+/*
+ * Encode LMUL to lmul as following:
+ *     LMUL    vlmul    lmul
+ *      1       000       0
+ *      2       001       1
+ *      4       010       2
+ *      8       011       3
+ *      -       100       -
+ *     1/8      101      -3
+ *     1/4      110      -2
+ *     1/2      111      -1
+ */
+static inline int32_t vext_lmul(uint32_t desc)
 {
-    return FIELD_EX32(simd_data(desc), VDATA, LMUL);
+    uint32_t lmul = FIELD_EX32(simd_data(desc), VDATA, LMUL);
+    return (int8_t)(lmul << 5) >> 5;
 }
 
 static uint32_t vext_wd(uint32_t desc)

[RFC,v3,12/71] target/riscv: rvv-1.0: add fractional LMUL

Commit Message

Comments

Patch