sysprog21 · Dec 30, 2024
diff --git a/‎src/decode.c
Lines changed: 88 additions & 85 deletions b/‎src/decode.c
Lines changed: 88 additions & 85 deletions
diff --git a/‎src/encoding.h
Lines changed: 357 additions & 346 deletions b/‎src/encoding.h
Lines changed: 357 additions & 346 deletions
diff --git a/‎src/riscv_private.h
Lines changed: 4 additions & 4 deletions b/‎src/riscv_private.h
Lines changed: 4 additions & 4 deletions
diff --git a/‎src/rv32_vector.c
Lines changed: 66 additions & 51 deletions b/‎src/rv32_vector.c
Lines changed: 66 additions & 51 deletions
@@ -1982,7 +1982,8 @@ static inline bool op_cfsw(rv_insn_t *ir, const uint32_t insn)
 #define op_cflwsp OP_UNIMP
 #endif /* RV32_HAS(EXT_C) && RV32_HAS(EXT_F) */
 
-static inline bool op_ivv(rv_insn_t *ir, const uint32_t insn) {
+static inline bool op_ivv(rv_insn_t *ir, const uint32_t insn)
+{
 #define MASK 0xfc00707f
 #define MATCH_VADD_VI 0x3057
 #define MATCH_VAND_VI 0x24003057
@@ -2011,74 +2012,74 @@ static inline bool op_ivv(rv_insn_t *ir, const uint32_t insn) {
     ir->rs2 = decode_rs2(insn);
     ir->vm = decode_rvv_vm(insn);
     switch (insn & MASK) {
-        case MATCH_VADD_VI:
+    case MATCH_VADD_VI:
         ir->opcode = rv_insn_vadd_vi;
-            break;
-        case MATCH_VAND_VI:
+        break;
+    case MATCH_VAND_VI:
         ir->opcode = rv_insn_vand_vi;
-            break;
-        case MATCH_VMADC_VI:
+        break;
+    case MATCH_VMADC_VI:
         ir->opcode = rv_insn_vmadc_vi;
-            break;
-        case MATCH_VMSEQ_VI:
+        break;
+    case MATCH_VMSEQ_VI:
         ir->opcode = rv_insn_vmseq_vi;
-            break;
-        case MATCH_VMSGT_VI:
+        break;
+    case MATCH_VMSGT_VI:
         ir->opcode = rv_insn_vmsgt_vi;
-            break;
-        case MATCH_VMSGTU_VI:
+        break;
+    case MATCH_VMSGTU_VI:
         ir->opcode = rv_insn_vmsgtu_vi;
-            break;
-        case MATCH_VMSLE_VI:
+        break;
+    case MATCH_VMSLE_VI:
         ir->opcode = rv_insn_vmsle_vi;
-            break;
-        case MATCH_VMSLEU_VI:
+        break;
+    case MATCH_VMSLEU_VI:
         ir->opcode = rv_insn_vmsleu_vi;
-            break;
-        case MATCH_VMSNE_VI:
+        break;
+    case MATCH_VMSNE_VI:
         ir->opcode = rv_insn_vmsne_vi;
-            break;
-        case MATCH_VOR_VI:
+        break;
+    case MATCH_VOR_VI:
         ir->opcode = rv_insn_vor_vi;
-            break;
-        case MATCH_VRGATHER_VI:
+        break;
+    case MATCH_VRGATHER_VI:
         ir->opcode = rv_insn_vrgather_vi;
-            break;
-        case MATCH_VRSUB_VI:
+        break;
+    case MATCH_VRSUB_VI:
         ir->opcode = rv_insn_vrsub_vi;
-            break;
-        case MATCH_VSADD_VI:
+        break;
+    case MATCH_VSADD_VI:
         ir->opcode = rv_insn_vsadd_vi;
-            break;
-        case MATCH_VSADDU_VI:
+        break;
+    case MATCH_VSADDU_VI:
         ir->opcode = rv_insn_vsaddu_vi;
-            break;
-        case MATCH_VSLIDEDOWN_VI:
+        break;
+    case MATCH_VSLIDEDOWN_VI:
         ir->opcode = rv_insn_vslidedown_vi;
-            break;
-        case MATCH_VSLIDEUP_VI:
+        break;
+    case MATCH_VSLIDEUP_VI:
         ir->opcode = rv_insn_vslideup_vi;
-            break;
-        case MATCH_VSLL_VI:
+        break;
+    case MATCH_VSLL_VI:
         ir->opcode = rv_insn_vsll_vi;
-            break;
-        case MATCH_VSRA_VI:
+        break;
+    case MATCH_VSRA_VI:
         ir->opcode = rv_insn_vsra_vi;
-            break;
-        case MATCH_VSRL_VI:
+        break;
+    case MATCH_VSRL_VI:
         ir->opcode = rv_insn_vsrl_vi;
-            break;
-        case MATCH_VSSRA_VI:
+        break;
+    case MATCH_VSSRA_VI:
         ir->opcode = rv_insn_vssra_vi;
-            break;
-        case MATCH_VSSRL_VI:
+        break;
+    case MATCH_VSSRL_VI:
         ir->opcode = rv_insn_vssrl_vi;
-            break;
-        case MATCH_VXOR_VI:
+        break;
+    case MATCH_VXOR_VI:
         ir->opcode = rv_insn_vxor_vi;
-            break;
-        default:
-            return false;
+        break;
+    default:
+        return false;
     }
 }
 
@@ -2090,43 +2091,45 @@ static inline bool op_fvf(rv_insn_t *ir, const uint32_t insn) {}
 static inline bool op_mvx(rv_insn_t *ir, const uint32_t insn) {}
 
 /* OP: RVV
- * opcode is 0x57 for VALU and VCFG 
+ * opcode is 0x57 for VALU and VCFG
  *
  * VALU format:
  * 31      26  25   24      20 19      15 14   12 11      7 6     0
- *  funct6   | vm  |   vs2    |    vs1   | 0 0 0 (funct3) |    vd   |1010111| OP-V (OPIVV)
- *  funct6   | vm  |   vs2    |    vs1   | 0 0 1 (funct3) |  vd/rd  |1010111| OP-V (OPFVV)
- *  funct6   | vm  |   vs2    |    vs1   | 0 1 0 (funct3) |  vd/rd  |1010111| OP-V (OPMVV)
- *  funct6   | vm  |   vs2    | imm[4:0] | 0 1 1 (funct3) |    vd   |1010111| OP-V (OPIVI)
- *  funct6   | vm  |   vs2    |    rs1   | 1 0 0 (funct3) |    vd   |1010111| OP-V (OPIVX)
- *  funct6   | vm  |   vs2    |    rs1   | 1 0 1 (funct3) |    vd   |1010111| OP-V (OPFVF)
- *  funct6   | vm  |   vs2    |    rs1   | 1 1 0 (funct3) |  vd/rd  |1010111| OP-V (OPMVX)
- *     6        1        5          5        3        5        7
- * 
+ *  funct6   | vm  |   vs2    |    vs1   | 0 0 0 (funct3) |    vd   |1010111|
+ * OP-V (OPIVV) funct6   | vm  |   vs2    |    vs1   | 0 0 1 (funct3) |  vd/rd
+ * |1010111| OP-V (OPFVV) funct6   | vm  |   vs2    |    vs1   | 0 1 0 (funct3)
+ * |  vd/rd  |1010111| OP-V (OPMVV) funct6   | vm  |   vs2    | imm[4:0] | 0 1 1
+ * (funct3) |    vd   |1010111| OP-V (OPIVI) funct6   | vm  |   vs2    |    rs1
+ * | 1 0 0 (funct3) |    vd   |1010111| OP-V (OPIVX) funct6   | vm  |   vs2    |
+ * rs1   | 1 0 1 (funct3) |    vd   |1010111| OP-V (OPFVF) funct6   | vm  | vs2
+ * |    rs1   | 1 1 0 (funct3) |  vd/rd  |1010111| OP-V (OPMVX) 6        1 5 5
+ * 3        5        7
+ *
  * Where 'vm' is the bit indicates whether masking is enabled
- *  see https://github.com/riscv/riscv-v-spec/blob/master/v-spec.adoc#531-mask-encoding
- * 
+ *  see
+ * https://github.com/riscv/riscv-v-spec/blob/master/v-spec.adoc#531-mask-encoding
+ *
  * VMEM format:
- * 
+ *
  * 31 29  28  27 26  25  24      20 19       15 14   12 11      7 6     0
- *  nf | mew| mop | vm |  lumop   |    rs1    | width |    vd   |0000111| VL*  unit-stride
- *  nf | mew| mop | vm |   rs2    |    rs1    | width |    vd   |0000111| VLS* strided
- *  nf | mew| mop | vm |   vs2    |    rs1    | width |    vd   |0000111| VLX* indexed
- *  3     1    2     1      5           5         3         5       7
- * 
+ *  nf | mew| mop | vm |  lumop   |    rs1    | width |    vd   |0000111| VL*
+ * unit-stride nf | mew| mop | vm |   rs2    |    rs1    | width |    vd
+ * |0000111| VLS* strided nf | mew| mop | vm |   vs2    |    rs1    | width | vd
+ * |0000111| VLX* indexed 3     1    2     1      5           5         3 5 7
+ *
  * VCFG format:
- * 
+ *
  *  31 30         25 24      20 19      15 14   12 11      7 6     0
  * 0 |        zimm[10:0]      |    rs1   | 1 1 1 |    rd   |1010111| vsetvli
  * 1 |   1|  zimm[ 9:0]       | uimm[4:0]| 1 1 1 |    rd   |1010111| vsetivli
  * 1 |   000000    |   rs2    |    rs1   | 1 1 1 |    rd   |1010111| vsetvl
  * 1        6            5          5        3        5        7
- * 
+ *
  * reference:
  *   https://github.com/riscv/riscv-isa-manual/blob/main/src/images/wavedrom/valu-format.edn
  *   https://github.com/riscv/riscv-isa-manual/blob/main/src/images/wavedrom/v-inst-table.edn
  *   https://observablehq.com/@drom/risc-v-v
- * 
+ *
  * funct3
  * | 0 | 0 | 0 | OPIVV | vector-vector    |       N/A
  * | 0 | 0 | 1 | OPFVV | vector-vector    |       N/A
@@ -2140,22 +2143,22 @@ static inline bool op_v(rv_insn_t *ir, const uint32_t insn)
 {
     uint32_t funct3_mask = 0x7000;
     switch ((insn & funct3_mask) >> 7) {
-        case 0:
-            return op_ivv(ir, insn);        
-        case 1:
-            return op_fvv(ir, insn);        
-        case 2:
-            return op_mvv(ir, insn);        
-        case 3:
-            return op_ivi(ir, insn);        
-        case 4:
-            return op_ivx(ir, insn);        
-        case 5:
-            return op_fvf(ir, insn);        
-        case 6:
-            return op_mvx(ir, insn);        
-        default:
-            return false;
+    case 0:
+        return op_ivv(ir, insn);
+    case 1:
+        return op_fvv(ir, insn);
+    case 2:
+        return op_mvv(ir, insn);
+    case 3:
+        return op_ivi(ir, insn);
+    case 4:
+        return op_ivx(ir, insn);
+    case 5:
+        return op_fvf(ir, insn);
+    case 6:
+        return op_mvx(ir, insn);
+    default:
+        return false;
     }
 
     if ((insn & MASK_VSETVLI) == MATCH_VSETVLI) {
@@ -2167,7 +2170,7 @@ static inline bool op_v(rv_insn_t *ir, const uint32_t insn)
         // vsetivli
         ir->rd = (insn >> 7) & 0x1f;
         ir->uimm = (insn >> 15) & 0x1f;
-        ir->zimm = (insn >> 20) & 0x3ff; // zimm[9:0]
+        ir->zimm = (insn >> 20) & 0x3ff;  // zimm[9:0]
 
     } else if ((insn & MASK_VSETVL) == MATCH_VSETVL) {
         // vsetvl
 
@@ -136,10 +136,10 @@ struct riscv_internal {
 #endif
 
 #if RV32_HAS(EXT_RVV)
-#define VLEN 128 // FIXME should not use a const and not even here for VLEN
-    uint8_t V1[(VLEN>>3)];
-    uint8_t V2[(VLEN>>3)];
-    uint8_t Vd[(VLEN>>3)];
+#define VLEN 128  // FIXME should not use a const and not even here for VLEN
+    uint8_t V1[(VLEN >> 3)];
+    uint8_t V2[(VLEN >> 3)];
+    uint8_t Vd[(VLEN >> 3)];
     uint8_t vl; /* current vl size */
     uint8_t lmul;
     uint8_t sew; /* current sew size */
 
@@ -1,67 +1,82 @@
 /* RV32 RVV Instruction Set */
 
 
-RVOP(vsetvli, { 
-    // | `vlmul[2:0]` | LMUL   | #groups | VLMAX           | Registers grouped with register `n`              |
-    // |--------------|--------|---------|-----------------|--------------------------------------------------|
-    // | `1 0 0`      | -      | -       | -               | Reserved                                         |
-    // | `1 0 1`      | `1/8`  | 32      | `VLEN/SEW/8`    | `v_n` (single register in group)                |
-    // | `1 1 0`      | `1/4`  | 32      | `VLEN/SEW/4`    | `v_n` (single register in group)                |
-    // | `1 1 1`      | `1/2`  | 32      | `VLEN/SEW/2`    | `v_n` (single register in group)                |
-    // | `0 0 0`      | `1`    | 32      | `VLEN/SEW`      | `v_n` (single register in group)                |
-    // | `0 0 1`      | `2`    | 16      | `2*VLEN/SEW`    | `v_n`, `v_n+1`                                  |
-    // | `0 1 0`      | `4`    | 8       | `4*VLEN/SEW`    | `v_n`, ..., `v_n+3`                             |
-    // | `0 1 1`      | `8`    | 4       | `8*VLEN/SEW`    | `v_n`, ..., `v_n+7`                             |
-    rv->lmul = 1<<(ir->zimm & 0x3);
-    if (ir->zimm & 0x4) {
-        rv->lmul = 1;
-    }
+RVOP(
+    vsetvli,
+    {
+        // | `vlmul[2:0]` | LMUL   | #groups | VLMAX           | Registers
+        // grouped with register `n`              |
+        // |--------------|--------|---------|-----------------|--------------------------------------------------|
+        // | `1 0 0`      | -      | -       | -               | Reserved | | `1
+        // 0 1`      | `1/8`  | 32      | `VLEN/SEW/8`    | `v_n` (single
+        // register in group)                | | `1 1 0`      | `1/4`  | 32 |
+        // `VLEN/SEW/4`    | `v_n` (single register in group)                |
+        // | `1 1 1`      | `1/2`  | 32      | `VLEN/SEW/2`    | `v_n` (single
+        // register in group)                | | `0 0 0`      | `1`    | 32 |
+        // `VLEN/SEW`      | `v_n` (single register in group)                |
+        // | `0 0 1`      | `2`    | 16      | `2*VLEN/SEW`    | `v_n`, `v_n+1`
+        // | | `0 1 0`      | `4`    | 8       | `4*VLEN/SEW`    | `v_n`, ...,
+        // `v_n+3`                             | | `0 1 1`      | `8`    | 4 |
+        // `8*VLEN/SEW`    | `v_n`, ..., `v_n+7`                             |
+        rv->lmul = 1 << (ir->zimm & 0x3);
+        if (ir->zimm & 0x4) {
+            rv->lmul = 1;
+        }
 
-    // | `vsew[2:0]` | SEW      |
-    // |-------------|----------|
-    // | 0 0 0       | 8        |
-    // | 0 0 1       | 16       |
-    // | 0 1 0       | 32       |
-    // | 0 1 1       | 64       |
-    // | 1 X X       | Reserved |
-    rv->sew = 8 << (ir->zimm & 0xf); 
-    }, GEN({/* no operation */}))
+        // | `vsew[2:0]` | SEW      |
+        // |-------------|----------|
+        // | 0 0 0       | 8        |
+        // | 0 0 1       | 16       |
+        // | 0 1 0       | 32       |
+        // | 0 1 1       | 64       |
+        // | 1 X X       | Reserved |
+        rv->sew = 8 << (ir->zimm & 0xf);
+    },
+    GEN({/* no operation */}))
 
-#define ADD_VV(BIT)                                        \
-  static inline *int##BIT##_t add_vv_i##BIT##(int##BIT##_t *a, int##BIT##_t *b, size_t size) {    \
-    int##BIT##_t c[size];\
-    for (int i = 0; i < size; i++) {\
-        c[i]=a[i]+b[i];\
-    }\
-    return c;\
-  }                                                                       
+#define ADD_VV(BIT)                                                           \
+    static inline *int##BIT##_t add_vv_i##BIT##(int##BIT##_t *a,              \
+                                                int##BIT##_t *b, size_t size) \
+    {                                                                         \
+        int##BIT##_t c[size];                                                 \
+        for (int i = 0; i < size; i++) {                                      \
+            c[i] = a[i] + b[i];                                               \
+        }                                                                     \
+        return c;                                                             \
+    }
 ADD_VV(8)
 ADD_VV(16)
 ADD_VV(32)
 ADD_VV(64)
 
 
 RVOP(vadd_vi, { rv->V1[rv_reg_zero] = 0; }, GEN({/* no operation */}))
-RVOP(vadd_vv, { 
-    switch (rv->sew) {
-    case 8:        
-        rv->Vd = (* int8_t)add_vv_i8((*int8_t)rv->V1, (*int8_t)rv->V2, rv-vl/8);
-        break;
-    case 16:        
-    rv->Vd = (* int8_t)add_vv_i16((*int16_t)rv->V1, (*int16_t)rv->V2, rv-vl/16);
-        break;
-    case 32:        
-    rv->Vd = (* int8_t)add_vv_i32((*int32_t)rv->V1, (*int32_t)rv->V2, rv-vl/32);
-        break;
-    case 64:        
-    rv->Vd = (* int8_t)add_vv_i64((*int64_t)rv->V1, (*int64_t)rv->V2, rv-vl/64);
-        break;
-    
-    default:
-        break;
-    }
+RVOP(
+    vadd_vv,
+    {
+        switch (rv->sew) {
+        case 8:
+            rv->Vd = (*int8_t) add_vv_i8((*int8_t) rv->V1, (*int8_t) rv->V2,
+                                         rv - vl / 8);
+            break;
+        case 16:
+            rv->Vd = (*int8_t) add_vv_i16((*int16_t) rv->V1, (*int16_t) rv->V2,
+                                          rv - vl / 16);
+            break;
+        case 32:
+            rv->Vd = (*int8_t) add_vv_i32((*int32_t) rv->V1, (*int32_t) rv->V2,
+                                          rv - vl / 32);
+            break;
+        case 64:
+            rv->Vd = (*int8_t) add_vv_i64((*int64_t) rv->V1, (*int64_t) rv->V2,
+                                          rv - vl / 64);
+            break;
 
-}, GEN({/* no operation */}))
+        default:
+            break;
+        }
+    },
+    GEN({/* no operation */}))
 RVOP(vand_vi, { rv->Vd[rv_reg_zero] = 0; }, GEN({/* no operation */}))
 RVOP(vand_vv, { rv->Vd[rv_reg_zero] = 0; }, GEN({/* no operation */}))
 RVOP(vmadc_vi, { rv->Vd[rv_reg_zero] = 0; }, GEN({/* no operation */}))