Vector Integer Arithmetic Intrinsics

Vector Single-Width Integer Add and Subtract Intrinsics

vint8mf8_t __riscv_vadd_vv_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                    vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vadd_vx_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2, int8_t rs1,
                                    size_t vl);
vint8mf4_t __riscv_vadd_vv_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                    vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vadd_vx_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2, int8_t rs1,
                                    size_t vl);
vint8mf2_t __riscv_vadd_vv_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                    vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vadd_vx_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2, int8_t rs1,
                                    size_t vl);
vint8m1_t __riscv_vadd_vv_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, vint8m1_t vs1,
                                  size_t vl);
vint8m1_t __riscv_vadd_vx_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, int8_t rs1,
                                  size_t vl);
vint8m2_t __riscv_vadd_vv_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, vint8m2_t vs1,
                                  size_t vl);
vint8m2_t __riscv_vadd_vx_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, int8_t rs1,
                                  size_t vl);
vint8m4_t __riscv_vadd_vv_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, vint8m4_t vs1,
                                  size_t vl);
vint8m4_t __riscv_vadd_vx_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, int8_t rs1,
                                  size_t vl);
vint8m8_t __riscv_vadd_vv_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, vint8m8_t vs1,
                                  size_t vl);
vint8m8_t __riscv_vadd_vx_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, int8_t rs1,
                                  size_t vl);
vint16mf4_t __riscv_vadd_vv_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                      vint16mf4_t vs1, size_t vl);
vint16mf4_t __riscv_vadd_vx_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                      int16_t rs1, size_t vl);
vint16mf2_t __riscv_vadd_vv_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                      vint16mf2_t vs1, size_t vl);
vint16mf2_t __riscv_vadd_vx_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                      int16_t rs1, size_t vl);
vint16m1_t __riscv_vadd_vv_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                    vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vadd_vx_i16m1_tu(vint16m1_t vd, vint16m1_t vs2, int16_t rs1,
                                    size_t vl);
vint16m2_t __riscv_vadd_vv_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                    vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vadd_vx_i16m2_tu(vint16m2_t vd, vint16m2_t vs2, int16_t rs1,
                                    size_t vl);
vint16m4_t __riscv_vadd_vv_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                    vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vadd_vx_i16m4_tu(vint16m4_t vd, vint16m4_t vs2, int16_t rs1,
                                    size_t vl);
vint16m8_t __riscv_vadd_vv_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                    vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vadd_vx_i16m8_tu(vint16m8_t vd, vint16m8_t vs2, int16_t rs1,
                                    size_t vl);
vint32mf2_t __riscv_vadd_vv_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                      vint32mf2_t vs1, size_t vl);
vint32mf2_t __riscv_vadd_vx_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                      int32_t rs1, size_t vl);
vint32m1_t __riscv_vadd_vv_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                    vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vadd_vx_i32m1_tu(vint32m1_t vd, vint32m1_t vs2, int32_t rs1,
                                    size_t vl);
vint32m2_t __riscv_vadd_vv_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                    vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vadd_vx_i32m2_tu(vint32m2_t vd, vint32m2_t vs2, int32_t rs1,
                                    size_t vl);
vint32m4_t __riscv_vadd_vv_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                    vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vadd_vx_i32m4_tu(vint32m4_t vd, vint32m4_t vs2, int32_t rs1,
                                    size_t vl);
vint32m8_t __riscv_vadd_vv_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                    vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vadd_vx_i32m8_tu(vint32m8_t vd, vint32m8_t vs2, int32_t rs1,
                                    size_t vl);
vint64m1_t __riscv_vadd_vv_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                    vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vadd_vx_i64m1_tu(vint64m1_t vd, vint64m1_t vs2, int64_t rs1,
                                    size_t vl);
vint64m2_t __riscv_vadd_vv_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                    vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vadd_vx_i64m2_tu(vint64m2_t vd, vint64m2_t vs2, int64_t rs1,
                                    size_t vl);
vint64m4_t __riscv_vadd_vv_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                    vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vadd_vx_i64m4_tu(vint64m4_t vd, vint64m4_t vs2, int64_t rs1,
                                    size_t vl);
vint64m8_t __riscv_vadd_vv_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                    vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vadd_vx_i64m8_tu(vint64m8_t vd, vint64m8_t vs2, int64_t rs1,
                                    size_t vl);
vint8mf8_t __riscv_vsub_vv_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                    vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vsub_vx_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2, int8_t rs1,
                                    size_t vl);
vint8mf4_t __riscv_vsub_vv_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                    vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vsub_vx_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2, int8_t rs1,
                                    size_t vl);
vint8mf2_t __riscv_vsub_vv_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                    vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vsub_vx_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2, int8_t rs1,
                                    size_t vl);
vint8m1_t __riscv_vsub_vv_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, vint8m1_t vs1,
                                  size_t vl);
vint8m1_t __riscv_vsub_vx_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, int8_t rs1,
                                  size_t vl);
vint8m2_t __riscv_vsub_vv_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, vint8m2_t vs1,
                                  size_t vl);
vint8m2_t __riscv_vsub_vx_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, int8_t rs1,
                                  size_t vl);
vint8m4_t __riscv_vsub_vv_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, vint8m4_t vs1,
                                  size_t vl);
vint8m4_t __riscv_vsub_vx_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, int8_t rs1,
                                  size_t vl);
vint8m8_t __riscv_vsub_vv_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, vint8m8_t vs1,
                                  size_t vl);
vint8m8_t __riscv_vsub_vx_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, int8_t rs1,
                                  size_t vl);
vint16mf4_t __riscv_vsub_vv_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                      vint16mf4_t vs1, size_t vl);
vint16mf4_t __riscv_vsub_vx_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                      int16_t rs1, size_t vl);
vint16mf2_t __riscv_vsub_vv_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                      vint16mf2_t vs1, size_t vl);
vint16mf2_t __riscv_vsub_vx_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                      int16_t rs1, size_t vl);
vint16m1_t __riscv_vsub_vv_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                    vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vsub_vx_i16m1_tu(vint16m1_t vd, vint16m1_t vs2, int16_t rs1,
                                    size_t vl);
vint16m2_t __riscv_vsub_vv_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                    vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vsub_vx_i16m2_tu(vint16m2_t vd, vint16m2_t vs2, int16_t rs1,
                                    size_t vl);
vint16m4_t __riscv_vsub_vv_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                    vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vsub_vx_i16m4_tu(vint16m4_t vd, vint16m4_t vs2, int16_t rs1,
                                    size_t vl);
vint16m8_t __riscv_vsub_vv_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                    vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vsub_vx_i16m8_tu(vint16m8_t vd, vint16m8_t vs2, int16_t rs1,
                                    size_t vl);
vint32mf2_t __riscv_vsub_vv_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                      vint32mf2_t vs1, size_t vl);
vint32mf2_t __riscv_vsub_vx_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                      int32_t rs1, size_t vl);
vint32m1_t __riscv_vsub_vv_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                    vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vsub_vx_i32m1_tu(vint32m1_t vd, vint32m1_t vs2, int32_t rs1,
                                    size_t vl);
vint32m2_t __riscv_vsub_vv_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                    vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vsub_vx_i32m2_tu(vint32m2_t vd, vint32m2_t vs2, int32_t rs1,
                                    size_t vl);
vint32m4_t __riscv_vsub_vv_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                    vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vsub_vx_i32m4_tu(vint32m4_t vd, vint32m4_t vs2, int32_t rs1,
                                    size_t vl);
vint32m8_t __riscv_vsub_vv_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                    vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vsub_vx_i32m8_tu(vint32m8_t vd, vint32m8_t vs2, int32_t rs1,
                                    size_t vl);
vint64m1_t __riscv_vsub_vv_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                    vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vsub_vx_i64m1_tu(vint64m1_t vd, vint64m1_t vs2, int64_t rs1,
                                    size_t vl);
vint64m2_t __riscv_vsub_vv_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                    vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vsub_vx_i64m2_tu(vint64m2_t vd, vint64m2_t vs2, int64_t rs1,
                                    size_t vl);
vint64m4_t __riscv_vsub_vv_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                    vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vsub_vx_i64m4_tu(vint64m4_t vd, vint64m4_t vs2, int64_t rs1,
                                    size_t vl);
vint64m8_t __riscv_vsub_vv_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                    vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vsub_vx_i64m8_tu(vint64m8_t vd, vint64m8_t vs2, int64_t rs1,
                                    size_t vl);
vint8mf8_t __riscv_vrsub_vx_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2, int8_t rs1,
                                     size_t vl);
vint8mf4_t __riscv_vrsub_vx_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2, int8_t rs1,
                                     size_t vl);
vint8mf2_t __riscv_vrsub_vx_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2, int8_t rs1,
                                     size_t vl);
vint8m1_t __riscv_vrsub_vx_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, int8_t rs1,
                                   size_t vl);
vint8m2_t __riscv_vrsub_vx_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, int8_t rs1,
                                   size_t vl);
vint8m4_t __riscv_vrsub_vx_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, int8_t rs1,
                                   size_t vl);
vint8m8_t __riscv_vrsub_vx_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, int8_t rs1,
                                   size_t vl);
vint16mf4_t __riscv_vrsub_vx_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                       int16_t rs1, size_t vl);
vint16mf2_t __riscv_vrsub_vx_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                       int16_t rs1, size_t vl);
vint16m1_t __riscv_vrsub_vx_i16m1_tu(vint16m1_t vd, vint16m1_t vs2, int16_t rs1,
                                     size_t vl);
vint16m2_t __riscv_vrsub_vx_i16m2_tu(vint16m2_t vd, vint16m2_t vs2, int16_t rs1,
                                     size_t vl);
vint16m4_t __riscv_vrsub_vx_i16m4_tu(vint16m4_t vd, vint16m4_t vs2, int16_t rs1,
                                     size_t vl);
vint16m8_t __riscv_vrsub_vx_i16m8_tu(vint16m8_t vd, vint16m8_t vs2, int16_t rs1,
                                     size_t vl);
vint32mf2_t __riscv_vrsub_vx_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                       int32_t rs1, size_t vl);
vint32m1_t __riscv_vrsub_vx_i32m1_tu(vint32m1_t vd, vint32m1_t vs2, int32_t rs1,
                                     size_t vl);
vint32m2_t __riscv_vrsub_vx_i32m2_tu(vint32m2_t vd, vint32m2_t vs2, int32_t rs1,
                                     size_t vl);
vint32m4_t __riscv_vrsub_vx_i32m4_tu(vint32m4_t vd, vint32m4_t vs2, int32_t rs1,
                                     size_t vl);
vint32m8_t __riscv_vrsub_vx_i32m8_tu(vint32m8_t vd, vint32m8_t vs2, int32_t rs1,
                                     size_t vl);
vint64m1_t __riscv_vrsub_vx_i64m1_tu(vint64m1_t vd, vint64m1_t vs2, int64_t rs1,
                                     size_t vl);
vint64m2_t __riscv_vrsub_vx_i64m2_tu(vint64m2_t vd, vint64m2_t vs2, int64_t rs1,
                                     size_t vl);
vint64m4_t __riscv_vrsub_vx_i64m4_tu(vint64m4_t vd, vint64m4_t vs2, int64_t rs1,
                                     size_t vl);
vint64m8_t __riscv_vrsub_vx_i64m8_tu(vint64m8_t vd, vint64m8_t vs2, int64_t rs1,
                                     size_t vl);
vint8mf8_t __riscv_vneg_v_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs, size_t vl);
vint8mf4_t __riscv_vneg_v_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs, size_t vl);
vint8mf2_t __riscv_vneg_v_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs, size_t vl);
vint8m1_t __riscv_vneg_v_i8m1_tu(vint8m1_t vd, vint8m1_t vs, size_t vl);
vint8m2_t __riscv_vneg_v_i8m2_tu(vint8m2_t vd, vint8m2_t vs, size_t vl);
vint8m4_t __riscv_vneg_v_i8m4_tu(vint8m4_t vd, vint8m4_t vs, size_t vl);
vint8m8_t __riscv_vneg_v_i8m8_tu(vint8m8_t vd, vint8m8_t vs, size_t vl);
vint16mf4_t __riscv_vneg_v_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs, size_t vl);
vint16mf2_t __riscv_vneg_v_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs, size_t vl);
vint16m1_t __riscv_vneg_v_i16m1_tu(vint16m1_t vd, vint16m1_t vs, size_t vl);
vint16m2_t __riscv_vneg_v_i16m2_tu(vint16m2_t vd, vint16m2_t vs, size_t vl);
vint16m4_t __riscv_vneg_v_i16m4_tu(vint16m4_t vd, vint16m4_t vs, size_t vl);
vint16m8_t __riscv_vneg_v_i16m8_tu(vint16m8_t vd, vint16m8_t vs, size_t vl);
vint32mf2_t __riscv_vneg_v_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs, size_t vl);
vint32m1_t __riscv_vneg_v_i32m1_tu(vint32m1_t vd, vint32m1_t vs, size_t vl);
vint32m2_t __riscv_vneg_v_i32m2_tu(vint32m2_t vd, vint32m2_t vs, size_t vl);
vint32m4_t __riscv_vneg_v_i32m4_tu(vint32m4_t vd, vint32m4_t vs, size_t vl);
vint32m8_t __riscv_vneg_v_i32m8_tu(vint32m8_t vd, vint32m8_t vs, size_t vl);
vint64m1_t __riscv_vneg_v_i64m1_tu(vint64m1_t vd, vint64m1_t vs, size_t vl);
vint64m2_t __riscv_vneg_v_i64m2_tu(vint64m2_t vd, vint64m2_t vs, size_t vl);
vint64m4_t __riscv_vneg_v_i64m4_tu(vint64m4_t vd, vint64m4_t vs, size_t vl);
vint64m8_t __riscv_vneg_v_i64m8_tu(vint64m8_t vd, vint64m8_t vs, size_t vl);
vuint8mf8_t __riscv_vadd_vv_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                     vuint8mf8_t vs1, size_t vl);
vuint8mf8_t __riscv_vadd_vx_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vadd_vv_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                     vuint8mf4_t vs1, size_t vl);
vuint8mf4_t __riscv_vadd_vx_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vadd_vv_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                     vuint8mf2_t vs1, size_t vl);
vuint8mf2_t __riscv_vadd_vx_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vadd_vv_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2,
                                   vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vadd_vx_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2, uint8_t rs1,
                                   size_t vl);
vuint8m2_t __riscv_vadd_vv_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2,
                                   vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vadd_vx_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2, uint8_t rs1,
                                   size_t vl);
vuint8m4_t __riscv_vadd_vv_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2,
                                   vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vadd_vx_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2, uint8_t rs1,
                                   size_t vl);
vuint8m8_t __riscv_vadd_vv_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2,
                                   vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vadd_vx_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2, uint8_t rs1,
                                   size_t vl);
vuint16mf4_t __riscv_vadd_vv_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                       vuint16mf4_t vs1, size_t vl);
vuint16mf4_t __riscv_vadd_vx_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                       uint16_t rs1, size_t vl);
vuint16mf2_t __riscv_vadd_vv_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                       vuint16mf2_t vs1, size_t vl);
vuint16mf2_t __riscv_vadd_vx_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                       uint16_t rs1, size_t vl);
vuint16m1_t __riscv_vadd_vv_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                     vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vadd_vx_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                     uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vadd_vv_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                     vuint16m2_t vs1, size_t vl);
vuint16m2_t __riscv_vadd_vx_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                     uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vadd_vv_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                     vuint16m4_t vs1, size_t vl);
vuint16m4_t __riscv_vadd_vx_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                     uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vadd_vv_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                     vuint16m8_t vs1, size_t vl);
vuint16m8_t __riscv_vadd_vx_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                     uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vadd_vv_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                       vuint32mf2_t vs1, size_t vl);
vuint32mf2_t __riscv_vadd_vx_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                       uint32_t rs1, size_t vl);
vuint32m1_t __riscv_vadd_vv_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                     vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vadd_vx_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                     uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vadd_vv_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                     vuint32m2_t vs1, size_t vl);
vuint32m2_t __riscv_vadd_vx_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                     uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vadd_vv_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                     vuint32m4_t vs1, size_t vl);
vuint32m4_t __riscv_vadd_vx_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                     uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vadd_vv_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                     vuint32m8_t vs1, size_t vl);
vuint32m8_t __riscv_vadd_vx_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                     uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vadd_vv_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                     vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vadd_vx_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                     uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vadd_vv_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                     vuint64m2_t vs1, size_t vl);
vuint64m2_t __riscv_vadd_vx_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                     uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vadd_vv_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                     vuint64m4_t vs1, size_t vl);
vuint64m4_t __riscv_vadd_vx_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                     uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vadd_vv_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                     vuint64m8_t vs1, size_t vl);
vuint64m8_t __riscv_vadd_vx_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                     uint64_t rs1, size_t vl);
vuint8mf8_t __riscv_vsub_vv_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                     vuint8mf8_t vs1, size_t vl);
vuint8mf8_t __riscv_vsub_vx_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vsub_vv_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                     vuint8mf4_t vs1, size_t vl);
vuint8mf4_t __riscv_vsub_vx_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vsub_vv_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                     vuint8mf2_t vs1, size_t vl);
vuint8mf2_t __riscv_vsub_vx_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vsub_vv_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2,
                                   vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vsub_vx_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2, uint8_t rs1,
                                   size_t vl);
vuint8m2_t __riscv_vsub_vv_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2,
                                   vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vsub_vx_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2, uint8_t rs1,
                                   size_t vl);
vuint8m4_t __riscv_vsub_vv_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2,
                                   vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vsub_vx_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2, uint8_t rs1,
                                   size_t vl);
vuint8m8_t __riscv_vsub_vv_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2,
                                   vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vsub_vx_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2, uint8_t rs1,
                                   size_t vl);
vuint16mf4_t __riscv_vsub_vv_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                       vuint16mf4_t vs1, size_t vl);
vuint16mf4_t __riscv_vsub_vx_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                       uint16_t rs1, size_t vl);
vuint16mf2_t __riscv_vsub_vv_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                       vuint16mf2_t vs1, size_t vl);
vuint16mf2_t __riscv_vsub_vx_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                       uint16_t rs1, size_t vl);
vuint16m1_t __riscv_vsub_vv_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                     vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vsub_vx_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                     uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vsub_vv_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                     vuint16m2_t vs1, size_t vl);
vuint16m2_t __riscv_vsub_vx_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                     uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vsub_vv_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                     vuint16m4_t vs1, size_t vl);
vuint16m4_t __riscv_vsub_vx_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                     uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vsub_vv_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                     vuint16m8_t vs1, size_t vl);
vuint16m8_t __riscv_vsub_vx_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                     uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vsub_vv_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                       vuint32mf2_t vs1, size_t vl);
vuint32mf2_t __riscv_vsub_vx_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                       uint32_t rs1, size_t vl);
vuint32m1_t __riscv_vsub_vv_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                     vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vsub_vx_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                     uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vsub_vv_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                     vuint32m2_t vs1, size_t vl);
vuint32m2_t __riscv_vsub_vx_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                     uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vsub_vv_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                     vuint32m4_t vs1, size_t vl);
vuint32m4_t __riscv_vsub_vx_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                     uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vsub_vv_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                     vuint32m8_t vs1, size_t vl);
vuint32m8_t __riscv_vsub_vx_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                     uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vsub_vv_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                     vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vsub_vx_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                     uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vsub_vv_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                     vuint64m2_t vs1, size_t vl);
vuint64m2_t __riscv_vsub_vx_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                     uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vsub_vv_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                     vuint64m4_t vs1, size_t vl);
vuint64m4_t __riscv_vsub_vx_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                     uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vsub_vv_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                     vuint64m8_t vs1, size_t vl);
vuint64m8_t __riscv_vsub_vx_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                     uint64_t rs1, size_t vl);
vuint8mf8_t __riscv_vrsub_vx_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                      uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vrsub_vx_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                      uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vrsub_vx_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                      uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vrsub_vx_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2, uint8_t rs1,
                                    size_t vl);
vuint8m2_t __riscv_vrsub_vx_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2, uint8_t rs1,
                                    size_t vl);
vuint8m4_t __riscv_vrsub_vx_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2, uint8_t rs1,
                                    size_t vl);
vuint8m8_t __riscv_vrsub_vx_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2, uint8_t rs1,
                                    size_t vl);
vuint16mf4_t __riscv_vrsub_vx_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                        uint16_t rs1, size_t vl);
vuint16mf2_t __riscv_vrsub_vx_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                        uint16_t rs1, size_t vl);
vuint16m1_t __riscv_vrsub_vx_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                      uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vrsub_vx_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                      uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vrsub_vx_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                      uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vrsub_vx_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                      uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vrsub_vx_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                        uint32_t rs1, size_t vl);
vuint32m1_t __riscv_vrsub_vx_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                      uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vrsub_vx_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                      uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vrsub_vx_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                      uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vrsub_vx_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                      uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vrsub_vx_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                      uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vrsub_vx_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                      uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vrsub_vx_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                      uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vrsub_vx_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                      uint64_t rs1, size_t vl);
// masked functions
vint8mf8_t __riscv_vadd_vv_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vadd_vx_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vadd_vv_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vadd_vx_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vadd_vv_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vadd_vx_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vadd_vv_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vadd_vx_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   int8_t rs1, size_t vl);
vint8m2_t __riscv_vadd_vv_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vadd_vx_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   int8_t rs1, size_t vl);
vint8m4_t __riscv_vadd_vv_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vadd_vx_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   int8_t rs1, size_t vl);
vint8m8_t __riscv_vadd_vv_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vadd_vx_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   int8_t rs1, size_t vl);
vint16mf4_t __riscv_vadd_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, vint16mf4_t vs1,
                                       size_t vl);
vint16mf4_t __riscv_vadd_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vadd_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, vint16mf2_t vs1,
                                       size_t vl);
vint16mf2_t __riscv_vadd_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, int16_t rs1, size_t vl);
vint16m1_t __riscv_vadd_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vadd_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vadd_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vadd_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     int16_t rs1, size_t vl);
vint16m4_t __riscv_vadd_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vadd_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     int16_t rs1, size_t vl);
vint16m8_t __riscv_vadd_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vadd_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     int16_t rs1, size_t vl);
vint32mf2_t __riscv_vadd_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, vint32mf2_t vs1,
                                       size_t vl);
vint32mf2_t __riscv_vadd_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, int32_t rs1, size_t vl);
vint32m1_t __riscv_vadd_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vadd_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vadd_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vadd_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vadd_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vadd_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     int32_t rs1, size_t vl);
vint32m8_t __riscv_vadd_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vadd_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     int32_t rs1, size_t vl);
vint64m1_t __riscv_vadd_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vadd_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vadd_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vadd_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vadd_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vadd_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vadd_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vadd_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     int64_t rs1, size_t vl);
vint8mf8_t __riscv_vsub_vv_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vsub_vx_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vsub_vv_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vsub_vx_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vsub_vv_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vsub_vx_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vsub_vv_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vsub_vx_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   int8_t rs1, size_t vl);
vint8m2_t __riscv_vsub_vv_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vsub_vx_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   int8_t rs1, size_t vl);
vint8m4_t __riscv_vsub_vv_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vsub_vx_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   int8_t rs1, size_t vl);
vint8m8_t __riscv_vsub_vv_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vsub_vx_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   int8_t rs1, size_t vl);
vint16mf4_t __riscv_vsub_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, vint16mf4_t vs1,
                                       size_t vl);
vint16mf4_t __riscv_vsub_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vsub_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, vint16mf2_t vs1,
                                       size_t vl);
vint16mf2_t __riscv_vsub_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, int16_t rs1, size_t vl);
vint16m1_t __riscv_vsub_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vsub_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vsub_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vsub_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     int16_t rs1, size_t vl);
vint16m4_t __riscv_vsub_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vsub_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     int16_t rs1, size_t vl);
vint16m8_t __riscv_vsub_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vsub_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     int16_t rs1, size_t vl);
vint32mf2_t __riscv_vsub_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, vint32mf2_t vs1,
                                       size_t vl);
vint32mf2_t __riscv_vsub_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, int32_t rs1, size_t vl);
vint32m1_t __riscv_vsub_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vsub_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vsub_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vsub_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vsub_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vsub_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     int32_t rs1, size_t vl);
vint32m8_t __riscv_vsub_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vsub_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     int32_t rs1, size_t vl);
vint64m1_t __riscv_vsub_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vsub_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vsub_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vsub_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vsub_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vsub_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vsub_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vsub_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     int64_t rs1, size_t vl);
vint8mf8_t __riscv_vrsub_vx_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vrsub_vx_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vrsub_vx_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vrsub_vx_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                    int8_t rs1, size_t vl);
vint8m2_t __riscv_vrsub_vx_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                    int8_t rs1, size_t vl);
vint8m4_t __riscv_vrsub_vx_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                    int8_t rs1, size_t vl);
vint8m8_t __riscv_vrsub_vx_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                    int8_t rs1, size_t vl);
vint16mf4_t __riscv_vrsub_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, int16_t rs1,
                                        size_t vl);
vint16mf2_t __riscv_vrsub_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, int16_t rs1,
                                        size_t vl);
vint16m1_t __riscv_vrsub_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vrsub_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, int16_t rs1, size_t vl);
vint16m4_t __riscv_vrsub_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, int16_t rs1, size_t vl);
vint16m8_t __riscv_vrsub_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, int16_t rs1, size_t vl);
vint32mf2_t __riscv_vrsub_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, int32_t rs1,
                                        size_t vl);
vint32m1_t __riscv_vrsub_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vrsub_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vrsub_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, int32_t rs1, size_t vl);
vint32m8_t __riscv_vrsub_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, int32_t rs1, size_t vl);
vint64m1_t __riscv_vrsub_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vrsub_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vrsub_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vrsub_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, int64_t rs1, size_t vl);
vint8mf8_t __riscv_vneg_v_i8mf8_tum(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs,
                                    size_t vl);
vint8mf4_t __riscv_vneg_v_i8mf4_tum(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs,
                                    size_t vl);
vint8mf2_t __riscv_vneg_v_i8mf2_tum(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs,
                                    size_t vl);
vint8m1_t __riscv_vneg_v_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs,
                                  size_t vl);
vint8m2_t __riscv_vneg_v_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs,
                                  size_t vl);
vint8m4_t __riscv_vneg_v_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs,
                                  size_t vl);
vint8m8_t __riscv_vneg_v_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs,
                                  size_t vl);
vint16mf4_t __riscv_vneg_v_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs, size_t vl);
vint16mf2_t __riscv_vneg_v_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs, size_t vl);
vint16m1_t __riscv_vneg_v_i16m1_tum(vbool16_t vm, vint16m1_t vd, vint16m1_t vs,
                                    size_t vl);
vint16m2_t __riscv_vneg_v_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs,
                                    size_t vl);
vint16m4_t __riscv_vneg_v_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs,
                                    size_t vl);
vint16m8_t __riscv_vneg_v_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs,
                                    size_t vl);
vint32mf2_t __riscv_vneg_v_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs, size_t vl);
vint32m1_t __riscv_vneg_v_i32m1_tum(vbool32_t vm, vint32m1_t vd, vint32m1_t vs,
                                    size_t vl);
vint32m2_t __riscv_vneg_v_i32m2_tum(vbool16_t vm, vint32m2_t vd, vint32m2_t vs,
                                    size_t vl);
vint32m4_t __riscv_vneg_v_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs,
                                    size_t vl);
vint32m8_t __riscv_vneg_v_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs,
                                    size_t vl);
vint64m1_t __riscv_vneg_v_i64m1_tum(vbool64_t vm, vint64m1_t vd, vint64m1_t vs,
                                    size_t vl);
vint64m2_t __riscv_vneg_v_i64m2_tum(vbool32_t vm, vint64m2_t vd, vint64m2_t vs,
                                    size_t vl);
vint64m4_t __riscv_vneg_v_i64m4_tum(vbool16_t vm, vint64m4_t vd, vint64m4_t vs,
                                    size_t vl);
vint64m8_t __riscv_vneg_v_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs,
                                    size_t vl);
vuint8mf8_t __riscv_vadd_vv_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs2, vuint8mf8_t vs1,
                                      size_t vl);
vuint8mf8_t __riscv_vadd_vx_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vadd_vv_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs2, vuint8mf4_t vs1,
                                      size_t vl);
vuint8mf4_t __riscv_vadd_vx_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vadd_vv_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs2, vuint8mf2_t vs1,
                                      size_t vl);
vuint8mf2_t __riscv_vadd_vx_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vadd_vv_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                    vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vadd_vx_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vadd_vv_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                    vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vadd_vx_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vadd_vv_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                    vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vadd_vx_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vadd_vv_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                    vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vadd_vx_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                    uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vadd_vv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs2, vuint16mf4_t vs1,
                                        size_t vl);
vuint16mf4_t __riscv_vadd_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16mf2_t __riscv_vadd_vv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs2, vuint16mf2_t vs1,
                                        size_t vl);
vuint16mf2_t __riscv_vadd_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m1_t __riscv_vadd_vv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs2, vuint16m1_t vs1,
                                      size_t vl);
vuint16m1_t __riscv_vadd_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs2, uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vadd_vv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs2, vuint16m2_t vs1,
                                      size_t vl);
vuint16m2_t __riscv_vadd_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs2, uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vadd_vv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs2, vuint16m4_t vs1,
                                      size_t vl);
vuint16m4_t __riscv_vadd_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs2, uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vadd_vv_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs2, vuint16m8_t vs1,
                                      size_t vl);
vuint16m8_t __riscv_vadd_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs2, uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vadd_vv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs2, vuint32mf2_t vs1,
                                        size_t vl);
vuint32mf2_t __riscv_vadd_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m1_t __riscv_vadd_vv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs2, vuint32m1_t vs1,
                                      size_t vl);
vuint32m1_t __riscv_vadd_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs2, uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vadd_vv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs2, vuint32m2_t vs1,
                                      size_t vl);
vuint32m2_t __riscv_vadd_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs2, uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vadd_vv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs2, vuint32m4_t vs1,
                                      size_t vl);
vuint32m4_t __riscv_vadd_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs2, uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vadd_vv_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs2, vuint32m8_t vs1,
                                      size_t vl);
vuint32m8_t __riscv_vadd_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs2, uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vadd_vv_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs2, vuint64m1_t vs1,
                                      size_t vl);
vuint64m1_t __riscv_vadd_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs2, uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vadd_vv_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs2, vuint64m2_t vs1,
                                      size_t vl);
vuint64m2_t __riscv_vadd_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs2, uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vadd_vv_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs2, vuint64m4_t vs1,
                                      size_t vl);
vuint64m4_t __riscv_vadd_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs2, uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vadd_vv_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs2, vuint64m8_t vs1,
                                      size_t vl);
vuint64m8_t __riscv_vadd_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs2, uint64_t rs1, size_t vl);
vuint8mf8_t __riscv_vsub_vv_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs2, vuint8mf8_t vs1,
                                      size_t vl);
vuint8mf8_t __riscv_vsub_vx_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vsub_vv_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs2, vuint8mf4_t vs1,
                                      size_t vl);
vuint8mf4_t __riscv_vsub_vx_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vsub_vv_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs2, vuint8mf2_t vs1,
                                      size_t vl);
vuint8mf2_t __riscv_vsub_vx_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vsub_vv_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                    vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vsub_vx_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vsub_vv_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                    vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vsub_vx_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vsub_vv_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                    vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vsub_vx_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vsub_vv_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                    vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vsub_vx_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                    uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vsub_vv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs2, vuint16mf4_t vs1,
                                        size_t vl);
vuint16mf4_t __riscv_vsub_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16mf2_t __riscv_vsub_vv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs2, vuint16mf2_t vs1,
                                        size_t vl);
vuint16mf2_t __riscv_vsub_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m1_t __riscv_vsub_vv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs2, vuint16m1_t vs1,
                                      size_t vl);
vuint16m1_t __riscv_vsub_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs2, uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vsub_vv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs2, vuint16m2_t vs1,
                                      size_t vl);
vuint16m2_t __riscv_vsub_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs2, uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vsub_vv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs2, vuint16m4_t vs1,
                                      size_t vl);
vuint16m4_t __riscv_vsub_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs2, uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vsub_vv_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs2, vuint16m8_t vs1,
                                      size_t vl);
vuint16m8_t __riscv_vsub_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs2, uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vsub_vv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs2, vuint32mf2_t vs1,
                                        size_t vl);
vuint32mf2_t __riscv_vsub_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m1_t __riscv_vsub_vv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs2, vuint32m1_t vs1,
                                      size_t vl);
vuint32m1_t __riscv_vsub_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs2, uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vsub_vv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs2, vuint32m2_t vs1,
                                      size_t vl);
vuint32m2_t __riscv_vsub_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs2, uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vsub_vv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs2, vuint32m4_t vs1,
                                      size_t vl);
vuint32m4_t __riscv_vsub_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs2, uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vsub_vv_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs2, vuint32m8_t vs1,
                                      size_t vl);
vuint32m8_t __riscv_vsub_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs2, uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vsub_vv_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs2, vuint64m1_t vs1,
                                      size_t vl);
vuint64m1_t __riscv_vsub_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs2, uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vsub_vv_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs2, vuint64m2_t vs1,
                                      size_t vl);
vuint64m2_t __riscv_vsub_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs2, uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vsub_vv_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs2, vuint64m4_t vs1,
                                      size_t vl);
vuint64m4_t __riscv_vsub_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs2, uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vsub_vv_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs2, vuint64m8_t vs1,
                                      size_t vl);
vuint64m8_t __riscv_vsub_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs2, uint64_t rs1, size_t vl);
vuint8mf8_t __riscv_vrsub_vx_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vrsub_vx_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vrsub_vx_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vrsub_vx_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vrsub_vx_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vrsub_vx_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vrsub_vx_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                     uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vrsub_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, uint16_t rs1,
                                         size_t vl);
vuint16mf2_t __riscv_vrsub_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, uint16_t rs1,
                                         size_t vl);
vuint16m1_t __riscv_vrsub_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m2_t __riscv_vrsub_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m4_t __riscv_vrsub_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m8_t __riscv_vrsub_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32mf2_t __riscv_vrsub_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, uint32_t rs1,
                                         size_t vl);
vuint32m1_t __riscv_vrsub_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m2_t __riscv_vrsub_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m4_t __riscv_vrsub_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m8_t __riscv_vrsub_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m1_t __riscv_vrsub_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m2_t __riscv_vrsub_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m4_t __riscv_vrsub_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m8_t __riscv_vrsub_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, uint64_t rs1,
                                       size_t vl);
// masked functions
vint8mf8_t __riscv_vadd_vv_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs2, vint8mf8_t vs1,
                                      size_t vl);
vint8mf8_t __riscv_vadd_vx_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vadd_vv_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs2, vint8mf4_t vs1,
                                      size_t vl);
vint8mf4_t __riscv_vadd_vx_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vadd_vv_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs2, vint8mf2_t vs1,
                                      size_t vl);
vint8mf2_t __riscv_vadd_vx_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vadd_vv_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                    vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vadd_vx_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                    int8_t rs1, size_t vl);
vint8m2_t __riscv_vadd_vv_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                    vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vadd_vx_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                    int8_t rs1, size_t vl);
vint8m4_t __riscv_vadd_vv_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                    vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vadd_vx_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                    int8_t rs1, size_t vl);
vint8m8_t __riscv_vadd_vv_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                    vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vadd_vx_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                    int8_t rs1, size_t vl);
vint16mf4_t __riscv_vadd_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, vint16mf4_t vs1,
                                        size_t vl);
vint16mf4_t __riscv_vadd_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, int16_t rs1,
                                        size_t vl);
vint16mf2_t __riscv_vadd_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, vint16mf2_t vs1,
                                        size_t vl);
vint16mf2_t __riscv_vadd_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, int16_t rs1,
                                        size_t vl);
vint16m1_t __riscv_vadd_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, vint16m1_t vs1,
                                      size_t vl);
vint16m1_t __riscv_vadd_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vadd_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, vint16m2_t vs1,
                                      size_t vl);
vint16m2_t __riscv_vadd_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, int16_t rs1, size_t vl);
vint16m4_t __riscv_vadd_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, vint16m4_t vs1,
                                      size_t vl);
vint16m4_t __riscv_vadd_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, int16_t rs1, size_t vl);
vint16m8_t __riscv_vadd_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, vint16m8_t vs1,
                                      size_t vl);
vint16m8_t __riscv_vadd_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, int16_t rs1, size_t vl);
vint32mf2_t __riscv_vadd_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, vint32mf2_t vs1,
                                        size_t vl);
vint32mf2_t __riscv_vadd_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, int32_t rs1,
                                        size_t vl);
vint32m1_t __riscv_vadd_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, vint32m1_t vs1,
                                      size_t vl);
vint32m1_t __riscv_vadd_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vadd_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, vint32m2_t vs1,
                                      size_t vl);
vint32m2_t __riscv_vadd_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vadd_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, vint32m4_t vs1,
                                      size_t vl);
vint32m4_t __riscv_vadd_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, int32_t rs1, size_t vl);
vint32m8_t __riscv_vadd_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, vint32m8_t vs1,
                                      size_t vl);
vint32m8_t __riscv_vadd_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, int32_t rs1, size_t vl);
vint64m1_t __riscv_vadd_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, vint64m1_t vs1,
                                      size_t vl);
vint64m1_t __riscv_vadd_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vadd_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, vint64m2_t vs1,
                                      size_t vl);
vint64m2_t __riscv_vadd_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vadd_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, vint64m4_t vs1,
                                      size_t vl);
vint64m4_t __riscv_vadd_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vadd_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, vint64m8_t vs1,
                                      size_t vl);
vint64m8_t __riscv_vadd_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, int64_t rs1, size_t vl);
vint8mf8_t __riscv_vsub_vv_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs2, vint8mf8_t vs1,
                                      size_t vl);
vint8mf8_t __riscv_vsub_vx_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vsub_vv_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs2, vint8mf4_t vs1,
                                      size_t vl);
vint8mf4_t __riscv_vsub_vx_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vsub_vv_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs2, vint8mf2_t vs1,
                                      size_t vl);
vint8mf2_t __riscv_vsub_vx_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vsub_vv_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                    vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vsub_vx_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                    int8_t rs1, size_t vl);
vint8m2_t __riscv_vsub_vv_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                    vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vsub_vx_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                    int8_t rs1, size_t vl);
vint8m4_t __riscv_vsub_vv_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                    vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vsub_vx_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                    int8_t rs1, size_t vl);
vint8m8_t __riscv_vsub_vv_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                    vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vsub_vx_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                    int8_t rs1, size_t vl);
vint16mf4_t __riscv_vsub_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, vint16mf4_t vs1,
                                        size_t vl);
vint16mf4_t __riscv_vsub_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, int16_t rs1,
                                        size_t vl);
vint16mf2_t __riscv_vsub_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, vint16mf2_t vs1,
                                        size_t vl);
vint16mf2_t __riscv_vsub_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, int16_t rs1,
                                        size_t vl);
vint16m1_t __riscv_vsub_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, vint16m1_t vs1,
                                      size_t vl);
vint16m1_t __riscv_vsub_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vsub_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, vint16m2_t vs1,
                                      size_t vl);
vint16m2_t __riscv_vsub_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, int16_t rs1, size_t vl);
vint16m4_t __riscv_vsub_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, vint16m4_t vs1,
                                      size_t vl);
vint16m4_t __riscv_vsub_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, int16_t rs1, size_t vl);
vint16m8_t __riscv_vsub_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, vint16m8_t vs1,
                                      size_t vl);
vint16m8_t __riscv_vsub_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, int16_t rs1, size_t vl);
vint32mf2_t __riscv_vsub_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, vint32mf2_t vs1,
                                        size_t vl);
vint32mf2_t __riscv_vsub_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, int32_t rs1,
                                        size_t vl);
vint32m1_t __riscv_vsub_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, vint32m1_t vs1,
                                      size_t vl);
vint32m1_t __riscv_vsub_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vsub_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, vint32m2_t vs1,
                                      size_t vl);
vint32m2_t __riscv_vsub_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vsub_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, vint32m4_t vs1,
                                      size_t vl);
vint32m4_t __riscv_vsub_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, int32_t rs1, size_t vl);
vint32m8_t __riscv_vsub_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, vint32m8_t vs1,
                                      size_t vl);
vint32m8_t __riscv_vsub_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, int32_t rs1, size_t vl);
vint64m1_t __riscv_vsub_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, vint64m1_t vs1,
                                      size_t vl);
vint64m1_t __riscv_vsub_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vsub_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, vint64m2_t vs1,
                                      size_t vl);
vint64m2_t __riscv_vsub_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vsub_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, vint64m4_t vs1,
                                      size_t vl);
vint64m4_t __riscv_vsub_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vsub_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, vint64m8_t vs1,
                                      size_t vl);
vint64m8_t __riscv_vsub_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, int64_t rs1, size_t vl);
vint8mf8_t __riscv_vrsub_vx_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                       vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vrsub_vx_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                       vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vrsub_vx_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                       vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vrsub_vx_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                     int8_t rs1, size_t vl);
vint8m2_t __riscv_vrsub_vx_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                     int8_t rs1, size_t vl);
vint8m4_t __riscv_vrsub_vx_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                     int8_t rs1, size_t vl);
vint8m8_t __riscv_vrsub_vx_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                     int8_t rs1, size_t vl);
vint16mf4_t __riscv_vrsub_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                         vint16mf4_t vs2, int16_t rs1,
                                         size_t vl);
vint16mf2_t __riscv_vrsub_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                         vint16mf2_t vs2, int16_t rs1,
                                         size_t vl);
vint16m1_t __riscv_vrsub_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                       vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vrsub_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                       vint16m2_t vs2, int16_t rs1, size_t vl);
vint16m4_t __riscv_vrsub_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                       vint16m4_t vs2, int16_t rs1, size_t vl);
vint16m8_t __riscv_vrsub_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                       vint16m8_t vs2, int16_t rs1, size_t vl);
vint32mf2_t __riscv_vrsub_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                         vint32mf2_t vs2, int32_t rs1,
                                         size_t vl);
vint32m1_t __riscv_vrsub_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                       vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vrsub_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                       vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vrsub_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                       vint32m4_t vs2, int32_t rs1, size_t vl);
vint32m8_t __riscv_vrsub_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                       vint32m8_t vs2, int32_t rs1, size_t vl);
vint64m1_t __riscv_vrsub_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                       vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vrsub_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                       vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vrsub_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                       vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vrsub_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                       vint64m8_t vs2, int64_t rs1, size_t vl);
vint8mf8_t __riscv_vneg_v_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs,
                                     size_t vl);
vint8mf4_t __riscv_vneg_v_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs,
                                     size_t vl);
vint8mf2_t __riscv_vneg_v_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs,
                                     size_t vl);
vint8m1_t __riscv_vneg_v_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs,
                                   size_t vl);
vint8m2_t __riscv_vneg_v_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs,
                                   size_t vl);
vint8m4_t __riscv_vneg_v_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs,
                                   size_t vl);
vint8m8_t __riscv_vneg_v_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs,
                                   size_t vl);
vint16mf4_t __riscv_vneg_v_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs, size_t vl);
vint16mf2_t __riscv_vneg_v_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs, size_t vl);
vint16m1_t __riscv_vneg_v_i16m1_tumu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs,
                                     size_t vl);
vint16m2_t __riscv_vneg_v_i16m2_tumu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs,
                                     size_t vl);
vint16m4_t __riscv_vneg_v_i16m4_tumu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs,
                                     size_t vl);
vint16m8_t __riscv_vneg_v_i16m8_tumu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs,
                                     size_t vl);
vint32mf2_t __riscv_vneg_v_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs, size_t vl);
vint32m1_t __riscv_vneg_v_i32m1_tumu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs,
                                     size_t vl);
vint32m2_t __riscv_vneg_v_i32m2_tumu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs,
                                     size_t vl);
vint32m4_t __riscv_vneg_v_i32m4_tumu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs,
                                     size_t vl);
vint32m8_t __riscv_vneg_v_i32m8_tumu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs,
                                     size_t vl);
vint64m1_t __riscv_vneg_v_i64m1_tumu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs,
                                     size_t vl);
vint64m2_t __riscv_vneg_v_i64m2_tumu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs,
                                     size_t vl);
vint64m4_t __riscv_vneg_v_i64m4_tumu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs,
                                     size_t vl);
vint64m8_t __riscv_vneg_v_i64m8_tumu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs,
                                     size_t vl);
vuint8mf8_t __riscv_vadd_vv_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs2, vuint8mf8_t vs1,
                                       size_t vl);
vuint8mf8_t __riscv_vadd_vx_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vadd_vv_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs2, vuint8mf4_t vs1,
                                       size_t vl);
vuint8mf4_t __riscv_vadd_vx_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vadd_vv_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs2, vuint8mf2_t vs1,
                                       size_t vl);
vuint8mf2_t __riscv_vadd_vx_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vadd_vv_u8m1_tumu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                     vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vadd_vx_u8m1_tumu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vadd_vv_u8m2_tumu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                     vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vadd_vx_u8m2_tumu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vadd_vv_u8m4_tumu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                     vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vadd_vx_u8m4_tumu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vadd_vv_u8m8_tumu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                     vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vadd_vx_u8m8_tumu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                     uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vadd_vv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, vuint16mf4_t vs1,
                                         size_t vl);
vuint16mf4_t __riscv_vadd_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, uint16_t rs1,
                                         size_t vl);
vuint16mf2_t __riscv_vadd_vv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, vuint16mf2_t vs1,
                                         size_t vl);
vuint16mf2_t __riscv_vadd_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, uint16_t rs1,
                                         size_t vl);
vuint16m1_t __riscv_vadd_vv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, vuint16m1_t vs1,
                                       size_t vl);
vuint16m1_t __riscv_vadd_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m2_t __riscv_vadd_vv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, vuint16m2_t vs1,
                                       size_t vl);
vuint16m2_t __riscv_vadd_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m4_t __riscv_vadd_vv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, vuint16m4_t vs1,
                                       size_t vl);
vuint16m4_t __riscv_vadd_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m8_t __riscv_vadd_vv_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, vuint16m8_t vs1,
                                       size_t vl);
vuint16m8_t __riscv_vadd_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32mf2_t __riscv_vadd_vv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, vuint32mf2_t vs1,
                                         size_t vl);
vuint32mf2_t __riscv_vadd_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, uint32_t rs1,
                                         size_t vl);
vuint32m1_t __riscv_vadd_vv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, vuint32m1_t vs1,
                                       size_t vl);
vuint32m1_t __riscv_vadd_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m2_t __riscv_vadd_vv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, vuint32m2_t vs1,
                                       size_t vl);
vuint32m2_t __riscv_vadd_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m4_t __riscv_vadd_vv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, vuint32m4_t vs1,
                                       size_t vl);
vuint32m4_t __riscv_vadd_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m8_t __riscv_vadd_vv_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, vuint32m8_t vs1,
                                       size_t vl);
vuint32m8_t __riscv_vadd_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m1_t __riscv_vadd_vv_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, vuint64m1_t vs1,
                                       size_t vl);
vuint64m1_t __riscv_vadd_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m2_t __riscv_vadd_vv_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, vuint64m2_t vs1,
                                       size_t vl);
vuint64m2_t __riscv_vadd_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m4_t __riscv_vadd_vv_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, vuint64m4_t vs1,
                                       size_t vl);
vuint64m4_t __riscv_vadd_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m8_t __riscv_vadd_vv_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, vuint64m8_t vs1,
                                       size_t vl);
vuint64m8_t __riscv_vadd_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, uint64_t rs1,
                                       size_t vl);
vuint8mf8_t __riscv_vsub_vv_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs2, vuint8mf8_t vs1,
                                       size_t vl);
vuint8mf8_t __riscv_vsub_vx_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vsub_vv_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs2, vuint8mf4_t vs1,
                                       size_t vl);
vuint8mf4_t __riscv_vsub_vx_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vsub_vv_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs2, vuint8mf2_t vs1,
                                       size_t vl);
vuint8mf2_t __riscv_vsub_vx_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vsub_vv_u8m1_tumu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                     vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vsub_vx_u8m1_tumu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vsub_vv_u8m2_tumu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                     vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vsub_vx_u8m2_tumu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vsub_vv_u8m4_tumu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                     vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vsub_vx_u8m4_tumu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vsub_vv_u8m8_tumu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                     vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vsub_vx_u8m8_tumu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                     uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vsub_vv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, vuint16mf4_t vs1,
                                         size_t vl);
vuint16mf4_t __riscv_vsub_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, uint16_t rs1,
                                         size_t vl);
vuint16mf2_t __riscv_vsub_vv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, vuint16mf2_t vs1,
                                         size_t vl);
vuint16mf2_t __riscv_vsub_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, uint16_t rs1,
                                         size_t vl);
vuint16m1_t __riscv_vsub_vv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, vuint16m1_t vs1,
                                       size_t vl);
vuint16m1_t __riscv_vsub_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m2_t __riscv_vsub_vv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, vuint16m2_t vs1,
                                       size_t vl);
vuint16m2_t __riscv_vsub_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m4_t __riscv_vsub_vv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, vuint16m4_t vs1,
                                       size_t vl);
vuint16m4_t __riscv_vsub_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m8_t __riscv_vsub_vv_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, vuint16m8_t vs1,
                                       size_t vl);
vuint16m8_t __riscv_vsub_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32mf2_t __riscv_vsub_vv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, vuint32mf2_t vs1,
                                         size_t vl);
vuint32mf2_t __riscv_vsub_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, uint32_t rs1,
                                         size_t vl);
vuint32m1_t __riscv_vsub_vv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, vuint32m1_t vs1,
                                       size_t vl);
vuint32m1_t __riscv_vsub_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m2_t __riscv_vsub_vv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, vuint32m2_t vs1,
                                       size_t vl);
vuint32m2_t __riscv_vsub_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m4_t __riscv_vsub_vv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, vuint32m4_t vs1,
                                       size_t vl);
vuint32m4_t __riscv_vsub_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m8_t __riscv_vsub_vv_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, vuint32m8_t vs1,
                                       size_t vl);
vuint32m8_t __riscv_vsub_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m1_t __riscv_vsub_vv_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, vuint64m1_t vs1,
                                       size_t vl);
vuint64m1_t __riscv_vsub_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m2_t __riscv_vsub_vv_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, vuint64m2_t vs1,
                                       size_t vl);
vuint64m2_t __riscv_vsub_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m4_t __riscv_vsub_vv_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, vuint64m4_t vs1,
                                       size_t vl);
vuint64m4_t __riscv_vsub_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m8_t __riscv_vsub_vv_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, vuint64m8_t vs1,
                                       size_t vl);
vuint64m8_t __riscv_vsub_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, uint64_t rs1,
                                       size_t vl);
vuint8mf8_t __riscv_vrsub_vx_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                        vuint8mf8_t vs2, uint8_t rs1,
                                        size_t vl);
vuint8mf4_t __riscv_vrsub_vx_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                        vuint8mf4_t vs2, uint8_t rs1,
                                        size_t vl);
vuint8mf2_t __riscv_vrsub_vx_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                        vuint8mf2_t vs2, uint8_t rs1,
                                        size_t vl);
vuint8m1_t __riscv_vrsub_vx_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                      vuint8m1_t vs2, uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vrsub_vx_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                      vuint8m2_t vs2, uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vrsub_vx_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                      vuint8m4_t vs2, uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vrsub_vx_u8m8_tumu(vbool1_t vm, vuint8m8_t vd,
                                      vuint8m8_t vs2, uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vrsub_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                          vuint16mf4_t vs2, uint16_t rs1,
                                          size_t vl);
vuint16mf2_t __riscv_vrsub_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                          vuint16mf2_t vs2, uint16_t rs1,
                                          size_t vl);
vuint16m1_t __riscv_vrsub_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                        vuint16m1_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m2_t __riscv_vrsub_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                        vuint16m2_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m4_t __riscv_vrsub_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                        vuint16m4_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m8_t __riscv_vrsub_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                        vuint16m8_t vs2, uint16_t rs1,
                                        size_t vl);
vuint32mf2_t __riscv_vrsub_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                          vuint32mf2_t vs2, uint32_t rs1,
                                          size_t vl);
vuint32m1_t __riscv_vrsub_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                        vuint32m1_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m2_t __riscv_vrsub_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                        vuint32m2_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m4_t __riscv_vrsub_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                        vuint32m4_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m8_t __riscv_vrsub_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                        vuint32m8_t vs2, uint32_t rs1,
                                        size_t vl);
vuint64m1_t __riscv_vrsub_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                        vuint64m1_t vs2, uint64_t rs1,
                                        size_t vl);
vuint64m2_t __riscv_vrsub_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                        vuint64m2_t vs2, uint64_t rs1,
                                        size_t vl);
vuint64m4_t __riscv_vrsub_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                        vuint64m4_t vs2, uint64_t rs1,
                                        size_t vl);
vuint64m8_t __riscv_vrsub_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                        vuint64m8_t vs2, uint64_t rs1,
                                        size_t vl);
// masked functions
vint8mf8_t __riscv_vadd_vv_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                    vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vadd_vx_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                    int8_t rs1, size_t vl);
vint8mf4_t __riscv_vadd_vv_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                    vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vadd_vx_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                    int8_t rs1, size_t vl);
vint8mf2_t __riscv_vadd_vv_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                    vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vadd_vx_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                    int8_t rs1, size_t vl);
vint8m1_t __riscv_vadd_vv_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                  vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vadd_vx_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                  int8_t rs1, size_t vl);
vint8m2_t __riscv_vadd_vv_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                  vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vadd_vx_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                  int8_t rs1, size_t vl);
vint8m4_t __riscv_vadd_vv_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                  vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vadd_vx_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                  int8_t rs1, size_t vl);
vint8m8_t __riscv_vadd_vv_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                  vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vadd_vx_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                  int8_t rs1, size_t vl);
vint16mf4_t __riscv_vadd_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs2, vint16mf4_t vs1,
                                      size_t vl);
vint16mf4_t __riscv_vadd_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs2, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vadd_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs2, vint16mf2_t vs1,
                                      size_t vl);
vint16mf2_t __riscv_vadd_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs2, int16_t rs1, size_t vl);
vint16m1_t __riscv_vadd_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                    vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vadd_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                    int16_t rs1, size_t vl);
vint16m2_t __riscv_vadd_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                    vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vadd_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                    int16_t rs1, size_t vl);
vint16m4_t __riscv_vadd_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                    vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vadd_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                    int16_t rs1, size_t vl);
vint16m8_t __riscv_vadd_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                    vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vadd_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                    int16_t rs1, size_t vl);
vint32mf2_t __riscv_vadd_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs2, vint32mf2_t vs1,
                                      size_t vl);
vint32mf2_t __riscv_vadd_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs2, int32_t rs1, size_t vl);
vint32m1_t __riscv_vadd_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                    vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vadd_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                    int32_t rs1, size_t vl);
vint32m2_t __riscv_vadd_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                    vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vadd_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                    int32_t rs1, size_t vl);
vint32m4_t __riscv_vadd_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                    vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vadd_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                    int32_t rs1, size_t vl);
vint32m8_t __riscv_vadd_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                    vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vadd_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                    int32_t rs1, size_t vl);
vint64m1_t __riscv_vadd_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                    vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vadd_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                    int64_t rs1, size_t vl);
vint64m2_t __riscv_vadd_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                    vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vadd_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                    int64_t rs1, size_t vl);
vint64m4_t __riscv_vadd_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                    vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vadd_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                    int64_t rs1, size_t vl);
vint64m8_t __riscv_vadd_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                    vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vadd_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                    int64_t rs1, size_t vl);
vint8mf8_t __riscv_vsub_vv_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                    vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vsub_vx_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                    int8_t rs1, size_t vl);
vint8mf4_t __riscv_vsub_vv_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                    vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vsub_vx_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                    int8_t rs1, size_t vl);
vint8mf2_t __riscv_vsub_vv_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                    vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vsub_vx_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                    int8_t rs1, size_t vl);
vint8m1_t __riscv_vsub_vv_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                  vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vsub_vx_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                  int8_t rs1, size_t vl);
vint8m2_t __riscv_vsub_vv_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                  vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vsub_vx_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                  int8_t rs1, size_t vl);
vint8m4_t __riscv_vsub_vv_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                  vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vsub_vx_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                  int8_t rs1, size_t vl);
vint8m8_t __riscv_vsub_vv_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                  vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vsub_vx_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                  int8_t rs1, size_t vl);
vint16mf4_t __riscv_vsub_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs2, vint16mf4_t vs1,
                                      size_t vl);
vint16mf4_t __riscv_vsub_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs2, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vsub_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs2, vint16mf2_t vs1,
                                      size_t vl);
vint16mf2_t __riscv_vsub_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs2, int16_t rs1, size_t vl);
vint16m1_t __riscv_vsub_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                    vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vsub_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                    int16_t rs1, size_t vl);
vint16m2_t __riscv_vsub_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                    vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vsub_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                    int16_t rs1, size_t vl);
vint16m4_t __riscv_vsub_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                    vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vsub_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                    int16_t rs1, size_t vl);
vint16m8_t __riscv_vsub_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                    vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vsub_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                    int16_t rs1, size_t vl);
vint32mf2_t __riscv_vsub_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs2, vint32mf2_t vs1,
                                      size_t vl);
vint32mf2_t __riscv_vsub_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs2, int32_t rs1, size_t vl);
vint32m1_t __riscv_vsub_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                    vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vsub_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                    int32_t rs1, size_t vl);
vint32m2_t __riscv_vsub_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                    vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vsub_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                    int32_t rs1, size_t vl);
vint32m4_t __riscv_vsub_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                    vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vsub_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                    int32_t rs1, size_t vl);
vint32m8_t __riscv_vsub_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                    vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vsub_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                    int32_t rs1, size_t vl);
vint64m1_t __riscv_vsub_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                    vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vsub_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                    int64_t rs1, size_t vl);
vint64m2_t __riscv_vsub_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                    vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vsub_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                    int64_t rs1, size_t vl);
vint64m4_t __riscv_vsub_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                    vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vsub_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                    int64_t rs1, size_t vl);
vint64m8_t __riscv_vsub_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                    vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vsub_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                    int64_t rs1, size_t vl);
vint8mf8_t __riscv_vrsub_vx_i8mf8_mu(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vrsub_vx_i8mf4_mu(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vrsub_vx_i8mf2_mu(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vrsub_vx_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   int8_t rs1, size_t vl);
vint8m2_t __riscv_vrsub_vx_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   int8_t rs1, size_t vl);
vint8m4_t __riscv_vrsub_vx_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   int8_t rs1, size_t vl);
vint8m8_t __riscv_vrsub_vx_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   int8_t rs1, size_t vl);
vint16mf4_t __riscv_vrsub_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vrsub_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, int16_t rs1, size_t vl);
vint16m1_t __riscv_vrsub_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vrsub_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     int16_t rs1, size_t vl);
vint16m4_t __riscv_vrsub_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     int16_t rs1, size_t vl);
vint16m8_t __riscv_vrsub_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     int16_t rs1, size_t vl);
vint32mf2_t __riscv_vrsub_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, int32_t rs1, size_t vl);
vint32m1_t __riscv_vrsub_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vrsub_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vrsub_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     int32_t rs1, size_t vl);
vint32m8_t __riscv_vrsub_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     int32_t rs1, size_t vl);
vint64m1_t __riscv_vrsub_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vrsub_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vrsub_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vrsub_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     int64_t rs1, size_t vl);
vint8mf8_t __riscv_vneg_v_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs,
                                   size_t vl);
vint8mf4_t __riscv_vneg_v_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs,
                                   size_t vl);
vint8mf2_t __riscv_vneg_v_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs,
                                   size_t vl);
vint8m1_t __riscv_vneg_v_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs,
                                 size_t vl);
vint8m2_t __riscv_vneg_v_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs,
                                 size_t vl);
vint8m4_t __riscv_vneg_v_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs,
                                 size_t vl);
vint8m8_t __riscv_vneg_v_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs,
                                 size_t vl);
vint16mf4_t __riscv_vneg_v_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                     vint16mf4_t vs, size_t vl);
vint16mf2_t __riscv_vneg_v_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                     vint16mf2_t vs, size_t vl);
vint16m1_t __riscv_vneg_v_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs,
                                   size_t vl);
vint16m2_t __riscv_vneg_v_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs,
                                   size_t vl);
vint16m4_t __riscv_vneg_v_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs,
                                   size_t vl);
vint16m8_t __riscv_vneg_v_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs,
                                   size_t vl);
vint32mf2_t __riscv_vneg_v_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                     vint32mf2_t vs, size_t vl);
vint32m1_t __riscv_vneg_v_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs,
                                   size_t vl);
vint32m2_t __riscv_vneg_v_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs,
                                   size_t vl);
vint32m4_t __riscv_vneg_v_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs,
                                   size_t vl);
vint32m8_t __riscv_vneg_v_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs,
                                   size_t vl);
vint64m1_t __riscv_vneg_v_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs,
                                   size_t vl);
vint64m2_t __riscv_vneg_v_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs,
                                   size_t vl);
vint64m4_t __riscv_vneg_v_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs,
                                   size_t vl);
vint64m8_t __riscv_vneg_v_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs,
                                   size_t vl);
vuint8mf8_t __riscv_vadd_vv_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                     vuint8mf8_t vs2, vuint8mf8_t vs1,
                                     size_t vl);
vuint8mf8_t __riscv_vadd_vx_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                     vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vadd_vv_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                     vuint8mf4_t vs2, vuint8mf4_t vs1,
                                     size_t vl);
vuint8mf4_t __riscv_vadd_vx_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                     vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vadd_vv_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                     vuint8mf2_t vs2, vuint8mf2_t vs1,
                                     size_t vl);
vuint8mf2_t __riscv_vadd_vx_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                     vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vadd_vv_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                   vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vadd_vx_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                   uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vadd_vv_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                   vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vadd_vx_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                   uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vadd_vv_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                   vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vadd_vx_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                   uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vadd_vv_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                   vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vadd_vx_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                   uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vadd_vv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                       vuint16mf4_t vs2, vuint16mf4_t vs1,
                                       size_t vl);
vuint16mf4_t __riscv_vadd_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                       vuint16mf4_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16mf2_t __riscv_vadd_vv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                       vuint16mf2_t vs2, vuint16mf2_t vs1,
                                       size_t vl);
vuint16mf2_t __riscv_vadd_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                       vuint16mf2_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m1_t __riscv_vadd_vv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                     vuint16m1_t vs2, vuint16m1_t vs1,
                                     size_t vl);
vuint16m1_t __riscv_vadd_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                     vuint16m1_t vs2, uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vadd_vv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                     vuint16m2_t vs2, vuint16m2_t vs1,
                                     size_t vl);
vuint16m2_t __riscv_vadd_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                     vuint16m2_t vs2, uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vadd_vv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                     vuint16m4_t vs2, vuint16m4_t vs1,
                                     size_t vl);
vuint16m4_t __riscv_vadd_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                     vuint16m4_t vs2, uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vadd_vv_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                     vuint16m8_t vs2, vuint16m8_t vs1,
                                     size_t vl);
vuint16m8_t __riscv_vadd_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                     vuint16m8_t vs2, uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vadd_vv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                       vuint32mf2_t vs2, vuint32mf2_t vs1,
                                       size_t vl);
vuint32mf2_t __riscv_vadd_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                       vuint32mf2_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m1_t __riscv_vadd_vv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                     vuint32m1_t vs2, vuint32m1_t vs1,
                                     size_t vl);
vuint32m1_t __riscv_vadd_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                     vuint32m1_t vs2, uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vadd_vv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                     vuint32m2_t vs2, vuint32m2_t vs1,
                                     size_t vl);
vuint32m2_t __riscv_vadd_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                     vuint32m2_t vs2, uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vadd_vv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                     vuint32m4_t vs2, vuint32m4_t vs1,
                                     size_t vl);
vuint32m4_t __riscv_vadd_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                     vuint32m4_t vs2, uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vadd_vv_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                     vuint32m8_t vs2, vuint32m8_t vs1,
                                     size_t vl);
vuint32m8_t __riscv_vadd_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                     vuint32m8_t vs2, uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vadd_vv_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                     vuint64m1_t vs2, vuint64m1_t vs1,
                                     size_t vl);
vuint64m1_t __riscv_vadd_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                     vuint64m1_t vs2, uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vadd_vv_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                     vuint64m2_t vs2, vuint64m2_t vs1,
                                     size_t vl);
vuint64m2_t __riscv_vadd_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                     vuint64m2_t vs2, uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vadd_vv_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                     vuint64m4_t vs2, vuint64m4_t vs1,
                                     size_t vl);
vuint64m4_t __riscv_vadd_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                     vuint64m4_t vs2, uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vadd_vv_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                     vuint64m8_t vs2, vuint64m8_t vs1,
                                     size_t vl);
vuint64m8_t __riscv_vadd_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                     vuint64m8_t vs2, uint64_t rs1, size_t vl);
vuint8mf8_t __riscv_vsub_vv_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                     vuint8mf8_t vs2, vuint8mf8_t vs1,
                                     size_t vl);
vuint8mf8_t __riscv_vsub_vx_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                     vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vsub_vv_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                     vuint8mf4_t vs2, vuint8mf4_t vs1,
                                     size_t vl);
vuint8mf4_t __riscv_vsub_vx_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                     vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vsub_vv_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                     vuint8mf2_t vs2, vuint8mf2_t vs1,
                                     size_t vl);
vuint8mf2_t __riscv_vsub_vx_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                     vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vsub_vv_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                   vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vsub_vx_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                   uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vsub_vv_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                   vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vsub_vx_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                   uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vsub_vv_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                   vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vsub_vx_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                   uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vsub_vv_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                   vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vsub_vx_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                   uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vsub_vv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                       vuint16mf4_t vs2, vuint16mf4_t vs1,
                                       size_t vl);
vuint16mf4_t __riscv_vsub_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                       vuint16mf4_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16mf2_t __riscv_vsub_vv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                       vuint16mf2_t vs2, vuint16mf2_t vs1,
                                       size_t vl);
vuint16mf2_t __riscv_vsub_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                       vuint16mf2_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m1_t __riscv_vsub_vv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                     vuint16m1_t vs2, vuint16m1_t vs1,
                                     size_t vl);
vuint16m1_t __riscv_vsub_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                     vuint16m1_t vs2, uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vsub_vv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                     vuint16m2_t vs2, vuint16m2_t vs1,
                                     size_t vl);
vuint16m2_t __riscv_vsub_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                     vuint16m2_t vs2, uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vsub_vv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                     vuint16m4_t vs2, vuint16m4_t vs1,
                                     size_t vl);
vuint16m4_t __riscv_vsub_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                     vuint16m4_t vs2, uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vsub_vv_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                     vuint16m8_t vs2, vuint16m8_t vs1,
                                     size_t vl);
vuint16m8_t __riscv_vsub_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                     vuint16m8_t vs2, uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vsub_vv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                       vuint32mf2_t vs2, vuint32mf2_t vs1,
                                       size_t vl);
vuint32mf2_t __riscv_vsub_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                       vuint32mf2_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m1_t __riscv_vsub_vv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                     vuint32m1_t vs2, vuint32m1_t vs1,
                                     size_t vl);
vuint32m1_t __riscv_vsub_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                     vuint32m1_t vs2, uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vsub_vv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                     vuint32m2_t vs2, vuint32m2_t vs1,
                                     size_t vl);
vuint32m2_t __riscv_vsub_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                     vuint32m2_t vs2, uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vsub_vv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                     vuint32m4_t vs2, vuint32m4_t vs1,
                                     size_t vl);
vuint32m4_t __riscv_vsub_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                     vuint32m4_t vs2, uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vsub_vv_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                     vuint32m8_t vs2, vuint32m8_t vs1,
                                     size_t vl);
vuint32m8_t __riscv_vsub_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                     vuint32m8_t vs2, uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vsub_vv_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                     vuint64m1_t vs2, vuint64m1_t vs1,
                                     size_t vl);
vuint64m1_t __riscv_vsub_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                     vuint64m1_t vs2, uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vsub_vv_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                     vuint64m2_t vs2, vuint64m2_t vs1,
                                     size_t vl);
vuint64m2_t __riscv_vsub_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                     vuint64m2_t vs2, uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vsub_vv_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                     vuint64m4_t vs2, vuint64m4_t vs1,
                                     size_t vl);
vuint64m4_t __riscv_vsub_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                     vuint64m4_t vs2, uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vsub_vv_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                     vuint64m8_t vs2, vuint64m8_t vs1,
                                     size_t vl);
vuint64m8_t __riscv_vsub_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                     vuint64m8_t vs2, uint64_t rs1, size_t vl);
vuint8mf8_t __riscv_vrsub_vx_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vrsub_vx_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vrsub_vx_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vrsub_vx_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vrsub_vx_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vrsub_vx_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vrsub_vx_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                    uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vrsub_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16mf2_t __riscv_vrsub_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m1_t __riscv_vrsub_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs2, uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vrsub_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs2, uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vrsub_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs2, uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vrsub_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs2, uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vrsub_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m1_t __riscv_vrsub_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs2, uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vrsub_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs2, uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vrsub_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs2, uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vrsub_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs2, uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vrsub_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs2, uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vrsub_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs2, uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vrsub_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs2, uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vrsub_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs2, uint64_t rs1, size_t vl);

Vector Widening Integer Add/Subtract Intrinsics

vint16mf4_t __riscv_vwadd_vv_i16mf4_tu(vint16mf4_t vd, vint8mf8_t vs2,
                                       vint8mf8_t vs1, size_t vl);
vint16mf4_t __riscv_vwadd_vx_i16mf4_tu(vint16mf4_t vd, vint8mf8_t vs2,
                                       int8_t rs1, size_t vl);
vint16mf4_t __riscv_vwadd_wv_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                       vint8mf8_t vs1, size_t vl);
vint16mf4_t __riscv_vwadd_wx_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                       int8_t rs1, size_t vl);
vint16mf2_t __riscv_vwadd_vv_i16mf2_tu(vint16mf2_t vd, vint8mf4_t vs2,
                                       vint8mf4_t vs1, size_t vl);
vint16mf2_t __riscv_vwadd_vx_i16mf2_tu(vint16mf2_t vd, vint8mf4_t vs2,
                                       int8_t rs1, size_t vl);
vint16mf2_t __riscv_vwadd_wv_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                       vint8mf4_t vs1, size_t vl);
vint16mf2_t __riscv_vwadd_wx_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                       int8_t rs1, size_t vl);
vint16m1_t __riscv_vwadd_vv_i16m1_tu(vint16m1_t vd, vint8mf2_t vs2,
                                     vint8mf2_t vs1, size_t vl);
vint16m1_t __riscv_vwadd_vx_i16m1_tu(vint16m1_t vd, vint8mf2_t vs2, int8_t rs1,
                                     size_t vl);
vint16m1_t __riscv_vwadd_wv_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                     vint8mf2_t vs1, size_t vl);
vint16m1_t __riscv_vwadd_wx_i16m1_tu(vint16m1_t vd, vint16m1_t vs2, int8_t rs1,
                                     size_t vl);
vint16m2_t __riscv_vwadd_vv_i16m2_tu(vint16m2_t vd, vint8m1_t vs2,
                                     vint8m1_t vs1, size_t vl);
vint16m2_t __riscv_vwadd_vx_i16m2_tu(vint16m2_t vd, vint8m1_t vs2, int8_t rs1,
                                     size_t vl);
vint16m2_t __riscv_vwadd_wv_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                     vint8m1_t vs1, size_t vl);
vint16m2_t __riscv_vwadd_wx_i16m2_tu(vint16m2_t vd, vint16m2_t vs2, int8_t rs1,
                                     size_t vl);
vint16m4_t __riscv_vwadd_vv_i16m4_tu(vint16m4_t vd, vint8m2_t vs2,
                                     vint8m2_t vs1, size_t vl);
vint16m4_t __riscv_vwadd_vx_i16m4_tu(vint16m4_t vd, vint8m2_t vs2, int8_t rs1,
                                     size_t vl);
vint16m4_t __riscv_vwadd_wv_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                     vint8m2_t vs1, size_t vl);
vint16m4_t __riscv_vwadd_wx_i16m4_tu(vint16m4_t vd, vint16m4_t vs2, int8_t rs1,
                                     size_t vl);
vint16m8_t __riscv_vwadd_vv_i16m8_tu(vint16m8_t vd, vint8m4_t vs2,
                                     vint8m4_t vs1, size_t vl);
vint16m8_t __riscv_vwadd_vx_i16m8_tu(vint16m8_t vd, vint8m4_t vs2, int8_t rs1,
                                     size_t vl);
vint16m8_t __riscv_vwadd_wv_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                     vint8m4_t vs1, size_t vl);
vint16m8_t __riscv_vwadd_wx_i16m8_tu(vint16m8_t vd, vint16m8_t vs2, int8_t rs1,
                                     size_t vl);
vint32mf2_t __riscv_vwadd_vv_i32mf2_tu(vint32mf2_t vd, vint16mf4_t vs2,
                                       vint16mf4_t vs1, size_t vl);
vint32mf2_t __riscv_vwadd_vx_i32mf2_tu(vint32mf2_t vd, vint16mf4_t vs2,
                                       int16_t rs1, size_t vl);
vint32mf2_t __riscv_vwadd_wv_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                       vint16mf4_t vs1, size_t vl);
vint32mf2_t __riscv_vwadd_wx_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                       int16_t rs1, size_t vl);
vint32m1_t __riscv_vwadd_vv_i32m1_tu(vint32m1_t vd, vint16mf2_t vs2,
                                     vint16mf2_t vs1, size_t vl);
vint32m1_t __riscv_vwadd_vx_i32m1_tu(vint32m1_t vd, vint16mf2_t vs2,
                                     int16_t rs1, size_t vl);
vint32m1_t __riscv_vwadd_wv_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                     vint16mf2_t vs1, size_t vl);
vint32m1_t __riscv_vwadd_wx_i32m1_tu(vint32m1_t vd, vint32m1_t vs2, int16_t rs1,
                                     size_t vl);
vint32m2_t __riscv_vwadd_vv_i32m2_tu(vint32m2_t vd, vint16m1_t vs2,
                                     vint16m1_t vs1, size_t vl);
vint32m2_t __riscv_vwadd_vx_i32m2_tu(vint32m2_t vd, vint16m1_t vs2, int16_t rs1,
                                     size_t vl);
vint32m2_t __riscv_vwadd_wv_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                     vint16m1_t vs1, size_t vl);
vint32m2_t __riscv_vwadd_wx_i32m2_tu(vint32m2_t vd, vint32m2_t vs2, int16_t rs1,
                                     size_t vl);
vint32m4_t __riscv_vwadd_vv_i32m4_tu(vint32m4_t vd, vint16m2_t vs2,
                                     vint16m2_t vs1, size_t vl);
vint32m4_t __riscv_vwadd_vx_i32m4_tu(vint32m4_t vd, vint16m2_t vs2, int16_t rs1,
                                     size_t vl);
vint32m4_t __riscv_vwadd_wv_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                     vint16m2_t vs1, size_t vl);
vint32m4_t __riscv_vwadd_wx_i32m4_tu(vint32m4_t vd, vint32m4_t vs2, int16_t rs1,
                                     size_t vl);
vint32m8_t __riscv_vwadd_vv_i32m8_tu(vint32m8_t vd, vint16m4_t vs2,
                                     vint16m4_t vs1, size_t vl);
vint32m8_t __riscv_vwadd_vx_i32m8_tu(vint32m8_t vd, vint16m4_t vs2, int16_t rs1,
                                     size_t vl);
vint32m8_t __riscv_vwadd_wv_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                     vint16m4_t vs1, size_t vl);
vint32m8_t __riscv_vwadd_wx_i32m8_tu(vint32m8_t vd, vint32m8_t vs2, int16_t rs1,
                                     size_t vl);
vint64m1_t __riscv_vwadd_vv_i64m1_tu(vint64m1_t vd, vint32mf2_t vs2,
                                     vint32mf2_t vs1, size_t vl);
vint64m1_t __riscv_vwadd_vx_i64m1_tu(vint64m1_t vd, vint32mf2_t vs2,
                                     int32_t rs1, size_t vl);
vint64m1_t __riscv_vwadd_wv_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                     vint32mf2_t vs1, size_t vl);
vint64m1_t __riscv_vwadd_wx_i64m1_tu(vint64m1_t vd, vint64m1_t vs2, int32_t rs1,
                                     size_t vl);
vint64m2_t __riscv_vwadd_vv_i64m2_tu(vint64m2_t vd, vint32m1_t vs2,
                                     vint32m1_t vs1, size_t vl);
vint64m2_t __riscv_vwadd_vx_i64m2_tu(vint64m2_t vd, vint32m1_t vs2, int32_t rs1,
                                     size_t vl);
vint64m2_t __riscv_vwadd_wv_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                     vint32m1_t vs1, size_t vl);
vint64m2_t __riscv_vwadd_wx_i64m2_tu(vint64m2_t vd, vint64m2_t vs2, int32_t rs1,
                                     size_t vl);
vint64m4_t __riscv_vwadd_vv_i64m4_tu(vint64m4_t vd, vint32m2_t vs2,
                                     vint32m2_t vs1, size_t vl);
vint64m4_t __riscv_vwadd_vx_i64m4_tu(vint64m4_t vd, vint32m2_t vs2, int32_t rs1,
                                     size_t vl);
vint64m4_t __riscv_vwadd_wv_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                     vint32m2_t vs1, size_t vl);
vint64m4_t __riscv_vwadd_wx_i64m4_tu(vint64m4_t vd, vint64m4_t vs2, int32_t rs1,
                                     size_t vl);
vint64m8_t __riscv_vwadd_vv_i64m8_tu(vint64m8_t vd, vint32m4_t vs2,
                                     vint32m4_t vs1, size_t vl);
vint64m8_t __riscv_vwadd_vx_i64m8_tu(vint64m8_t vd, vint32m4_t vs2, int32_t rs1,
                                     size_t vl);
vint64m8_t __riscv_vwadd_wv_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                     vint32m4_t vs1, size_t vl);
vint64m8_t __riscv_vwadd_wx_i64m8_tu(vint64m8_t vd, vint64m8_t vs2, int32_t rs1,
                                     size_t vl);
vint16mf4_t __riscv_vwsub_vv_i16mf4_tu(vint16mf4_t vd, vint8mf8_t vs2,
                                       vint8mf8_t vs1, size_t vl);
vint16mf4_t __riscv_vwsub_vx_i16mf4_tu(vint16mf4_t vd, vint8mf8_t vs2,
                                       int8_t rs1, size_t vl);
vint16mf4_t __riscv_vwsub_wv_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                       vint8mf8_t vs1, size_t vl);
vint16mf4_t __riscv_vwsub_wx_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                       int8_t rs1, size_t vl);
vint16mf2_t __riscv_vwsub_vv_i16mf2_tu(vint16mf2_t vd, vint8mf4_t vs2,
                                       vint8mf4_t vs1, size_t vl);
vint16mf2_t __riscv_vwsub_vx_i16mf2_tu(vint16mf2_t vd, vint8mf4_t vs2,
                                       int8_t rs1, size_t vl);
vint16mf2_t __riscv_vwsub_wv_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                       vint8mf4_t vs1, size_t vl);
vint16mf2_t __riscv_vwsub_wx_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                       int8_t rs1, size_t vl);
vint16m1_t __riscv_vwsub_vv_i16m1_tu(vint16m1_t vd, vint8mf2_t vs2,
                                     vint8mf2_t vs1, size_t vl);
vint16m1_t __riscv_vwsub_vx_i16m1_tu(vint16m1_t vd, vint8mf2_t vs2, int8_t rs1,
                                     size_t vl);
vint16m1_t __riscv_vwsub_wv_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                     vint8mf2_t vs1, size_t vl);
vint16m1_t __riscv_vwsub_wx_i16m1_tu(vint16m1_t vd, vint16m1_t vs2, int8_t rs1,
                                     size_t vl);
vint16m2_t __riscv_vwsub_vv_i16m2_tu(vint16m2_t vd, vint8m1_t vs2,
                                     vint8m1_t vs1, size_t vl);
vint16m2_t __riscv_vwsub_vx_i16m2_tu(vint16m2_t vd, vint8m1_t vs2, int8_t rs1,
                                     size_t vl);
vint16m2_t __riscv_vwsub_wv_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                     vint8m1_t vs1, size_t vl);
vint16m2_t __riscv_vwsub_wx_i16m2_tu(vint16m2_t vd, vint16m2_t vs2, int8_t rs1,
                                     size_t vl);
vint16m4_t __riscv_vwsub_vv_i16m4_tu(vint16m4_t vd, vint8m2_t vs2,
                                     vint8m2_t vs1, size_t vl);
vint16m4_t __riscv_vwsub_vx_i16m4_tu(vint16m4_t vd, vint8m2_t vs2, int8_t rs1,
                                     size_t vl);
vint16m4_t __riscv_vwsub_wv_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                     vint8m2_t vs1, size_t vl);
vint16m4_t __riscv_vwsub_wx_i16m4_tu(vint16m4_t vd, vint16m4_t vs2, int8_t rs1,
                                     size_t vl);
vint16m8_t __riscv_vwsub_vv_i16m8_tu(vint16m8_t vd, vint8m4_t vs2,
                                     vint8m4_t vs1, size_t vl);
vint16m8_t __riscv_vwsub_vx_i16m8_tu(vint16m8_t vd, vint8m4_t vs2, int8_t rs1,
                                     size_t vl);
vint16m8_t __riscv_vwsub_wv_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                     vint8m4_t vs1, size_t vl);
vint16m8_t __riscv_vwsub_wx_i16m8_tu(vint16m8_t vd, vint16m8_t vs2, int8_t rs1,
                                     size_t vl);
vint32mf2_t __riscv_vwsub_vv_i32mf2_tu(vint32mf2_t vd, vint16mf4_t vs2,
                                       vint16mf4_t vs1, size_t vl);
vint32mf2_t __riscv_vwsub_vx_i32mf2_tu(vint32mf2_t vd, vint16mf4_t vs2,
                                       int16_t rs1, size_t vl);
vint32mf2_t __riscv_vwsub_wv_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                       vint16mf4_t vs1, size_t vl);
vint32mf2_t __riscv_vwsub_wx_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                       int16_t rs1, size_t vl);
vint32m1_t __riscv_vwsub_vv_i32m1_tu(vint32m1_t vd, vint16mf2_t vs2,
                                     vint16mf2_t vs1, size_t vl);
vint32m1_t __riscv_vwsub_vx_i32m1_tu(vint32m1_t vd, vint16mf2_t vs2,
                                     int16_t rs1, size_t vl);
vint32m1_t __riscv_vwsub_wv_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                     vint16mf2_t vs1, size_t vl);
vint32m1_t __riscv_vwsub_wx_i32m1_tu(vint32m1_t vd, vint32m1_t vs2, int16_t rs1,
                                     size_t vl);
vint32m2_t __riscv_vwsub_vv_i32m2_tu(vint32m2_t vd, vint16m1_t vs2,
                                     vint16m1_t vs1, size_t vl);
vint32m2_t __riscv_vwsub_vx_i32m2_tu(vint32m2_t vd, vint16m1_t vs2, int16_t rs1,
                                     size_t vl);
vint32m2_t __riscv_vwsub_wv_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                     vint16m1_t vs1, size_t vl);
vint32m2_t __riscv_vwsub_wx_i32m2_tu(vint32m2_t vd, vint32m2_t vs2, int16_t rs1,
                                     size_t vl);
vint32m4_t __riscv_vwsub_vv_i32m4_tu(vint32m4_t vd, vint16m2_t vs2,
                                     vint16m2_t vs1, size_t vl);
vint32m4_t __riscv_vwsub_vx_i32m4_tu(vint32m4_t vd, vint16m2_t vs2, int16_t rs1,
                                     size_t vl);
vint32m4_t __riscv_vwsub_wv_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                     vint16m2_t vs1, size_t vl);
vint32m4_t __riscv_vwsub_wx_i32m4_tu(vint32m4_t vd, vint32m4_t vs2, int16_t rs1,
                                     size_t vl);
vint32m8_t __riscv_vwsub_vv_i32m8_tu(vint32m8_t vd, vint16m4_t vs2,
                                     vint16m4_t vs1, size_t vl);
vint32m8_t __riscv_vwsub_vx_i32m8_tu(vint32m8_t vd, vint16m4_t vs2, int16_t rs1,
                                     size_t vl);
vint32m8_t __riscv_vwsub_wv_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                     vint16m4_t vs1, size_t vl);
vint32m8_t __riscv_vwsub_wx_i32m8_tu(vint32m8_t vd, vint32m8_t vs2, int16_t rs1,
                                     size_t vl);
vint64m1_t __riscv_vwsub_vv_i64m1_tu(vint64m1_t vd, vint32mf2_t vs2,
                                     vint32mf2_t vs1, size_t vl);
vint64m1_t __riscv_vwsub_vx_i64m1_tu(vint64m1_t vd, vint32mf2_t vs2,
                                     int32_t rs1, size_t vl);
vint64m1_t __riscv_vwsub_wv_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                     vint32mf2_t vs1, size_t vl);
vint64m1_t __riscv_vwsub_wx_i64m1_tu(vint64m1_t vd, vint64m1_t vs2, int32_t rs1,
                                     size_t vl);
vint64m2_t __riscv_vwsub_vv_i64m2_tu(vint64m2_t vd, vint32m1_t vs2,
                                     vint32m1_t vs1, size_t vl);
vint64m2_t __riscv_vwsub_vx_i64m2_tu(vint64m2_t vd, vint32m1_t vs2, int32_t rs1,
                                     size_t vl);
vint64m2_t __riscv_vwsub_wv_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                     vint32m1_t vs1, size_t vl);
vint64m2_t __riscv_vwsub_wx_i64m2_tu(vint64m2_t vd, vint64m2_t vs2, int32_t rs1,
                                     size_t vl);
vint64m4_t __riscv_vwsub_vv_i64m4_tu(vint64m4_t vd, vint32m2_t vs2,
                                     vint32m2_t vs1, size_t vl);
vint64m4_t __riscv_vwsub_vx_i64m4_tu(vint64m4_t vd, vint32m2_t vs2, int32_t rs1,
                                     size_t vl);
vint64m4_t __riscv_vwsub_wv_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                     vint32m2_t vs1, size_t vl);
vint64m4_t __riscv_vwsub_wx_i64m4_tu(vint64m4_t vd, vint64m4_t vs2, int32_t rs1,
                                     size_t vl);
vint64m8_t __riscv_vwsub_vv_i64m8_tu(vint64m8_t vd, vint32m4_t vs2,
                                     vint32m4_t vs1, size_t vl);
vint64m8_t __riscv_vwsub_vx_i64m8_tu(vint64m8_t vd, vint32m4_t vs2, int32_t rs1,
                                     size_t vl);
vint64m8_t __riscv_vwsub_wv_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                     vint32m4_t vs1, size_t vl);
vint64m8_t __riscv_vwsub_wx_i64m8_tu(vint64m8_t vd, vint64m8_t vs2, int32_t rs1,
                                     size_t vl);
vuint16mf4_t __riscv_vwaddu_vv_u16mf4_tu(vuint16mf4_t vd, vuint8mf8_t vs2,
                                         vuint8mf8_t vs1, size_t vl);
vuint16mf4_t __riscv_vwaddu_vx_u16mf4_tu(vuint16mf4_t vd, vuint8mf8_t vs2,
                                         uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vwaddu_wv_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                         vuint8mf8_t vs1, size_t vl);
vuint16mf4_t __riscv_vwaddu_wx_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                         uint8_t rs1, size_t vl);
vuint16mf2_t __riscv_vwaddu_vv_u16mf2_tu(vuint16mf2_t vd, vuint8mf4_t vs2,
                                         vuint8mf4_t vs1, size_t vl);
vuint16mf2_t __riscv_vwaddu_vx_u16mf2_tu(vuint16mf2_t vd, vuint8mf4_t vs2,
                                         uint8_t rs1, size_t vl);
vuint16mf2_t __riscv_vwaddu_wv_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                         vuint8mf4_t vs1, size_t vl);
vuint16mf2_t __riscv_vwaddu_wx_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                         uint8_t rs1, size_t vl);
vuint16m1_t __riscv_vwaddu_vv_u16m1_tu(vuint16m1_t vd, vuint8mf2_t vs2,
                                       vuint8mf2_t vs1, size_t vl);
vuint16m1_t __riscv_vwaddu_vx_u16m1_tu(vuint16m1_t vd, vuint8mf2_t vs2,
                                       uint8_t rs1, size_t vl);
vuint16m1_t __riscv_vwaddu_wv_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                       vuint8mf2_t vs1, size_t vl);
vuint16m1_t __riscv_vwaddu_wx_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                       uint8_t rs1, size_t vl);
vuint16m2_t __riscv_vwaddu_vv_u16m2_tu(vuint16m2_t vd, vuint8m1_t vs2,
                                       vuint8m1_t vs1, size_t vl);
vuint16m2_t __riscv_vwaddu_vx_u16m2_tu(vuint16m2_t vd, vuint8m1_t vs2,
                                       uint8_t rs1, size_t vl);
vuint16m2_t __riscv_vwaddu_wv_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                       vuint8m1_t vs1, size_t vl);
vuint16m2_t __riscv_vwaddu_wx_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                       uint8_t rs1, size_t vl);
vuint16m4_t __riscv_vwaddu_vv_u16m4_tu(vuint16m4_t vd, vuint8m2_t vs2,
                                       vuint8m2_t vs1, size_t vl);
vuint16m4_t __riscv_vwaddu_vx_u16m4_tu(vuint16m4_t vd, vuint8m2_t vs2,
                                       uint8_t rs1, size_t vl);
vuint16m4_t __riscv_vwaddu_wv_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                       vuint8m2_t vs1, size_t vl);
vuint16m4_t __riscv_vwaddu_wx_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                       uint8_t rs1, size_t vl);
vuint16m8_t __riscv_vwaddu_vv_u16m8_tu(vuint16m8_t vd, vuint8m4_t vs2,
                                       vuint8m4_t vs1, size_t vl);
vuint16m8_t __riscv_vwaddu_vx_u16m8_tu(vuint16m8_t vd, vuint8m4_t vs2,
                                       uint8_t rs1, size_t vl);
vuint16m8_t __riscv_vwaddu_wv_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                       vuint8m4_t vs1, size_t vl);
vuint16m8_t __riscv_vwaddu_wx_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                       uint8_t rs1, size_t vl);
vuint32mf2_t __riscv_vwaddu_vv_u32mf2_tu(vuint32mf2_t vd, vuint16mf4_t vs2,
                                         vuint16mf4_t vs1, size_t vl);
vuint32mf2_t __riscv_vwaddu_vx_u32mf2_tu(vuint32mf2_t vd, vuint16mf4_t vs2,
                                         uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vwaddu_wv_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                         vuint16mf4_t vs1, size_t vl);
vuint32mf2_t __riscv_vwaddu_wx_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                         uint16_t rs1, size_t vl);
vuint32m1_t __riscv_vwaddu_vv_u32m1_tu(vuint32m1_t vd, vuint16mf2_t vs2,
                                       vuint16mf2_t vs1, size_t vl);
vuint32m1_t __riscv_vwaddu_vx_u32m1_tu(vuint32m1_t vd, vuint16mf2_t vs2,
                                       uint16_t rs1, size_t vl);
vuint32m1_t __riscv_vwaddu_wv_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                       vuint16mf2_t vs1, size_t vl);
vuint32m1_t __riscv_vwaddu_wx_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                       uint16_t rs1, size_t vl);
vuint32m2_t __riscv_vwaddu_vv_u32m2_tu(vuint32m2_t vd, vuint16m1_t vs2,
                                       vuint16m1_t vs1, size_t vl);
vuint32m2_t __riscv_vwaddu_vx_u32m2_tu(vuint32m2_t vd, vuint16m1_t vs2,
                                       uint16_t rs1, size_t vl);
vuint32m2_t __riscv_vwaddu_wv_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                       vuint16m1_t vs1, size_t vl);
vuint32m2_t __riscv_vwaddu_wx_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                       uint16_t rs1, size_t vl);
vuint32m4_t __riscv_vwaddu_vv_u32m4_tu(vuint32m4_t vd, vuint16m2_t vs2,
                                       vuint16m2_t vs1, size_t vl);
vuint32m4_t __riscv_vwaddu_vx_u32m4_tu(vuint32m4_t vd, vuint16m2_t vs2,
                                       uint16_t rs1, size_t vl);
vuint32m4_t __riscv_vwaddu_wv_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                       vuint16m2_t vs1, size_t vl);
vuint32m4_t __riscv_vwaddu_wx_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                       uint16_t rs1, size_t vl);
vuint32m8_t __riscv_vwaddu_vv_u32m8_tu(vuint32m8_t vd, vuint16m4_t vs2,
                                       vuint16m4_t vs1, size_t vl);
vuint32m8_t __riscv_vwaddu_vx_u32m8_tu(vuint32m8_t vd, vuint16m4_t vs2,
                                       uint16_t rs1, size_t vl);
vuint32m8_t __riscv_vwaddu_wv_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                       vuint16m4_t vs1, size_t vl);
vuint32m8_t __riscv_vwaddu_wx_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                       uint16_t rs1, size_t vl);
vuint64m1_t __riscv_vwaddu_vv_u64m1_tu(vuint64m1_t vd, vuint32mf2_t vs2,
                                       vuint32mf2_t vs1, size_t vl);
vuint64m1_t __riscv_vwaddu_vx_u64m1_tu(vuint64m1_t vd, vuint32mf2_t vs2,
                                       uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vwaddu_wv_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                       vuint32mf2_t vs1, size_t vl);
vuint64m1_t __riscv_vwaddu_wx_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                       uint32_t rs1, size_t vl);
vuint64m2_t __riscv_vwaddu_vv_u64m2_tu(vuint64m2_t vd, vuint32m1_t vs2,
                                       vuint32m1_t vs1, size_t vl);
vuint64m2_t __riscv_vwaddu_vx_u64m2_tu(vuint64m2_t vd, vuint32m1_t vs2,
                                       uint32_t rs1, size_t vl);
vuint64m2_t __riscv_vwaddu_wv_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                       vuint32m1_t vs1, size_t vl);
vuint64m2_t __riscv_vwaddu_wx_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                       uint32_t rs1, size_t vl);
vuint64m4_t __riscv_vwaddu_vv_u64m4_tu(vuint64m4_t vd, vuint32m2_t vs2,
                                       vuint32m2_t vs1, size_t vl);
vuint64m4_t __riscv_vwaddu_vx_u64m4_tu(vuint64m4_t vd, vuint32m2_t vs2,
                                       uint32_t rs1, size_t vl);
vuint64m4_t __riscv_vwaddu_wv_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                       vuint32m2_t vs1, size_t vl);
vuint64m4_t __riscv_vwaddu_wx_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                       uint32_t rs1, size_t vl);
vuint64m8_t __riscv_vwaddu_vv_u64m8_tu(vuint64m8_t vd, vuint32m4_t vs2,
                                       vuint32m4_t vs1, size_t vl);
vuint64m8_t __riscv_vwaddu_vx_u64m8_tu(vuint64m8_t vd, vuint32m4_t vs2,
                                       uint32_t rs1, size_t vl);
vuint64m8_t __riscv_vwaddu_wv_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                       vuint32m4_t vs1, size_t vl);
vuint64m8_t __riscv_vwaddu_wx_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                       uint32_t rs1, size_t vl);
vuint16mf4_t __riscv_vwsubu_vv_u16mf4_tu(vuint16mf4_t vd, vuint8mf8_t vs2,
                                         vuint8mf8_t vs1, size_t vl);
vuint16mf4_t __riscv_vwsubu_vx_u16mf4_tu(vuint16mf4_t vd, vuint8mf8_t vs2,
                                         uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vwsubu_wv_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                         vuint8mf8_t vs1, size_t vl);
vuint16mf4_t __riscv_vwsubu_wx_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                         uint8_t rs1, size_t vl);
vuint16mf2_t __riscv_vwsubu_vv_u16mf2_tu(vuint16mf2_t vd, vuint8mf4_t vs2,
                                         vuint8mf4_t vs1, size_t vl);
vuint16mf2_t __riscv_vwsubu_vx_u16mf2_tu(vuint16mf2_t vd, vuint8mf4_t vs2,
                                         uint8_t rs1, size_t vl);
vuint16mf2_t __riscv_vwsubu_wv_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                         vuint8mf4_t vs1, size_t vl);
vuint16mf2_t __riscv_vwsubu_wx_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                         uint8_t rs1, size_t vl);
vuint16m1_t __riscv_vwsubu_vv_u16m1_tu(vuint16m1_t vd, vuint8mf2_t vs2,
                                       vuint8mf2_t vs1, size_t vl);
vuint16m1_t __riscv_vwsubu_vx_u16m1_tu(vuint16m1_t vd, vuint8mf2_t vs2,
                                       uint8_t rs1, size_t vl);
vuint16m1_t __riscv_vwsubu_wv_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                       vuint8mf2_t vs1, size_t vl);
vuint16m1_t __riscv_vwsubu_wx_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                       uint8_t rs1, size_t vl);
vuint16m2_t __riscv_vwsubu_vv_u16m2_tu(vuint16m2_t vd, vuint8m1_t vs2,
                                       vuint8m1_t vs1, size_t vl);
vuint16m2_t __riscv_vwsubu_vx_u16m2_tu(vuint16m2_t vd, vuint8m1_t vs2,
                                       uint8_t rs1, size_t vl);
vuint16m2_t __riscv_vwsubu_wv_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                       vuint8m1_t vs1, size_t vl);
vuint16m2_t __riscv_vwsubu_wx_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                       uint8_t rs1, size_t vl);
vuint16m4_t __riscv_vwsubu_vv_u16m4_tu(vuint16m4_t vd, vuint8m2_t vs2,
                                       vuint8m2_t vs1, size_t vl);
vuint16m4_t __riscv_vwsubu_vx_u16m4_tu(vuint16m4_t vd, vuint8m2_t vs2,
                                       uint8_t rs1, size_t vl);
vuint16m4_t __riscv_vwsubu_wv_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                       vuint8m2_t vs1, size_t vl);
vuint16m4_t __riscv_vwsubu_wx_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                       uint8_t rs1, size_t vl);
vuint16m8_t __riscv_vwsubu_vv_u16m8_tu(vuint16m8_t vd, vuint8m4_t vs2,
                                       vuint8m4_t vs1, size_t vl);
vuint16m8_t __riscv_vwsubu_vx_u16m8_tu(vuint16m8_t vd, vuint8m4_t vs2,
                                       uint8_t rs1, size_t vl);
vuint16m8_t __riscv_vwsubu_wv_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                       vuint8m4_t vs1, size_t vl);
vuint16m8_t __riscv_vwsubu_wx_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                       uint8_t rs1, size_t vl);
vuint32mf2_t __riscv_vwsubu_vv_u32mf2_tu(vuint32mf2_t vd, vuint16mf4_t vs2,
                                         vuint16mf4_t vs1, size_t vl);
vuint32mf2_t __riscv_vwsubu_vx_u32mf2_tu(vuint32mf2_t vd, vuint16mf4_t vs2,
                                         uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vwsubu_wv_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                         vuint16mf4_t vs1, size_t vl);
vuint32mf2_t __riscv_vwsubu_wx_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                         uint16_t rs1, size_t vl);
vuint32m1_t __riscv_vwsubu_vv_u32m1_tu(vuint32m1_t vd, vuint16mf2_t vs2,
                                       vuint16mf2_t vs1, size_t vl);
vuint32m1_t __riscv_vwsubu_vx_u32m1_tu(vuint32m1_t vd, vuint16mf2_t vs2,
                                       uint16_t rs1, size_t vl);
vuint32m1_t __riscv_vwsubu_wv_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                       vuint16mf2_t vs1, size_t vl);
vuint32m1_t __riscv_vwsubu_wx_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                       uint16_t rs1, size_t vl);
vuint32m2_t __riscv_vwsubu_vv_u32m2_tu(vuint32m2_t vd, vuint16m1_t vs2,
                                       vuint16m1_t vs1, size_t vl);
vuint32m2_t __riscv_vwsubu_vx_u32m2_tu(vuint32m2_t vd, vuint16m1_t vs2,
                                       uint16_t rs1, size_t vl);
vuint32m2_t __riscv_vwsubu_wv_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                       vuint16m1_t vs1, size_t vl);
vuint32m2_t __riscv_vwsubu_wx_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                       uint16_t rs1, size_t vl);
vuint32m4_t __riscv_vwsubu_vv_u32m4_tu(vuint32m4_t vd, vuint16m2_t vs2,
                                       vuint16m2_t vs1, size_t vl);
vuint32m4_t __riscv_vwsubu_vx_u32m4_tu(vuint32m4_t vd, vuint16m2_t vs2,
                                       uint16_t rs1, size_t vl);
vuint32m4_t __riscv_vwsubu_wv_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                       vuint16m2_t vs1, size_t vl);
vuint32m4_t __riscv_vwsubu_wx_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                       uint16_t rs1, size_t vl);
vuint32m8_t __riscv_vwsubu_vv_u32m8_tu(vuint32m8_t vd, vuint16m4_t vs2,
                                       vuint16m4_t vs1, size_t vl);
vuint32m8_t __riscv_vwsubu_vx_u32m8_tu(vuint32m8_t vd, vuint16m4_t vs2,
                                       uint16_t rs1, size_t vl);
vuint32m8_t __riscv_vwsubu_wv_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                       vuint16m4_t vs1, size_t vl);
vuint32m8_t __riscv_vwsubu_wx_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                       uint16_t rs1, size_t vl);
vuint64m1_t __riscv_vwsubu_vv_u64m1_tu(vuint64m1_t vd, vuint32mf2_t vs2,
                                       vuint32mf2_t vs1, size_t vl);
vuint64m1_t __riscv_vwsubu_vx_u64m1_tu(vuint64m1_t vd, vuint32mf2_t vs2,
                                       uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vwsubu_wv_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                       vuint32mf2_t vs1, size_t vl);
vuint64m1_t __riscv_vwsubu_wx_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                       uint32_t rs1, size_t vl);
vuint64m2_t __riscv_vwsubu_vv_u64m2_tu(vuint64m2_t vd, vuint32m1_t vs2,
                                       vuint32m1_t vs1, size_t vl);
vuint64m2_t __riscv_vwsubu_vx_u64m2_tu(vuint64m2_t vd, vuint32m1_t vs2,
                                       uint32_t rs1, size_t vl);
vuint64m2_t __riscv_vwsubu_wv_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                       vuint32m1_t vs1, size_t vl);
vuint64m2_t __riscv_vwsubu_wx_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                       uint32_t rs1, size_t vl);
vuint64m4_t __riscv_vwsubu_vv_u64m4_tu(vuint64m4_t vd, vuint32m2_t vs2,
                                       vuint32m2_t vs1, size_t vl);
vuint64m4_t __riscv_vwsubu_vx_u64m4_tu(vuint64m4_t vd, vuint32m2_t vs2,
                                       uint32_t rs1, size_t vl);
vuint64m4_t __riscv_vwsubu_wv_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                       vuint32m2_t vs1, size_t vl);
vuint64m4_t __riscv_vwsubu_wx_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                       uint32_t rs1, size_t vl);
vuint64m8_t __riscv_vwsubu_vv_u64m8_tu(vuint64m8_t vd, vuint32m4_t vs2,
                                       vuint32m4_t vs1, size_t vl);
vuint64m8_t __riscv_vwsubu_vx_u64m8_tu(vuint64m8_t vd, vuint32m4_t vs2,
                                       uint32_t rs1, size_t vl);
vuint64m8_t __riscv_vwsubu_wv_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                       vuint32m4_t vs1, size_t vl);
vuint64m8_t __riscv_vwsubu_wx_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                       uint32_t rs1, size_t vl);
// masked functions
vint16mf4_t __riscv_vwadd_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                        vint8mf8_t vs2, vint8mf8_t vs1,
                                        size_t vl);
vint16mf4_t __riscv_vwadd_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                        vint8mf8_t vs2, int8_t rs1, size_t vl);
vint16mf4_t __riscv_vwadd_wv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, vint8mf8_t vs1,
                                        size_t vl);
vint16mf4_t __riscv_vwadd_wx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, int8_t rs1, size_t vl);
vint16mf2_t __riscv_vwadd_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                        vint8mf4_t vs2, vint8mf4_t vs1,
                                        size_t vl);
vint16mf2_t __riscv_vwadd_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                        vint8mf4_t vs2, int8_t rs1, size_t vl);
vint16mf2_t __riscv_vwadd_wv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, vint8mf4_t vs1,
                                        size_t vl);
vint16mf2_t __riscv_vwadd_wx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, int8_t rs1, size_t vl);
vint16m1_t __riscv_vwadd_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                      vint8mf2_t vs2, vint8mf2_t vs1,
                                      size_t vl);
vint16m1_t __riscv_vwadd_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                      vint8mf2_t vs2, int8_t rs1, size_t vl);
vint16m1_t __riscv_vwadd_wv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, vint8mf2_t vs1,
                                      size_t vl);
vint16m1_t __riscv_vwadd_wx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, int8_t rs1, size_t vl);
vint16m2_t __riscv_vwadd_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint8m1_t vs2,
                                      vint8m1_t vs1, size_t vl);
vint16m2_t __riscv_vwadd_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint8m1_t vs2,
                                      int8_t rs1, size_t vl);
vint16m2_t __riscv_vwadd_wv_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, vint8m1_t vs1, size_t vl);
vint16m2_t __riscv_vwadd_wx_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, int8_t rs1, size_t vl);
vint16m4_t __riscv_vwadd_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint8m2_t vs2,
                                      vint8m2_t vs1, size_t vl);
vint16m4_t __riscv_vwadd_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint8m2_t vs2,
                                      int8_t rs1, size_t vl);
vint16m4_t __riscv_vwadd_wv_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, vint8m2_t vs1, size_t vl);
vint16m4_t __riscv_vwadd_wx_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, int8_t rs1, size_t vl);
vint16m8_t __riscv_vwadd_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint8m4_t vs2,
                                      vint8m4_t vs1, size_t vl);
vint16m8_t __riscv_vwadd_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint8m4_t vs2,
                                      int8_t rs1, size_t vl);
vint16m8_t __riscv_vwadd_wv_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, vint8m4_t vs1, size_t vl);
vint16m8_t __riscv_vwadd_wx_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, int8_t rs1, size_t vl);
vint32mf2_t __riscv_vwadd_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                        vint16mf4_t vs2, vint16mf4_t vs1,
                                        size_t vl);
vint32mf2_t __riscv_vwadd_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                        vint16mf4_t vs2, int16_t rs1,
                                        size_t vl);
vint32mf2_t __riscv_vwadd_wv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, vint16mf4_t vs1,
                                        size_t vl);
vint32mf2_t __riscv_vwadd_wx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, int16_t rs1,
                                        size_t vl);
vint32m1_t __riscv_vwadd_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                      vint16mf2_t vs2, vint16mf2_t vs1,
                                      size_t vl);
vint32m1_t __riscv_vwadd_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                      vint16mf2_t vs2, int16_t rs1, size_t vl);
vint32m1_t __riscv_vwadd_wv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, vint16mf2_t vs1,
                                      size_t vl);
vint32m1_t __riscv_vwadd_wx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, int16_t rs1, size_t vl);
vint32m2_t __riscv_vwadd_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                      vint16m1_t vs2, vint16m1_t vs1,
                                      size_t vl);
vint32m2_t __riscv_vwadd_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                      vint16m1_t vs2, int16_t rs1, size_t vl);
vint32m2_t __riscv_vwadd_wv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, vint16m1_t vs1,
                                      size_t vl);
vint32m2_t __riscv_vwadd_wx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, int16_t rs1, size_t vl);
vint32m4_t __riscv_vwadd_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                      vint16m2_t vs2, vint16m2_t vs1,
                                      size_t vl);
vint32m4_t __riscv_vwadd_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                      vint16m2_t vs2, int16_t rs1, size_t vl);
vint32m4_t __riscv_vwadd_wv_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, vint16m2_t vs1,
                                      size_t vl);
vint32m4_t __riscv_vwadd_wx_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, int16_t rs1, size_t vl);
vint32m8_t __riscv_vwadd_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                      vint16m4_t vs2, vint16m4_t vs1,
                                      size_t vl);
vint32m8_t __riscv_vwadd_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                      vint16m4_t vs2, int16_t rs1, size_t vl);
vint32m8_t __riscv_vwadd_wv_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, vint16m4_t vs1,
                                      size_t vl);
vint32m8_t __riscv_vwadd_wx_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, int16_t rs1, size_t vl);
vint64m1_t __riscv_vwadd_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                      vint32mf2_t vs2, vint32mf2_t vs1,
                                      size_t vl);
vint64m1_t __riscv_vwadd_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                      vint32mf2_t vs2, int32_t rs1, size_t vl);
vint64m1_t __riscv_vwadd_wv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, vint32mf2_t vs1,
                                      size_t vl);
vint64m1_t __riscv_vwadd_wx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, int32_t rs1, size_t vl);
vint64m2_t __riscv_vwadd_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                      vint32m1_t vs2, vint32m1_t vs1,
                                      size_t vl);
vint64m2_t __riscv_vwadd_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                      vint32m1_t vs2, int32_t rs1, size_t vl);
vint64m2_t __riscv_vwadd_wv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, vint32m1_t vs1,
                                      size_t vl);
vint64m2_t __riscv_vwadd_wx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, int32_t rs1, size_t vl);
vint64m4_t __riscv_vwadd_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                      vint32m2_t vs2, vint32m2_t vs1,
                                      size_t vl);
vint64m4_t __riscv_vwadd_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                      vint32m2_t vs2, int32_t rs1, size_t vl);
vint64m4_t __riscv_vwadd_wv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, vint32m2_t vs1,
                                      size_t vl);
vint64m4_t __riscv_vwadd_wx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, int32_t rs1, size_t vl);
vint64m8_t __riscv_vwadd_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                      vint32m4_t vs2, vint32m4_t vs1,
                                      size_t vl);
vint64m8_t __riscv_vwadd_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                      vint32m4_t vs2, int32_t rs1, size_t vl);
vint64m8_t __riscv_vwadd_wv_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, vint32m4_t vs1,
                                      size_t vl);
vint64m8_t __riscv_vwadd_wx_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, int32_t rs1, size_t vl);
vint16mf4_t __riscv_vwsub_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                        vint8mf8_t vs2, vint8mf8_t vs1,
                                        size_t vl);
vint16mf4_t __riscv_vwsub_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                        vint8mf8_t vs2, int8_t rs1, size_t vl);
vint16mf4_t __riscv_vwsub_wv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, vint8mf8_t vs1,
                                        size_t vl);
vint16mf4_t __riscv_vwsub_wx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, int8_t rs1, size_t vl);
vint16mf2_t __riscv_vwsub_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                        vint8mf4_t vs2, vint8mf4_t vs1,
                                        size_t vl);
vint16mf2_t __riscv_vwsub_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                        vint8mf4_t vs2, int8_t rs1, size_t vl);
vint16mf2_t __riscv_vwsub_wv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, vint8mf4_t vs1,
                                        size_t vl);
vint16mf2_t __riscv_vwsub_wx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, int8_t rs1, size_t vl);
vint16m1_t __riscv_vwsub_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                      vint8mf2_t vs2, vint8mf2_t vs1,
                                      size_t vl);
vint16m1_t __riscv_vwsub_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                      vint8mf2_t vs2, int8_t rs1, size_t vl);
vint16m1_t __riscv_vwsub_wv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, vint8mf2_t vs1,
                                      size_t vl);
vint16m1_t __riscv_vwsub_wx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, int8_t rs1, size_t vl);
vint16m2_t __riscv_vwsub_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint8m1_t vs2,
                                      vint8m1_t vs1, size_t vl);
vint16m2_t __riscv_vwsub_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint8m1_t vs2,
                                      int8_t rs1, size_t vl);
vint16m2_t __riscv_vwsub_wv_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, vint8m1_t vs1, size_t vl);
vint16m2_t __riscv_vwsub_wx_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, int8_t rs1, size_t vl);
vint16m4_t __riscv_vwsub_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint8m2_t vs2,
                                      vint8m2_t vs1, size_t vl);
vint16m4_t __riscv_vwsub_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint8m2_t vs2,
                                      int8_t rs1, size_t vl);
vint16m4_t __riscv_vwsub_wv_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, vint8m2_t vs1, size_t vl);
vint16m4_t __riscv_vwsub_wx_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, int8_t rs1, size_t vl);
vint16m8_t __riscv_vwsub_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint8m4_t vs2,
                                      vint8m4_t vs1, size_t vl);
vint16m8_t __riscv_vwsub_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint8m4_t vs2,
                                      int8_t rs1, size_t vl);
vint16m8_t __riscv_vwsub_wv_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, vint8m4_t vs1, size_t vl);
vint16m8_t __riscv_vwsub_wx_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, int8_t rs1, size_t vl);
vint32mf2_t __riscv_vwsub_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                        vint16mf4_t vs2, vint16mf4_t vs1,
                                        size_t vl);
vint32mf2_t __riscv_vwsub_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                        vint16mf4_t vs2, int16_t rs1,
                                        size_t vl);
vint32mf2_t __riscv_vwsub_wv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, vint16mf4_t vs1,
                                        size_t vl);
vint32mf2_t __riscv_vwsub_wx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, int16_t rs1,
                                        size_t vl);
vint32m1_t __riscv_vwsub_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                      vint16mf2_t vs2, vint16mf2_t vs1,
                                      size_t vl);
vint32m1_t __riscv_vwsub_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                      vint16mf2_t vs2, int16_t rs1, size_t vl);
vint32m1_t __riscv_vwsub_wv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, vint16mf2_t vs1,
                                      size_t vl);
vint32m1_t __riscv_vwsub_wx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, int16_t rs1, size_t vl);
vint32m2_t __riscv_vwsub_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                      vint16m1_t vs2, vint16m1_t vs1,
                                      size_t vl);
vint32m2_t __riscv_vwsub_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                      vint16m1_t vs2, int16_t rs1, size_t vl);
vint32m2_t __riscv_vwsub_wv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, vint16m1_t vs1,
                                      size_t vl);
vint32m2_t __riscv_vwsub_wx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, int16_t rs1, size_t vl);
vint32m4_t __riscv_vwsub_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                      vint16m2_t vs2, vint16m2_t vs1,
                                      size_t vl);
vint32m4_t __riscv_vwsub_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                      vint16m2_t vs2, int16_t rs1, size_t vl);
vint32m4_t __riscv_vwsub_wv_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, vint16m2_t vs1,
                                      size_t vl);
vint32m4_t __riscv_vwsub_wx_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, int16_t rs1, size_t vl);
vint32m8_t __riscv_vwsub_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                      vint16m4_t vs2, vint16m4_t vs1,
                                      size_t vl);
vint32m8_t __riscv_vwsub_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                      vint16m4_t vs2, int16_t rs1, size_t vl);
vint32m8_t __riscv_vwsub_wv_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, vint16m4_t vs1,
                                      size_t vl);
vint32m8_t __riscv_vwsub_wx_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, int16_t rs1, size_t vl);
vint64m1_t __riscv_vwsub_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                      vint32mf2_t vs2, vint32mf2_t vs1,
                                      size_t vl);
vint64m1_t __riscv_vwsub_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                      vint32mf2_t vs2, int32_t rs1, size_t vl);
vint64m1_t __riscv_vwsub_wv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, vint32mf2_t vs1,
                                      size_t vl);
vint64m1_t __riscv_vwsub_wx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, int32_t rs1, size_t vl);
vint64m2_t __riscv_vwsub_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                      vint32m1_t vs2, vint32m1_t vs1,
                                      size_t vl);
vint64m2_t __riscv_vwsub_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                      vint32m1_t vs2, int32_t rs1, size_t vl);
vint64m2_t __riscv_vwsub_wv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, vint32m1_t vs1,
                                      size_t vl);
vint64m2_t __riscv_vwsub_wx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, int32_t rs1, size_t vl);
vint64m4_t __riscv_vwsub_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                      vint32m2_t vs2, vint32m2_t vs1,
                                      size_t vl);
vint64m4_t __riscv_vwsub_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                      vint32m2_t vs2, int32_t rs1, size_t vl);
vint64m4_t __riscv_vwsub_wv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, vint32m2_t vs1,
                                      size_t vl);
vint64m4_t __riscv_vwsub_wx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, int32_t rs1, size_t vl);
vint64m8_t __riscv_vwsub_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                      vint32m4_t vs2, vint32m4_t vs1,
                                      size_t vl);
vint64m8_t __riscv_vwsub_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                      vint32m4_t vs2, int32_t rs1, size_t vl);
vint64m8_t __riscv_vwsub_wv_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, vint32m4_t vs1,
                                      size_t vl);
vint64m8_t __riscv_vwsub_wx_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, int32_t rs1, size_t vl);
vuint16mf4_t __riscv_vwaddu_vv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                          vuint8mf8_t vs2, vuint8mf8_t vs1,
                                          size_t vl);
vuint16mf4_t __riscv_vwaddu_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                          vuint8mf8_t vs2, uint8_t rs1,
                                          size_t vl);
vuint16mf4_t __riscv_vwaddu_wv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                          vuint16mf4_t vs2, vuint8mf8_t vs1,
                                          size_t vl);
vuint16mf4_t __riscv_vwaddu_wx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                          vuint16mf4_t vs2, uint8_t rs1,
                                          size_t vl);
vuint16mf2_t __riscv_vwaddu_vv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                          vuint8mf4_t vs2, vuint8mf4_t vs1,
                                          size_t vl);
vuint16mf2_t __riscv_vwaddu_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                          vuint8mf4_t vs2, uint8_t rs1,
                                          size_t vl);
vuint16mf2_t __riscv_vwaddu_wv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                          vuint16mf2_t vs2, vuint8mf4_t vs1,
                                          size_t vl);
vuint16mf2_t __riscv_vwaddu_wx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                          vuint16mf2_t vs2, uint8_t rs1,
                                          size_t vl);
vuint16m1_t __riscv_vwaddu_vv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                        vuint8mf2_t vs2, vuint8mf2_t vs1,
                                        size_t vl);
vuint16m1_t __riscv_vwaddu_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                        vuint8mf2_t vs2, uint8_t rs1,
                                        size_t vl);
vuint16m1_t __riscv_vwaddu_wv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                        vuint16m1_t vs2, vuint8mf2_t vs1,
                                        size_t vl);
vuint16m1_t __riscv_vwaddu_wx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                        vuint16m1_t vs2, uint8_t rs1,
                                        size_t vl);
vuint16m2_t __riscv_vwaddu_vv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                        vuint8m1_t vs2, vuint8m1_t vs1,
                                        size_t vl);
vuint16m2_t __riscv_vwaddu_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                        vuint8m1_t vs2, uint8_t rs1, size_t vl);
vuint16m2_t __riscv_vwaddu_wv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                        vuint16m2_t vs2, vuint8m1_t vs1,
                                        size_t vl);
vuint16m2_t __riscv_vwaddu_wx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                        vuint16m2_t vs2, uint8_t rs1,
                                        size_t vl);
vuint16m4_t __riscv_vwaddu_vv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                        vuint8m2_t vs2, vuint8m2_t vs1,
                                        size_t vl);
vuint16m4_t __riscv_vwaddu_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                        vuint8m2_t vs2, uint8_t rs1, size_t vl);
vuint16m4_t __riscv_vwaddu_wv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                        vuint16m4_t vs2, vuint8m2_t vs1,
                                        size_t vl);
vuint16m4_t __riscv_vwaddu_wx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                        vuint16m4_t vs2, uint8_t rs1,
                                        size_t vl);
vuint16m8_t __riscv_vwaddu_vv_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                        vuint8m4_t vs2, vuint8m4_t vs1,
                                        size_t vl);
vuint16m8_t __riscv_vwaddu_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                        vuint8m4_t vs2, uint8_t rs1, size_t vl);
vuint16m8_t __riscv_vwaddu_wv_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                        vuint16m8_t vs2, vuint8m4_t vs1,
                                        size_t vl);
vuint16m8_t __riscv_vwaddu_wx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                        vuint16m8_t vs2, uint8_t rs1,
                                        size_t vl);
vuint32mf2_t __riscv_vwaddu_vv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                          vuint16mf4_t vs2, vuint16mf4_t vs1,
                                          size_t vl);
vuint32mf2_t __riscv_vwaddu_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                          vuint16mf4_t vs2, uint16_t rs1,
                                          size_t vl);
vuint32mf2_t __riscv_vwaddu_wv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                          vuint32mf2_t vs2, vuint16mf4_t vs1,
                                          size_t vl);
vuint32mf2_t __riscv_vwaddu_wx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                          vuint32mf2_t vs2, uint16_t rs1,
                                          size_t vl);
vuint32m1_t __riscv_vwaddu_vv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                        vuint16mf2_t vs2, vuint16mf2_t vs1,
                                        size_t vl);
vuint32m1_t __riscv_vwaddu_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                        vuint16mf2_t vs2, uint16_t rs1,
                                        size_t vl);
vuint32m1_t __riscv_vwaddu_wv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                        vuint32m1_t vs2, vuint16mf2_t vs1,
                                        size_t vl);
vuint32m1_t __riscv_vwaddu_wx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                        vuint32m1_t vs2, uint16_t rs1,
                                        size_t vl);
vuint32m2_t __riscv_vwaddu_vv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                        vuint16m1_t vs2, vuint16m1_t vs1,
                                        size_t vl);
vuint32m2_t __riscv_vwaddu_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                        vuint16m1_t vs2, uint16_t rs1,
                                        size_t vl);
vuint32m2_t __riscv_vwaddu_wv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                        vuint32m2_t vs2, vuint16m1_t vs1,
                                        size_t vl);
vuint32m2_t __riscv_vwaddu_wx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                        vuint32m2_t vs2, uint16_t rs1,
                                        size_t vl);
vuint32m4_t __riscv_vwaddu_vv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                        vuint16m2_t vs2, vuint16m2_t vs1,
                                        size_t vl);
vuint32m4_t __riscv_vwaddu_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                        vuint16m2_t vs2, uint16_t rs1,
                                        size_t vl);
vuint32m4_t __riscv_vwaddu_wv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                        vuint32m4_t vs2, vuint16m2_t vs1,
                                        size_t vl);
vuint32m4_t __riscv_vwaddu_wx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                        vuint32m4_t vs2, uint16_t rs1,
                                        size_t vl);
vuint32m8_t __riscv_vwaddu_vv_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                        vuint16m4_t vs2, vuint16m4_t vs1,
                                        size_t vl);
vuint32m8_t __riscv_vwaddu_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                        vuint16m4_t vs2, uint16_t rs1,
                                        size_t vl);
vuint32m8_t __riscv_vwaddu_wv_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                        vuint32m8_t vs2, vuint16m4_t vs1,
                                        size_t vl);
vuint32m8_t __riscv_vwaddu_wx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                        vuint32m8_t vs2, uint16_t rs1,
                                        size_t vl);
vuint64m1_t __riscv_vwaddu_vv_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                        vuint32mf2_t vs2, vuint32mf2_t vs1,
                                        size_t vl);
vuint64m1_t __riscv_vwaddu_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                        vuint32mf2_t vs2, uint32_t rs1,
                                        size_t vl);
vuint64m1_t __riscv_vwaddu_wv_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                        vuint64m1_t vs2, vuint32mf2_t vs1,
                                        size_t vl);
vuint64m1_t __riscv_vwaddu_wx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                        vuint64m1_t vs2, uint32_t rs1,
                                        size_t vl);
vuint64m2_t __riscv_vwaddu_vv_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                        vuint32m1_t vs2, vuint32m1_t vs1,
                                        size_t vl);
vuint64m2_t __riscv_vwaddu_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                        vuint32m1_t vs2, uint32_t rs1,
                                        size_t vl);
vuint64m2_t __riscv_vwaddu_wv_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                        vuint64m2_t vs2, vuint32m1_t vs1,
                                        size_t vl);
vuint64m2_t __riscv_vwaddu_wx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                        vuint64m2_t vs2, uint32_t rs1,
                                        size_t vl);
vuint64m4_t __riscv_vwaddu_vv_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                        vuint32m2_t vs2, vuint32m2_t vs1,
                                        size_t vl);
vuint64m4_t __riscv_vwaddu_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                        vuint32m2_t vs2, uint32_t rs1,
                                        size_t vl);
vuint64m4_t __riscv_vwaddu_wv_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                        vuint64m4_t vs2, vuint32m2_t vs1,
                                        size_t vl);
vuint64m4_t __riscv_vwaddu_wx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                        vuint64m4_t vs2, uint32_t rs1,
                                        size_t vl);
vuint64m8_t __riscv_vwaddu_vv_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                        vuint32m4_t vs2, vuint32m4_t vs1,
                                        size_t vl);
vuint64m8_t __riscv_vwaddu_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                        vuint32m4_t vs2, uint32_t rs1,
                                        size_t vl);
vuint64m8_t __riscv_vwaddu_wv_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                        vuint64m8_t vs2, vuint32m4_t vs1,
                                        size_t vl);
vuint64m8_t __riscv_vwaddu_wx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                        vuint64m8_t vs2, uint32_t rs1,
                                        size_t vl);
vuint16mf4_t __riscv_vwsubu_vv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                          vuint8mf8_t vs2, vuint8mf8_t vs1,
                                          size_t vl);
vuint16mf4_t __riscv_vwsubu_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                          vuint8mf8_t vs2, uint8_t rs1,
                                          size_t vl);
vuint16mf4_t __riscv_vwsubu_wv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                          vuint16mf4_t vs2, vuint8mf8_t vs1,
                                          size_t vl);
vuint16mf4_t __riscv_vwsubu_wx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                          vuint16mf4_t vs2, uint8_t rs1,
                                          size_t vl);
vuint16mf2_t __riscv_vwsubu_vv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                          vuint8mf4_t vs2, vuint8mf4_t vs1,
                                          size_t vl);
vuint16mf2_t __riscv_vwsubu_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                          vuint8mf4_t vs2, uint8_t rs1,
                                          size_t vl);
vuint16mf2_t __riscv_vwsubu_wv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                          vuint16mf2_t vs2, vuint8mf4_t vs1,
                                          size_t vl);
vuint16mf2_t __riscv_vwsubu_wx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                          vuint16mf2_t vs2, uint8_t rs1,
                                          size_t vl);
vuint16m1_t __riscv_vwsubu_vv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                        vuint8mf2_t vs2, vuint8mf2_t vs1,
                                        size_t vl);
vuint16m1_t __riscv_vwsubu_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                        vuint8mf2_t vs2, uint8_t rs1,
                                        size_t vl);
vuint16m1_t __riscv_vwsubu_wv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                        vuint16m1_t vs2, vuint8mf2_t vs1,
                                        size_t vl);
vuint16m1_t __riscv_vwsubu_wx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                        vuint16m1_t vs2, uint8_t rs1,
                                        size_t vl);
vuint16m2_t __riscv_vwsubu_vv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                        vuint8m1_t vs2, vuint8m1_t vs1,
                                        size_t vl);
vuint16m2_t __riscv_vwsubu_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                        vuint8m1_t vs2, uint8_t rs1, size_t vl);
vuint16m2_t __riscv_vwsubu_wv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                        vuint16m2_t vs2, vuint8m1_t vs1,
                                        size_t vl);
vuint16m2_t __riscv_vwsubu_wx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                        vuint16m2_t vs2, uint8_t rs1,
                                        size_t vl);
vuint16m4_t __riscv_vwsubu_vv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                        vuint8m2_t vs2, vuint8m2_t vs1,
                                        size_t vl);
vuint16m4_t __riscv_vwsubu_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                        vuint8m2_t vs2, uint8_t rs1, size_t vl);
vuint16m4_t __riscv_vwsubu_wv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                        vuint16m4_t vs2, vuint8m2_t vs1,
                                        size_t vl);
vuint16m4_t __riscv_vwsubu_wx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                        vuint16m4_t vs2, uint8_t rs1,
                                        size_t vl);
vuint16m8_t __riscv_vwsubu_vv_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                        vuint8m4_t vs2, vuint8m4_t vs1,
                                        size_t vl);
vuint16m8_t __riscv_vwsubu_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                        vuint8m4_t vs2, uint8_t rs1, size_t vl);
vuint16m8_t __riscv_vwsubu_wv_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                        vuint16m8_t vs2, vuint8m4_t vs1,
                                        size_t vl);
vuint16m8_t __riscv_vwsubu_wx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                        vuint16m8_t vs2, uint8_t rs1,
                                        size_t vl);
vuint32mf2_t __riscv_vwsubu_vv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                          vuint16mf4_t vs2, vuint16mf4_t vs1,
                                          size_t vl);
vuint32mf2_t __riscv_vwsubu_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                          vuint16mf4_t vs2, uint16_t rs1,
                                          size_t vl);
vuint32mf2_t __riscv_vwsubu_wv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                          vuint32mf2_t vs2, vuint16mf4_t vs1,
                                          size_t vl);
vuint32mf2_t __riscv_vwsubu_wx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                          vuint32mf2_t vs2, uint16_t rs1,
                                          size_t vl);
vuint32m1_t __riscv_vwsubu_vv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                        vuint16mf2_t vs2, vuint16mf2_t vs1,
                                        size_t vl);
vuint32m1_t __riscv_vwsubu_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                        vuint16mf2_t vs2, uint16_t rs1,
                                        size_t vl);
vuint32m1_t __riscv_vwsubu_wv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                        vuint32m1_t vs2, vuint16mf2_t vs1,
                                        size_t vl);
vuint32m1_t __riscv_vwsubu_wx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                        vuint32m1_t vs2, uint16_t rs1,
                                        size_t vl);
vuint32m2_t __riscv_vwsubu_vv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                        vuint16m1_t vs2, vuint16m1_t vs1,
                                        size_t vl);
vuint32m2_t __riscv_vwsubu_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                        vuint16m1_t vs2, uint16_t rs1,
                                        size_t vl);
vuint32m2_t __riscv_vwsubu_wv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                        vuint32m2_t vs2, vuint16m1_t vs1,
                                        size_t vl);
vuint32m2_t __riscv_vwsubu_wx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                        vuint32m2_t vs2, uint16_t rs1,
                                        size_t vl);
vuint32m4_t __riscv_vwsubu_vv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                        vuint16m2_t vs2, vuint16m2_t vs1,
                                        size_t vl);
vuint32m4_t __riscv_vwsubu_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                        vuint16m2_t vs2, uint16_t rs1,
                                        size_t vl);
vuint32m4_t __riscv_vwsubu_wv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                        vuint32m4_t vs2, vuint16m2_t vs1,
                                        size_t vl);
vuint32m4_t __riscv_vwsubu_wx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                        vuint32m4_t vs2, uint16_t rs1,
                                        size_t vl);
vuint32m8_t __riscv_vwsubu_vv_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                        vuint16m4_t vs2, vuint16m4_t vs1,
                                        size_t vl);
vuint32m8_t __riscv_vwsubu_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                        vuint16m4_t vs2, uint16_t rs1,
                                        size_t vl);
vuint32m8_t __riscv_vwsubu_wv_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                        vuint32m8_t vs2, vuint16m4_t vs1,
                                        size_t vl);
vuint32m8_t __riscv_vwsubu_wx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                        vuint32m8_t vs2, uint16_t rs1,
                                        size_t vl);
vuint64m1_t __riscv_vwsubu_vv_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                        vuint32mf2_t vs2, vuint32mf2_t vs1,
                                        size_t vl);
vuint64m1_t __riscv_vwsubu_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                        vuint32mf2_t vs2, uint32_t rs1,
                                        size_t vl);
vuint64m1_t __riscv_vwsubu_wv_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                        vuint64m1_t vs2, vuint32mf2_t vs1,
                                        size_t vl);
vuint64m1_t __riscv_vwsubu_wx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                        vuint64m1_t vs2, uint32_t rs1,
                                        size_t vl);
vuint64m2_t __riscv_vwsubu_vv_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                        vuint32m1_t vs2, vuint32m1_t vs1,
                                        size_t vl);
vuint64m2_t __riscv_vwsubu_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                        vuint32m1_t vs2, uint32_t rs1,
                                        size_t vl);
vuint64m2_t __riscv_vwsubu_wv_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                        vuint64m2_t vs2, vuint32m1_t vs1,
                                        size_t vl);
vuint64m2_t __riscv_vwsubu_wx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                        vuint64m2_t vs2, uint32_t rs1,
                                        size_t vl);
vuint64m4_t __riscv_vwsubu_vv_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                        vuint32m2_t vs2, vuint32m2_t vs1,
                                        size_t vl);
vuint64m4_t __riscv_vwsubu_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                        vuint32m2_t vs2, uint32_t rs1,
                                        size_t vl);
vuint64m4_t __riscv_vwsubu_wv_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                        vuint64m4_t vs2, vuint32m2_t vs1,
                                        size_t vl);
vuint64m4_t __riscv_vwsubu_wx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                        vuint64m4_t vs2, uint32_t rs1,
                                        size_t vl);
vuint64m8_t __riscv_vwsubu_vv_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                        vuint32m4_t vs2, vuint32m4_t vs1,
                                        size_t vl);
vuint64m8_t __riscv_vwsubu_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                        vuint32m4_t vs2, uint32_t rs1,
                                        size_t vl);
vuint64m8_t __riscv_vwsubu_wv_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                        vuint64m8_t vs2, vuint32m4_t vs1,
                                        size_t vl);
vuint64m8_t __riscv_vwsubu_wx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                        vuint64m8_t vs2, uint32_t rs1,
                                        size_t vl);
// masked functions
vint16mf4_t __riscv_vwadd_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                         vint8mf8_t vs2, vint8mf8_t vs1,
                                         size_t vl);
vint16mf4_t __riscv_vwadd_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                         vint8mf8_t vs2, int8_t rs1, size_t vl);
vint16mf4_t __riscv_vwadd_wv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                         vint16mf4_t vs2, vint8mf8_t vs1,
                                         size_t vl);
vint16mf4_t __riscv_vwadd_wx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                         vint16mf4_t vs2, int8_t rs1,
                                         size_t vl);
vint16mf2_t __riscv_vwadd_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                         vint8mf4_t vs2, vint8mf4_t vs1,
                                         size_t vl);
vint16mf2_t __riscv_vwadd_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                         vint8mf4_t vs2, int8_t rs1, size_t vl);
vint16mf2_t __riscv_vwadd_wv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                         vint16mf2_t vs2, vint8mf4_t vs1,
                                         size_t vl);
vint16mf2_t __riscv_vwadd_wx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                         vint16mf2_t vs2, int8_t rs1,
                                         size_t vl);
vint16m1_t __riscv_vwadd_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                       vint8mf2_t vs2, vint8mf2_t vs1,
                                       size_t vl);
vint16m1_t __riscv_vwadd_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                       vint8mf2_t vs2, int8_t rs1, size_t vl);
vint16m1_t __riscv_vwadd_wv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                       vint16m1_t vs2, vint8mf2_t vs1,
                                       size_t vl);
vint16m1_t __riscv_vwadd_wx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                       vint16m1_t vs2, int8_t rs1, size_t vl);
vint16m2_t __riscv_vwadd_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                       vint8m1_t vs2, vint8m1_t vs1, size_t vl);
vint16m2_t __riscv_vwadd_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                       vint8m1_t vs2, int8_t rs1, size_t vl);
vint16m2_t __riscv_vwadd_wv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                       vint16m2_t vs2, vint8m1_t vs1,
                                       size_t vl);
vint16m2_t __riscv_vwadd_wx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                       vint16m2_t vs2, int8_t rs1, size_t vl);
vint16m4_t __riscv_vwadd_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                       vint8m2_t vs2, vint8m2_t vs1, size_t vl);
vint16m4_t __riscv_vwadd_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                       vint8m2_t vs2, int8_t rs1, size_t vl);
vint16m4_t __riscv_vwadd_wv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                       vint16m4_t vs2, vint8m2_t vs1,
                                       size_t vl);
vint16m4_t __riscv_vwadd_wx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                       vint16m4_t vs2, int8_t rs1, size_t vl);
vint16m8_t __riscv_vwadd_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                       vint8m4_t vs2, vint8m4_t vs1, size_t vl);
vint16m8_t __riscv_vwadd_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                       vint8m4_t vs2, int8_t rs1, size_t vl);
vint16m8_t __riscv_vwadd_wv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                       vint16m8_t vs2, vint8m4_t vs1,
                                       size_t vl);
vint16m8_t __riscv_vwadd_wx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                       vint16m8_t vs2, int8_t rs1, size_t vl);
vint32mf2_t __riscv_vwadd_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                         vint16mf4_t vs2, vint16mf4_t vs1,
                                         size_t vl);
vint32mf2_t __riscv_vwadd_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                         vint16mf4_t vs2, int16_t rs1,
                                         size_t vl);
vint32mf2_t __riscv_vwadd_wv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                         vint32mf2_t vs2, vint16mf4_t vs1,
                                         size_t vl);
vint32mf2_t __riscv_vwadd_wx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                         vint32mf2_t vs2, int16_t rs1,
                                         size_t vl);
vint32m1_t __riscv_vwadd_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                       vint16mf2_t vs2, vint16mf2_t vs1,
                                       size_t vl);
vint32m1_t __riscv_vwadd_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                       vint16mf2_t vs2, int16_t rs1, size_t vl);
vint32m1_t __riscv_vwadd_wv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                       vint32m1_t vs2, vint16mf2_t vs1,
                                       size_t vl);
vint32m1_t __riscv_vwadd_wx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                       vint32m1_t vs2, int16_t rs1, size_t vl);
vint32m2_t __riscv_vwadd_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                       vint16m1_t vs2, vint16m1_t vs1,
                                       size_t vl);
vint32m2_t __riscv_vwadd_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                       vint16m1_t vs2, int16_t rs1, size_t vl);
vint32m2_t __riscv_vwadd_wv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                       vint32m2_t vs2, vint16m1_t vs1,
                                       size_t vl);
vint32m2_t __riscv_vwadd_wx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                       vint32m2_t vs2, int16_t rs1, size_t vl);
vint32m4_t __riscv_vwadd_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                       vint16m2_t vs2, vint16m2_t vs1,
                                       size_t vl);
vint32m4_t __riscv_vwadd_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                       vint16m2_t vs2, int16_t rs1, size_t vl);
vint32m4_t __riscv_vwadd_wv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                       vint32m4_t vs2, vint16m2_t vs1,
                                       size_t vl);
vint32m4_t __riscv_vwadd_wx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                       vint32m4_t vs2, int16_t rs1, size_t vl);
vint32m8_t __riscv_vwadd_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                       vint16m4_t vs2, vint16m4_t vs1,
                                       size_t vl);
vint32m8_t __riscv_vwadd_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                       vint16m4_t vs2, int16_t rs1, size_t vl);
vint32m8_t __riscv_vwadd_wv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                       vint32m8_t vs2, vint16m4_t vs1,
                                       size_t vl);
vint32m8_t __riscv_vwadd_wx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                       vint32m8_t vs2, int16_t rs1, size_t vl);
vint64m1_t __riscv_vwadd_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                       vint32mf2_t vs2, vint32mf2_t vs1,
                                       size_t vl);
vint64m1_t __riscv_vwadd_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                       vint32mf2_t vs2, int32_t rs1, size_t vl);
vint64m1_t __riscv_vwadd_wv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                       vint64m1_t vs2, vint32mf2_t vs1,
                                       size_t vl);
vint64m1_t __riscv_vwadd_wx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                       vint64m1_t vs2, int32_t rs1, size_t vl);
vint64m2_t __riscv_vwadd_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                       vint32m1_t vs2, vint32m1_t vs1,
                                       size_t vl);
vint64m2_t __riscv_vwadd_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                       vint32m1_t vs2, int32_t rs1, size_t vl);
vint64m2_t __riscv_vwadd_wv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                       vint64m2_t vs2, vint32m1_t vs1,
                                       size_t vl);
vint64m2_t __riscv_vwadd_wx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                       vint64m2_t vs2, int32_t rs1, size_t vl);
vint64m4_t __riscv_vwadd_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                       vint32m2_t vs2, vint32m2_t vs1,
                                       size_t vl);
vint64m4_t __riscv_vwadd_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                       vint32m2_t vs2, int32_t rs1, size_t vl);
vint64m4_t __riscv_vwadd_wv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                       vint64m4_t vs2, vint32m2_t vs1,
                                       size_t vl);
vint64m4_t __riscv_vwadd_wx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                       vint64m4_t vs2, int32_t rs1, size_t vl);
vint64m8_t __riscv_vwadd_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                       vint32m4_t vs2, vint32m4_t vs1,
                                       size_t vl);
vint64m8_t __riscv_vwadd_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                       vint32m4_t vs2, int32_t rs1, size_t vl);
vint64m8_t __riscv_vwadd_wv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                       vint64m8_t vs2, vint32m4_t vs1,
                                       size_t vl);
vint64m8_t __riscv_vwadd_wx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                       vint64m8_t vs2, int32_t rs1, size_t vl);
vint16mf4_t __riscv_vwsub_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                         vint8mf8_t vs2, vint8mf8_t vs1,
                                         size_t vl);
vint16mf4_t __riscv_vwsub_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                         vint8mf8_t vs2, int8_t rs1, size_t vl);
vint16mf4_t __riscv_vwsub_wv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                         vint16mf4_t vs2, vint8mf8_t vs1,
                                         size_t vl);
vint16mf4_t __riscv_vwsub_wx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                         vint16mf4_t vs2, int8_t rs1,
                                         size_t vl);
vint16mf2_t __riscv_vwsub_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                         vint8mf4_t vs2, vint8mf4_t vs1,
                                         size_t vl);
vint16mf2_t __riscv_vwsub_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                         vint8mf4_t vs2, int8_t rs1, size_t vl);
vint16mf2_t __riscv_vwsub_wv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                         vint16mf2_t vs2, vint8mf4_t vs1,
                                         size_t vl);
vint16mf2_t __riscv_vwsub_wx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                         vint16mf2_t vs2, int8_t rs1,
                                         size_t vl);
vint16m1_t __riscv_vwsub_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                       vint8mf2_t vs2, vint8mf2_t vs1,
                                       size_t vl);
vint16m1_t __riscv_vwsub_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                       vint8mf2_t vs2, int8_t rs1, size_t vl);
vint16m1_t __riscv_vwsub_wv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                       vint16m1_t vs2, vint8mf2_t vs1,
                                       size_t vl);
vint16m1_t __riscv_vwsub_wx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                       vint16m1_t vs2, int8_t rs1, size_t vl);
vint16m2_t __riscv_vwsub_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                       vint8m1_t vs2, vint8m1_t vs1, size_t vl);
vint16m2_t __riscv_vwsub_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                       vint8m1_t vs2, int8_t rs1, size_t vl);
vint16m2_t __riscv_vwsub_wv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                       vint16m2_t vs2, vint8m1_t vs1,
                                       size_t vl);
vint16m2_t __riscv_vwsub_wx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                       vint16m2_t vs2, int8_t rs1, size_t vl);
vint16m4_t __riscv_vwsub_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                       vint8m2_t vs2, vint8m2_t vs1, size_t vl);
vint16m4_t __riscv_vwsub_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                       vint8m2_t vs2, int8_t rs1, size_t vl);
vint16m4_t __riscv_vwsub_wv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                       vint16m4_t vs2, vint8m2_t vs1,
                                       size_t vl);
vint16m4_t __riscv_vwsub_wx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                       vint16m4_t vs2, int8_t rs1, size_t vl);
vint16m8_t __riscv_vwsub_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                       vint8m4_t vs2, vint8m4_t vs1, size_t vl);
vint16m8_t __riscv_vwsub_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                       vint8m4_t vs2, int8_t rs1, size_t vl);
vint16m8_t __riscv_vwsub_wv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                       vint16m8_t vs2, vint8m4_t vs1,
                                       size_t vl);
vint16m8_t __riscv_vwsub_wx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                       vint16m8_t vs2, int8_t rs1, size_t vl);
vint32mf2_t __riscv_vwsub_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                         vint16mf4_t vs2, vint16mf4_t vs1,
                                         size_t vl);
vint32mf2_t __riscv_vwsub_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                         vint16mf4_t vs2, int16_t rs1,
                                         size_t vl);
vint32mf2_t __riscv_vwsub_wv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                         vint32mf2_t vs2, vint16mf4_t vs1,
                                         size_t vl);
vint32mf2_t __riscv_vwsub_wx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                         vint32mf2_t vs2, int16_t rs1,
                                         size_t vl);
vint32m1_t __riscv_vwsub_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                       vint16mf2_t vs2, vint16mf2_t vs1,
                                       size_t vl);
vint32m1_t __riscv_vwsub_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                       vint16mf2_t vs2, int16_t rs1, size_t vl);
vint32m1_t __riscv_vwsub_wv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                       vint32m1_t vs2, vint16mf2_t vs1,
                                       size_t vl);
vint32m1_t __riscv_vwsub_wx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                       vint32m1_t vs2, int16_t rs1, size_t vl);
vint32m2_t __riscv_vwsub_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                       vint16m1_t vs2, vint16m1_t vs1,
                                       size_t vl);
vint32m2_t __riscv_vwsub_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                       vint16m1_t vs2, int16_t rs1, size_t vl);
vint32m2_t __riscv_vwsub_wv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                       vint32m2_t vs2, vint16m1_t vs1,
                                       size_t vl);
vint32m2_t __riscv_vwsub_wx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                       vint32m2_t vs2, int16_t rs1, size_t vl);
vint32m4_t __riscv_vwsub_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                       vint16m2_t vs2, vint16m2_t vs1,
                                       size_t vl);
vint32m4_t __riscv_vwsub_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                       vint16m2_t vs2, int16_t rs1, size_t vl);
vint32m4_t __riscv_vwsub_wv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                       vint32m4_t vs2, vint16m2_t vs1,
                                       size_t vl);
vint32m4_t __riscv_vwsub_wx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                       vint32m4_t vs2, int16_t rs1, size_t vl);
vint32m8_t __riscv_vwsub_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                       vint16m4_t vs2, vint16m4_t vs1,
                                       size_t vl);
vint32m8_t __riscv_vwsub_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                       vint16m4_t vs2, int16_t rs1, size_t vl);
vint32m8_t __riscv_vwsub_wv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                       vint32m8_t vs2, vint16m4_t vs1,
                                       size_t vl);
vint32m8_t __riscv_vwsub_wx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                       vint32m8_t vs2, int16_t rs1, size_t vl);
vint64m1_t __riscv_vwsub_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                       vint32mf2_t vs2, vint32mf2_t vs1,
                                       size_t vl);
vint64m1_t __riscv_vwsub_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                       vint32mf2_t vs2, int32_t rs1, size_t vl);
vint64m1_t __riscv_vwsub_wv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                       vint64m1_t vs2, vint32mf2_t vs1,
                                       size_t vl);
vint64m1_t __riscv_vwsub_wx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                       vint64m1_t vs2, int32_t rs1, size_t vl);
vint64m2_t __riscv_vwsub_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                       vint32m1_t vs2, vint32m1_t vs1,
                                       size_t vl);
vint64m2_t __riscv_vwsub_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                       vint32m1_t vs2, int32_t rs1, size_t vl);
vint64m2_t __riscv_vwsub_wv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                       vint64m2_t vs2, vint32m1_t vs1,
                                       size_t vl);
vint64m2_t __riscv_vwsub_wx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                       vint64m2_t vs2, int32_t rs1, size_t vl);
vint64m4_t __riscv_vwsub_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                       vint32m2_t vs2, vint32m2_t vs1,
                                       size_t vl);
vint64m4_t __riscv_vwsub_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                       vint32m2_t vs2, int32_t rs1, size_t vl);
vint64m4_t __riscv_vwsub_wv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                       vint64m4_t vs2, vint32m2_t vs1,
                                       size_t vl);
vint64m4_t __riscv_vwsub_wx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                       vint64m4_t vs2, int32_t rs1, size_t vl);
vint64m8_t __riscv_vwsub_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                       vint32m4_t vs2, vint32m4_t vs1,
                                       size_t vl);
vint64m8_t __riscv_vwsub_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                       vint32m4_t vs2, int32_t rs1, size_t vl);
vint64m8_t __riscv_vwsub_wv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                       vint64m8_t vs2, vint32m4_t vs1,
                                       size_t vl);
vint64m8_t __riscv_vwsub_wx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                       vint64m8_t vs2, int32_t rs1, size_t vl);
vuint16mf4_t __riscv_vwaddu_vv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                           vuint8mf8_t vs2, vuint8mf8_t vs1,
                                           size_t vl);
vuint16mf4_t __riscv_vwaddu_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                           vuint8mf8_t vs2, uint8_t rs1,
                                           size_t vl);
vuint16mf4_t __riscv_vwaddu_wv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                           vuint16mf4_t vs2, vuint8mf8_t vs1,
                                           size_t vl);
vuint16mf4_t __riscv_vwaddu_wx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                           vuint16mf4_t vs2, uint8_t rs1,
                                           size_t vl);
vuint16mf2_t __riscv_vwaddu_vv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                           vuint8mf4_t vs2, vuint8mf4_t vs1,
                                           size_t vl);
vuint16mf2_t __riscv_vwaddu_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                           vuint8mf4_t vs2, uint8_t rs1,
                                           size_t vl);
vuint16mf2_t __riscv_vwaddu_wv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                           vuint16mf2_t vs2, vuint8mf4_t vs1,
                                           size_t vl);
vuint16mf2_t __riscv_vwaddu_wx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                           vuint16mf2_t vs2, uint8_t rs1,
                                           size_t vl);
vuint16m1_t __riscv_vwaddu_vv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                         vuint8mf2_t vs2, vuint8mf2_t vs1,
                                         size_t vl);
vuint16m1_t __riscv_vwaddu_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                         vuint8mf2_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16m1_t __riscv_vwaddu_wv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                         vuint16m1_t vs2, vuint8mf2_t vs1,
                                         size_t vl);
vuint16m1_t __riscv_vwaddu_wx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                         vuint16m1_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16m2_t __riscv_vwaddu_vv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                         vuint8m1_t vs2, vuint8m1_t vs1,
                                         size_t vl);
vuint16m2_t __riscv_vwaddu_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                         vuint8m1_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16m2_t __riscv_vwaddu_wv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                         vuint16m2_t vs2, vuint8m1_t vs1,
                                         size_t vl);
vuint16m2_t __riscv_vwaddu_wx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                         vuint16m2_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16m4_t __riscv_vwaddu_vv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                         vuint8m2_t vs2, vuint8m2_t vs1,
                                         size_t vl);
vuint16m4_t __riscv_vwaddu_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                         vuint8m2_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16m4_t __riscv_vwaddu_wv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                         vuint16m4_t vs2, vuint8m2_t vs1,
                                         size_t vl);
vuint16m4_t __riscv_vwaddu_wx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                         vuint16m4_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16m8_t __riscv_vwaddu_vv_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                         vuint8m4_t vs2, vuint8m4_t vs1,
                                         size_t vl);
vuint16m8_t __riscv_vwaddu_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                         vuint8m4_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16m8_t __riscv_vwaddu_wv_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                         vuint16m8_t vs2, vuint8m4_t vs1,
                                         size_t vl);
vuint16m8_t __riscv_vwaddu_wx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                         vuint16m8_t vs2, uint8_t rs1,
                                         size_t vl);
vuint32mf2_t __riscv_vwaddu_vv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                           vuint16mf4_t vs2, vuint16mf4_t vs1,
                                           size_t vl);
vuint32mf2_t __riscv_vwaddu_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                           vuint16mf4_t vs2, uint16_t rs1,
                                           size_t vl);
vuint32mf2_t __riscv_vwaddu_wv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                           vuint32mf2_t vs2, vuint16mf4_t vs1,
                                           size_t vl);
vuint32mf2_t __riscv_vwaddu_wx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                           vuint32mf2_t vs2, uint16_t rs1,
                                           size_t vl);
vuint32m1_t __riscv_vwaddu_vv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                         vuint16mf2_t vs2, vuint16mf2_t vs1,
                                         size_t vl);
vuint32m1_t __riscv_vwaddu_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                         vuint16mf2_t vs2, uint16_t rs1,
                                         size_t vl);
vuint32m1_t __riscv_vwaddu_wv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                         vuint32m1_t vs2, vuint16mf2_t vs1,
                                         size_t vl);
vuint32m1_t __riscv_vwaddu_wx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                         vuint32m1_t vs2, uint16_t rs1,
                                         size_t vl);
vuint32m2_t __riscv_vwaddu_vv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                         vuint16m1_t vs2, vuint16m1_t vs1,
                                         size_t vl);
vuint32m2_t __riscv_vwaddu_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                         vuint16m1_t vs2, uint16_t rs1,
                                         size_t vl);
vuint32m2_t __riscv_vwaddu_wv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                         vuint32m2_t vs2, vuint16m1_t vs1,
                                         size_t vl);
vuint32m2_t __riscv_vwaddu_wx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                         vuint32m2_t vs2, uint16_t rs1,
                                         size_t vl);
vuint32m4_t __riscv_vwaddu_vv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                         vuint16m2_t vs2, vuint16m2_t vs1,
                                         size_t vl);
vuint32m4_t __riscv_vwaddu_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                         vuint16m2_t vs2, uint16_t rs1,
                                         size_t vl);
vuint32m4_t __riscv_vwaddu_wv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                         vuint32m4_t vs2, vuint16m2_t vs1,
                                         size_t vl);
vuint32m4_t __riscv_vwaddu_wx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                         vuint32m4_t vs2, uint16_t rs1,
                                         size_t vl);
vuint32m8_t __riscv_vwaddu_vv_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                         vuint16m4_t vs2, vuint16m4_t vs1,
                                         size_t vl);
vuint32m8_t __riscv_vwaddu_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                         vuint16m4_t vs2, uint16_t rs1,
                                         size_t vl);
vuint32m8_t __riscv_vwaddu_wv_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                         vuint32m8_t vs2, vuint16m4_t vs1,
                                         size_t vl);
vuint32m8_t __riscv_vwaddu_wx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                         vuint32m8_t vs2, uint16_t rs1,
                                         size_t vl);
vuint64m1_t __riscv_vwaddu_vv_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                         vuint32mf2_t vs2, vuint32mf2_t vs1,
                                         size_t vl);
vuint64m1_t __riscv_vwaddu_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                         vuint32mf2_t vs2, uint32_t rs1,
                                         size_t vl);
vuint64m1_t __riscv_vwaddu_wv_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                         vuint64m1_t vs2, vuint32mf2_t vs1,
                                         size_t vl);
vuint64m1_t __riscv_vwaddu_wx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                         vuint64m1_t vs2, uint32_t rs1,
                                         size_t vl);
vuint64m2_t __riscv_vwaddu_vv_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                         vuint32m1_t vs2, vuint32m1_t vs1,
                                         size_t vl);
vuint64m2_t __riscv_vwaddu_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                         vuint32m1_t vs2, uint32_t rs1,
                                         size_t vl);
vuint64m2_t __riscv_vwaddu_wv_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                         vuint64m2_t vs2, vuint32m1_t vs1,
                                         size_t vl);
vuint64m2_t __riscv_vwaddu_wx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                         vuint64m2_t vs2, uint32_t rs1,
                                         size_t vl);
vuint64m4_t __riscv_vwaddu_vv_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                         vuint32m2_t vs2, vuint32m2_t vs1,
                                         size_t vl);
vuint64m4_t __riscv_vwaddu_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                         vuint32m2_t vs2, uint32_t rs1,
                                         size_t vl);
vuint64m4_t __riscv_vwaddu_wv_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                         vuint64m4_t vs2, vuint32m2_t vs1,
                                         size_t vl);
vuint64m4_t __riscv_vwaddu_wx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                         vuint64m4_t vs2, uint32_t rs1,
                                         size_t vl);
vuint64m8_t __riscv_vwaddu_vv_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                         vuint32m4_t vs2, vuint32m4_t vs1,
                                         size_t vl);
vuint64m8_t __riscv_vwaddu_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                         vuint32m4_t vs2, uint32_t rs1,
                                         size_t vl);
vuint64m8_t __riscv_vwaddu_wv_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                         vuint64m8_t vs2, vuint32m4_t vs1,
                                         size_t vl);
vuint64m8_t __riscv_vwaddu_wx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                         vuint64m8_t vs2, uint32_t rs1,
                                         size_t vl);
vuint16mf4_t __riscv_vwsubu_vv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                           vuint8mf8_t vs2, vuint8mf8_t vs1,
                                           size_t vl);
vuint16mf4_t __riscv_vwsubu_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                           vuint8mf8_t vs2, uint8_t rs1,
                                           size_t vl);
vuint16mf4_t __riscv_vwsubu_wv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                           vuint16mf4_t vs2, vuint8mf8_t vs1,
                                           size_t vl);
vuint16mf4_t __riscv_vwsubu_wx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                           vuint16mf4_t vs2, uint8_t rs1,
                                           size_t vl);
vuint16mf2_t __riscv_vwsubu_vv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                           vuint8mf4_t vs2, vuint8mf4_t vs1,
                                           size_t vl);
vuint16mf2_t __riscv_vwsubu_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                           vuint8mf4_t vs2, uint8_t rs1,
                                           size_t vl);
vuint16mf2_t __riscv_vwsubu_wv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                           vuint16mf2_t vs2, vuint8mf4_t vs1,
                                           size_t vl);
vuint16mf2_t __riscv_vwsubu_wx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                           vuint16mf2_t vs2, uint8_t rs1,
                                           size_t vl);
vuint16m1_t __riscv_vwsubu_vv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                         vuint8mf2_t vs2, vuint8mf2_t vs1,
                                         size_t vl);
vuint16m1_t __riscv_vwsubu_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                         vuint8mf2_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16m1_t __riscv_vwsubu_wv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                         vuint16m1_t vs2, vuint8mf2_t vs1,
                                         size_t vl);
vuint16m1_t __riscv_vwsubu_wx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                         vuint16m1_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16m2_t __riscv_vwsubu_vv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                         vuint8m1_t vs2, vuint8m1_t vs1,
                                         size_t vl);
vuint16m2_t __riscv_vwsubu_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                         vuint8m1_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16m2_t __riscv_vwsubu_wv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                         vuint16m2_t vs2, vuint8m1_t vs1,
                                         size_t vl);
vuint16m2_t __riscv_vwsubu_wx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                         vuint16m2_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16m4_t __riscv_vwsubu_vv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                         vuint8m2_t vs2, vuint8m2_t vs1,
                                         size_t vl);
vuint16m4_t __riscv_vwsubu_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                         vuint8m2_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16m4_t __riscv_vwsubu_wv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                         vuint16m4_t vs2, vuint8m2_t vs1,
                                         size_t vl);
vuint16m4_t __riscv_vwsubu_wx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                         vuint16m4_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16m8_t __riscv_vwsubu_vv_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                         vuint8m4_t vs2, vuint8m4_t vs1,
                                         size_t vl);
vuint16m8_t __riscv_vwsubu_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                         vuint8m4_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16m8_t __riscv_vwsubu_wv_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                         vuint16m8_t vs2, vuint8m4_t vs1,
                                         size_t vl);
vuint16m8_t __riscv_vwsubu_wx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                         vuint16m8_t vs2, uint8_t rs1,
                                         size_t vl);
vuint32mf2_t __riscv_vwsubu_vv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                           vuint16mf4_t vs2, vuint16mf4_t vs1,
                                           size_t vl);
vuint32mf2_t __riscv_vwsubu_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                           vuint16mf4_t vs2, uint16_t rs1,
                                           size_t vl);
vuint32mf2_t __riscv_vwsubu_wv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                           vuint32mf2_t vs2, vuint16mf4_t vs1,
                                           size_t vl);
vuint32mf2_t __riscv_vwsubu_wx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                           vuint32mf2_t vs2, uint16_t rs1,
                                           size_t vl);
vuint32m1_t __riscv_vwsubu_vv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                         vuint16mf2_t vs2, vuint16mf2_t vs1,
                                         size_t vl);
vuint32m1_t __riscv_vwsubu_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                         vuint16mf2_t vs2, uint16_t rs1,
                                         size_t vl);
vuint32m1_t __riscv_vwsubu_wv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                         vuint32m1_t vs2, vuint16mf2_t vs1,
                                         size_t vl);
vuint32m1_t __riscv_vwsubu_wx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                         vuint32m1_t vs2, uint16_t rs1,
                                         size_t vl);
vuint32m2_t __riscv_vwsubu_vv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                         vuint16m1_t vs2, vuint16m1_t vs1,
                                         size_t vl);
vuint32m2_t __riscv_vwsubu_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                         vuint16m1_t vs2, uint16_t rs1,
                                         size_t vl);
vuint32m2_t __riscv_vwsubu_wv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                         vuint32m2_t vs2, vuint16m1_t vs1,
                                         size_t vl);
vuint32m2_t __riscv_vwsubu_wx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                         vuint32m2_t vs2, uint16_t rs1,
                                         size_t vl);
vuint32m4_t __riscv_vwsubu_vv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                         vuint16m2_t vs2, vuint16m2_t vs1,
                                         size_t vl);
vuint32m4_t __riscv_vwsubu_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                         vuint16m2_t vs2, uint16_t rs1,
                                         size_t vl);
vuint32m4_t __riscv_vwsubu_wv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                         vuint32m4_t vs2, vuint16m2_t vs1,
                                         size_t vl);
vuint32m4_t __riscv_vwsubu_wx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                         vuint32m4_t vs2, uint16_t rs1,
                                         size_t vl);
vuint32m8_t __riscv_vwsubu_vv_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                         vuint16m4_t vs2, vuint16m4_t vs1,
                                         size_t vl);
vuint32m8_t __riscv_vwsubu_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                         vuint16m4_t vs2, uint16_t rs1,
                                         size_t vl);
vuint32m8_t __riscv_vwsubu_wv_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                         vuint32m8_t vs2, vuint16m4_t vs1,
                                         size_t vl);
vuint32m8_t __riscv_vwsubu_wx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                         vuint32m8_t vs2, uint16_t rs1,
                                         size_t vl);
vuint64m1_t __riscv_vwsubu_vv_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                         vuint32mf2_t vs2, vuint32mf2_t vs1,
                                         size_t vl);
vuint64m1_t __riscv_vwsubu_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                         vuint32mf2_t vs2, uint32_t rs1,
                                         size_t vl);
vuint64m1_t __riscv_vwsubu_wv_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                         vuint64m1_t vs2, vuint32mf2_t vs1,
                                         size_t vl);
vuint64m1_t __riscv_vwsubu_wx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                         vuint64m1_t vs2, uint32_t rs1,
                                         size_t vl);
vuint64m2_t __riscv_vwsubu_vv_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                         vuint32m1_t vs2, vuint32m1_t vs1,
                                         size_t vl);
vuint64m2_t __riscv_vwsubu_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                         vuint32m1_t vs2, uint32_t rs1,
                                         size_t vl);
vuint64m2_t __riscv_vwsubu_wv_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                         vuint64m2_t vs2, vuint32m1_t vs1,
                                         size_t vl);
vuint64m2_t __riscv_vwsubu_wx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                         vuint64m2_t vs2, uint32_t rs1,
                                         size_t vl);
vuint64m4_t __riscv_vwsubu_vv_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                         vuint32m2_t vs2, vuint32m2_t vs1,
                                         size_t vl);
vuint64m4_t __riscv_vwsubu_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                         vuint32m2_t vs2, uint32_t rs1,
                                         size_t vl);
vuint64m4_t __riscv_vwsubu_wv_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                         vuint64m4_t vs2, vuint32m2_t vs1,
                                         size_t vl);
vuint64m4_t __riscv_vwsubu_wx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                         vuint64m4_t vs2, uint32_t rs1,
                                         size_t vl);
vuint64m8_t __riscv_vwsubu_vv_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                         vuint32m4_t vs2, vuint32m4_t vs1,
                                         size_t vl);
vuint64m8_t __riscv_vwsubu_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                         vuint32m4_t vs2, uint32_t rs1,
                                         size_t vl);
vuint64m8_t __riscv_vwsubu_wv_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                         vuint64m8_t vs2, vuint32m4_t vs1,
                                         size_t vl);
vuint64m8_t __riscv_vwsubu_wx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                         vuint64m8_t vs2, uint32_t rs1,
                                         size_t vl);
// masked functions
vint16mf4_t __riscv_vwadd_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                       vint8mf8_t vs2, vint8mf8_t vs1,
                                       size_t vl);
vint16mf4_t __riscv_vwadd_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                       vint8mf8_t vs2, int8_t rs1, size_t vl);
vint16mf4_t __riscv_vwadd_wv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, vint8mf8_t vs1,
                                       size_t vl);
vint16mf4_t __riscv_vwadd_wx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, int8_t rs1, size_t vl);
vint16mf2_t __riscv_vwadd_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                       vint8mf4_t vs2, vint8mf4_t vs1,
                                       size_t vl);
vint16mf2_t __riscv_vwadd_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                       vint8mf4_t vs2, int8_t rs1, size_t vl);
vint16mf2_t __riscv_vwadd_wv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, vint8mf4_t vs1,
                                       size_t vl);
vint16mf2_t __riscv_vwadd_wx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, int8_t rs1, size_t vl);
vint16m1_t __riscv_vwadd_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                     vint8mf2_t vs2, vint8mf2_t vs1, size_t vl);
vint16m1_t __riscv_vwadd_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                     vint8mf2_t vs2, int8_t rs1, size_t vl);
vint16m1_t __riscv_vwadd_wv_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, vint8mf2_t vs1, size_t vl);
vint16m1_t __riscv_vwadd_wx_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, int8_t rs1, size_t vl);
vint16m2_t __riscv_vwadd_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint8m1_t vs2,
                                     vint8m1_t vs1, size_t vl);
vint16m2_t __riscv_vwadd_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint8m1_t vs2,
                                     int8_t rs1, size_t vl);
vint16m2_t __riscv_vwadd_wv_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     vint8m1_t vs1, size_t vl);
vint16m2_t __riscv_vwadd_wx_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     int8_t rs1, size_t vl);
vint16m4_t __riscv_vwadd_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint8m2_t vs2,
                                     vint8m2_t vs1, size_t vl);
vint16m4_t __riscv_vwadd_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint8m2_t vs2,
                                     int8_t rs1, size_t vl);
vint16m4_t __riscv_vwadd_wv_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     vint8m2_t vs1, size_t vl);
vint16m4_t __riscv_vwadd_wx_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     int8_t rs1, size_t vl);
vint16m8_t __riscv_vwadd_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint8m4_t vs2,
                                     vint8m4_t vs1, size_t vl);
vint16m8_t __riscv_vwadd_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint8m4_t vs2,
                                     int8_t rs1, size_t vl);
vint16m8_t __riscv_vwadd_wv_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     vint8m4_t vs1, size_t vl);
vint16m8_t __riscv_vwadd_wx_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     int8_t rs1, size_t vl);
vint32mf2_t __riscv_vwadd_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                       vint16mf4_t vs2, vint16mf4_t vs1,
                                       size_t vl);
vint32mf2_t __riscv_vwadd_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                       vint16mf4_t vs2, int16_t rs1, size_t vl);
vint32mf2_t __riscv_vwadd_wv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, vint16mf4_t vs1,
                                       size_t vl);
vint32mf2_t __riscv_vwadd_wx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, int16_t rs1, size_t vl);
vint32m1_t __riscv_vwadd_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                     vint16mf2_t vs2, vint16mf2_t vs1,
                                     size_t vl);
vint32m1_t __riscv_vwadd_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                     vint16mf2_t vs2, int16_t rs1, size_t vl);
vint32m1_t __riscv_vwadd_wv_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, vint16mf2_t vs1,
                                     size_t vl);
vint32m1_t __riscv_vwadd_wx_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, int16_t rs1, size_t vl);
vint32m2_t __riscv_vwadd_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                     vint16m1_t vs2, vint16m1_t vs1, size_t vl);
vint32m2_t __riscv_vwadd_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                     vint16m1_t vs2, int16_t rs1, size_t vl);
vint32m2_t __riscv_vwadd_wv_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, vint16m1_t vs1, size_t vl);
vint32m2_t __riscv_vwadd_wx_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, int16_t rs1, size_t vl);
vint32m4_t __riscv_vwadd_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint16m2_t vs2,
                                     vint16m2_t vs1, size_t vl);
vint32m4_t __riscv_vwadd_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint16m2_t vs2,
                                     int16_t rs1, size_t vl);
vint32m4_t __riscv_vwadd_wv_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     vint16m2_t vs1, size_t vl);
vint32m4_t __riscv_vwadd_wx_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     int16_t rs1, size_t vl);
vint32m8_t __riscv_vwadd_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint16m4_t vs2,
                                     vint16m4_t vs1, size_t vl);
vint32m8_t __riscv_vwadd_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint16m4_t vs2,
                                     int16_t rs1, size_t vl);
vint32m8_t __riscv_vwadd_wv_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     vint16m4_t vs1, size_t vl);
vint32m8_t __riscv_vwadd_wx_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     int16_t rs1, size_t vl);
vint64m1_t __riscv_vwadd_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                     vint32mf2_t vs2, vint32mf2_t vs1,
                                     size_t vl);
vint64m1_t __riscv_vwadd_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                     vint32mf2_t vs2, int32_t rs1, size_t vl);
vint64m1_t __riscv_vwadd_wv_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, vint32mf2_t vs1,
                                     size_t vl);
vint64m1_t __riscv_vwadd_wx_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, int32_t rs1, size_t vl);
vint64m2_t __riscv_vwadd_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                     vint32m1_t vs2, vint32m1_t vs1, size_t vl);
vint64m2_t __riscv_vwadd_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                     vint32m1_t vs2, int32_t rs1, size_t vl);
vint64m2_t __riscv_vwadd_wv_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, vint32m1_t vs1, size_t vl);
vint64m2_t __riscv_vwadd_wx_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, int32_t rs1, size_t vl);
vint64m4_t __riscv_vwadd_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                     vint32m2_t vs2, vint32m2_t vs1, size_t vl);
vint64m4_t __riscv_vwadd_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                     vint32m2_t vs2, int32_t rs1, size_t vl);
vint64m4_t __riscv_vwadd_wv_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, vint32m2_t vs1, size_t vl);
vint64m4_t __riscv_vwadd_wx_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, int32_t rs1, size_t vl);
vint64m8_t __riscv_vwadd_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint32m4_t vs2,
                                     vint32m4_t vs1, size_t vl);
vint64m8_t __riscv_vwadd_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint32m4_t vs2,
                                     int32_t rs1, size_t vl);
vint64m8_t __riscv_vwadd_wv_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     vint32m4_t vs1, size_t vl);
vint64m8_t __riscv_vwadd_wx_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     int32_t rs1, size_t vl);
vint16mf4_t __riscv_vwsub_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                       vint8mf8_t vs2, vint8mf8_t vs1,
                                       size_t vl);
vint16mf4_t __riscv_vwsub_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                       vint8mf8_t vs2, int8_t rs1, size_t vl);
vint16mf4_t __riscv_vwsub_wv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, vint8mf8_t vs1,
                                       size_t vl);
vint16mf4_t __riscv_vwsub_wx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, int8_t rs1, size_t vl);
vint16mf2_t __riscv_vwsub_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                       vint8mf4_t vs2, vint8mf4_t vs1,
                                       size_t vl);
vint16mf2_t __riscv_vwsub_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                       vint8mf4_t vs2, int8_t rs1, size_t vl);
vint16mf2_t __riscv_vwsub_wv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, vint8mf4_t vs1,
                                       size_t vl);
vint16mf2_t __riscv_vwsub_wx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, int8_t rs1, size_t vl);
vint16m1_t __riscv_vwsub_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                     vint8mf2_t vs2, vint8mf2_t vs1, size_t vl);
vint16m1_t __riscv_vwsub_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                     vint8mf2_t vs2, int8_t rs1, size_t vl);
vint16m1_t __riscv_vwsub_wv_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, vint8mf2_t vs1, size_t vl);
vint16m1_t __riscv_vwsub_wx_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, int8_t rs1, size_t vl);
vint16m2_t __riscv_vwsub_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint8m1_t vs2,
                                     vint8m1_t vs1, size_t vl);
vint16m2_t __riscv_vwsub_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint8m1_t vs2,
                                     int8_t rs1, size_t vl);
vint16m2_t __riscv_vwsub_wv_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     vint8m1_t vs1, size_t vl);
vint16m2_t __riscv_vwsub_wx_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     int8_t rs1, size_t vl);
vint16m4_t __riscv_vwsub_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint8m2_t vs2,
                                     vint8m2_t vs1, size_t vl);
vint16m4_t __riscv_vwsub_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint8m2_t vs2,
                                     int8_t rs1, size_t vl);
vint16m4_t __riscv_vwsub_wv_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     vint8m2_t vs1, size_t vl);
vint16m4_t __riscv_vwsub_wx_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     int8_t rs1, size_t vl);
vint16m8_t __riscv_vwsub_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint8m4_t vs2,
                                     vint8m4_t vs1, size_t vl);
vint16m8_t __riscv_vwsub_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint8m4_t vs2,
                                     int8_t rs1, size_t vl);
vint16m8_t __riscv_vwsub_wv_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     vint8m4_t vs1, size_t vl);
vint16m8_t __riscv_vwsub_wx_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     int8_t rs1, size_t vl);
vint32mf2_t __riscv_vwsub_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                       vint16mf4_t vs2, vint16mf4_t vs1,
                                       size_t vl);
vint32mf2_t __riscv_vwsub_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                       vint16mf4_t vs2, int16_t rs1, size_t vl);
vint32mf2_t __riscv_vwsub_wv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, vint16mf4_t vs1,
                                       size_t vl);
vint32mf2_t __riscv_vwsub_wx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, int16_t rs1, size_t vl);
vint32m1_t __riscv_vwsub_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                     vint16mf2_t vs2, vint16mf2_t vs1,
                                     size_t vl);
vint32m1_t __riscv_vwsub_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                     vint16mf2_t vs2, int16_t rs1, size_t vl);
vint32m1_t __riscv_vwsub_wv_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, vint16mf2_t vs1,
                                     size_t vl);
vint32m1_t __riscv_vwsub_wx_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, int16_t rs1, size_t vl);
vint32m2_t __riscv_vwsub_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                     vint16m1_t vs2, vint16m1_t vs1, size_t vl);
vint32m2_t __riscv_vwsub_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                     vint16m1_t vs2, int16_t rs1, size_t vl);
vint32m2_t __riscv_vwsub_wv_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, vint16m1_t vs1, size_t vl);
vint32m2_t __riscv_vwsub_wx_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, int16_t rs1, size_t vl);
vint32m4_t __riscv_vwsub_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint16m2_t vs2,
                                     vint16m2_t vs1, size_t vl);
vint32m4_t __riscv_vwsub_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint16m2_t vs2,
                                     int16_t rs1, size_t vl);
vint32m4_t __riscv_vwsub_wv_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     vint16m2_t vs1, size_t vl);
vint32m4_t __riscv_vwsub_wx_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     int16_t rs1, size_t vl);
vint32m8_t __riscv_vwsub_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint16m4_t vs2,
                                     vint16m4_t vs1, size_t vl);
vint32m8_t __riscv_vwsub_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint16m4_t vs2,
                                     int16_t rs1, size_t vl);
vint32m8_t __riscv_vwsub_wv_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     vint16m4_t vs1, size_t vl);
vint32m8_t __riscv_vwsub_wx_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     int16_t rs1, size_t vl);
vint64m1_t __riscv_vwsub_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                     vint32mf2_t vs2, vint32mf2_t vs1,
                                     size_t vl);
vint64m1_t __riscv_vwsub_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                     vint32mf2_t vs2, int32_t rs1, size_t vl);
vint64m1_t __riscv_vwsub_wv_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, vint32mf2_t vs1,
                                     size_t vl);
vint64m1_t __riscv_vwsub_wx_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, int32_t rs1, size_t vl);
vint64m2_t __riscv_vwsub_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                     vint32m1_t vs2, vint32m1_t vs1, size_t vl);
vint64m2_t __riscv_vwsub_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                     vint32m1_t vs2, int32_t rs1, size_t vl);
vint64m2_t __riscv_vwsub_wv_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, vint32m1_t vs1, size_t vl);
vint64m2_t __riscv_vwsub_wx_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, int32_t rs1, size_t vl);
vint64m4_t __riscv_vwsub_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                     vint32m2_t vs2, vint32m2_t vs1, size_t vl);
vint64m4_t __riscv_vwsub_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                     vint32m2_t vs2, int32_t rs1, size_t vl);
vint64m4_t __riscv_vwsub_wv_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, vint32m2_t vs1, size_t vl);
vint64m4_t __riscv_vwsub_wx_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, int32_t rs1, size_t vl);
vint64m8_t __riscv_vwsub_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint32m4_t vs2,
                                     vint32m4_t vs1, size_t vl);
vint64m8_t __riscv_vwsub_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint32m4_t vs2,
                                     int32_t rs1, size_t vl);
vint64m8_t __riscv_vwsub_wv_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     vint32m4_t vs1, size_t vl);
vint64m8_t __riscv_vwsub_wx_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     int32_t rs1, size_t vl);
vuint16mf4_t __riscv_vwaddu_vv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint8mf8_t vs2, vuint8mf8_t vs1,
                                         size_t vl);
vuint16mf4_t __riscv_vwaddu_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint8mf8_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16mf4_t __riscv_vwaddu_wv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, vuint8mf8_t vs1,
                                         size_t vl);
vuint16mf4_t __riscv_vwaddu_wx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16mf2_t __riscv_vwaddu_vv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint8mf4_t vs2, vuint8mf4_t vs1,
                                         size_t vl);
vuint16mf2_t __riscv_vwaddu_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint8mf4_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16mf2_t __riscv_vwaddu_wv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, vuint8mf4_t vs1,
                                         size_t vl);
vuint16mf2_t __riscv_vwaddu_wx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16m1_t __riscv_vwaddu_vv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                       vuint8mf2_t vs2, vuint8mf2_t vs1,
                                       size_t vl);
vuint16m1_t __riscv_vwaddu_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                       vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint16m1_t __riscv_vwaddu_wv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, vuint8mf2_t vs1,
                                       size_t vl);
vuint16m1_t __riscv_vwaddu_wx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, uint8_t rs1, size_t vl);
vuint16m2_t __riscv_vwaddu_vv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                       vuint8m1_t vs2, vuint8m1_t vs1,
                                       size_t vl);
vuint16m2_t __riscv_vwaddu_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                       vuint8m1_t vs2, uint8_t rs1, size_t vl);
vuint16m2_t __riscv_vwaddu_wv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, vuint8m1_t vs1,
                                       size_t vl);
vuint16m2_t __riscv_vwaddu_wx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, uint8_t rs1, size_t vl);
vuint16m4_t __riscv_vwaddu_vv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                       vuint8m2_t vs2, vuint8m2_t vs1,
                                       size_t vl);
vuint16m4_t __riscv_vwaddu_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                       vuint8m2_t vs2, uint8_t rs1, size_t vl);
vuint16m4_t __riscv_vwaddu_wv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, vuint8m2_t vs1,
                                       size_t vl);
vuint16m4_t __riscv_vwaddu_wx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, uint8_t rs1, size_t vl);
vuint16m8_t __riscv_vwaddu_vv_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                       vuint8m4_t vs2, vuint8m4_t vs1,
                                       size_t vl);
vuint16m8_t __riscv_vwaddu_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                       vuint8m4_t vs2, uint8_t rs1, size_t vl);
vuint16m8_t __riscv_vwaddu_wv_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, vuint8m4_t vs1,
                                       size_t vl);
vuint16m8_t __riscv_vwaddu_wx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, uint8_t rs1, size_t vl);
vuint32mf2_t __riscv_vwaddu_vv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint16mf4_t vs2, vuint16mf4_t vs1,
                                         size_t vl);
vuint32mf2_t __riscv_vwaddu_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint16mf4_t vs2, uint16_t rs1,
                                         size_t vl);
vuint32mf2_t __riscv_vwaddu_wv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, vuint16mf4_t vs1,
                                         size_t vl);
vuint32mf2_t __riscv_vwaddu_wx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, uint16_t rs1,
                                         size_t vl);
vuint32m1_t __riscv_vwaddu_vv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                       vuint16mf2_t vs2, vuint16mf2_t vs1,
                                       size_t vl);
vuint32m1_t __riscv_vwaddu_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                       vuint16mf2_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32m1_t __riscv_vwaddu_wv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, vuint16mf2_t vs1,
                                       size_t vl);
vuint32m1_t __riscv_vwaddu_wx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32m2_t __riscv_vwaddu_vv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                       vuint16m1_t vs2, vuint16m1_t vs1,
                                       size_t vl);
vuint32m2_t __riscv_vwaddu_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                       vuint16m1_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32m2_t __riscv_vwaddu_wv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, vuint16m1_t vs1,
                                       size_t vl);
vuint32m2_t __riscv_vwaddu_wx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32m4_t __riscv_vwaddu_vv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                       vuint16m2_t vs2, vuint16m2_t vs1,
                                       size_t vl);
vuint32m4_t __riscv_vwaddu_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                       vuint16m2_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32m4_t __riscv_vwaddu_wv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, vuint16m2_t vs1,
                                       size_t vl);
vuint32m4_t __riscv_vwaddu_wx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32m8_t __riscv_vwaddu_vv_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                       vuint16m4_t vs2, vuint16m4_t vs1,
                                       size_t vl);
vuint32m8_t __riscv_vwaddu_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                       vuint16m4_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32m8_t __riscv_vwaddu_wv_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, vuint16m4_t vs1,
                                       size_t vl);
vuint32m8_t __riscv_vwaddu_wx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, uint16_t rs1,
                                       size_t vl);
vuint64m1_t __riscv_vwaddu_vv_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                       vuint32mf2_t vs2, vuint32mf2_t vs1,
                                       size_t vl);
vuint64m1_t __riscv_vwaddu_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                       vuint32mf2_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m1_t __riscv_vwaddu_wv_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, vuint32mf2_t vs1,
                                       size_t vl);
vuint64m1_t __riscv_vwaddu_wx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m2_t __riscv_vwaddu_vv_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                       vuint32m1_t vs2, vuint32m1_t vs1,
                                       size_t vl);
vuint64m2_t __riscv_vwaddu_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                       vuint32m1_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m2_t __riscv_vwaddu_wv_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, vuint32m1_t vs1,
                                       size_t vl);
vuint64m2_t __riscv_vwaddu_wx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m4_t __riscv_vwaddu_vv_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                       vuint32m2_t vs2, vuint32m2_t vs1,
                                       size_t vl);
vuint64m4_t __riscv_vwaddu_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                       vuint32m2_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m4_t __riscv_vwaddu_wv_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, vuint32m2_t vs1,
                                       size_t vl);
vuint64m4_t __riscv_vwaddu_wx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m8_t __riscv_vwaddu_vv_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                       vuint32m4_t vs2, vuint32m4_t vs1,
                                       size_t vl);
vuint64m8_t __riscv_vwaddu_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                       vuint32m4_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m8_t __riscv_vwaddu_wv_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, vuint32m4_t vs1,
                                       size_t vl);
vuint64m8_t __riscv_vwaddu_wx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, uint32_t rs1,
                                       size_t vl);
vuint16mf4_t __riscv_vwsubu_vv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint8mf8_t vs2, vuint8mf8_t vs1,
                                         size_t vl);
vuint16mf4_t __riscv_vwsubu_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint8mf8_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16mf4_t __riscv_vwsubu_wv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, vuint8mf8_t vs1,
                                         size_t vl);
vuint16mf4_t __riscv_vwsubu_wx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16mf2_t __riscv_vwsubu_vv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint8mf4_t vs2, vuint8mf4_t vs1,
                                         size_t vl);
vuint16mf2_t __riscv_vwsubu_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint8mf4_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16mf2_t __riscv_vwsubu_wv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, vuint8mf4_t vs1,
                                         size_t vl);
vuint16mf2_t __riscv_vwsubu_wx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16m1_t __riscv_vwsubu_vv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                       vuint8mf2_t vs2, vuint8mf2_t vs1,
                                       size_t vl);
vuint16m1_t __riscv_vwsubu_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                       vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint16m1_t __riscv_vwsubu_wv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, vuint8mf2_t vs1,
                                       size_t vl);
vuint16m1_t __riscv_vwsubu_wx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, uint8_t rs1, size_t vl);
vuint16m2_t __riscv_vwsubu_vv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                       vuint8m1_t vs2, vuint8m1_t vs1,
                                       size_t vl);
vuint16m2_t __riscv_vwsubu_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                       vuint8m1_t vs2, uint8_t rs1, size_t vl);
vuint16m2_t __riscv_vwsubu_wv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, vuint8m1_t vs1,
                                       size_t vl);
vuint16m2_t __riscv_vwsubu_wx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, uint8_t rs1, size_t vl);
vuint16m4_t __riscv_vwsubu_vv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                       vuint8m2_t vs2, vuint8m2_t vs1,
                                       size_t vl);
vuint16m4_t __riscv_vwsubu_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                       vuint8m2_t vs2, uint8_t rs1, size_t vl);
vuint16m4_t __riscv_vwsubu_wv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, vuint8m2_t vs1,
                                       size_t vl);
vuint16m4_t __riscv_vwsubu_wx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, uint8_t rs1, size_t vl);
vuint16m8_t __riscv_vwsubu_vv_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                       vuint8m4_t vs2, vuint8m4_t vs1,
                                       size_t vl);
vuint16m8_t __riscv_vwsubu_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                       vuint8m4_t vs2, uint8_t rs1, size_t vl);
vuint16m8_t __riscv_vwsubu_wv_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, vuint8m4_t vs1,
                                       size_t vl);
vuint16m8_t __riscv_vwsubu_wx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, uint8_t rs1, size_t vl);
vuint32mf2_t __riscv_vwsubu_vv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint16mf4_t vs2, vuint16mf4_t vs1,
                                         size_t vl);
vuint32mf2_t __riscv_vwsubu_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint16mf4_t vs2, uint16_t rs1,
                                         size_t vl);
vuint32mf2_t __riscv_vwsubu_wv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, vuint16mf4_t vs1,
                                         size_t vl);
vuint32mf2_t __riscv_vwsubu_wx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, uint16_t rs1,
                                         size_t vl);
vuint32m1_t __riscv_vwsubu_vv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                       vuint16mf2_t vs2, vuint16mf2_t vs1,
                                       size_t vl);
vuint32m1_t __riscv_vwsubu_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                       vuint16mf2_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32m1_t __riscv_vwsubu_wv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, vuint16mf2_t vs1,
                                       size_t vl);
vuint32m1_t __riscv_vwsubu_wx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32m2_t __riscv_vwsubu_vv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                       vuint16m1_t vs2, vuint16m1_t vs1,
                                       size_t vl);
vuint32m2_t __riscv_vwsubu_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                       vuint16m1_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32m2_t __riscv_vwsubu_wv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, vuint16m1_t vs1,
                                       size_t vl);
vuint32m2_t __riscv_vwsubu_wx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32m4_t __riscv_vwsubu_vv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                       vuint16m2_t vs2, vuint16m2_t vs1,
                                       size_t vl);
vuint32m4_t __riscv_vwsubu_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                       vuint16m2_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32m4_t __riscv_vwsubu_wv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, vuint16m2_t vs1,
                                       size_t vl);
vuint32m4_t __riscv_vwsubu_wx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32m8_t __riscv_vwsubu_vv_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                       vuint16m4_t vs2, vuint16m4_t vs1,
                                       size_t vl);
vuint32m8_t __riscv_vwsubu_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                       vuint16m4_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32m8_t __riscv_vwsubu_wv_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, vuint16m4_t vs1,
                                       size_t vl);
vuint32m8_t __riscv_vwsubu_wx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, uint16_t rs1,
                                       size_t vl);
vuint64m1_t __riscv_vwsubu_vv_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                       vuint32mf2_t vs2, vuint32mf2_t vs1,
                                       size_t vl);
vuint64m1_t __riscv_vwsubu_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                       vuint32mf2_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m1_t __riscv_vwsubu_wv_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, vuint32mf2_t vs1,
                                       size_t vl);
vuint64m1_t __riscv_vwsubu_wx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m2_t __riscv_vwsubu_vv_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                       vuint32m1_t vs2, vuint32m1_t vs1,
                                       size_t vl);
vuint64m2_t __riscv_vwsubu_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                       vuint32m1_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m2_t __riscv_vwsubu_wv_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, vuint32m1_t vs1,
                                       size_t vl);
vuint64m2_t __riscv_vwsubu_wx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m4_t __riscv_vwsubu_vv_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                       vuint32m2_t vs2, vuint32m2_t vs1,
                                       size_t vl);
vuint64m4_t __riscv_vwsubu_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                       vuint32m2_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m4_t __riscv_vwsubu_wv_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, vuint32m2_t vs1,
                                       size_t vl);
vuint64m4_t __riscv_vwsubu_wx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m8_t __riscv_vwsubu_vv_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                       vuint32m4_t vs2, vuint32m4_t vs1,
                                       size_t vl);
vuint64m8_t __riscv_vwsubu_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                       vuint32m4_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m8_t __riscv_vwsubu_wv_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, vuint32m4_t vs1,
                                       size_t vl);
vuint64m8_t __riscv_vwsubu_wx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, uint32_t rs1,
                                       size_t vl);

Vector Integer Widening Intrinsics

vint16mf4_t __riscv_vwcvt_x_x_v_i16mf4_tu(vint16mf4_t vd, vint8mf8_t vs2,
                                          size_t vl);
vint16mf2_t __riscv_vwcvt_x_x_v_i16mf2_tu(vint16mf2_t vd, vint8mf4_t vs2,
                                          size_t vl);
vint16m1_t __riscv_vwcvt_x_x_v_i16m1_tu(vint16m1_t vd, vint8mf2_t vs2,
                                        size_t vl);
vint16m2_t __riscv_vwcvt_x_x_v_i16m2_tu(vint16m2_t vd, vint8m1_t vs2,
                                        size_t vl);
vint16m4_t __riscv_vwcvt_x_x_v_i16m4_tu(vint16m4_t vd, vint8m2_t vs2,
                                        size_t vl);
vint16m8_t __riscv_vwcvt_x_x_v_i16m8_tu(vint16m8_t vd, vint8m4_t vs2,
                                        size_t vl);
vuint16mf4_t __riscv_vwcvtu_x_x_v_u16mf4_tu(vuint16mf4_t vd, vuint8mf8_t vs2,
                                            size_t vl);
vuint16mf2_t __riscv_vwcvtu_x_x_v_u16mf2_tu(vuint16mf2_t vd, vuint8mf4_t vs2,
                                            size_t vl);
vuint16m1_t __riscv_vwcvtu_x_x_v_u16m1_tu(vuint16m1_t vd, vuint8mf2_t vs2,
                                          size_t vl);
vuint16m2_t __riscv_vwcvtu_x_x_v_u16m2_tu(vuint16m2_t vd, vuint8m1_t vs2,
                                          size_t vl);
vuint16m4_t __riscv_vwcvtu_x_x_v_u16m4_tu(vuint16m4_t vd, vuint8m2_t vs2,
                                          size_t vl);
vuint16m8_t __riscv_vwcvtu_x_x_v_u16m8_tu(vuint16m8_t vd, vuint8m4_t vs2,
                                          size_t vl);
vint32mf2_t __riscv_vwcvt_x_x_v_i32mf2_tu(vint32mf2_t vd, vint16mf4_t vs2,
                                          size_t vl);
vint32m1_t __riscv_vwcvt_x_x_v_i32m1_tu(vint32m1_t vd, vint16mf2_t vs2,
                                        size_t vl);
vint32m2_t __riscv_vwcvt_x_x_v_i32m2_tu(vint32m2_t vd, vint16m1_t vs2,
                                        size_t vl);
vint32m4_t __riscv_vwcvt_x_x_v_i32m4_tu(vint32m4_t vd, vint16m2_t vs2,
                                        size_t vl);
vint32m8_t __riscv_vwcvt_x_x_v_i32m8_tu(vint32m8_t vd, vint16m4_t vs2,
                                        size_t vl);
vuint32mf2_t __riscv_vwcvtu_x_x_v_u32mf2_tu(vuint32mf2_t vd, vuint16mf4_t vs2,
                                            size_t vl);
vuint32m1_t __riscv_vwcvtu_x_x_v_u32m1_tu(vuint32m1_t vd, vuint16mf2_t vs2,
                                          size_t vl);
vuint32m2_t __riscv_vwcvtu_x_x_v_u32m2_tu(vuint32m2_t vd, vuint16m1_t vs2,
                                          size_t vl);
vuint32m4_t __riscv_vwcvtu_x_x_v_u32m4_tu(vuint32m4_t vd, vuint16m2_t vs2,
                                          size_t vl);
vuint32m8_t __riscv_vwcvtu_x_x_v_u32m8_tu(vuint32m8_t vd, vuint16m4_t vs2,
                                          size_t vl);
vint64m1_t __riscv_vwcvt_x_x_v_i64m1_tu(vint64m1_t vd, vint32mf2_t vs2,
                                        size_t vl);
vint64m2_t __riscv_vwcvt_x_x_v_i64m2_tu(vint64m2_t vd, vint32m1_t vs2,
                                        size_t vl);
vint64m4_t __riscv_vwcvt_x_x_v_i64m4_tu(vint64m4_t vd, vint32m2_t vs2,
                                        size_t vl);
vint64m8_t __riscv_vwcvt_x_x_v_i64m8_tu(vint64m8_t vd, vint32m4_t vs2,
                                        size_t vl);
vuint64m1_t __riscv_vwcvtu_x_x_v_u64m1_tu(vuint64m1_t vd, vuint32mf2_t vs2,
                                          size_t vl);
vuint64m2_t __riscv_vwcvtu_x_x_v_u64m2_tu(vuint64m2_t vd, vuint32m1_t vs2,
                                          size_t vl);
vuint64m4_t __riscv_vwcvtu_x_x_v_u64m4_tu(vuint64m4_t vd, vuint32m2_t vs2,
                                          size_t vl);
vuint64m8_t __riscv_vwcvtu_x_x_v_u64m8_tu(vuint64m8_t vd, vuint32m4_t vs2,
                                          size_t vl);
// masked functions
vint16mf4_t __riscv_vwcvt_x_x_v_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                           vint8mf8_t vs2, size_t vl);
vint16mf2_t __riscv_vwcvt_x_x_v_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                           vint8mf4_t vs2, size_t vl);
vint16m1_t __riscv_vwcvt_x_x_v_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                         vint8mf2_t vs2, size_t vl);
vint16m2_t __riscv_vwcvt_x_x_v_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                         vint8m1_t vs2, size_t vl);
vint16m4_t __riscv_vwcvt_x_x_v_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                         vint8m2_t vs2, size_t vl);
vint16m8_t __riscv_vwcvt_x_x_v_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                         vint8m4_t vs2, size_t vl);
vuint16mf4_t __riscv_vwcvtu_x_x_v_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                             vuint8mf8_t vs2, size_t vl);
vuint16mf2_t __riscv_vwcvtu_x_x_v_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                             vuint8mf4_t vs2, size_t vl);
vuint16m1_t __riscv_vwcvtu_x_x_v_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                           vuint8mf2_t vs2, size_t vl);
vuint16m2_t __riscv_vwcvtu_x_x_v_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                           vuint8m1_t vs2, size_t vl);
vuint16m4_t __riscv_vwcvtu_x_x_v_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                           vuint8m2_t vs2, size_t vl);
vuint16m8_t __riscv_vwcvtu_x_x_v_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                           vuint8m4_t vs2, size_t vl);
vint32mf2_t __riscv_vwcvt_x_x_v_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                           vint16mf4_t vs2, size_t vl);
vint32m1_t __riscv_vwcvt_x_x_v_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                         vint16mf2_t vs2, size_t vl);
vint32m2_t __riscv_vwcvt_x_x_v_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                         vint16m1_t vs2, size_t vl);
vint32m4_t __riscv_vwcvt_x_x_v_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                         vint16m2_t vs2, size_t vl);
vint32m8_t __riscv_vwcvt_x_x_v_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                         vint16m4_t vs2, size_t vl);
vuint32mf2_t __riscv_vwcvtu_x_x_v_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                             vuint16mf4_t vs2, size_t vl);
vuint32m1_t __riscv_vwcvtu_x_x_v_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                           vuint16mf2_t vs2, size_t vl);
vuint32m2_t __riscv_vwcvtu_x_x_v_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                           vuint16m1_t vs2, size_t vl);
vuint32m4_t __riscv_vwcvtu_x_x_v_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                           vuint16m2_t vs2, size_t vl);
vuint32m8_t __riscv_vwcvtu_x_x_v_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                           vuint16m4_t vs2, size_t vl);
vint64m1_t __riscv_vwcvt_x_x_v_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                         vint32mf2_t vs2, size_t vl);
vint64m2_t __riscv_vwcvt_x_x_v_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                         vint32m1_t vs2, size_t vl);
vint64m4_t __riscv_vwcvt_x_x_v_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                         vint32m2_t vs2, size_t vl);
vint64m8_t __riscv_vwcvt_x_x_v_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                         vint32m4_t vs2, size_t vl);
vuint64m1_t __riscv_vwcvtu_x_x_v_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                           vuint32mf2_t vs2, size_t vl);
vuint64m2_t __riscv_vwcvtu_x_x_v_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                           vuint32m1_t vs2, size_t vl);
vuint64m4_t __riscv_vwcvtu_x_x_v_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                           vuint32m2_t vs2, size_t vl);
vuint64m8_t __riscv_vwcvtu_x_x_v_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                           vuint32m4_t vs2, size_t vl);
// masked functions
vint16mf4_t __riscv_vwcvt_x_x_v_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                            vint8mf8_t vs2, size_t vl);
vint16mf2_t __riscv_vwcvt_x_x_v_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                            vint8mf4_t vs2, size_t vl);
vint16m1_t __riscv_vwcvt_x_x_v_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                          vint8mf2_t vs2, size_t vl);
vint16m2_t __riscv_vwcvt_x_x_v_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                          vint8m1_t vs2, size_t vl);
vint16m4_t __riscv_vwcvt_x_x_v_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                          vint8m2_t vs2, size_t vl);
vint16m8_t __riscv_vwcvt_x_x_v_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                          vint8m4_t vs2, size_t vl);
vuint16mf4_t __riscv_vwcvtu_x_x_v_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                              vuint8mf8_t vs2, size_t vl);
vuint16mf2_t __riscv_vwcvtu_x_x_v_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                              vuint8mf4_t vs2, size_t vl);
vuint16m1_t __riscv_vwcvtu_x_x_v_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                            vuint8mf2_t vs2, size_t vl);
vuint16m2_t __riscv_vwcvtu_x_x_v_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                            vuint8m1_t vs2, size_t vl);
vuint16m4_t __riscv_vwcvtu_x_x_v_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                            vuint8m2_t vs2, size_t vl);
vuint16m8_t __riscv_vwcvtu_x_x_v_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                            vuint8m4_t vs2, size_t vl);
vint32mf2_t __riscv_vwcvt_x_x_v_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                            vint16mf4_t vs2, size_t vl);
vint32m1_t __riscv_vwcvt_x_x_v_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                          vint16mf2_t vs2, size_t vl);
vint32m2_t __riscv_vwcvt_x_x_v_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                          vint16m1_t vs2, size_t vl);
vint32m4_t __riscv_vwcvt_x_x_v_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                          vint16m2_t vs2, size_t vl);
vint32m8_t __riscv_vwcvt_x_x_v_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                          vint16m4_t vs2, size_t vl);
vuint32mf2_t __riscv_vwcvtu_x_x_v_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                              vuint16mf4_t vs2, size_t vl);
vuint32m1_t __riscv_vwcvtu_x_x_v_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                            vuint16mf2_t vs2, size_t vl);
vuint32m2_t __riscv_vwcvtu_x_x_v_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                            vuint16m1_t vs2, size_t vl);
vuint32m4_t __riscv_vwcvtu_x_x_v_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                            vuint16m2_t vs2, size_t vl);
vuint32m8_t __riscv_vwcvtu_x_x_v_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                            vuint16m4_t vs2, size_t vl);
vint64m1_t __riscv_vwcvt_x_x_v_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                          vint32mf2_t vs2, size_t vl);
vint64m2_t __riscv_vwcvt_x_x_v_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                          vint32m1_t vs2, size_t vl);
vint64m4_t __riscv_vwcvt_x_x_v_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                          vint32m2_t vs2, size_t vl);
vint64m8_t __riscv_vwcvt_x_x_v_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                          vint32m4_t vs2, size_t vl);
vuint64m1_t __riscv_vwcvtu_x_x_v_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                            vuint32mf2_t vs2, size_t vl);
vuint64m2_t __riscv_vwcvtu_x_x_v_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                            vuint32m1_t vs2, size_t vl);
vuint64m4_t __riscv_vwcvtu_x_x_v_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                            vuint32m2_t vs2, size_t vl);
vuint64m8_t __riscv_vwcvtu_x_x_v_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                            vuint32m4_t vs2, size_t vl);
// masked functions
vint16mf4_t __riscv_vwcvt_x_x_v_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                          vint8mf8_t vs2, size_t vl);
vint16mf2_t __riscv_vwcvt_x_x_v_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                          vint8mf4_t vs2, size_t vl);
vint16m1_t __riscv_vwcvt_x_x_v_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                        vint8mf2_t vs2, size_t vl);
vint16m2_t __riscv_vwcvt_x_x_v_i16m2_mu(vbool8_t vm, vint16m2_t vd,
                                        vint8m1_t vs2, size_t vl);
vint16m4_t __riscv_vwcvt_x_x_v_i16m4_mu(vbool4_t vm, vint16m4_t vd,
                                        vint8m2_t vs2, size_t vl);
vint16m8_t __riscv_vwcvt_x_x_v_i16m8_mu(vbool2_t vm, vint16m8_t vd,
                                        vint8m4_t vs2, size_t vl);
vuint16mf4_t __riscv_vwcvtu_x_x_v_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                            vuint8mf8_t vs2, size_t vl);
vuint16mf2_t __riscv_vwcvtu_x_x_v_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                            vuint8mf4_t vs2, size_t vl);
vuint16m1_t __riscv_vwcvtu_x_x_v_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                          vuint8mf2_t vs2, size_t vl);
vuint16m2_t __riscv_vwcvtu_x_x_v_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                          vuint8m1_t vs2, size_t vl);
vuint16m4_t __riscv_vwcvtu_x_x_v_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                          vuint8m2_t vs2, size_t vl);
vuint16m8_t __riscv_vwcvtu_x_x_v_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                          vuint8m4_t vs2, size_t vl);
vint32mf2_t __riscv_vwcvt_x_x_v_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                          vint16mf4_t vs2, size_t vl);
vint32m1_t __riscv_vwcvt_x_x_v_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                        vint16mf2_t vs2, size_t vl);
vint32m2_t __riscv_vwcvt_x_x_v_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                        vint16m1_t vs2, size_t vl);
vint32m4_t __riscv_vwcvt_x_x_v_i32m4_mu(vbool8_t vm, vint32m4_t vd,
                                        vint16m2_t vs2, size_t vl);
vint32m8_t __riscv_vwcvt_x_x_v_i32m8_mu(vbool4_t vm, vint32m8_t vd,
                                        vint16m4_t vs2, size_t vl);
vuint32mf2_t __riscv_vwcvtu_x_x_v_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                            vuint16mf4_t vs2, size_t vl);
vuint32m1_t __riscv_vwcvtu_x_x_v_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                          vuint16mf2_t vs2, size_t vl);
vuint32m2_t __riscv_vwcvtu_x_x_v_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                          vuint16m1_t vs2, size_t vl);
vuint32m4_t __riscv_vwcvtu_x_x_v_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                          vuint16m2_t vs2, size_t vl);
vuint32m8_t __riscv_vwcvtu_x_x_v_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                          vuint16m4_t vs2, size_t vl);
vint64m1_t __riscv_vwcvt_x_x_v_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                        vint32mf2_t vs2, size_t vl);
vint64m2_t __riscv_vwcvt_x_x_v_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                        vint32m1_t vs2, size_t vl);
vint64m4_t __riscv_vwcvt_x_x_v_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                        vint32m2_t vs2, size_t vl);
vint64m8_t __riscv_vwcvt_x_x_v_i64m8_mu(vbool8_t vm, vint64m8_t vd,
                                        vint32m4_t vs2, size_t vl);
vuint64m1_t __riscv_vwcvtu_x_x_v_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                          vuint32mf2_t vs2, size_t vl);
vuint64m2_t __riscv_vwcvtu_x_x_v_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                          vuint32m1_t vs2, size_t vl);
vuint64m4_t __riscv_vwcvtu_x_x_v_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                          vuint32m2_t vs2, size_t vl);
vuint64m8_t __riscv_vwcvtu_x_x_v_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                          vuint32m4_t vs2, size_t vl);

Vector Integer Extension Intrinsics

vint16mf4_t __riscv_vsext_vf2_i16mf4_tu(vint16mf4_t vd, vint8mf8_t vs2,
                                        size_t vl);
vint16mf2_t __riscv_vsext_vf2_i16mf2_tu(vint16mf2_t vd, vint8mf4_t vs2,
                                        size_t vl);
vint16m1_t __riscv_vsext_vf2_i16m1_tu(vint16m1_t vd, vint8mf2_t vs2, size_t vl);
vint16m2_t __riscv_vsext_vf2_i16m2_tu(vint16m2_t vd, vint8m1_t vs2, size_t vl);
vint16m4_t __riscv_vsext_vf2_i16m4_tu(vint16m4_t vd, vint8m2_t vs2, size_t vl);
vint16m8_t __riscv_vsext_vf2_i16m8_tu(vint16m8_t vd, vint8m4_t vs2, size_t vl);
vint32mf2_t __riscv_vsext_vf4_i32mf2_tu(vint32mf2_t vd, vint8mf8_t vs2,
                                        size_t vl);
vint32m1_t __riscv_vsext_vf4_i32m1_tu(vint32m1_t vd, vint8mf4_t vs2, size_t vl);
vint32m2_t __riscv_vsext_vf4_i32m2_tu(vint32m2_t vd, vint8mf2_t vs2, size_t vl);
vint32m4_t __riscv_vsext_vf4_i32m4_tu(vint32m4_t vd, vint8m1_t vs2, size_t vl);
vint32m8_t __riscv_vsext_vf4_i32m8_tu(vint32m8_t vd, vint8m2_t vs2, size_t vl);
vint64m1_t __riscv_vsext_vf8_i64m1_tu(vint64m1_t vd, vint8mf8_t vs2, size_t vl);
vint64m2_t __riscv_vsext_vf8_i64m2_tu(vint64m2_t vd, vint8mf4_t vs2, size_t vl);
vint64m4_t __riscv_vsext_vf8_i64m4_tu(vint64m4_t vd, vint8mf2_t vs2, size_t vl);
vint64m8_t __riscv_vsext_vf8_i64m8_tu(vint64m8_t vd, vint8m1_t vs2, size_t vl);
vint32mf2_t __riscv_vsext_vf2_i32mf2_tu(vint32mf2_t vd, vint16mf4_t vs2,
                                        size_t vl);
vint32m1_t __riscv_vsext_vf2_i32m1_tu(vint32m1_t vd, vint16mf2_t vs2,
                                      size_t vl);
vint32m2_t __riscv_vsext_vf2_i32m2_tu(vint32m2_t vd, vint16m1_t vs2, size_t vl);
vint32m4_t __riscv_vsext_vf2_i32m4_tu(vint32m4_t vd, vint16m2_t vs2, size_t vl);
vint32m8_t __riscv_vsext_vf2_i32m8_tu(vint32m8_t vd, vint16m4_t vs2, size_t vl);
vint64m1_t __riscv_vsext_vf4_i64m1_tu(vint64m1_t vd, vint16mf4_t vs2,
                                      size_t vl);
vint64m2_t __riscv_vsext_vf4_i64m2_tu(vint64m2_t vd, vint16mf2_t vs2,
                                      size_t vl);
vint64m4_t __riscv_vsext_vf4_i64m4_tu(vint64m4_t vd, vint16m1_t vs2, size_t vl);
vint64m8_t __riscv_vsext_vf4_i64m8_tu(vint64m8_t vd, vint16m2_t vs2, size_t vl);
vint64m1_t __riscv_vsext_vf2_i64m1_tu(vint64m1_t vd, vint32mf2_t vs2,
                                      size_t vl);
vint64m2_t __riscv_vsext_vf2_i64m2_tu(vint64m2_t vd, vint32m1_t vs2, size_t vl);
vint64m4_t __riscv_vsext_vf2_i64m4_tu(vint64m4_t vd, vint32m2_t vs2, size_t vl);
vint64m8_t __riscv_vsext_vf2_i64m8_tu(vint64m8_t vd, vint32m4_t vs2, size_t vl);
vuint16mf4_t __riscv_vzext_vf2_u16mf4_tu(vuint16mf4_t vd, vuint8mf8_t vs2,
                                         size_t vl);
vuint16mf2_t __riscv_vzext_vf2_u16mf2_tu(vuint16mf2_t vd, vuint8mf4_t vs2,
                                         size_t vl);
vuint16m1_t __riscv_vzext_vf2_u16m1_tu(vuint16m1_t vd, vuint8mf2_t vs2,
                                       size_t vl);
vuint16m2_t __riscv_vzext_vf2_u16m2_tu(vuint16m2_t vd, vuint8m1_t vs2,
                                       size_t vl);
vuint16m4_t __riscv_vzext_vf2_u16m4_tu(vuint16m4_t vd, vuint8m2_t vs2,
                                       size_t vl);
vuint16m8_t __riscv_vzext_vf2_u16m8_tu(vuint16m8_t vd, vuint8m4_t vs2,
                                       size_t vl);
vuint32mf2_t __riscv_vzext_vf4_u32mf2_tu(vuint32mf2_t vd, vuint8mf8_t vs2,
                                         size_t vl);
vuint32m1_t __riscv_vzext_vf4_u32m1_tu(vuint32m1_t vd, vuint8mf4_t vs2,
                                       size_t vl);
vuint32m2_t __riscv_vzext_vf4_u32m2_tu(vuint32m2_t vd, vuint8mf2_t vs2,
                                       size_t vl);
vuint32m4_t __riscv_vzext_vf4_u32m4_tu(vuint32m4_t vd, vuint8m1_t vs2,
                                       size_t vl);
vuint32m8_t __riscv_vzext_vf4_u32m8_tu(vuint32m8_t vd, vuint8m2_t vs2,
                                       size_t vl);
vuint64m1_t __riscv_vzext_vf8_u64m1_tu(vuint64m1_t vd, vuint8mf8_t vs2,
                                       size_t vl);
vuint64m2_t __riscv_vzext_vf8_u64m2_tu(vuint64m2_t vd, vuint8mf4_t vs2,
                                       size_t vl);
vuint64m4_t __riscv_vzext_vf8_u64m4_tu(vuint64m4_t vd, vuint8mf2_t vs2,
                                       size_t vl);
vuint64m8_t __riscv_vzext_vf8_u64m8_tu(vuint64m8_t vd, vuint8m1_t vs2,
                                       size_t vl);
vuint32mf2_t __riscv_vzext_vf2_u32mf2_tu(vuint32mf2_t vd, vuint16mf4_t vs2,
                                         size_t vl);
vuint32m1_t __riscv_vzext_vf2_u32m1_tu(vuint32m1_t vd, vuint16mf2_t vs2,
                                       size_t vl);
vuint32m2_t __riscv_vzext_vf2_u32m2_tu(vuint32m2_t vd, vuint16m1_t vs2,
                                       size_t vl);
vuint32m4_t __riscv_vzext_vf2_u32m4_tu(vuint32m4_t vd, vuint16m2_t vs2,
                                       size_t vl);
vuint32m8_t __riscv_vzext_vf2_u32m8_tu(vuint32m8_t vd, vuint16m4_t vs2,
                                       size_t vl);
vuint64m1_t __riscv_vzext_vf4_u64m1_tu(vuint64m1_t vd, vuint16mf4_t vs2,
                                       size_t vl);
vuint64m2_t __riscv_vzext_vf4_u64m2_tu(vuint64m2_t vd, vuint16mf2_t vs2,
                                       size_t vl);
vuint64m4_t __riscv_vzext_vf4_u64m4_tu(vuint64m4_t vd, vuint16m1_t vs2,
                                       size_t vl);
vuint64m8_t __riscv_vzext_vf4_u64m8_tu(vuint64m8_t vd, vuint16m2_t vs2,
                                       size_t vl);
vuint64m1_t __riscv_vzext_vf2_u64m1_tu(vuint64m1_t vd, vuint32mf2_t vs2,
                                       size_t vl);
vuint64m2_t __riscv_vzext_vf2_u64m2_tu(vuint64m2_t vd, vuint32m1_t vs2,
                                       size_t vl);
vuint64m4_t __riscv_vzext_vf2_u64m4_tu(vuint64m4_t vd, vuint32m2_t vs2,
                                       size_t vl);
vuint64m8_t __riscv_vzext_vf2_u64m8_tu(vuint64m8_t vd, vuint32m4_t vs2,
                                       size_t vl);
// masked functions
vint16mf4_t __riscv_vsext_vf2_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                         vint8mf8_t vs2, size_t vl);
vint16mf2_t __riscv_vsext_vf2_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                         vint8mf4_t vs2, size_t vl);
vint16m1_t __riscv_vsext_vf2_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                       vint8mf2_t vs2, size_t vl);
vint16m2_t __riscv_vsext_vf2_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                       vint8m1_t vs2, size_t vl);
vint16m4_t __riscv_vsext_vf2_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                       vint8m2_t vs2, size_t vl);
vint16m8_t __riscv_vsext_vf2_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                       vint8m4_t vs2, size_t vl);
vint32mf2_t __riscv_vsext_vf4_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                         vint8mf8_t vs2, size_t vl);
vint32m1_t __riscv_vsext_vf4_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                       vint8mf4_t vs2, size_t vl);
vint32m2_t __riscv_vsext_vf4_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                       vint8mf2_t vs2, size_t vl);
vint32m4_t __riscv_vsext_vf4_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                       vint8m1_t vs2, size_t vl);
vint32m8_t __riscv_vsext_vf4_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                       vint8m2_t vs2, size_t vl);
vint64m1_t __riscv_vsext_vf8_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                       vint8mf8_t vs2, size_t vl);
vint64m2_t __riscv_vsext_vf8_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                       vint8mf4_t vs2, size_t vl);
vint64m4_t __riscv_vsext_vf8_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                       vint8mf2_t vs2, size_t vl);
vint64m8_t __riscv_vsext_vf8_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                       vint8m1_t vs2, size_t vl);
vint32mf2_t __riscv_vsext_vf2_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                         vint16mf4_t vs2, size_t vl);
vint32m1_t __riscv_vsext_vf2_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                       vint16mf2_t vs2, size_t vl);
vint32m2_t __riscv_vsext_vf2_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                       vint16m1_t vs2, size_t vl);
vint32m4_t __riscv_vsext_vf2_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                       vint16m2_t vs2, size_t vl);
vint32m8_t __riscv_vsext_vf2_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                       vint16m4_t vs2, size_t vl);
vint64m1_t __riscv_vsext_vf4_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                       vint16mf4_t vs2, size_t vl);
vint64m2_t __riscv_vsext_vf4_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                       vint16mf2_t vs2, size_t vl);
vint64m4_t __riscv_vsext_vf4_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                       vint16m1_t vs2, size_t vl);
vint64m8_t __riscv_vsext_vf4_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                       vint16m2_t vs2, size_t vl);
vint64m1_t __riscv_vsext_vf2_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                       vint32mf2_t vs2, size_t vl);
vint64m2_t __riscv_vsext_vf2_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                       vint32m1_t vs2, size_t vl);
vint64m4_t __riscv_vsext_vf2_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                       vint32m2_t vs2, size_t vl);
vint64m8_t __riscv_vsext_vf2_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                       vint32m4_t vs2, size_t vl);
vuint16mf4_t __riscv_vzext_vf2_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                          vuint8mf8_t vs2, size_t vl);
vuint16mf2_t __riscv_vzext_vf2_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                          vuint8mf4_t vs2, size_t vl);
vuint16m1_t __riscv_vzext_vf2_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                        vuint8mf2_t vs2, size_t vl);
vuint16m2_t __riscv_vzext_vf2_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                        vuint8m1_t vs2, size_t vl);
vuint16m4_t __riscv_vzext_vf2_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                        vuint8m2_t vs2, size_t vl);
vuint16m8_t __riscv_vzext_vf2_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                        vuint8m4_t vs2, size_t vl);
vuint32mf2_t __riscv_vzext_vf4_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                          vuint8mf8_t vs2, size_t vl);
vuint32m1_t __riscv_vzext_vf4_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                        vuint8mf4_t vs2, size_t vl);
vuint32m2_t __riscv_vzext_vf4_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                        vuint8mf2_t vs2, size_t vl);
vuint32m4_t __riscv_vzext_vf4_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                        vuint8m1_t vs2, size_t vl);
vuint32m8_t __riscv_vzext_vf4_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                        vuint8m2_t vs2, size_t vl);
vuint64m1_t __riscv_vzext_vf8_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                        vuint8mf8_t vs2, size_t vl);
vuint64m2_t __riscv_vzext_vf8_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                        vuint8mf4_t vs2, size_t vl);
vuint64m4_t __riscv_vzext_vf8_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                        vuint8mf2_t vs2, size_t vl);
vuint64m8_t __riscv_vzext_vf8_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                        vuint8m1_t vs2, size_t vl);
vuint32mf2_t __riscv_vzext_vf2_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                          vuint16mf4_t vs2, size_t vl);
vuint32m1_t __riscv_vzext_vf2_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                        vuint16mf2_t vs2, size_t vl);
vuint32m2_t __riscv_vzext_vf2_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                        vuint16m1_t vs2, size_t vl);
vuint32m4_t __riscv_vzext_vf2_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                        vuint16m2_t vs2, size_t vl);
vuint32m8_t __riscv_vzext_vf2_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                        vuint16m4_t vs2, size_t vl);
vuint64m1_t __riscv_vzext_vf4_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                        vuint16mf4_t vs2, size_t vl);
vuint64m2_t __riscv_vzext_vf4_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                        vuint16mf2_t vs2, size_t vl);
vuint64m4_t __riscv_vzext_vf4_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                        vuint16m1_t vs2, size_t vl);
vuint64m8_t __riscv_vzext_vf4_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                        vuint16m2_t vs2, size_t vl);
vuint64m1_t __riscv_vzext_vf2_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                        vuint32mf2_t vs2, size_t vl);
vuint64m2_t __riscv_vzext_vf2_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                        vuint32m1_t vs2, size_t vl);
vuint64m4_t __riscv_vzext_vf2_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                        vuint32m2_t vs2, size_t vl);
vuint64m8_t __riscv_vzext_vf2_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                        vuint32m4_t vs2, size_t vl);
// masked functions
vint16mf4_t __riscv_vsext_vf2_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                          vint8mf8_t vs2, size_t vl);
vint16mf2_t __riscv_vsext_vf2_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                          vint8mf4_t vs2, size_t vl);
vint16m1_t __riscv_vsext_vf2_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                        vint8mf2_t vs2, size_t vl);
vint16m2_t __riscv_vsext_vf2_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                        vint8m1_t vs2, size_t vl);
vint16m4_t __riscv_vsext_vf2_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                        vint8m2_t vs2, size_t vl);
vint16m8_t __riscv_vsext_vf2_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                        vint8m4_t vs2, size_t vl);
vint32mf2_t __riscv_vsext_vf4_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                          vint8mf8_t vs2, size_t vl);
vint32m1_t __riscv_vsext_vf4_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                        vint8mf4_t vs2, size_t vl);
vint32m2_t __riscv_vsext_vf4_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                        vint8mf2_t vs2, size_t vl);
vint32m4_t __riscv_vsext_vf4_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                        vint8m1_t vs2, size_t vl);
vint32m8_t __riscv_vsext_vf4_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                        vint8m2_t vs2, size_t vl);
vint64m1_t __riscv_vsext_vf8_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                        vint8mf8_t vs2, size_t vl);
vint64m2_t __riscv_vsext_vf8_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                        vint8mf4_t vs2, size_t vl);
vint64m4_t __riscv_vsext_vf8_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                        vint8mf2_t vs2, size_t vl);
vint64m8_t __riscv_vsext_vf8_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                        vint8m1_t vs2, size_t vl);
vint32mf2_t __riscv_vsext_vf2_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                          vint16mf4_t vs2, size_t vl);
vint32m1_t __riscv_vsext_vf2_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                        vint16mf2_t vs2, size_t vl);
vint32m2_t __riscv_vsext_vf2_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                        vint16m1_t vs2, size_t vl);
vint32m4_t __riscv_vsext_vf2_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                        vint16m2_t vs2, size_t vl);
vint32m8_t __riscv_vsext_vf2_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                        vint16m4_t vs2, size_t vl);
vint64m1_t __riscv_vsext_vf4_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                        vint16mf4_t vs2, size_t vl);
vint64m2_t __riscv_vsext_vf4_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                        vint16mf2_t vs2, size_t vl);
vint64m4_t __riscv_vsext_vf4_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                        vint16m1_t vs2, size_t vl);
vint64m8_t __riscv_vsext_vf4_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                        vint16m2_t vs2, size_t vl);
vint64m1_t __riscv_vsext_vf2_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                        vint32mf2_t vs2, size_t vl);
vint64m2_t __riscv_vsext_vf2_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                        vint32m1_t vs2, size_t vl);
vint64m4_t __riscv_vsext_vf2_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                        vint32m2_t vs2, size_t vl);
vint64m8_t __riscv_vsext_vf2_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                        vint32m4_t vs2, size_t vl);
vuint16mf4_t __riscv_vzext_vf2_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                           vuint8mf8_t vs2, size_t vl);
vuint16mf2_t __riscv_vzext_vf2_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                           vuint8mf4_t vs2, size_t vl);
vuint16m1_t __riscv_vzext_vf2_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                         vuint8mf2_t vs2, size_t vl);
vuint16m2_t __riscv_vzext_vf2_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                         vuint8m1_t vs2, size_t vl);
vuint16m4_t __riscv_vzext_vf2_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                         vuint8m2_t vs2, size_t vl);
vuint16m8_t __riscv_vzext_vf2_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                         vuint8m4_t vs2, size_t vl);
vuint32mf2_t __riscv_vzext_vf4_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                           vuint8mf8_t vs2, size_t vl);
vuint32m1_t __riscv_vzext_vf4_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                         vuint8mf4_t vs2, size_t vl);
vuint32m2_t __riscv_vzext_vf4_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                         vuint8mf2_t vs2, size_t vl);
vuint32m4_t __riscv_vzext_vf4_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                         vuint8m1_t vs2, size_t vl);
vuint32m8_t __riscv_vzext_vf4_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                         vuint8m2_t vs2, size_t vl);
vuint64m1_t __riscv_vzext_vf8_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                         vuint8mf8_t vs2, size_t vl);
vuint64m2_t __riscv_vzext_vf8_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                         vuint8mf4_t vs2, size_t vl);
vuint64m4_t __riscv_vzext_vf8_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                         vuint8mf2_t vs2, size_t vl);
vuint64m8_t __riscv_vzext_vf8_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                         vuint8m1_t vs2, size_t vl);
vuint32mf2_t __riscv_vzext_vf2_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                           vuint16mf4_t vs2, size_t vl);
vuint32m1_t __riscv_vzext_vf2_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                         vuint16mf2_t vs2, size_t vl);
vuint32m2_t __riscv_vzext_vf2_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                         vuint16m1_t vs2, size_t vl);
vuint32m4_t __riscv_vzext_vf2_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                         vuint16m2_t vs2, size_t vl);
vuint32m8_t __riscv_vzext_vf2_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                         vuint16m4_t vs2, size_t vl);
vuint64m1_t __riscv_vzext_vf4_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                         vuint16mf4_t vs2, size_t vl);
vuint64m2_t __riscv_vzext_vf4_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                         vuint16mf2_t vs2, size_t vl);
vuint64m4_t __riscv_vzext_vf4_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                         vuint16m1_t vs2, size_t vl);
vuint64m8_t __riscv_vzext_vf4_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                         vuint16m2_t vs2, size_t vl);
vuint64m1_t __riscv_vzext_vf2_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                         vuint32mf2_t vs2, size_t vl);
vuint64m2_t __riscv_vzext_vf2_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                         vuint32m1_t vs2, size_t vl);
vuint64m4_t __riscv_vzext_vf2_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                         vuint32m2_t vs2, size_t vl);
vuint64m8_t __riscv_vzext_vf2_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                         vuint32m4_t vs2, size_t vl);
// masked functions
vint16mf4_t __riscv_vsext_vf2_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                        vint8mf8_t vs2, size_t vl);
vint16mf2_t __riscv_vsext_vf2_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                        vint8mf4_t vs2, size_t vl);
vint16m1_t __riscv_vsext_vf2_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                      vint8mf2_t vs2, size_t vl);
vint16m2_t __riscv_vsext_vf2_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint8m1_t vs2,
                                      size_t vl);
vint16m4_t __riscv_vsext_vf2_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint8m2_t vs2,
                                      size_t vl);
vint16m8_t __riscv_vsext_vf2_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint8m4_t vs2,
                                      size_t vl);
vint32mf2_t __riscv_vsext_vf4_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                        vint8mf8_t vs2, size_t vl);
vint32m1_t __riscv_vsext_vf4_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                      vint8mf4_t vs2, size_t vl);
vint32m2_t __riscv_vsext_vf4_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                      vint8mf2_t vs2, size_t vl);
vint32m4_t __riscv_vsext_vf4_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint8m1_t vs2,
                                      size_t vl);
vint32m8_t __riscv_vsext_vf4_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint8m2_t vs2,
                                      size_t vl);
vint64m1_t __riscv_vsext_vf8_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                      vint8mf8_t vs2, size_t vl);
vint64m2_t __riscv_vsext_vf8_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                      vint8mf4_t vs2, size_t vl);
vint64m4_t __riscv_vsext_vf8_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                      vint8mf2_t vs2, size_t vl);
vint64m8_t __riscv_vsext_vf8_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint8m1_t vs2,
                                      size_t vl);
vint32mf2_t __riscv_vsext_vf2_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                        vint16mf4_t vs2, size_t vl);
vint32m1_t __riscv_vsext_vf2_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                      vint16mf2_t vs2, size_t vl);
vint32m2_t __riscv_vsext_vf2_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                      vint16m1_t vs2, size_t vl);
vint32m4_t __riscv_vsext_vf2_i32m4_mu(vbool8_t vm, vint32m4_t vd,
                                      vint16m2_t vs2, size_t vl);
vint32m8_t __riscv_vsext_vf2_i32m8_mu(vbool4_t vm, vint32m8_t vd,
                                      vint16m4_t vs2, size_t vl);
vint64m1_t __riscv_vsext_vf4_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                      vint16mf4_t vs2, size_t vl);
vint64m2_t __riscv_vsext_vf4_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                      vint16mf2_t vs2, size_t vl);
vint64m4_t __riscv_vsext_vf4_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                      vint16m1_t vs2, size_t vl);
vint64m8_t __riscv_vsext_vf4_i64m8_mu(vbool8_t vm, vint64m8_t vd,
                                      vint16m2_t vs2, size_t vl);
vint64m1_t __riscv_vsext_vf2_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                      vint32mf2_t vs2, size_t vl);
vint64m2_t __riscv_vsext_vf2_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                      vint32m1_t vs2, size_t vl);
vint64m4_t __riscv_vsext_vf2_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                      vint32m2_t vs2, size_t vl);
vint64m8_t __riscv_vsext_vf2_i64m8_mu(vbool8_t vm, vint64m8_t vd,
                                      vint32m4_t vs2, size_t vl);
vuint16mf4_t __riscv_vzext_vf2_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint8mf8_t vs2, size_t vl);
vuint16mf2_t __riscv_vzext_vf2_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint8mf4_t vs2, size_t vl);
vuint16m1_t __riscv_vzext_vf2_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                       vuint8mf2_t vs2, size_t vl);
vuint16m2_t __riscv_vzext_vf2_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                       vuint8m1_t vs2, size_t vl);
vuint16m4_t __riscv_vzext_vf2_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                       vuint8m2_t vs2, size_t vl);
vuint16m8_t __riscv_vzext_vf2_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                       vuint8m4_t vs2, size_t vl);
vuint32mf2_t __riscv_vzext_vf4_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint8mf8_t vs2, size_t vl);
vuint32m1_t __riscv_vzext_vf4_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                       vuint8mf4_t vs2, size_t vl);
vuint32m2_t __riscv_vzext_vf4_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                       vuint8mf2_t vs2, size_t vl);
vuint32m4_t __riscv_vzext_vf4_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                       vuint8m1_t vs2, size_t vl);
vuint32m8_t __riscv_vzext_vf4_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                       vuint8m2_t vs2, size_t vl);
vuint64m1_t __riscv_vzext_vf8_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                       vuint8mf8_t vs2, size_t vl);
vuint64m2_t __riscv_vzext_vf8_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                       vuint8mf4_t vs2, size_t vl);
vuint64m4_t __riscv_vzext_vf8_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                       vuint8mf2_t vs2, size_t vl);
vuint64m8_t __riscv_vzext_vf8_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                       vuint8m1_t vs2, size_t vl);
vuint32mf2_t __riscv_vzext_vf2_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint16mf4_t vs2, size_t vl);
vuint32m1_t __riscv_vzext_vf2_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                       vuint16mf2_t vs2, size_t vl);
vuint32m2_t __riscv_vzext_vf2_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                       vuint16m1_t vs2, size_t vl);
vuint32m4_t __riscv_vzext_vf2_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                       vuint16m2_t vs2, size_t vl);
vuint32m8_t __riscv_vzext_vf2_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                       vuint16m4_t vs2, size_t vl);
vuint64m1_t __riscv_vzext_vf4_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                       vuint16mf4_t vs2, size_t vl);
vuint64m2_t __riscv_vzext_vf4_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                       vuint16mf2_t vs2, size_t vl);
vuint64m4_t __riscv_vzext_vf4_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                       vuint16m1_t vs2, size_t vl);
vuint64m8_t __riscv_vzext_vf4_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                       vuint16m2_t vs2, size_t vl);
vuint64m1_t __riscv_vzext_vf2_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                       vuint32mf2_t vs2, size_t vl);
vuint64m2_t __riscv_vzext_vf2_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                       vuint32m1_t vs2, size_t vl);
vuint64m4_t __riscv_vzext_vf2_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                       vuint32m2_t vs2, size_t vl);
vuint64m8_t __riscv_vzext_vf2_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                       vuint32m4_t vs2, size_t vl);

Vector Integer Add-with-Carry / Subtract-with-Borrow Intrinsics

vint8mf8_t __riscv_vadc_vvm_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                     vint8mf8_t vs1, vbool64_t v0, size_t vl);
vint8mf8_t __riscv_vadc_vxm_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2, int8_t rs1,
                                     vbool64_t v0, size_t vl);
vint8mf4_t __riscv_vadc_vvm_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                     vint8mf4_t vs1, vbool32_t v0, size_t vl);
vint8mf4_t __riscv_vadc_vxm_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2, int8_t rs1,
                                     vbool32_t v0, size_t vl);
vint8mf2_t __riscv_vadc_vvm_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                     vint8mf2_t vs1, vbool16_t v0, size_t vl);
vint8mf2_t __riscv_vadc_vxm_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2, int8_t rs1,
                                     vbool16_t v0, size_t vl);
vint8m1_t __riscv_vadc_vvm_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, vint8m1_t vs1,
                                   vbool8_t v0, size_t vl);
vint8m1_t __riscv_vadc_vxm_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, int8_t rs1,
                                   vbool8_t v0, size_t vl);
vint8m2_t __riscv_vadc_vvm_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, vint8m2_t vs1,
                                   vbool4_t v0, size_t vl);
vint8m2_t __riscv_vadc_vxm_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, int8_t rs1,
                                   vbool4_t v0, size_t vl);
vint8m4_t __riscv_vadc_vvm_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, vint8m4_t vs1,
                                   vbool2_t v0, size_t vl);
vint8m4_t __riscv_vadc_vxm_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, int8_t rs1,
                                   vbool2_t v0, size_t vl);
vint8m8_t __riscv_vadc_vvm_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, vint8m8_t vs1,
                                   vbool1_t v0, size_t vl);
vint8m8_t __riscv_vadc_vxm_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, int8_t rs1,
                                   vbool1_t v0, size_t vl);
vint16mf4_t __riscv_vadc_vvm_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                       vint16mf4_t vs1, vbool64_t v0,
                                       size_t vl);
vint16mf4_t __riscv_vadc_vxm_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                       int16_t rs1, vbool64_t v0, size_t vl);
vint16mf2_t __riscv_vadc_vvm_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                       vint16mf2_t vs1, vbool32_t v0,
                                       size_t vl);
vint16mf2_t __riscv_vadc_vxm_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                       int16_t rs1, vbool32_t v0, size_t vl);
vint16m1_t __riscv_vadc_vvm_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                     vint16m1_t vs1, vbool16_t v0, size_t vl);
vint16m1_t __riscv_vadc_vxm_i16m1_tu(vint16m1_t vd, vint16m1_t vs2, int16_t rs1,
                                     vbool16_t v0, size_t vl);
vint16m2_t __riscv_vadc_vvm_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                     vint16m2_t vs1, vbool8_t v0, size_t vl);
vint16m2_t __riscv_vadc_vxm_i16m2_tu(vint16m2_t vd, vint16m2_t vs2, int16_t rs1,
                                     vbool8_t v0, size_t vl);
vint16m4_t __riscv_vadc_vvm_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                     vint16m4_t vs1, vbool4_t v0, size_t vl);
vint16m4_t __riscv_vadc_vxm_i16m4_tu(vint16m4_t vd, vint16m4_t vs2, int16_t rs1,
                                     vbool4_t v0, size_t vl);
vint16m8_t __riscv_vadc_vvm_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                     vint16m8_t vs1, vbool2_t v0, size_t vl);
vint16m8_t __riscv_vadc_vxm_i16m8_tu(vint16m8_t vd, vint16m8_t vs2, int16_t rs1,
                                     vbool2_t v0, size_t vl);
vint32mf2_t __riscv_vadc_vvm_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                       vint32mf2_t vs1, vbool64_t v0,
                                       size_t vl);
vint32mf2_t __riscv_vadc_vxm_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                       int32_t rs1, vbool64_t v0, size_t vl);
vint32m1_t __riscv_vadc_vvm_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                     vint32m1_t vs1, vbool32_t v0, size_t vl);
vint32m1_t __riscv_vadc_vxm_i32m1_tu(vint32m1_t vd, vint32m1_t vs2, int32_t rs1,
                                     vbool32_t v0, size_t vl);
vint32m2_t __riscv_vadc_vvm_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                     vint32m2_t vs1, vbool16_t v0, size_t vl);
vint32m2_t __riscv_vadc_vxm_i32m2_tu(vint32m2_t vd, vint32m2_t vs2, int32_t rs1,
                                     vbool16_t v0, size_t vl);
vint32m4_t __riscv_vadc_vvm_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                     vint32m4_t vs1, vbool8_t v0, size_t vl);
vint32m4_t __riscv_vadc_vxm_i32m4_tu(vint32m4_t vd, vint32m4_t vs2, int32_t rs1,
                                     vbool8_t v0, size_t vl);
vint32m8_t __riscv_vadc_vvm_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                     vint32m8_t vs1, vbool4_t v0, size_t vl);
vint32m8_t __riscv_vadc_vxm_i32m8_tu(vint32m8_t vd, vint32m8_t vs2, int32_t rs1,
                                     vbool4_t v0, size_t vl);
vint64m1_t __riscv_vadc_vvm_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                     vint64m1_t vs1, vbool64_t v0, size_t vl);
vint64m1_t __riscv_vadc_vxm_i64m1_tu(vint64m1_t vd, vint64m1_t vs2, int64_t rs1,
                                     vbool64_t v0, size_t vl);
vint64m2_t __riscv_vadc_vvm_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                     vint64m2_t vs1, vbool32_t v0, size_t vl);
vint64m2_t __riscv_vadc_vxm_i64m2_tu(vint64m2_t vd, vint64m2_t vs2, int64_t rs1,
                                     vbool32_t v0, size_t vl);
vint64m4_t __riscv_vadc_vvm_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                     vint64m4_t vs1, vbool16_t v0, size_t vl);
vint64m4_t __riscv_vadc_vxm_i64m4_tu(vint64m4_t vd, vint64m4_t vs2, int64_t rs1,
                                     vbool16_t v0, size_t vl);
vint64m8_t __riscv_vadc_vvm_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                     vint64m8_t vs1, vbool8_t v0, size_t vl);
vint64m8_t __riscv_vadc_vxm_i64m8_tu(vint64m8_t vd, vint64m8_t vs2, int64_t rs1,
                                     vbool8_t v0, size_t vl);
vint8mf8_t __riscv_vsbc_vvm_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                     vint8mf8_t vs1, vbool64_t v0, size_t vl);
vint8mf8_t __riscv_vsbc_vxm_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2, int8_t rs1,
                                     vbool64_t v0, size_t vl);
vint8mf4_t __riscv_vsbc_vvm_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                     vint8mf4_t vs1, vbool32_t v0, size_t vl);
vint8mf4_t __riscv_vsbc_vxm_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2, int8_t rs1,
                                     vbool32_t v0, size_t vl);
vint8mf2_t __riscv_vsbc_vvm_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                     vint8mf2_t vs1, vbool16_t v0, size_t vl);
vint8mf2_t __riscv_vsbc_vxm_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2, int8_t rs1,
                                     vbool16_t v0, size_t vl);
vint8m1_t __riscv_vsbc_vvm_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, vint8m1_t vs1,
                                   vbool8_t v0, size_t vl);
vint8m1_t __riscv_vsbc_vxm_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, int8_t rs1,
                                   vbool8_t v0, size_t vl);
vint8m2_t __riscv_vsbc_vvm_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, vint8m2_t vs1,
                                   vbool4_t v0, size_t vl);
vint8m2_t __riscv_vsbc_vxm_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, int8_t rs1,
                                   vbool4_t v0, size_t vl);
vint8m4_t __riscv_vsbc_vvm_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, vint8m4_t vs1,
                                   vbool2_t v0, size_t vl);
vint8m4_t __riscv_vsbc_vxm_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, int8_t rs1,
                                   vbool2_t v0, size_t vl);
vint8m8_t __riscv_vsbc_vvm_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, vint8m8_t vs1,
                                   vbool1_t v0, size_t vl);
vint8m8_t __riscv_vsbc_vxm_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, int8_t rs1,
                                   vbool1_t v0, size_t vl);
vint16mf4_t __riscv_vsbc_vvm_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                       vint16mf4_t vs1, vbool64_t v0,
                                       size_t vl);
vint16mf4_t __riscv_vsbc_vxm_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                       int16_t rs1, vbool64_t v0, size_t vl);
vint16mf2_t __riscv_vsbc_vvm_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                       vint16mf2_t vs1, vbool32_t v0,
                                       size_t vl);
vint16mf2_t __riscv_vsbc_vxm_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                       int16_t rs1, vbool32_t v0, size_t vl);
vint16m1_t __riscv_vsbc_vvm_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                     vint16m1_t vs1, vbool16_t v0, size_t vl);
vint16m1_t __riscv_vsbc_vxm_i16m1_tu(vint16m1_t vd, vint16m1_t vs2, int16_t rs1,
                                     vbool16_t v0, size_t vl);
vint16m2_t __riscv_vsbc_vvm_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                     vint16m2_t vs1, vbool8_t v0, size_t vl);
vint16m2_t __riscv_vsbc_vxm_i16m2_tu(vint16m2_t vd, vint16m2_t vs2, int16_t rs1,
                                     vbool8_t v0, size_t vl);
vint16m4_t __riscv_vsbc_vvm_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                     vint16m4_t vs1, vbool4_t v0, size_t vl);
vint16m4_t __riscv_vsbc_vxm_i16m4_tu(vint16m4_t vd, vint16m4_t vs2, int16_t rs1,
                                     vbool4_t v0, size_t vl);
vint16m8_t __riscv_vsbc_vvm_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                     vint16m8_t vs1, vbool2_t v0, size_t vl);
vint16m8_t __riscv_vsbc_vxm_i16m8_tu(vint16m8_t vd, vint16m8_t vs2, int16_t rs1,
                                     vbool2_t v0, size_t vl);
vint32mf2_t __riscv_vsbc_vvm_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                       vint32mf2_t vs1, vbool64_t v0,
                                       size_t vl);
vint32mf2_t __riscv_vsbc_vxm_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                       int32_t rs1, vbool64_t v0, size_t vl);
vint32m1_t __riscv_vsbc_vvm_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                     vint32m1_t vs1, vbool32_t v0, size_t vl);
vint32m1_t __riscv_vsbc_vxm_i32m1_tu(vint32m1_t vd, vint32m1_t vs2, int32_t rs1,
                                     vbool32_t v0, size_t vl);
vint32m2_t __riscv_vsbc_vvm_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                     vint32m2_t vs1, vbool16_t v0, size_t vl);
vint32m2_t __riscv_vsbc_vxm_i32m2_tu(vint32m2_t vd, vint32m2_t vs2, int32_t rs1,
                                     vbool16_t v0, size_t vl);
vint32m4_t __riscv_vsbc_vvm_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                     vint32m4_t vs1, vbool8_t v0, size_t vl);
vint32m4_t __riscv_vsbc_vxm_i32m4_tu(vint32m4_t vd, vint32m4_t vs2, int32_t rs1,
                                     vbool8_t v0, size_t vl);
vint32m8_t __riscv_vsbc_vvm_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                     vint32m8_t vs1, vbool4_t v0, size_t vl);
vint32m8_t __riscv_vsbc_vxm_i32m8_tu(vint32m8_t vd, vint32m8_t vs2, int32_t rs1,
                                     vbool4_t v0, size_t vl);
vint64m1_t __riscv_vsbc_vvm_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                     vint64m1_t vs1, vbool64_t v0, size_t vl);
vint64m1_t __riscv_vsbc_vxm_i64m1_tu(vint64m1_t vd, vint64m1_t vs2, int64_t rs1,
                                     vbool64_t v0, size_t vl);
vint64m2_t __riscv_vsbc_vvm_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                     vint64m2_t vs1, vbool32_t v0, size_t vl);
vint64m2_t __riscv_vsbc_vxm_i64m2_tu(vint64m2_t vd, vint64m2_t vs2, int64_t rs1,
                                     vbool32_t v0, size_t vl);
vint64m4_t __riscv_vsbc_vvm_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                     vint64m4_t vs1, vbool16_t v0, size_t vl);
vint64m4_t __riscv_vsbc_vxm_i64m4_tu(vint64m4_t vd, vint64m4_t vs2, int64_t rs1,
                                     vbool16_t v0, size_t vl);
vint64m8_t __riscv_vsbc_vvm_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                     vint64m8_t vs1, vbool8_t v0, size_t vl);
vint64m8_t __riscv_vsbc_vxm_i64m8_tu(vint64m8_t vd, vint64m8_t vs2, int64_t rs1,
                                     vbool8_t v0, size_t vl);
vuint8mf8_t __riscv_vadc_vvm_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                      vuint8mf8_t vs1, vbool64_t v0, size_t vl);
vuint8mf8_t __riscv_vadc_vxm_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                      uint8_t rs1, vbool64_t v0, size_t vl);
vuint8mf4_t __riscv_vadc_vvm_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                      vuint8mf4_t vs1, vbool32_t v0, size_t vl);
vuint8mf4_t __riscv_vadc_vxm_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                      uint8_t rs1, vbool32_t v0, size_t vl);
vuint8mf2_t __riscv_vadc_vvm_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                      vuint8mf2_t vs1, vbool16_t v0, size_t vl);
vuint8mf2_t __riscv_vadc_vxm_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                      uint8_t rs1, vbool16_t v0, size_t vl);
vuint8m1_t __riscv_vadc_vvm_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2,
                                    vuint8m1_t vs1, vbool8_t v0, size_t vl);
vuint8m1_t __riscv_vadc_vxm_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2, uint8_t rs1,
                                    vbool8_t v0, size_t vl);
vuint8m2_t __riscv_vadc_vvm_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2,
                                    vuint8m2_t vs1, vbool4_t v0, size_t vl);
vuint8m2_t __riscv_vadc_vxm_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2, uint8_t rs1,
                                    vbool4_t v0, size_t vl);
vuint8m4_t __riscv_vadc_vvm_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2,
                                    vuint8m4_t vs1, vbool2_t v0, size_t vl);
vuint8m4_t __riscv_vadc_vxm_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2, uint8_t rs1,
                                    vbool2_t v0, size_t vl);
vuint8m8_t __riscv_vadc_vvm_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2,
                                    vuint8m8_t vs1, vbool1_t v0, size_t vl);
vuint8m8_t __riscv_vadc_vxm_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2, uint8_t rs1,
                                    vbool1_t v0, size_t vl);
vuint16mf4_t __riscv_vadc_vvm_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                        vuint16mf4_t vs1, vbool64_t v0,
                                        size_t vl);
vuint16mf4_t __riscv_vadc_vxm_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                        uint16_t rs1, vbool64_t v0, size_t vl);
vuint16mf2_t __riscv_vadc_vvm_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                        vuint16mf2_t vs1, vbool32_t v0,
                                        size_t vl);
vuint16mf2_t __riscv_vadc_vxm_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                        uint16_t rs1, vbool32_t v0, size_t vl);
vuint16m1_t __riscv_vadc_vvm_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                      vuint16m1_t vs1, vbool16_t v0, size_t vl);
vuint16m1_t __riscv_vadc_vxm_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                      uint16_t rs1, vbool16_t v0, size_t vl);
vuint16m2_t __riscv_vadc_vvm_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                      vuint16m2_t vs1, vbool8_t v0, size_t vl);
vuint16m2_t __riscv_vadc_vxm_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                      uint16_t rs1, vbool8_t v0, size_t vl);
vuint16m4_t __riscv_vadc_vvm_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                      vuint16m4_t vs1, vbool4_t v0, size_t vl);
vuint16m4_t __riscv_vadc_vxm_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                      uint16_t rs1, vbool4_t v0, size_t vl);
vuint16m8_t __riscv_vadc_vvm_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                      vuint16m8_t vs1, vbool2_t v0, size_t vl);
vuint16m8_t __riscv_vadc_vxm_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                      uint16_t rs1, vbool2_t v0, size_t vl);
vuint32mf2_t __riscv_vadc_vvm_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                        vuint32mf2_t vs1, vbool64_t v0,
                                        size_t vl);
vuint32mf2_t __riscv_vadc_vxm_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                        uint32_t rs1, vbool64_t v0, size_t vl);
vuint32m1_t __riscv_vadc_vvm_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                      vuint32m1_t vs1, vbool32_t v0, size_t vl);
vuint32m1_t __riscv_vadc_vxm_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                      uint32_t rs1, vbool32_t v0, size_t vl);
vuint32m2_t __riscv_vadc_vvm_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                      vuint32m2_t vs1, vbool16_t v0, size_t vl);
vuint32m2_t __riscv_vadc_vxm_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                      uint32_t rs1, vbool16_t v0, size_t vl);
vuint32m4_t __riscv_vadc_vvm_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                      vuint32m4_t vs1, vbool8_t v0, size_t vl);
vuint32m4_t __riscv_vadc_vxm_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                      uint32_t rs1, vbool8_t v0, size_t vl);
vuint32m8_t __riscv_vadc_vvm_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                      vuint32m8_t vs1, vbool4_t v0, size_t vl);
vuint32m8_t __riscv_vadc_vxm_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                      uint32_t rs1, vbool4_t v0, size_t vl);
vuint64m1_t __riscv_vadc_vvm_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                      vuint64m1_t vs1, vbool64_t v0, size_t vl);
vuint64m1_t __riscv_vadc_vxm_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                      uint64_t rs1, vbool64_t v0, size_t vl);
vuint64m2_t __riscv_vadc_vvm_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                      vuint64m2_t vs1, vbool32_t v0, size_t vl);
vuint64m2_t __riscv_vadc_vxm_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                      uint64_t rs1, vbool32_t v0, size_t vl);
vuint64m4_t __riscv_vadc_vvm_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                      vuint64m4_t vs1, vbool16_t v0, size_t vl);
vuint64m4_t __riscv_vadc_vxm_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                      uint64_t rs1, vbool16_t v0, size_t vl);
vuint64m8_t __riscv_vadc_vvm_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                      vuint64m8_t vs1, vbool8_t v0, size_t vl);
vuint64m8_t __riscv_vadc_vxm_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                      uint64_t rs1, vbool8_t v0, size_t vl);
vuint8mf8_t __riscv_vsbc_vvm_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                      vuint8mf8_t vs1, vbool64_t v0, size_t vl);
vuint8mf8_t __riscv_vsbc_vxm_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                      uint8_t rs1, vbool64_t v0, size_t vl);
vuint8mf4_t __riscv_vsbc_vvm_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                      vuint8mf4_t vs1, vbool32_t v0, size_t vl);
vuint8mf4_t __riscv_vsbc_vxm_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                      uint8_t rs1, vbool32_t v0, size_t vl);
vuint8mf2_t __riscv_vsbc_vvm_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                      vuint8mf2_t vs1, vbool16_t v0, size_t vl);
vuint8mf2_t __riscv_vsbc_vxm_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                      uint8_t rs1, vbool16_t v0, size_t vl);
vuint8m1_t __riscv_vsbc_vvm_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2,
                                    vuint8m1_t vs1, vbool8_t v0, size_t vl);
vuint8m1_t __riscv_vsbc_vxm_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2, uint8_t rs1,
                                    vbool8_t v0, size_t vl);
vuint8m2_t __riscv_vsbc_vvm_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2,
                                    vuint8m2_t vs1, vbool4_t v0, size_t vl);
vuint8m2_t __riscv_vsbc_vxm_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2, uint8_t rs1,
                                    vbool4_t v0, size_t vl);
vuint8m4_t __riscv_vsbc_vvm_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2,
                                    vuint8m4_t vs1, vbool2_t v0, size_t vl);
vuint8m4_t __riscv_vsbc_vxm_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2, uint8_t rs1,
                                    vbool2_t v0, size_t vl);
vuint8m8_t __riscv_vsbc_vvm_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2,
                                    vuint8m8_t vs1, vbool1_t v0, size_t vl);
vuint8m8_t __riscv_vsbc_vxm_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2, uint8_t rs1,
                                    vbool1_t v0, size_t vl);
vuint16mf4_t __riscv_vsbc_vvm_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                        vuint16mf4_t vs1, vbool64_t v0,
                                        size_t vl);
vuint16mf4_t __riscv_vsbc_vxm_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                        uint16_t rs1, vbool64_t v0, size_t vl);
vuint16mf2_t __riscv_vsbc_vvm_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                        vuint16mf2_t vs1, vbool32_t v0,
                                        size_t vl);
vuint16mf2_t __riscv_vsbc_vxm_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                        uint16_t rs1, vbool32_t v0, size_t vl);
vuint16m1_t __riscv_vsbc_vvm_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                      vuint16m1_t vs1, vbool16_t v0, size_t vl);
vuint16m1_t __riscv_vsbc_vxm_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                      uint16_t rs1, vbool16_t v0, size_t vl);
vuint16m2_t __riscv_vsbc_vvm_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                      vuint16m2_t vs1, vbool8_t v0, size_t vl);
vuint16m2_t __riscv_vsbc_vxm_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                      uint16_t rs1, vbool8_t v0, size_t vl);
vuint16m4_t __riscv_vsbc_vvm_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                      vuint16m4_t vs1, vbool4_t v0, size_t vl);
vuint16m4_t __riscv_vsbc_vxm_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                      uint16_t rs1, vbool4_t v0, size_t vl);
vuint16m8_t __riscv_vsbc_vvm_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                      vuint16m8_t vs1, vbool2_t v0, size_t vl);
vuint16m8_t __riscv_vsbc_vxm_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                      uint16_t rs1, vbool2_t v0, size_t vl);
vuint32mf2_t __riscv_vsbc_vvm_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                        vuint32mf2_t vs1, vbool64_t v0,
                                        size_t vl);
vuint32mf2_t __riscv_vsbc_vxm_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                        uint32_t rs1, vbool64_t v0, size_t vl);
vuint32m1_t __riscv_vsbc_vvm_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                      vuint32m1_t vs1, vbool32_t v0, size_t vl);
vuint32m1_t __riscv_vsbc_vxm_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                      uint32_t rs1, vbool32_t v0, size_t vl);
vuint32m2_t __riscv_vsbc_vvm_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                      vuint32m2_t vs1, vbool16_t v0, size_t vl);
vuint32m2_t __riscv_vsbc_vxm_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                      uint32_t rs1, vbool16_t v0, size_t vl);
vuint32m4_t __riscv_vsbc_vvm_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                      vuint32m4_t vs1, vbool8_t v0, size_t vl);
vuint32m4_t __riscv_vsbc_vxm_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                      uint32_t rs1, vbool8_t v0, size_t vl);
vuint32m8_t __riscv_vsbc_vvm_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                      vuint32m8_t vs1, vbool4_t v0, size_t vl);
vuint32m8_t __riscv_vsbc_vxm_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                      uint32_t rs1, vbool4_t v0, size_t vl);
vuint64m1_t __riscv_vsbc_vvm_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                      vuint64m1_t vs1, vbool64_t v0, size_t vl);
vuint64m1_t __riscv_vsbc_vxm_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                      uint64_t rs1, vbool64_t v0, size_t vl);
vuint64m2_t __riscv_vsbc_vvm_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                      vuint64m2_t vs1, vbool32_t v0, size_t vl);
vuint64m2_t __riscv_vsbc_vxm_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                      uint64_t rs1, vbool32_t v0, size_t vl);
vuint64m4_t __riscv_vsbc_vvm_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                      vuint64m4_t vs1, vbool16_t v0, size_t vl);
vuint64m4_t __riscv_vsbc_vxm_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                      uint64_t rs1, vbool16_t v0, size_t vl);
vuint64m8_t __riscv_vsbc_vvm_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                      vuint64m8_t vs1, vbool8_t v0, size_t vl);
vuint64m8_t __riscv_vsbc_vxm_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                      uint64_t rs1, vbool8_t v0, size_t vl);

Vector Integer Carry-out / Borrow-out Intrinsics

Intrinsics here don’t have a policy variant.

Vector Bitwise Binary Logical Intrinsics

vint8mf8_t __riscv_vand_vv_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                    vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vand_vx_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2, int8_t rs1,
                                    size_t vl);
vint8mf4_t __riscv_vand_vv_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                    vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vand_vx_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2, int8_t rs1,
                                    size_t vl);
vint8mf2_t __riscv_vand_vv_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                    vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vand_vx_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2, int8_t rs1,
                                    size_t vl);
vint8m1_t __riscv_vand_vv_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, vint8m1_t vs1,
                                  size_t vl);
vint8m1_t __riscv_vand_vx_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, int8_t rs1,
                                  size_t vl);
vint8m2_t __riscv_vand_vv_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, vint8m2_t vs1,
                                  size_t vl);
vint8m2_t __riscv_vand_vx_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, int8_t rs1,
                                  size_t vl);
vint8m4_t __riscv_vand_vv_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, vint8m4_t vs1,
                                  size_t vl);
vint8m4_t __riscv_vand_vx_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, int8_t rs1,
                                  size_t vl);
vint8m8_t __riscv_vand_vv_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, vint8m8_t vs1,
                                  size_t vl);
vint8m8_t __riscv_vand_vx_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, int8_t rs1,
                                  size_t vl);
vint16mf4_t __riscv_vand_vv_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                      vint16mf4_t vs1, size_t vl);
vint16mf4_t __riscv_vand_vx_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                      int16_t rs1, size_t vl);
vint16mf2_t __riscv_vand_vv_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                      vint16mf2_t vs1, size_t vl);
vint16mf2_t __riscv_vand_vx_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                      int16_t rs1, size_t vl);
vint16m1_t __riscv_vand_vv_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                    vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vand_vx_i16m1_tu(vint16m1_t vd, vint16m1_t vs2, int16_t rs1,
                                    size_t vl);
vint16m2_t __riscv_vand_vv_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                    vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vand_vx_i16m2_tu(vint16m2_t vd, vint16m2_t vs2, int16_t rs1,
                                    size_t vl);
vint16m4_t __riscv_vand_vv_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                    vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vand_vx_i16m4_tu(vint16m4_t vd, vint16m4_t vs2, int16_t rs1,
                                    size_t vl);
vint16m8_t __riscv_vand_vv_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                    vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vand_vx_i16m8_tu(vint16m8_t vd, vint16m8_t vs2, int16_t rs1,
                                    size_t vl);
vint32mf2_t __riscv_vand_vv_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                      vint32mf2_t vs1, size_t vl);
vint32mf2_t __riscv_vand_vx_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                      int32_t rs1, size_t vl);
vint32m1_t __riscv_vand_vv_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                    vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vand_vx_i32m1_tu(vint32m1_t vd, vint32m1_t vs2, int32_t rs1,
                                    size_t vl);
vint32m2_t __riscv_vand_vv_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                    vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vand_vx_i32m2_tu(vint32m2_t vd, vint32m2_t vs2, int32_t rs1,
                                    size_t vl);
vint32m4_t __riscv_vand_vv_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                    vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vand_vx_i32m4_tu(vint32m4_t vd, vint32m4_t vs2, int32_t rs1,
                                    size_t vl);
vint32m8_t __riscv_vand_vv_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                    vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vand_vx_i32m8_tu(vint32m8_t vd, vint32m8_t vs2, int32_t rs1,
                                    size_t vl);
vint64m1_t __riscv_vand_vv_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                    vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vand_vx_i64m1_tu(vint64m1_t vd, vint64m1_t vs2, int64_t rs1,
                                    size_t vl);
vint64m2_t __riscv_vand_vv_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                    vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vand_vx_i64m2_tu(vint64m2_t vd, vint64m2_t vs2, int64_t rs1,
                                    size_t vl);
vint64m4_t __riscv_vand_vv_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                    vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vand_vx_i64m4_tu(vint64m4_t vd, vint64m4_t vs2, int64_t rs1,
                                    size_t vl);
vint64m8_t __riscv_vand_vv_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                    vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vand_vx_i64m8_tu(vint64m8_t vd, vint64m8_t vs2, int64_t rs1,
                                    size_t vl);
vint8mf8_t __riscv_vor_vv_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                   vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vor_vx_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2, int8_t rs1,
                                   size_t vl);
vint8mf4_t __riscv_vor_vv_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                   vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vor_vx_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2, int8_t rs1,
                                   size_t vl);
vint8mf2_t __riscv_vor_vv_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                   vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vor_vx_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2, int8_t rs1,
                                   size_t vl);
vint8m1_t __riscv_vor_vv_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, vint8m1_t vs1,
                                 size_t vl);
vint8m1_t __riscv_vor_vx_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, int8_t rs1,
                                 size_t vl);
vint8m2_t __riscv_vor_vv_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, vint8m2_t vs1,
                                 size_t vl);
vint8m2_t __riscv_vor_vx_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, int8_t rs1,
                                 size_t vl);
vint8m4_t __riscv_vor_vv_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, vint8m4_t vs1,
                                 size_t vl);
vint8m4_t __riscv_vor_vx_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, int8_t rs1,
                                 size_t vl);
vint8m8_t __riscv_vor_vv_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, vint8m8_t vs1,
                                 size_t vl);
vint8m8_t __riscv_vor_vx_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, int8_t rs1,
                                 size_t vl);
vint16mf4_t __riscv_vor_vv_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                     vint16mf4_t vs1, size_t vl);
vint16mf4_t __riscv_vor_vx_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                     int16_t rs1, size_t vl);
vint16mf2_t __riscv_vor_vv_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                     vint16mf2_t vs1, size_t vl);
vint16mf2_t __riscv_vor_vx_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                     int16_t rs1, size_t vl);
vint16m1_t __riscv_vor_vv_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                   vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vor_vx_i16m1_tu(vint16m1_t vd, vint16m1_t vs2, int16_t rs1,
                                   size_t vl);
vint16m2_t __riscv_vor_vv_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                   vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vor_vx_i16m2_tu(vint16m2_t vd, vint16m2_t vs2, int16_t rs1,
                                   size_t vl);
vint16m4_t __riscv_vor_vv_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                   vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vor_vx_i16m4_tu(vint16m4_t vd, vint16m4_t vs2, int16_t rs1,
                                   size_t vl);
vint16m8_t __riscv_vor_vv_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                   vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vor_vx_i16m8_tu(vint16m8_t vd, vint16m8_t vs2, int16_t rs1,
                                   size_t vl);
vint32mf2_t __riscv_vor_vv_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                     vint32mf2_t vs1, size_t vl);
vint32mf2_t __riscv_vor_vx_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                     int32_t rs1, size_t vl);
vint32m1_t __riscv_vor_vv_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                   vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vor_vx_i32m1_tu(vint32m1_t vd, vint32m1_t vs2, int32_t rs1,
                                   size_t vl);
vint32m2_t __riscv_vor_vv_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                   vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vor_vx_i32m2_tu(vint32m2_t vd, vint32m2_t vs2, int32_t rs1,
                                   size_t vl);
vint32m4_t __riscv_vor_vv_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                   vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vor_vx_i32m4_tu(vint32m4_t vd, vint32m4_t vs2, int32_t rs1,
                                   size_t vl);
vint32m8_t __riscv_vor_vv_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                   vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vor_vx_i32m8_tu(vint32m8_t vd, vint32m8_t vs2, int32_t rs1,
                                   size_t vl);
vint64m1_t __riscv_vor_vv_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                   vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vor_vx_i64m1_tu(vint64m1_t vd, vint64m1_t vs2, int64_t rs1,
                                   size_t vl);
vint64m2_t __riscv_vor_vv_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                   vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vor_vx_i64m2_tu(vint64m2_t vd, vint64m2_t vs2, int64_t rs1,
                                   size_t vl);
vint64m4_t __riscv_vor_vv_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                   vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vor_vx_i64m4_tu(vint64m4_t vd, vint64m4_t vs2, int64_t rs1,
                                   size_t vl);
vint64m8_t __riscv_vor_vv_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                   vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vor_vx_i64m8_tu(vint64m8_t vd, vint64m8_t vs2, int64_t rs1,
                                   size_t vl);
vint8mf8_t __riscv_vxor_vv_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                    vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vxor_vx_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2, int8_t rs1,
                                    size_t vl);
vint8mf4_t __riscv_vxor_vv_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                    vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vxor_vx_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2, int8_t rs1,
                                    size_t vl);
vint8mf2_t __riscv_vxor_vv_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                    vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vxor_vx_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2, int8_t rs1,
                                    size_t vl);
vint8m1_t __riscv_vxor_vv_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, vint8m1_t vs1,
                                  size_t vl);
vint8m1_t __riscv_vxor_vx_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, int8_t rs1,
                                  size_t vl);
vint8m2_t __riscv_vxor_vv_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, vint8m2_t vs1,
                                  size_t vl);
vint8m2_t __riscv_vxor_vx_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, int8_t rs1,
                                  size_t vl);
vint8m4_t __riscv_vxor_vv_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, vint8m4_t vs1,
                                  size_t vl);
vint8m4_t __riscv_vxor_vx_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, int8_t rs1,
                                  size_t vl);
vint8m8_t __riscv_vxor_vv_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, vint8m8_t vs1,
                                  size_t vl);
vint8m8_t __riscv_vxor_vx_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, int8_t rs1,
                                  size_t vl);
vint16mf4_t __riscv_vxor_vv_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                      vint16mf4_t vs1, size_t vl);
vint16mf4_t __riscv_vxor_vx_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                      int16_t rs1, size_t vl);
vint16mf2_t __riscv_vxor_vv_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                      vint16mf2_t vs1, size_t vl);
vint16mf2_t __riscv_vxor_vx_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                      int16_t rs1, size_t vl);
vint16m1_t __riscv_vxor_vv_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                    vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vxor_vx_i16m1_tu(vint16m1_t vd, vint16m1_t vs2, int16_t rs1,
                                    size_t vl);
vint16m2_t __riscv_vxor_vv_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                    vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vxor_vx_i16m2_tu(vint16m2_t vd, vint16m2_t vs2, int16_t rs1,
                                    size_t vl);
vint16m4_t __riscv_vxor_vv_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                    vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vxor_vx_i16m4_tu(vint16m4_t vd, vint16m4_t vs2, int16_t rs1,
                                    size_t vl);
vint16m8_t __riscv_vxor_vv_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                    vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vxor_vx_i16m8_tu(vint16m8_t vd, vint16m8_t vs2, int16_t rs1,
                                    size_t vl);
vint32mf2_t __riscv_vxor_vv_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                      vint32mf2_t vs1, size_t vl);
vint32mf2_t __riscv_vxor_vx_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                      int32_t rs1, size_t vl);
vint32m1_t __riscv_vxor_vv_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                    vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vxor_vx_i32m1_tu(vint32m1_t vd, vint32m1_t vs2, int32_t rs1,
                                    size_t vl);
vint32m2_t __riscv_vxor_vv_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                    vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vxor_vx_i32m2_tu(vint32m2_t vd, vint32m2_t vs2, int32_t rs1,
                                    size_t vl);
vint32m4_t __riscv_vxor_vv_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                    vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vxor_vx_i32m4_tu(vint32m4_t vd, vint32m4_t vs2, int32_t rs1,
                                    size_t vl);
vint32m8_t __riscv_vxor_vv_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                    vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vxor_vx_i32m8_tu(vint32m8_t vd, vint32m8_t vs2, int32_t rs1,
                                    size_t vl);
vint64m1_t __riscv_vxor_vv_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                    vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vxor_vx_i64m1_tu(vint64m1_t vd, vint64m1_t vs2, int64_t rs1,
                                    size_t vl);
vint64m2_t __riscv_vxor_vv_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                    vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vxor_vx_i64m2_tu(vint64m2_t vd, vint64m2_t vs2, int64_t rs1,
                                    size_t vl);
vint64m4_t __riscv_vxor_vv_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                    vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vxor_vx_i64m4_tu(vint64m4_t vd, vint64m4_t vs2, int64_t rs1,
                                    size_t vl);
vint64m8_t __riscv_vxor_vv_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                    vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vxor_vx_i64m8_tu(vint64m8_t vd, vint64m8_t vs2, int64_t rs1,
                                    size_t vl);
vuint8mf8_t __riscv_vand_vv_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                     vuint8mf8_t vs1, size_t vl);
vuint8mf8_t __riscv_vand_vx_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vand_vv_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                     vuint8mf4_t vs1, size_t vl);
vuint8mf4_t __riscv_vand_vx_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vand_vv_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                     vuint8mf2_t vs1, size_t vl);
vuint8mf2_t __riscv_vand_vx_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vand_vv_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2,
                                   vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vand_vx_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2, uint8_t rs1,
                                   size_t vl);
vuint8m2_t __riscv_vand_vv_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2,
                                   vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vand_vx_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2, uint8_t rs1,
                                   size_t vl);
vuint8m4_t __riscv_vand_vv_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2,
                                   vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vand_vx_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2, uint8_t rs1,
                                   size_t vl);
vuint8m8_t __riscv_vand_vv_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2,
                                   vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vand_vx_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2, uint8_t rs1,
                                   size_t vl);
vuint16mf4_t __riscv_vand_vv_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                       vuint16mf4_t vs1, size_t vl);
vuint16mf4_t __riscv_vand_vx_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                       uint16_t rs1, size_t vl);
vuint16mf2_t __riscv_vand_vv_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                       vuint16mf2_t vs1, size_t vl);
vuint16mf2_t __riscv_vand_vx_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                       uint16_t rs1, size_t vl);
vuint16m1_t __riscv_vand_vv_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                     vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vand_vx_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                     uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vand_vv_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                     vuint16m2_t vs1, size_t vl);
vuint16m2_t __riscv_vand_vx_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                     uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vand_vv_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                     vuint16m4_t vs1, size_t vl);
vuint16m4_t __riscv_vand_vx_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                     uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vand_vv_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                     vuint16m8_t vs1, size_t vl);
vuint16m8_t __riscv_vand_vx_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                     uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vand_vv_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                       vuint32mf2_t vs1, size_t vl);
vuint32mf2_t __riscv_vand_vx_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                       uint32_t rs1, size_t vl);
vuint32m1_t __riscv_vand_vv_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                     vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vand_vx_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                     uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vand_vv_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                     vuint32m2_t vs1, size_t vl);
vuint32m2_t __riscv_vand_vx_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                     uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vand_vv_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                     vuint32m4_t vs1, size_t vl);
vuint32m4_t __riscv_vand_vx_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                     uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vand_vv_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                     vuint32m8_t vs1, size_t vl);
vuint32m8_t __riscv_vand_vx_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                     uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vand_vv_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                     vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vand_vx_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                     uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vand_vv_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                     vuint64m2_t vs1, size_t vl);
vuint64m2_t __riscv_vand_vx_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                     uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vand_vv_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                     vuint64m4_t vs1, size_t vl);
vuint64m4_t __riscv_vand_vx_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                     uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vand_vv_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                     vuint64m8_t vs1, size_t vl);
vuint64m8_t __riscv_vand_vx_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                     uint64_t rs1, size_t vl);
vuint8mf8_t __riscv_vor_vv_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                    vuint8mf8_t vs1, size_t vl);
vuint8mf8_t __riscv_vor_vx_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vor_vv_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                    vuint8mf4_t vs1, size_t vl);
vuint8mf4_t __riscv_vor_vx_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vor_vv_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                    vuint8mf2_t vs1, size_t vl);
vuint8mf2_t __riscv_vor_vx_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vor_vv_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2, vuint8m1_t vs1,
                                  size_t vl);
vuint8m1_t __riscv_vor_vx_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2, uint8_t rs1,
                                  size_t vl);
vuint8m2_t __riscv_vor_vv_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2, vuint8m2_t vs1,
                                  size_t vl);
vuint8m2_t __riscv_vor_vx_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2, uint8_t rs1,
                                  size_t vl);
vuint8m4_t __riscv_vor_vv_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2, vuint8m4_t vs1,
                                  size_t vl);
vuint8m4_t __riscv_vor_vx_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2, uint8_t rs1,
                                  size_t vl);
vuint8m8_t __riscv_vor_vv_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2, vuint8m8_t vs1,
                                  size_t vl);
vuint8m8_t __riscv_vor_vx_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2, uint8_t rs1,
                                  size_t vl);
vuint16mf4_t __riscv_vor_vv_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                      vuint16mf4_t vs1, size_t vl);
vuint16mf4_t __riscv_vor_vx_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                      uint16_t rs1, size_t vl);
vuint16mf2_t __riscv_vor_vv_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                      vuint16mf2_t vs1, size_t vl);
vuint16mf2_t __riscv_vor_vx_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                      uint16_t rs1, size_t vl);
vuint16m1_t __riscv_vor_vv_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                    vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vor_vx_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                    uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vor_vv_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                    vuint16m2_t vs1, size_t vl);
vuint16m2_t __riscv_vor_vx_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                    uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vor_vv_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                    vuint16m4_t vs1, size_t vl);
vuint16m4_t __riscv_vor_vx_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                    uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vor_vv_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                    vuint16m8_t vs1, size_t vl);
vuint16m8_t __riscv_vor_vx_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                    uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vor_vv_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                      vuint32mf2_t vs1, size_t vl);
vuint32mf2_t __riscv_vor_vx_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                      uint32_t rs1, size_t vl);
vuint32m1_t __riscv_vor_vv_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                    vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vor_vx_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                    uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vor_vv_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                    vuint32m2_t vs1, size_t vl);
vuint32m2_t __riscv_vor_vx_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                    uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vor_vv_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                    vuint32m4_t vs1, size_t vl);
vuint32m4_t __riscv_vor_vx_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                    uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vor_vv_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                    vuint32m8_t vs1, size_t vl);
vuint32m8_t __riscv_vor_vx_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                    uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vor_vv_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                    vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vor_vx_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                    uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vor_vv_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                    vuint64m2_t vs1, size_t vl);
vuint64m2_t __riscv_vor_vx_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                    uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vor_vv_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                    vuint64m4_t vs1, size_t vl);
vuint64m4_t __riscv_vor_vx_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                    uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vor_vv_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                    vuint64m8_t vs1, size_t vl);
vuint64m8_t __riscv_vor_vx_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                    uint64_t rs1, size_t vl);
vuint8mf8_t __riscv_vxor_vv_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                     vuint8mf8_t vs1, size_t vl);
vuint8mf8_t __riscv_vxor_vx_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vxor_vv_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                     vuint8mf4_t vs1, size_t vl);
vuint8mf4_t __riscv_vxor_vx_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vxor_vv_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                     vuint8mf2_t vs1, size_t vl);
vuint8mf2_t __riscv_vxor_vx_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vxor_vv_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2,
                                   vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vxor_vx_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2, uint8_t rs1,
                                   size_t vl);
vuint8m2_t __riscv_vxor_vv_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2,
                                   vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vxor_vx_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2, uint8_t rs1,
                                   size_t vl);
vuint8m4_t __riscv_vxor_vv_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2,
                                   vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vxor_vx_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2, uint8_t rs1,
                                   size_t vl);
vuint8m8_t __riscv_vxor_vv_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2,
                                   vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vxor_vx_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2, uint8_t rs1,
                                   size_t vl);
vuint16mf4_t __riscv_vxor_vv_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                       vuint16mf4_t vs1, size_t vl);
vuint16mf4_t __riscv_vxor_vx_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                       uint16_t rs1, size_t vl);
vuint16mf2_t __riscv_vxor_vv_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                       vuint16mf2_t vs1, size_t vl);
vuint16mf2_t __riscv_vxor_vx_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                       uint16_t rs1, size_t vl);
vuint16m1_t __riscv_vxor_vv_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                     vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vxor_vx_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                     uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vxor_vv_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                     vuint16m2_t vs1, size_t vl);
vuint16m2_t __riscv_vxor_vx_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                     uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vxor_vv_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                     vuint16m4_t vs1, size_t vl);
vuint16m4_t __riscv_vxor_vx_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                     uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vxor_vv_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                     vuint16m8_t vs1, size_t vl);
vuint16m8_t __riscv_vxor_vx_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                     uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vxor_vv_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                       vuint32mf2_t vs1, size_t vl);
vuint32mf2_t __riscv_vxor_vx_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                       uint32_t rs1, size_t vl);
vuint32m1_t __riscv_vxor_vv_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                     vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vxor_vx_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                     uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vxor_vv_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                     vuint32m2_t vs1, size_t vl);
vuint32m2_t __riscv_vxor_vx_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                     uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vxor_vv_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                     vuint32m4_t vs1, size_t vl);
vuint32m4_t __riscv_vxor_vx_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                     uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vxor_vv_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                     vuint32m8_t vs1, size_t vl);
vuint32m8_t __riscv_vxor_vx_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                     uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vxor_vv_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                     vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vxor_vx_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                     uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vxor_vv_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                     vuint64m2_t vs1, size_t vl);
vuint64m2_t __riscv_vxor_vx_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                     uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vxor_vv_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                     vuint64m4_t vs1, size_t vl);
vuint64m4_t __riscv_vxor_vx_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                     uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vxor_vv_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                     vuint64m8_t vs1, size_t vl);
vuint64m8_t __riscv_vxor_vx_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                     uint64_t rs1, size_t vl);
// masked functions
vint8mf8_t __riscv_vand_vv_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vand_vx_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vand_vv_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vand_vx_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vand_vv_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vand_vx_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vand_vv_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vand_vx_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   int8_t rs1, size_t vl);
vint8m2_t __riscv_vand_vv_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vand_vx_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   int8_t rs1, size_t vl);
vint8m4_t __riscv_vand_vv_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vand_vx_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   int8_t rs1, size_t vl);
vint8m8_t __riscv_vand_vv_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vand_vx_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   int8_t rs1, size_t vl);
vint16mf4_t __riscv_vand_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, vint16mf4_t vs1,
                                       size_t vl);
vint16mf4_t __riscv_vand_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vand_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, vint16mf2_t vs1,
                                       size_t vl);
vint16mf2_t __riscv_vand_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, int16_t rs1, size_t vl);
vint16m1_t __riscv_vand_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vand_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vand_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vand_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     int16_t rs1, size_t vl);
vint16m4_t __riscv_vand_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vand_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     int16_t rs1, size_t vl);
vint16m8_t __riscv_vand_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vand_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     int16_t rs1, size_t vl);
vint32mf2_t __riscv_vand_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, vint32mf2_t vs1,
                                       size_t vl);
vint32mf2_t __riscv_vand_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, int32_t rs1, size_t vl);
vint32m1_t __riscv_vand_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vand_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vand_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vand_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vand_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vand_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     int32_t rs1, size_t vl);
vint32m8_t __riscv_vand_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vand_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     int32_t rs1, size_t vl);
vint64m1_t __riscv_vand_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vand_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vand_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vand_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vand_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vand_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vand_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vand_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     int64_t rs1, size_t vl);
vint8mf8_t __riscv_vor_vv_i8mf8_tum(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                    vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vor_vx_i8mf8_tum(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                    int8_t rs1, size_t vl);
vint8mf4_t __riscv_vor_vv_i8mf4_tum(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                    vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vor_vx_i8mf4_tum(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                    int8_t rs1, size_t vl);
vint8mf2_t __riscv_vor_vv_i8mf2_tum(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                    vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vor_vx_i8mf2_tum(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                    int8_t rs1, size_t vl);
vint8m1_t __riscv_vor_vv_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                  vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vor_vx_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                  int8_t rs1, size_t vl);
vint8m2_t __riscv_vor_vv_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                  vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vor_vx_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                  int8_t rs1, size_t vl);
vint8m4_t __riscv_vor_vv_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                  vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vor_vx_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                  int8_t rs1, size_t vl);
vint8m8_t __riscv_vor_vv_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                  vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vor_vx_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                  int8_t rs1, size_t vl);
vint16mf4_t __riscv_vor_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs2, vint16mf4_t vs1,
                                      size_t vl);
vint16mf4_t __riscv_vor_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs2, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vor_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs2, vint16mf2_t vs1,
                                      size_t vl);
vint16mf2_t __riscv_vor_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs2, int16_t rs1, size_t vl);
vint16m1_t __riscv_vor_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                    vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vor_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                    int16_t rs1, size_t vl);
vint16m2_t __riscv_vor_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                    vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vor_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                    int16_t rs1, size_t vl);
vint16m4_t __riscv_vor_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                    vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vor_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                    int16_t rs1, size_t vl);
vint16m8_t __riscv_vor_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                    vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vor_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                    int16_t rs1, size_t vl);
vint32mf2_t __riscv_vor_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs2, vint32mf2_t vs1,
                                      size_t vl);
vint32mf2_t __riscv_vor_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs2, int32_t rs1, size_t vl);
vint32m1_t __riscv_vor_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                    vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vor_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                    int32_t rs1, size_t vl);
vint32m2_t __riscv_vor_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                    vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vor_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                    int32_t rs1, size_t vl);
vint32m4_t __riscv_vor_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                    vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vor_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                    int32_t rs1, size_t vl);
vint32m8_t __riscv_vor_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                    vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vor_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                    int32_t rs1, size_t vl);
vint64m1_t __riscv_vor_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                    vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vor_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                    int64_t rs1, size_t vl);
vint64m2_t __riscv_vor_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                    vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vor_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                    int64_t rs1, size_t vl);
vint64m4_t __riscv_vor_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                    vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vor_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                    int64_t rs1, size_t vl);
vint64m8_t __riscv_vor_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                    vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vor_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                    int64_t rs1, size_t vl);
vint8mf8_t __riscv_vxor_vv_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vxor_vx_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vxor_vv_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vxor_vx_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vxor_vv_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vxor_vx_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vxor_vv_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vxor_vx_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   int8_t rs1, size_t vl);
vint8m2_t __riscv_vxor_vv_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vxor_vx_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   int8_t rs1, size_t vl);
vint8m4_t __riscv_vxor_vv_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vxor_vx_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   int8_t rs1, size_t vl);
vint8m8_t __riscv_vxor_vv_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vxor_vx_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   int8_t rs1, size_t vl);
vint16mf4_t __riscv_vxor_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, vint16mf4_t vs1,
                                       size_t vl);
vint16mf4_t __riscv_vxor_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vxor_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, vint16mf2_t vs1,
                                       size_t vl);
vint16mf2_t __riscv_vxor_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, int16_t rs1, size_t vl);
vint16m1_t __riscv_vxor_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vxor_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vxor_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vxor_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     int16_t rs1, size_t vl);
vint16m4_t __riscv_vxor_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vxor_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     int16_t rs1, size_t vl);
vint16m8_t __riscv_vxor_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vxor_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     int16_t rs1, size_t vl);
vint32mf2_t __riscv_vxor_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, vint32mf2_t vs1,
                                       size_t vl);
vint32mf2_t __riscv_vxor_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, int32_t rs1, size_t vl);
vint32m1_t __riscv_vxor_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vxor_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vxor_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vxor_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vxor_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vxor_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     int32_t rs1, size_t vl);
vint32m8_t __riscv_vxor_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vxor_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     int32_t rs1, size_t vl);
vint64m1_t __riscv_vxor_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vxor_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vxor_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vxor_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vxor_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vxor_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vxor_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vxor_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     int64_t rs1, size_t vl);
vuint8mf8_t __riscv_vand_vv_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs2, vuint8mf8_t vs1,
                                      size_t vl);
vuint8mf8_t __riscv_vand_vx_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vand_vv_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs2, vuint8mf4_t vs1,
                                      size_t vl);
vuint8mf4_t __riscv_vand_vx_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vand_vv_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs2, vuint8mf2_t vs1,
                                      size_t vl);
vuint8mf2_t __riscv_vand_vx_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vand_vv_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                    vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vand_vx_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vand_vv_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                    vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vand_vx_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vand_vv_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                    vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vand_vx_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vand_vv_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                    vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vand_vx_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                    uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vand_vv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs2, vuint16mf4_t vs1,
                                        size_t vl);
vuint16mf4_t __riscv_vand_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16mf2_t __riscv_vand_vv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs2, vuint16mf2_t vs1,
                                        size_t vl);
vuint16mf2_t __riscv_vand_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m1_t __riscv_vand_vv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs2, vuint16m1_t vs1,
                                      size_t vl);
vuint16m1_t __riscv_vand_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs2, uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vand_vv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs2, vuint16m2_t vs1,
                                      size_t vl);
vuint16m2_t __riscv_vand_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs2, uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vand_vv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs2, vuint16m4_t vs1,
                                      size_t vl);
vuint16m4_t __riscv_vand_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs2, uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vand_vv_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs2, vuint16m8_t vs1,
                                      size_t vl);
vuint16m8_t __riscv_vand_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs2, uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vand_vv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs2, vuint32mf2_t vs1,
                                        size_t vl);
vuint32mf2_t __riscv_vand_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m1_t __riscv_vand_vv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs2, vuint32m1_t vs1,
                                      size_t vl);
vuint32m1_t __riscv_vand_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs2, uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vand_vv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs2, vuint32m2_t vs1,
                                      size_t vl);
vuint32m2_t __riscv_vand_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs2, uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vand_vv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs2, vuint32m4_t vs1,
                                      size_t vl);
vuint32m4_t __riscv_vand_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs2, uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vand_vv_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs2, vuint32m8_t vs1,
                                      size_t vl);
vuint32m8_t __riscv_vand_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs2, uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vand_vv_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs2, vuint64m1_t vs1,
                                      size_t vl);
vuint64m1_t __riscv_vand_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs2, uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vand_vv_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs2, vuint64m2_t vs1,
                                      size_t vl);
vuint64m2_t __riscv_vand_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs2, uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vand_vv_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs2, vuint64m4_t vs1,
                                      size_t vl);
vuint64m4_t __riscv_vand_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs2, uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vand_vv_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs2, vuint64m8_t vs1,
                                      size_t vl);
vuint64m8_t __riscv_vand_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs2, uint64_t rs1, size_t vl);
vuint8mf8_t __riscv_vor_vv_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                     vuint8mf8_t vs2, vuint8mf8_t vs1,
                                     size_t vl);
vuint8mf8_t __riscv_vor_vx_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                     vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vor_vv_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                     vuint8mf4_t vs2, vuint8mf4_t vs1,
                                     size_t vl);
vuint8mf4_t __riscv_vor_vx_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                     vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vor_vv_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                     vuint8mf2_t vs2, vuint8mf2_t vs1,
                                     size_t vl);
vuint8mf2_t __riscv_vor_vx_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                     vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vor_vv_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                   vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vor_vx_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                   uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vor_vv_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                   vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vor_vx_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                   uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vor_vv_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                   vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vor_vx_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                   uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vor_vv_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                   vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vor_vx_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                   uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vor_vv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                       vuint16mf4_t vs2, vuint16mf4_t vs1,
                                       size_t vl);
vuint16mf4_t __riscv_vor_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                       vuint16mf4_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16mf2_t __riscv_vor_vv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                       vuint16mf2_t vs2, vuint16mf2_t vs1,
                                       size_t vl);
vuint16mf2_t __riscv_vor_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                       vuint16mf2_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m1_t __riscv_vor_vv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                     vuint16m1_t vs2, vuint16m1_t vs1,
                                     size_t vl);
vuint16m1_t __riscv_vor_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                     vuint16m1_t vs2, uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vor_vv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                     vuint16m2_t vs2, vuint16m2_t vs1,
                                     size_t vl);
vuint16m2_t __riscv_vor_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                     vuint16m2_t vs2, uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vor_vv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                     vuint16m4_t vs2, vuint16m4_t vs1,
                                     size_t vl);
vuint16m4_t __riscv_vor_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                     vuint16m4_t vs2, uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vor_vv_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                     vuint16m8_t vs2, vuint16m8_t vs1,
                                     size_t vl);
vuint16m8_t __riscv_vor_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                     vuint16m8_t vs2, uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vor_vv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                       vuint32mf2_t vs2, vuint32mf2_t vs1,
                                       size_t vl);
vuint32mf2_t __riscv_vor_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                       vuint32mf2_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m1_t __riscv_vor_vv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                     vuint32m1_t vs2, vuint32m1_t vs1,
                                     size_t vl);
vuint32m1_t __riscv_vor_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                     vuint32m1_t vs2, uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vor_vv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                     vuint32m2_t vs2, vuint32m2_t vs1,
                                     size_t vl);
vuint32m2_t __riscv_vor_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                     vuint32m2_t vs2, uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vor_vv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                     vuint32m4_t vs2, vuint32m4_t vs1,
                                     size_t vl);
vuint32m4_t __riscv_vor_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                     vuint32m4_t vs2, uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vor_vv_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                     vuint32m8_t vs2, vuint32m8_t vs1,
                                     size_t vl);
vuint32m8_t __riscv_vor_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                     vuint32m8_t vs2, uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vor_vv_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                     vuint64m1_t vs2, vuint64m1_t vs1,
                                     size_t vl);
vuint64m1_t __riscv_vor_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                     vuint64m1_t vs2, uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vor_vv_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                     vuint64m2_t vs2, vuint64m2_t vs1,
                                     size_t vl);
vuint64m2_t __riscv_vor_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                     vuint64m2_t vs2, uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vor_vv_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                     vuint64m4_t vs2, vuint64m4_t vs1,
                                     size_t vl);
vuint64m4_t __riscv_vor_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                     vuint64m4_t vs2, uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vor_vv_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                     vuint64m8_t vs2, vuint64m8_t vs1,
                                     size_t vl);
vuint64m8_t __riscv_vor_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                     vuint64m8_t vs2, uint64_t rs1, size_t vl);
vuint8mf8_t __riscv_vxor_vv_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs2, vuint8mf8_t vs1,
                                      size_t vl);
vuint8mf8_t __riscv_vxor_vx_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vxor_vv_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs2, vuint8mf4_t vs1,
                                      size_t vl);
vuint8mf4_t __riscv_vxor_vx_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vxor_vv_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs2, vuint8mf2_t vs1,
                                      size_t vl);
vuint8mf2_t __riscv_vxor_vx_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vxor_vv_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                    vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vxor_vx_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vxor_vv_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                    vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vxor_vx_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vxor_vv_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                    vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vxor_vx_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vxor_vv_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                    vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vxor_vx_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                    uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vxor_vv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs2, vuint16mf4_t vs1,
                                        size_t vl);
vuint16mf4_t __riscv_vxor_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16mf2_t __riscv_vxor_vv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs2, vuint16mf2_t vs1,
                                        size_t vl);
vuint16mf2_t __riscv_vxor_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m1_t __riscv_vxor_vv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs2, vuint16m1_t vs1,
                                      size_t vl);
vuint16m1_t __riscv_vxor_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs2, uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vxor_vv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs2, vuint16m2_t vs1,
                                      size_t vl);
vuint16m2_t __riscv_vxor_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs2, uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vxor_vv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs2, vuint16m4_t vs1,
                                      size_t vl);
vuint16m4_t __riscv_vxor_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs2, uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vxor_vv_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs2, vuint16m8_t vs1,
                                      size_t vl);
vuint16m8_t __riscv_vxor_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs2, uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vxor_vv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs2, vuint32mf2_t vs1,
                                        size_t vl);
vuint32mf2_t __riscv_vxor_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m1_t __riscv_vxor_vv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs2, vuint32m1_t vs1,
                                      size_t vl);
vuint32m1_t __riscv_vxor_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs2, uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vxor_vv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs2, vuint32m2_t vs1,
                                      size_t vl);
vuint32m2_t __riscv_vxor_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs2, uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vxor_vv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs2, vuint32m4_t vs1,
                                      size_t vl);
vuint32m4_t __riscv_vxor_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs2, uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vxor_vv_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs2, vuint32m8_t vs1,
                                      size_t vl);
vuint32m8_t __riscv_vxor_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs2, uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vxor_vv_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs2, vuint64m1_t vs1,
                                      size_t vl);
vuint64m1_t __riscv_vxor_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs2, uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vxor_vv_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs2, vuint64m2_t vs1,
                                      size_t vl);
vuint64m2_t __riscv_vxor_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs2, uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vxor_vv_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs2, vuint64m4_t vs1,
                                      size_t vl);
vuint64m4_t __riscv_vxor_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs2, uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vxor_vv_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs2, vuint64m8_t vs1,
                                      size_t vl);
vuint64m8_t __riscv_vxor_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs2, uint64_t rs1, size_t vl);
// masked functions
vint8mf8_t __riscv_vand_vv_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs2, vint8mf8_t vs1,
                                      size_t vl);
vint8mf8_t __riscv_vand_vx_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vand_vv_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs2, vint8mf4_t vs1,
                                      size_t vl);
vint8mf4_t __riscv_vand_vx_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vand_vv_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs2, vint8mf2_t vs1,
                                      size_t vl);
vint8mf2_t __riscv_vand_vx_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vand_vv_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                    vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vand_vx_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                    int8_t rs1, size_t vl);
vint8m2_t __riscv_vand_vv_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                    vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vand_vx_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                    int8_t rs1, size_t vl);
vint8m4_t __riscv_vand_vv_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                    vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vand_vx_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                    int8_t rs1, size_t vl);
vint8m8_t __riscv_vand_vv_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                    vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vand_vx_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                    int8_t rs1, size_t vl);
vint16mf4_t __riscv_vand_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, vint16mf4_t vs1,
                                        size_t vl);
vint16mf4_t __riscv_vand_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, int16_t rs1,
                                        size_t vl);
vint16mf2_t __riscv_vand_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, vint16mf2_t vs1,
                                        size_t vl);
vint16mf2_t __riscv_vand_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, int16_t rs1,
                                        size_t vl);
vint16m1_t __riscv_vand_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, vint16m1_t vs1,
                                      size_t vl);
vint16m1_t __riscv_vand_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vand_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, vint16m2_t vs1,
                                      size_t vl);
vint16m2_t __riscv_vand_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, int16_t rs1, size_t vl);
vint16m4_t __riscv_vand_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, vint16m4_t vs1,
                                      size_t vl);
vint16m4_t __riscv_vand_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, int16_t rs1, size_t vl);
vint16m8_t __riscv_vand_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, vint16m8_t vs1,
                                      size_t vl);
vint16m8_t __riscv_vand_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, int16_t rs1, size_t vl);
vint32mf2_t __riscv_vand_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, vint32mf2_t vs1,
                                        size_t vl);
vint32mf2_t __riscv_vand_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, int32_t rs1,
                                        size_t vl);
vint32m1_t __riscv_vand_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, vint32m1_t vs1,
                                      size_t vl);
vint32m1_t __riscv_vand_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vand_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, vint32m2_t vs1,
                                      size_t vl);
vint32m2_t __riscv_vand_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vand_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, vint32m4_t vs1,
                                      size_t vl);
vint32m4_t __riscv_vand_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, int32_t rs1, size_t vl);
vint32m8_t __riscv_vand_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, vint32m8_t vs1,
                                      size_t vl);
vint32m8_t __riscv_vand_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, int32_t rs1, size_t vl);
vint64m1_t __riscv_vand_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, vint64m1_t vs1,
                                      size_t vl);
vint64m1_t __riscv_vand_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vand_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, vint64m2_t vs1,
                                      size_t vl);
vint64m2_t __riscv_vand_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vand_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, vint64m4_t vs1,
                                      size_t vl);
vint64m4_t __riscv_vand_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vand_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, vint64m8_t vs1,
                                      size_t vl);
vint64m8_t __riscv_vand_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, int64_t rs1, size_t vl);
vint8mf8_t __riscv_vor_vv_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vor_vx_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vor_vv_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vor_vx_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vor_vv_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vor_vx_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vor_vv_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vor_vx_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   int8_t rs1, size_t vl);
vint8m2_t __riscv_vor_vv_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vor_vx_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   int8_t rs1, size_t vl);
vint8m4_t __riscv_vor_vv_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vor_vx_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   int8_t rs1, size_t vl);
vint8m8_t __riscv_vor_vv_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vor_vx_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   int8_t rs1, size_t vl);
vint16mf4_t __riscv_vor_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, vint16mf4_t vs1,
                                       size_t vl);
vint16mf4_t __riscv_vor_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vor_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, vint16mf2_t vs1,
                                       size_t vl);
vint16mf2_t __riscv_vor_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, int16_t rs1, size_t vl);
vint16m1_t __riscv_vor_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vor_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vor_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vor_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     int16_t rs1, size_t vl);
vint16m4_t __riscv_vor_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vor_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     int16_t rs1, size_t vl);
vint16m8_t __riscv_vor_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vor_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     int16_t rs1, size_t vl);
vint32mf2_t __riscv_vor_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, vint32mf2_t vs1,
                                       size_t vl);
vint32mf2_t __riscv_vor_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, int32_t rs1, size_t vl);
vint32m1_t __riscv_vor_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vor_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vor_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vor_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vor_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vor_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     int32_t rs1, size_t vl);
vint32m8_t __riscv_vor_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vor_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     int32_t rs1, size_t vl);
vint64m1_t __riscv_vor_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vor_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vor_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vor_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vor_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vor_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vor_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vor_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     int64_t rs1, size_t vl);
vint8mf8_t __riscv_vxor_vv_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs2, vint8mf8_t vs1,
                                      size_t vl);
vint8mf8_t __riscv_vxor_vx_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vxor_vv_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs2, vint8mf4_t vs1,
                                      size_t vl);
vint8mf4_t __riscv_vxor_vx_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vxor_vv_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs2, vint8mf2_t vs1,
                                      size_t vl);
vint8mf2_t __riscv_vxor_vx_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vxor_vv_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                    vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vxor_vx_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                    int8_t rs1, size_t vl);
vint8m2_t __riscv_vxor_vv_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                    vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vxor_vx_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                    int8_t rs1, size_t vl);
vint8m4_t __riscv_vxor_vv_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                    vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vxor_vx_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                    int8_t rs1, size_t vl);
vint8m8_t __riscv_vxor_vv_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                    vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vxor_vx_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                    int8_t rs1, size_t vl);
vint16mf4_t __riscv_vxor_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, vint16mf4_t vs1,
                                        size_t vl);
vint16mf4_t __riscv_vxor_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, int16_t rs1,
                                        size_t vl);
vint16mf2_t __riscv_vxor_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, vint16mf2_t vs1,
                                        size_t vl);
vint16mf2_t __riscv_vxor_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, int16_t rs1,
                                        size_t vl);
vint16m1_t __riscv_vxor_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, vint16m1_t vs1,
                                      size_t vl);
vint16m1_t __riscv_vxor_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vxor_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, vint16m2_t vs1,
                                      size_t vl);
vint16m2_t __riscv_vxor_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, int16_t rs1, size_t vl);
vint16m4_t __riscv_vxor_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, vint16m4_t vs1,
                                      size_t vl);
vint16m4_t __riscv_vxor_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, int16_t rs1, size_t vl);
vint16m8_t __riscv_vxor_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, vint16m8_t vs1,
                                      size_t vl);
vint16m8_t __riscv_vxor_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, int16_t rs1, size_t vl);
vint32mf2_t __riscv_vxor_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, vint32mf2_t vs1,
                                        size_t vl);
vint32mf2_t __riscv_vxor_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, int32_t rs1,
                                        size_t vl);
vint32m1_t __riscv_vxor_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, vint32m1_t vs1,
                                      size_t vl);
vint32m1_t __riscv_vxor_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vxor_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, vint32m2_t vs1,
                                      size_t vl);
vint32m2_t __riscv_vxor_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vxor_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, vint32m4_t vs1,
                                      size_t vl);
vint32m4_t __riscv_vxor_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, int32_t rs1, size_t vl);
vint32m8_t __riscv_vxor_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, vint32m8_t vs1,
                                      size_t vl);
vint32m8_t __riscv_vxor_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, int32_t rs1, size_t vl);
vint64m1_t __riscv_vxor_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, vint64m1_t vs1,
                                      size_t vl);
vint64m1_t __riscv_vxor_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vxor_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, vint64m2_t vs1,
                                      size_t vl);
vint64m2_t __riscv_vxor_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vxor_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, vint64m4_t vs1,
                                      size_t vl);
vint64m4_t __riscv_vxor_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vxor_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, vint64m8_t vs1,
                                      size_t vl);
vint64m8_t __riscv_vxor_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, int64_t rs1, size_t vl);
vuint8mf8_t __riscv_vand_vv_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs2, vuint8mf8_t vs1,
                                       size_t vl);
vuint8mf8_t __riscv_vand_vx_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vand_vv_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs2, vuint8mf4_t vs1,
                                       size_t vl);
vuint8mf4_t __riscv_vand_vx_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vand_vv_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs2, vuint8mf2_t vs1,
                                       size_t vl);
vuint8mf2_t __riscv_vand_vx_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vand_vv_u8m1_tumu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                     vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vand_vx_u8m1_tumu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vand_vv_u8m2_tumu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                     vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vand_vx_u8m2_tumu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vand_vv_u8m4_tumu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                     vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vand_vx_u8m4_tumu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vand_vv_u8m8_tumu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                     vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vand_vx_u8m8_tumu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                     uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vand_vv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, vuint16mf4_t vs1,
                                         size_t vl);
vuint16mf4_t __riscv_vand_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, uint16_t rs1,
                                         size_t vl);
vuint16mf2_t __riscv_vand_vv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, vuint16mf2_t vs1,
                                         size_t vl);
vuint16mf2_t __riscv_vand_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, uint16_t rs1,
                                         size_t vl);
vuint16m1_t __riscv_vand_vv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, vuint16m1_t vs1,
                                       size_t vl);
vuint16m1_t __riscv_vand_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m2_t __riscv_vand_vv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, vuint16m2_t vs1,
                                       size_t vl);
vuint16m2_t __riscv_vand_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m4_t __riscv_vand_vv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, vuint16m4_t vs1,
                                       size_t vl);
vuint16m4_t __riscv_vand_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m8_t __riscv_vand_vv_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, vuint16m8_t vs1,
                                       size_t vl);
vuint16m8_t __riscv_vand_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32mf2_t __riscv_vand_vv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, vuint32mf2_t vs1,
                                         size_t vl);
vuint32mf2_t __riscv_vand_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, uint32_t rs1,
                                         size_t vl);
vuint32m1_t __riscv_vand_vv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, vuint32m1_t vs1,
                                       size_t vl);
vuint32m1_t __riscv_vand_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m2_t __riscv_vand_vv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, vuint32m2_t vs1,
                                       size_t vl);
vuint32m2_t __riscv_vand_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m4_t __riscv_vand_vv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, vuint32m4_t vs1,
                                       size_t vl);
vuint32m4_t __riscv_vand_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m8_t __riscv_vand_vv_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, vuint32m8_t vs1,
                                       size_t vl);
vuint32m8_t __riscv_vand_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m1_t __riscv_vand_vv_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, vuint64m1_t vs1,
                                       size_t vl);
vuint64m1_t __riscv_vand_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m2_t __riscv_vand_vv_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, vuint64m2_t vs1,
                                       size_t vl);
vuint64m2_t __riscv_vand_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m4_t __riscv_vand_vv_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, vuint64m4_t vs1,
                                       size_t vl);
vuint64m4_t __riscv_vand_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m8_t __riscv_vand_vv_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, vuint64m8_t vs1,
                                       size_t vl);
vuint64m8_t __riscv_vand_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, uint64_t rs1,
                                       size_t vl);
vuint8mf8_t __riscv_vor_vv_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs2, vuint8mf8_t vs1,
                                      size_t vl);
vuint8mf8_t __riscv_vor_vx_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vor_vv_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs2, vuint8mf4_t vs1,
                                      size_t vl);
vuint8mf4_t __riscv_vor_vx_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vor_vv_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs2, vuint8mf2_t vs1,
                                      size_t vl);
vuint8mf2_t __riscv_vor_vx_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vor_vv_u8m1_tumu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                    vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vor_vx_u8m1_tumu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vor_vv_u8m2_tumu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                    vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vor_vx_u8m2_tumu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vor_vv_u8m4_tumu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                    vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vor_vx_u8m4_tumu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vor_vv_u8m8_tumu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                    vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vor_vx_u8m8_tumu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                    uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vor_vv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs2, vuint16mf4_t vs1,
                                        size_t vl);
vuint16mf4_t __riscv_vor_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16mf2_t __riscv_vor_vv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs2, vuint16mf2_t vs1,
                                        size_t vl);
vuint16mf2_t __riscv_vor_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m1_t __riscv_vor_vv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs2, vuint16m1_t vs1,
                                      size_t vl);
vuint16m1_t __riscv_vor_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs2, uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vor_vv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs2, vuint16m2_t vs1,
                                      size_t vl);
vuint16m2_t __riscv_vor_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs2, uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vor_vv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs2, vuint16m4_t vs1,
                                      size_t vl);
vuint16m4_t __riscv_vor_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs2, uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vor_vv_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs2, vuint16m8_t vs1,
                                      size_t vl);
vuint16m8_t __riscv_vor_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs2, uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vor_vv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs2, vuint32mf2_t vs1,
                                        size_t vl);
vuint32mf2_t __riscv_vor_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m1_t __riscv_vor_vv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs2, vuint32m1_t vs1,
                                      size_t vl);
vuint32m1_t __riscv_vor_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs2, uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vor_vv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs2, vuint32m2_t vs1,
                                      size_t vl);
vuint32m2_t __riscv_vor_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs2, uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vor_vv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs2, vuint32m4_t vs1,
                                      size_t vl);
vuint32m4_t __riscv_vor_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs2, uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vor_vv_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs2, vuint32m8_t vs1,
                                      size_t vl);
vuint32m8_t __riscv_vor_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs2, uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vor_vv_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs2, vuint64m1_t vs1,
                                      size_t vl);
vuint64m1_t __riscv_vor_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs2, uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vor_vv_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs2, vuint64m2_t vs1,
                                      size_t vl);
vuint64m2_t __riscv_vor_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs2, uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vor_vv_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs2, vuint64m4_t vs1,
                                      size_t vl);
vuint64m4_t __riscv_vor_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs2, uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vor_vv_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs2, vuint64m8_t vs1,
                                      size_t vl);
vuint64m8_t __riscv_vor_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs2, uint64_t rs1, size_t vl);
vuint8mf8_t __riscv_vxor_vv_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs2, vuint8mf8_t vs1,
                                       size_t vl);
vuint8mf8_t __riscv_vxor_vx_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vxor_vv_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs2, vuint8mf4_t vs1,
                                       size_t vl);
vuint8mf4_t __riscv_vxor_vx_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vxor_vv_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs2, vuint8mf2_t vs1,
                                       size_t vl);
vuint8mf2_t __riscv_vxor_vx_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vxor_vv_u8m1_tumu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                     vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vxor_vx_u8m1_tumu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vxor_vv_u8m2_tumu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                     vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vxor_vx_u8m2_tumu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vxor_vv_u8m4_tumu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                     vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vxor_vx_u8m4_tumu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vxor_vv_u8m8_tumu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                     vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vxor_vx_u8m8_tumu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                     uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vxor_vv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, vuint16mf4_t vs1,
                                         size_t vl);
vuint16mf4_t __riscv_vxor_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, uint16_t rs1,
                                         size_t vl);
vuint16mf2_t __riscv_vxor_vv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, vuint16mf2_t vs1,
                                         size_t vl);
vuint16mf2_t __riscv_vxor_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, uint16_t rs1,
                                         size_t vl);
vuint16m1_t __riscv_vxor_vv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, vuint16m1_t vs1,
                                       size_t vl);
vuint16m1_t __riscv_vxor_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m2_t __riscv_vxor_vv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, vuint16m2_t vs1,
                                       size_t vl);
vuint16m2_t __riscv_vxor_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m4_t __riscv_vxor_vv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, vuint16m4_t vs1,
                                       size_t vl);
vuint16m4_t __riscv_vxor_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m8_t __riscv_vxor_vv_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, vuint16m8_t vs1,
                                       size_t vl);
vuint16m8_t __riscv_vxor_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32mf2_t __riscv_vxor_vv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, vuint32mf2_t vs1,
                                         size_t vl);
vuint32mf2_t __riscv_vxor_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, uint32_t rs1,
                                         size_t vl);
vuint32m1_t __riscv_vxor_vv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, vuint32m1_t vs1,
                                       size_t vl);
vuint32m1_t __riscv_vxor_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m2_t __riscv_vxor_vv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, vuint32m2_t vs1,
                                       size_t vl);
vuint32m2_t __riscv_vxor_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m4_t __riscv_vxor_vv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, vuint32m4_t vs1,
                                       size_t vl);
vuint32m4_t __riscv_vxor_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m8_t __riscv_vxor_vv_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, vuint32m8_t vs1,
                                       size_t vl);
vuint32m8_t __riscv_vxor_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m1_t __riscv_vxor_vv_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, vuint64m1_t vs1,
                                       size_t vl);
vuint64m1_t __riscv_vxor_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m2_t __riscv_vxor_vv_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, vuint64m2_t vs1,
                                       size_t vl);
vuint64m2_t __riscv_vxor_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m4_t __riscv_vxor_vv_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, vuint64m4_t vs1,
                                       size_t vl);
vuint64m4_t __riscv_vxor_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m8_t __riscv_vxor_vv_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, vuint64m8_t vs1,
                                       size_t vl);
vuint64m8_t __riscv_vxor_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, uint64_t rs1,
                                       size_t vl);
// masked functions
vint8mf8_t __riscv_vand_vv_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                    vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vand_vx_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                    int8_t rs1, size_t vl);
vint8mf4_t __riscv_vand_vv_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                    vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vand_vx_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                    int8_t rs1, size_t vl);
vint8mf2_t __riscv_vand_vv_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                    vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vand_vx_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                    int8_t rs1, size_t vl);
vint8m1_t __riscv_vand_vv_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                  vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vand_vx_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                  int8_t rs1, size_t vl);
vint8m2_t __riscv_vand_vv_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                  vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vand_vx_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                  int8_t rs1, size_t vl);
vint8m4_t __riscv_vand_vv_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                  vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vand_vx_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                  int8_t rs1, size_t vl);
vint8m8_t __riscv_vand_vv_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                  vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vand_vx_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                  int8_t rs1, size_t vl);
vint16mf4_t __riscv_vand_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs2, vint16mf4_t vs1,
                                      size_t vl);
vint16mf4_t __riscv_vand_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs2, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vand_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs2, vint16mf2_t vs1,
                                      size_t vl);
vint16mf2_t __riscv_vand_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs2, int16_t rs1, size_t vl);
vint16m1_t __riscv_vand_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                    vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vand_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                    int16_t rs1, size_t vl);
vint16m2_t __riscv_vand_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                    vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vand_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                    int16_t rs1, size_t vl);
vint16m4_t __riscv_vand_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                    vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vand_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                    int16_t rs1, size_t vl);
vint16m8_t __riscv_vand_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                    vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vand_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                    int16_t rs1, size_t vl);
vint32mf2_t __riscv_vand_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs2, vint32mf2_t vs1,
                                      size_t vl);
vint32mf2_t __riscv_vand_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs2, int32_t rs1, size_t vl);
vint32m1_t __riscv_vand_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                    vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vand_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                    int32_t rs1, size_t vl);
vint32m2_t __riscv_vand_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                    vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vand_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                    int32_t rs1, size_t vl);
vint32m4_t __riscv_vand_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                    vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vand_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                    int32_t rs1, size_t vl);
vint32m8_t __riscv_vand_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                    vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vand_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                    int32_t rs1, size_t vl);
vint64m1_t __riscv_vand_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                    vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vand_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                    int64_t rs1, size_t vl);
vint64m2_t __riscv_vand_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                    vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vand_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                    int64_t rs1, size_t vl);
vint64m4_t __riscv_vand_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                    vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vand_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                    int64_t rs1, size_t vl);
vint64m8_t __riscv_vand_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                    vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vand_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                    int64_t rs1, size_t vl);
vint8mf8_t __riscv_vor_vv_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                   vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vor_vx_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                   int8_t rs1, size_t vl);
vint8mf4_t __riscv_vor_vv_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                   vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vor_vx_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                   int8_t rs1, size_t vl);
vint8mf2_t __riscv_vor_vv_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                   vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vor_vx_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                   int8_t rs1, size_t vl);
vint8m1_t __riscv_vor_vv_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                 vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vor_vx_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                 int8_t rs1, size_t vl);
vint8m2_t __riscv_vor_vv_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                 vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vor_vx_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                 int8_t rs1, size_t vl);
vint8m4_t __riscv_vor_vv_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                 vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vor_vx_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                 int8_t rs1, size_t vl);
vint8m8_t __riscv_vor_vv_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                 vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vor_vx_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                 int8_t rs1, size_t vl);
vint16mf4_t __riscv_vor_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                     vint16mf4_t vs2, vint16mf4_t vs1,
                                     size_t vl);
vint16mf4_t __riscv_vor_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                     vint16mf4_t vs2, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vor_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                     vint16mf2_t vs2, vint16mf2_t vs1,
                                     size_t vl);
vint16mf2_t __riscv_vor_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                     vint16mf2_t vs2, int16_t rs1, size_t vl);
vint16m1_t __riscv_vor_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                   vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vor_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                   int16_t rs1, size_t vl);
vint16m2_t __riscv_vor_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                   vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vor_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                   int16_t rs1, size_t vl);
vint16m4_t __riscv_vor_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                   vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vor_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                   int16_t rs1, size_t vl);
vint16m8_t __riscv_vor_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                   vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vor_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                   int16_t rs1, size_t vl);
vint32mf2_t __riscv_vor_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                     vint32mf2_t vs2, vint32mf2_t vs1,
                                     size_t vl);
vint32mf2_t __riscv_vor_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                     vint32mf2_t vs2, int32_t rs1, size_t vl);
vint32m1_t __riscv_vor_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                   vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vor_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                   int32_t rs1, size_t vl);
vint32m2_t __riscv_vor_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                   vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vor_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                   int32_t rs1, size_t vl);
vint32m4_t __riscv_vor_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                   vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vor_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                   int32_t rs1, size_t vl);
vint32m8_t __riscv_vor_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                   vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vor_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                   int32_t rs1, size_t vl);
vint64m1_t __riscv_vor_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                   vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vor_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                   int64_t rs1, size_t vl);
vint64m2_t __riscv_vor_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                   vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vor_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                   int64_t rs1, size_t vl);
vint64m4_t __riscv_vor_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                   vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vor_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                   int64_t rs1, size_t vl);
vint64m8_t __riscv_vor_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                   vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vor_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                   int64_t rs1, size_t vl);
vint8mf8_t __riscv_vxor_vv_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                    vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vxor_vx_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                    int8_t rs1, size_t vl);
vint8mf4_t __riscv_vxor_vv_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                    vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vxor_vx_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                    int8_t rs1, size_t vl);
vint8mf2_t __riscv_vxor_vv_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                    vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vxor_vx_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                    int8_t rs1, size_t vl);
vint8m1_t __riscv_vxor_vv_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                  vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vxor_vx_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                  int8_t rs1, size_t vl);
vint8m2_t __riscv_vxor_vv_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                  vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vxor_vx_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                  int8_t rs1, size_t vl);
vint8m4_t __riscv_vxor_vv_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                  vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vxor_vx_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                  int8_t rs1, size_t vl);
vint8m8_t __riscv_vxor_vv_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                  vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vxor_vx_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                  int8_t rs1, size_t vl);
vint16mf4_t __riscv_vxor_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs2, vint16mf4_t vs1,
                                      size_t vl);
vint16mf4_t __riscv_vxor_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs2, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vxor_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs2, vint16mf2_t vs1,
                                      size_t vl);
vint16mf2_t __riscv_vxor_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs2, int16_t rs1, size_t vl);
vint16m1_t __riscv_vxor_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                    vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vxor_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                    int16_t rs1, size_t vl);
vint16m2_t __riscv_vxor_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                    vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vxor_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                    int16_t rs1, size_t vl);
vint16m4_t __riscv_vxor_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                    vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vxor_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                    int16_t rs1, size_t vl);
vint16m8_t __riscv_vxor_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                    vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vxor_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                    int16_t rs1, size_t vl);
vint32mf2_t __riscv_vxor_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs2, vint32mf2_t vs1,
                                      size_t vl);
vint32mf2_t __riscv_vxor_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs2, int32_t rs1, size_t vl);
vint32m1_t __riscv_vxor_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                    vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vxor_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                    int32_t rs1, size_t vl);
vint32m2_t __riscv_vxor_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                    vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vxor_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                    int32_t rs1, size_t vl);
vint32m4_t __riscv_vxor_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                    vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vxor_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                    int32_t rs1, size_t vl);
vint32m8_t __riscv_vxor_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                    vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vxor_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                    int32_t rs1, size_t vl);
vint64m1_t __riscv_vxor_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                    vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vxor_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                    int64_t rs1, size_t vl);
vint64m2_t __riscv_vxor_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                    vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vxor_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                    int64_t rs1, size_t vl);
vint64m4_t __riscv_vxor_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                    vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vxor_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                    int64_t rs1, size_t vl);
vint64m8_t __riscv_vxor_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                    vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vxor_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                    int64_t rs1, size_t vl);
vuint8mf8_t __riscv_vand_vv_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                     vuint8mf8_t vs2, vuint8mf8_t vs1,
                                     size_t vl);
vuint8mf8_t __riscv_vand_vx_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                     vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vand_vv_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                     vuint8mf4_t vs2, vuint8mf4_t vs1,
                                     size_t vl);
vuint8mf4_t __riscv_vand_vx_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                     vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vand_vv_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                     vuint8mf2_t vs2, vuint8mf2_t vs1,
                                     size_t vl);
vuint8mf2_t __riscv_vand_vx_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                     vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vand_vv_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                   vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vand_vx_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                   uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vand_vv_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                   vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vand_vx_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                   uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vand_vv_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                   vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vand_vx_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                   uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vand_vv_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                   vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vand_vx_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                   uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vand_vv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                       vuint16mf4_t vs2, vuint16mf4_t vs1,
                                       size_t vl);
vuint16mf4_t __riscv_vand_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                       vuint16mf4_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16mf2_t __riscv_vand_vv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                       vuint16mf2_t vs2, vuint16mf2_t vs1,
                                       size_t vl);
vuint16mf2_t __riscv_vand_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                       vuint16mf2_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m1_t __riscv_vand_vv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                     vuint16m1_t vs2, vuint16m1_t vs1,
                                     size_t vl);
vuint16m1_t __riscv_vand_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                     vuint16m1_t vs2, uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vand_vv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                     vuint16m2_t vs2, vuint16m2_t vs1,
                                     size_t vl);
vuint16m2_t __riscv_vand_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                     vuint16m2_t vs2, uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vand_vv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                     vuint16m4_t vs2, vuint16m4_t vs1,
                                     size_t vl);
vuint16m4_t __riscv_vand_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                     vuint16m4_t vs2, uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vand_vv_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                     vuint16m8_t vs2, vuint16m8_t vs1,
                                     size_t vl);
vuint16m8_t __riscv_vand_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                     vuint16m8_t vs2, uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vand_vv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                       vuint32mf2_t vs2, vuint32mf2_t vs1,
                                       size_t vl);
vuint32mf2_t __riscv_vand_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                       vuint32mf2_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m1_t __riscv_vand_vv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                     vuint32m1_t vs2, vuint32m1_t vs1,
                                     size_t vl);
vuint32m1_t __riscv_vand_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                     vuint32m1_t vs2, uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vand_vv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                     vuint32m2_t vs2, vuint32m2_t vs1,
                                     size_t vl);
vuint32m2_t __riscv_vand_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                     vuint32m2_t vs2, uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vand_vv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                     vuint32m4_t vs2, vuint32m4_t vs1,
                                     size_t vl);
vuint32m4_t __riscv_vand_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                     vuint32m4_t vs2, uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vand_vv_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                     vuint32m8_t vs2, vuint32m8_t vs1,
                                     size_t vl);
vuint32m8_t __riscv_vand_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                     vuint32m8_t vs2, uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vand_vv_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                     vuint64m1_t vs2, vuint64m1_t vs1,
                                     size_t vl);
vuint64m1_t __riscv_vand_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                     vuint64m1_t vs2, uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vand_vv_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                     vuint64m2_t vs2, vuint64m2_t vs1,
                                     size_t vl);
vuint64m2_t __riscv_vand_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                     vuint64m2_t vs2, uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vand_vv_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                     vuint64m4_t vs2, vuint64m4_t vs1,
                                     size_t vl);
vuint64m4_t __riscv_vand_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                     vuint64m4_t vs2, uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vand_vv_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                     vuint64m8_t vs2, vuint64m8_t vs1,
                                     size_t vl);
vuint64m8_t __riscv_vand_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                     vuint64m8_t vs2, uint64_t rs1, size_t vl);
vuint8mf8_t __riscv_vor_vv_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                    vuint8mf8_t vs2, vuint8mf8_t vs1,
                                    size_t vl);
vuint8mf8_t __riscv_vor_vx_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                    vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vor_vv_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                    vuint8mf4_t vs2, vuint8mf4_t vs1,
                                    size_t vl);
vuint8mf4_t __riscv_vor_vx_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                    vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vor_vv_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                    vuint8mf2_t vs2, vuint8mf2_t vs1,
                                    size_t vl);
vuint8mf2_t __riscv_vor_vx_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                    vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vor_vv_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                  vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vor_vx_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                  uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vor_vv_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                  vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vor_vx_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                  uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vor_vv_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                  vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vor_vx_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                  uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vor_vv_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                  vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vor_vx_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                  uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vor_vv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                      vuint16mf4_t vs2, vuint16mf4_t vs1,
                                      size_t vl);
vuint16mf4_t __riscv_vor_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                      vuint16mf4_t vs2, uint16_t rs1,
                                      size_t vl);
vuint16mf2_t __riscv_vor_vv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                      vuint16mf2_t vs2, vuint16mf2_t vs1,
                                      size_t vl);
vuint16mf2_t __riscv_vor_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                      vuint16mf2_t vs2, uint16_t rs1,
                                      size_t vl);
vuint16m1_t __riscv_vor_vv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                    vuint16m1_t vs2, vuint16m1_t vs1,
                                    size_t vl);
vuint16m1_t __riscv_vor_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                    vuint16m1_t vs2, uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vor_vv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                    vuint16m2_t vs2, vuint16m2_t vs1,
                                    size_t vl);
vuint16m2_t __riscv_vor_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                    vuint16m2_t vs2, uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vor_vv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                    vuint16m4_t vs2, vuint16m4_t vs1,
                                    size_t vl);
vuint16m4_t __riscv_vor_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                    vuint16m4_t vs2, uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vor_vv_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                    vuint16m8_t vs2, vuint16m8_t vs1,
                                    size_t vl);
vuint16m8_t __riscv_vor_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                    vuint16m8_t vs2, uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vor_vv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                      vuint32mf2_t vs2, vuint32mf2_t vs1,
                                      size_t vl);
vuint32mf2_t __riscv_vor_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                      vuint32mf2_t vs2, uint32_t rs1,
                                      size_t vl);
vuint32m1_t __riscv_vor_vv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                    vuint32m1_t vs2, vuint32m1_t vs1,
                                    size_t vl);
vuint32m1_t __riscv_vor_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                    vuint32m1_t vs2, uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vor_vv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                    vuint32m2_t vs2, vuint32m2_t vs1,
                                    size_t vl);
vuint32m2_t __riscv_vor_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                    vuint32m2_t vs2, uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vor_vv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                    vuint32m4_t vs2, vuint32m4_t vs1,
                                    size_t vl);
vuint32m4_t __riscv_vor_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                    vuint32m4_t vs2, uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vor_vv_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                    vuint32m8_t vs2, vuint32m8_t vs1,
                                    size_t vl);
vuint32m8_t __riscv_vor_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                    vuint32m8_t vs2, uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vor_vv_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                    vuint64m1_t vs2, vuint64m1_t vs1,
                                    size_t vl);
vuint64m1_t __riscv_vor_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                    vuint64m1_t vs2, uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vor_vv_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                    vuint64m2_t vs2, vuint64m2_t vs1,
                                    size_t vl);
vuint64m2_t __riscv_vor_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                    vuint64m2_t vs2, uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vor_vv_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                    vuint64m4_t vs2, vuint64m4_t vs1,
                                    size_t vl);
vuint64m4_t __riscv_vor_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                    vuint64m4_t vs2, uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vor_vv_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                    vuint64m8_t vs2, vuint64m8_t vs1,
                                    size_t vl);
vuint64m8_t __riscv_vor_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                    vuint64m8_t vs2, uint64_t rs1, size_t vl);
vuint8mf8_t __riscv_vxor_vv_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                     vuint8mf8_t vs2, vuint8mf8_t vs1,
                                     size_t vl);
vuint8mf8_t __riscv_vxor_vx_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                     vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vxor_vv_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                     vuint8mf4_t vs2, vuint8mf4_t vs1,
                                     size_t vl);
vuint8mf4_t __riscv_vxor_vx_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                     vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vxor_vv_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                     vuint8mf2_t vs2, vuint8mf2_t vs1,
                                     size_t vl);
vuint8mf2_t __riscv_vxor_vx_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                     vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vxor_vv_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                   vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vxor_vx_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                   uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vxor_vv_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                   vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vxor_vx_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                   uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vxor_vv_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                   vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vxor_vx_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                   uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vxor_vv_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                   vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vxor_vx_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                   uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vxor_vv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                       vuint16mf4_t vs2, vuint16mf4_t vs1,
                                       size_t vl);
vuint16mf4_t __riscv_vxor_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                       vuint16mf4_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16mf2_t __riscv_vxor_vv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                       vuint16mf2_t vs2, vuint16mf2_t vs1,
                                       size_t vl);
vuint16mf2_t __riscv_vxor_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                       vuint16mf2_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m1_t __riscv_vxor_vv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                     vuint16m1_t vs2, vuint16m1_t vs1,
                                     size_t vl);
vuint16m1_t __riscv_vxor_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                     vuint16m1_t vs2, uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vxor_vv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                     vuint16m2_t vs2, vuint16m2_t vs1,
                                     size_t vl);
vuint16m2_t __riscv_vxor_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                     vuint16m2_t vs2, uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vxor_vv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                     vuint16m4_t vs2, vuint16m4_t vs1,
                                     size_t vl);
vuint16m4_t __riscv_vxor_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                     vuint16m4_t vs2, uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vxor_vv_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                     vuint16m8_t vs2, vuint16m8_t vs1,
                                     size_t vl);
vuint16m8_t __riscv_vxor_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                     vuint16m8_t vs2, uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vxor_vv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                       vuint32mf2_t vs2, vuint32mf2_t vs1,
                                       size_t vl);
vuint32mf2_t __riscv_vxor_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                       vuint32mf2_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m1_t __riscv_vxor_vv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                     vuint32m1_t vs2, vuint32m1_t vs1,
                                     size_t vl);
vuint32m1_t __riscv_vxor_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                     vuint32m1_t vs2, uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vxor_vv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                     vuint32m2_t vs2, vuint32m2_t vs1,
                                     size_t vl);
vuint32m2_t __riscv_vxor_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                     vuint32m2_t vs2, uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vxor_vv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                     vuint32m4_t vs2, vuint32m4_t vs1,
                                     size_t vl);
vuint32m4_t __riscv_vxor_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                     vuint32m4_t vs2, uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vxor_vv_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                     vuint32m8_t vs2, vuint32m8_t vs1,
                                     size_t vl);
vuint32m8_t __riscv_vxor_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                     vuint32m8_t vs2, uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vxor_vv_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                     vuint64m1_t vs2, vuint64m1_t vs1,
                                     size_t vl);
vuint64m1_t __riscv_vxor_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                     vuint64m1_t vs2, uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vxor_vv_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                     vuint64m2_t vs2, vuint64m2_t vs1,
                                     size_t vl);
vuint64m2_t __riscv_vxor_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                     vuint64m2_t vs2, uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vxor_vv_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                     vuint64m4_t vs2, vuint64m4_t vs1,
                                     size_t vl);
vuint64m4_t __riscv_vxor_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                     vuint64m4_t vs2, uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vxor_vv_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                     vuint64m8_t vs2, vuint64m8_t vs1,
                                     size_t vl);
vuint64m8_t __riscv_vxor_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                     vuint64m8_t vs2, uint64_t rs1, size_t vl);

Vector Bitwise Unary Logical Intrinsics

vint8mf8_t __riscv_vnot_v_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs, size_t vl);
vint8mf4_t __riscv_vnot_v_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs, size_t vl);
vint8mf2_t __riscv_vnot_v_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs, size_t vl);
vint8m1_t __riscv_vnot_v_i8m1_tu(vint8m1_t vd, vint8m1_t vs, size_t vl);
vint8m2_t __riscv_vnot_v_i8m2_tu(vint8m2_t vd, vint8m2_t vs, size_t vl);
vint8m4_t __riscv_vnot_v_i8m4_tu(vint8m4_t vd, vint8m4_t vs, size_t vl);
vint8m8_t __riscv_vnot_v_i8m8_tu(vint8m8_t vd, vint8m8_t vs, size_t vl);
vint16mf4_t __riscv_vnot_v_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs, size_t vl);
vint16mf2_t __riscv_vnot_v_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs, size_t vl);
vint16m1_t __riscv_vnot_v_i16m1_tu(vint16m1_t vd, vint16m1_t vs, size_t vl);
vint16m2_t __riscv_vnot_v_i16m2_tu(vint16m2_t vd, vint16m2_t vs, size_t vl);
vint16m4_t __riscv_vnot_v_i16m4_tu(vint16m4_t vd, vint16m4_t vs, size_t vl);
vint16m8_t __riscv_vnot_v_i16m8_tu(vint16m8_t vd, vint16m8_t vs, size_t vl);
vint32mf2_t __riscv_vnot_v_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs, size_t vl);
vint32m1_t __riscv_vnot_v_i32m1_tu(vint32m1_t vd, vint32m1_t vs, size_t vl);
vint32m2_t __riscv_vnot_v_i32m2_tu(vint32m2_t vd, vint32m2_t vs, size_t vl);
vint32m4_t __riscv_vnot_v_i32m4_tu(vint32m4_t vd, vint32m4_t vs, size_t vl);
vint32m8_t __riscv_vnot_v_i32m8_tu(vint32m8_t vd, vint32m8_t vs, size_t vl);
vint64m1_t __riscv_vnot_v_i64m1_tu(vint64m1_t vd, vint64m1_t vs, size_t vl);
vint64m2_t __riscv_vnot_v_i64m2_tu(vint64m2_t vd, vint64m2_t vs, size_t vl);
vint64m4_t __riscv_vnot_v_i64m4_tu(vint64m4_t vd, vint64m4_t vs, size_t vl);
vint64m8_t __riscv_vnot_v_i64m8_tu(vint64m8_t vd, vint64m8_t vs, size_t vl);
vuint8mf8_t __riscv_vnot_v_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs, size_t vl);
vuint8mf4_t __riscv_vnot_v_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs, size_t vl);
vuint8mf2_t __riscv_vnot_v_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs, size_t vl);
vuint8m1_t __riscv_vnot_v_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs, size_t vl);
vuint8m2_t __riscv_vnot_v_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs, size_t vl);
vuint8m4_t __riscv_vnot_v_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs, size_t vl);
vuint8m8_t __riscv_vnot_v_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs, size_t vl);
vuint16mf4_t __riscv_vnot_v_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs,
                                      size_t vl);
vuint16mf2_t __riscv_vnot_v_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs,
                                      size_t vl);
vuint16m1_t __riscv_vnot_v_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs, size_t vl);
vuint16m2_t __riscv_vnot_v_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs, size_t vl);
vuint16m4_t __riscv_vnot_v_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs, size_t vl);
vuint16m8_t __riscv_vnot_v_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs, size_t vl);
vuint32mf2_t __riscv_vnot_v_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs,
                                      size_t vl);
vuint32m1_t __riscv_vnot_v_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs, size_t vl);
vuint32m2_t __riscv_vnot_v_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs, size_t vl);
vuint32m4_t __riscv_vnot_v_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs, size_t vl);
vuint32m8_t __riscv_vnot_v_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs, size_t vl);
vuint64m1_t __riscv_vnot_v_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs, size_t vl);
vuint64m2_t __riscv_vnot_v_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs, size_t vl);
vuint64m4_t __riscv_vnot_v_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs, size_t vl);
vuint64m8_t __riscv_vnot_v_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs, size_t vl);
// masked functions
vint8mf8_t __riscv_vnot_v_i8mf8_tum(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs,
                                    size_t vl);
vint8mf4_t __riscv_vnot_v_i8mf4_tum(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs,
                                    size_t vl);
vint8mf2_t __riscv_vnot_v_i8mf2_tum(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs,
                                    size_t vl);
vint8m1_t __riscv_vnot_v_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs,
                                  size_t vl);
vint8m2_t __riscv_vnot_v_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs,
                                  size_t vl);
vint8m4_t __riscv_vnot_v_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs,
                                  size_t vl);
vint8m8_t __riscv_vnot_v_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs,
                                  size_t vl);
vint16mf4_t __riscv_vnot_v_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs, size_t vl);
vint16mf2_t __riscv_vnot_v_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs, size_t vl);
vint16m1_t __riscv_vnot_v_i16m1_tum(vbool16_t vm, vint16m1_t vd, vint16m1_t vs,
                                    size_t vl);
vint16m2_t __riscv_vnot_v_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs,
                                    size_t vl);
vint16m4_t __riscv_vnot_v_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs,
                                    size_t vl);
vint16m8_t __riscv_vnot_v_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs,
                                    size_t vl);
vint32mf2_t __riscv_vnot_v_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs, size_t vl);
vint32m1_t __riscv_vnot_v_i32m1_tum(vbool32_t vm, vint32m1_t vd, vint32m1_t vs,
                                    size_t vl);
vint32m2_t __riscv_vnot_v_i32m2_tum(vbool16_t vm, vint32m2_t vd, vint32m2_t vs,
                                    size_t vl);
vint32m4_t __riscv_vnot_v_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs,
                                    size_t vl);
vint32m8_t __riscv_vnot_v_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs,
                                    size_t vl);
vint64m1_t __riscv_vnot_v_i64m1_tum(vbool64_t vm, vint64m1_t vd, vint64m1_t vs,
                                    size_t vl);
vint64m2_t __riscv_vnot_v_i64m2_tum(vbool32_t vm, vint64m2_t vd, vint64m2_t vs,
                                    size_t vl);
vint64m4_t __riscv_vnot_v_i64m4_tum(vbool16_t vm, vint64m4_t vd, vint64m4_t vs,
                                    size_t vl);
vint64m8_t __riscv_vnot_v_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs,
                                    size_t vl);
vuint8mf8_t __riscv_vnot_v_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                     vuint8mf8_t vs, size_t vl);
vuint8mf4_t __riscv_vnot_v_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                     vuint8mf4_t vs, size_t vl);
vuint8mf2_t __riscv_vnot_v_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                     vuint8mf2_t vs, size_t vl);
vuint8m1_t __riscv_vnot_v_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs,
                                   size_t vl);
vuint8m2_t __riscv_vnot_v_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs,
                                   size_t vl);
vuint8m4_t __riscv_vnot_v_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs,
                                   size_t vl);
vuint8m8_t __riscv_vnot_v_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs,
                                   size_t vl);
vuint16mf4_t __riscv_vnot_v_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                       vuint16mf4_t vs, size_t vl);
vuint16mf2_t __riscv_vnot_v_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                       vuint16mf2_t vs, size_t vl);
vuint16m1_t __riscv_vnot_v_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                     vuint16m1_t vs, size_t vl);
vuint16m2_t __riscv_vnot_v_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                     vuint16m2_t vs, size_t vl);
vuint16m4_t __riscv_vnot_v_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                     vuint16m4_t vs, size_t vl);
vuint16m8_t __riscv_vnot_v_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                     vuint16m8_t vs, size_t vl);
vuint32mf2_t __riscv_vnot_v_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                       vuint32mf2_t vs, size_t vl);
vuint32m1_t __riscv_vnot_v_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                     vuint32m1_t vs, size_t vl);
vuint32m2_t __riscv_vnot_v_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                     vuint32m2_t vs, size_t vl);
vuint32m4_t __riscv_vnot_v_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                     vuint32m4_t vs, size_t vl);
vuint32m8_t __riscv_vnot_v_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                     vuint32m8_t vs, size_t vl);
vuint64m1_t __riscv_vnot_v_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                     vuint64m1_t vs, size_t vl);
vuint64m2_t __riscv_vnot_v_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                     vuint64m2_t vs, size_t vl);
vuint64m4_t __riscv_vnot_v_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                     vuint64m4_t vs, size_t vl);
vuint64m8_t __riscv_vnot_v_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                     vuint64m8_t vs, size_t vl);
// masked functions
vint8mf8_t __riscv_vnot_v_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs,
                                     size_t vl);
vint8mf4_t __riscv_vnot_v_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs,
                                     size_t vl);
vint8mf2_t __riscv_vnot_v_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs,
                                     size_t vl);
vint8m1_t __riscv_vnot_v_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs,
                                   size_t vl);
vint8m2_t __riscv_vnot_v_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs,
                                   size_t vl);
vint8m4_t __riscv_vnot_v_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs,
                                   size_t vl);
vint8m8_t __riscv_vnot_v_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs,
                                   size_t vl);
vint16mf4_t __riscv_vnot_v_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs, size_t vl);
vint16mf2_t __riscv_vnot_v_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs, size_t vl);
vint16m1_t __riscv_vnot_v_i16m1_tumu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs,
                                     size_t vl);
vint16m2_t __riscv_vnot_v_i16m2_tumu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs,
                                     size_t vl);
vint16m4_t __riscv_vnot_v_i16m4_tumu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs,
                                     size_t vl);
vint16m8_t __riscv_vnot_v_i16m8_tumu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs,
                                     size_t vl);
vint32mf2_t __riscv_vnot_v_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs, size_t vl);
vint32m1_t __riscv_vnot_v_i32m1_tumu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs,
                                     size_t vl);
vint32m2_t __riscv_vnot_v_i32m2_tumu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs,
                                     size_t vl);
vint32m4_t __riscv_vnot_v_i32m4_tumu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs,
                                     size_t vl);
vint32m8_t __riscv_vnot_v_i32m8_tumu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs,
                                     size_t vl);
vint64m1_t __riscv_vnot_v_i64m1_tumu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs,
                                     size_t vl);
vint64m2_t __riscv_vnot_v_i64m2_tumu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs,
                                     size_t vl);
vint64m4_t __riscv_vnot_v_i64m4_tumu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs,
                                     size_t vl);
vint64m8_t __riscv_vnot_v_i64m8_tumu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs,
                                     size_t vl);
vuint8mf8_t __riscv_vnot_v_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs, size_t vl);
vuint8mf4_t __riscv_vnot_v_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs, size_t vl);
vuint8mf2_t __riscv_vnot_v_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs, size_t vl);
vuint8m1_t __riscv_vnot_v_u8m1_tumu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs,
                                    size_t vl);
vuint8m2_t __riscv_vnot_v_u8m2_tumu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs,
                                    size_t vl);
vuint8m4_t __riscv_vnot_v_u8m4_tumu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs,
                                    size_t vl);
vuint8m8_t __riscv_vnot_v_u8m8_tumu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs,
                                    size_t vl);
vuint16mf4_t __riscv_vnot_v_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs, size_t vl);
vuint16mf2_t __riscv_vnot_v_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs, size_t vl);
vuint16m1_t __riscv_vnot_v_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs, size_t vl);
vuint16m2_t __riscv_vnot_v_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs, size_t vl);
vuint16m4_t __riscv_vnot_v_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs, size_t vl);
vuint16m8_t __riscv_vnot_v_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs, size_t vl);
vuint32mf2_t __riscv_vnot_v_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs, size_t vl);
vuint32m1_t __riscv_vnot_v_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs, size_t vl);
vuint32m2_t __riscv_vnot_v_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs, size_t vl);
vuint32m4_t __riscv_vnot_v_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs, size_t vl);
vuint32m8_t __riscv_vnot_v_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs, size_t vl);
vuint64m1_t __riscv_vnot_v_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs, size_t vl);
vuint64m2_t __riscv_vnot_v_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs, size_t vl);
vuint64m4_t __riscv_vnot_v_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs, size_t vl);
vuint64m8_t __riscv_vnot_v_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs, size_t vl);
// masked functions
vint8mf8_t __riscv_vnot_v_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs,
                                   size_t vl);
vint8mf4_t __riscv_vnot_v_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs,
                                   size_t vl);
vint8mf2_t __riscv_vnot_v_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs,
                                   size_t vl);
vint8m1_t __riscv_vnot_v_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs,
                                 size_t vl);
vint8m2_t __riscv_vnot_v_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs,
                                 size_t vl);
vint8m4_t __riscv_vnot_v_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs,
                                 size_t vl);
vint8m8_t __riscv_vnot_v_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs,
                                 size_t vl);
vint16mf4_t __riscv_vnot_v_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                     vint16mf4_t vs, size_t vl);
vint16mf2_t __riscv_vnot_v_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                     vint16mf2_t vs, size_t vl);
vint16m1_t __riscv_vnot_v_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs,
                                   size_t vl);
vint16m2_t __riscv_vnot_v_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs,
                                   size_t vl);
vint16m4_t __riscv_vnot_v_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs,
                                   size_t vl);
vint16m8_t __riscv_vnot_v_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs,
                                   size_t vl);
vint32mf2_t __riscv_vnot_v_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                     vint32mf2_t vs, size_t vl);
vint32m1_t __riscv_vnot_v_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs,
                                   size_t vl);
vint32m2_t __riscv_vnot_v_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs,
                                   size_t vl);
vint32m4_t __riscv_vnot_v_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs,
                                   size_t vl);
vint32m8_t __riscv_vnot_v_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs,
                                   size_t vl);
vint64m1_t __riscv_vnot_v_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs,
                                   size_t vl);
vint64m2_t __riscv_vnot_v_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs,
                                   size_t vl);
vint64m4_t __riscv_vnot_v_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs,
                                   size_t vl);
vint64m8_t __riscv_vnot_v_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs,
                                   size_t vl);
vuint8mf8_t __riscv_vnot_v_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                    vuint8mf8_t vs, size_t vl);
vuint8mf4_t __riscv_vnot_v_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                    vuint8mf4_t vs, size_t vl);
vuint8mf2_t __riscv_vnot_v_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                    vuint8mf2_t vs, size_t vl);
vuint8m1_t __riscv_vnot_v_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs,
                                  size_t vl);
vuint8m2_t __riscv_vnot_v_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs,
                                  size_t vl);
vuint8m4_t __riscv_vnot_v_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs,
                                  size_t vl);
vuint8m8_t __riscv_vnot_v_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs,
                                  size_t vl);
vuint16mf4_t __riscv_vnot_v_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                      vuint16mf4_t vs, size_t vl);
vuint16mf2_t __riscv_vnot_v_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                      vuint16mf2_t vs, size_t vl);
vuint16m1_t __riscv_vnot_v_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                    vuint16m1_t vs, size_t vl);
vuint16m2_t __riscv_vnot_v_u16m2_mu(vbool8_t vm, vuint16m2_t vd, vuint16m2_t vs,
                                    size_t vl);
vuint16m4_t __riscv_vnot_v_u16m4_mu(vbool4_t vm, vuint16m4_t vd, vuint16m4_t vs,
                                    size_t vl);
vuint16m8_t __riscv_vnot_v_u16m8_mu(vbool2_t vm, vuint16m8_t vd, vuint16m8_t vs,
                                    size_t vl);
vuint32mf2_t __riscv_vnot_v_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                      vuint32mf2_t vs, size_t vl);
vuint32m1_t __riscv_vnot_v_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                    vuint32m1_t vs, size_t vl);
vuint32m2_t __riscv_vnot_v_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                    vuint32m2_t vs, size_t vl);
vuint32m4_t __riscv_vnot_v_u32m4_mu(vbool8_t vm, vuint32m4_t vd, vuint32m4_t vs,
                                    size_t vl);
vuint32m8_t __riscv_vnot_v_u32m8_mu(vbool4_t vm, vuint32m8_t vd, vuint32m8_t vs,
                                    size_t vl);
vuint64m1_t __riscv_vnot_v_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                    vuint64m1_t vs, size_t vl);
vuint64m2_t __riscv_vnot_v_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                    vuint64m2_t vs, size_t vl);
vuint64m4_t __riscv_vnot_v_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                    vuint64m4_t vs, size_t vl);
vuint64m8_t __riscv_vnot_v_u64m8_mu(vbool8_t vm, vuint64m8_t vd, vuint64m8_t vs,
                                    size_t vl);

Vector Single-Width Bit Shift Intrinsics

vint8mf8_t __riscv_vsll_vv_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                    vuint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vsll_vx_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2, size_t rs1,
                                    size_t vl);
vint8mf4_t __riscv_vsll_vv_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                    vuint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vsll_vx_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2, size_t rs1,
                                    size_t vl);
vint8mf2_t __riscv_vsll_vv_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                    vuint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vsll_vx_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2, size_t rs1,
                                    size_t vl);
vint8m1_t __riscv_vsll_vv_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, vuint8m1_t vs1,
                                  size_t vl);
vint8m1_t __riscv_vsll_vx_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, size_t rs1,
                                  size_t vl);
vint8m2_t __riscv_vsll_vv_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, vuint8m2_t vs1,
                                  size_t vl);
vint8m2_t __riscv_vsll_vx_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, size_t rs1,
                                  size_t vl);
vint8m4_t __riscv_vsll_vv_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, vuint8m4_t vs1,
                                  size_t vl);
vint8m4_t __riscv_vsll_vx_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, size_t rs1,
                                  size_t vl);
vint8m8_t __riscv_vsll_vv_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, vuint8m8_t vs1,
                                  size_t vl);
vint8m8_t __riscv_vsll_vx_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, size_t rs1,
                                  size_t vl);
vint16mf4_t __riscv_vsll_vv_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                      vuint16mf4_t vs1, size_t vl);
vint16mf4_t __riscv_vsll_vx_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                      size_t rs1, size_t vl);
vint16mf2_t __riscv_vsll_vv_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                      vuint16mf2_t vs1, size_t vl);
vint16mf2_t __riscv_vsll_vx_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                      size_t rs1, size_t vl);
vint16m1_t __riscv_vsll_vv_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                    vuint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vsll_vx_i16m1_tu(vint16m1_t vd, vint16m1_t vs2, size_t rs1,
                                    size_t vl);
vint16m2_t __riscv_vsll_vv_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                    vuint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vsll_vx_i16m2_tu(vint16m2_t vd, vint16m2_t vs2, size_t rs1,
                                    size_t vl);
vint16m4_t __riscv_vsll_vv_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                    vuint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vsll_vx_i16m4_tu(vint16m4_t vd, vint16m4_t vs2, size_t rs1,
                                    size_t vl);
vint16m8_t __riscv_vsll_vv_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                    vuint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vsll_vx_i16m8_tu(vint16m8_t vd, vint16m8_t vs2, size_t rs1,
                                    size_t vl);
vint32mf2_t __riscv_vsll_vv_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                      vuint32mf2_t vs1, size_t vl);
vint32mf2_t __riscv_vsll_vx_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                      size_t rs1, size_t vl);
vint32m1_t __riscv_vsll_vv_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                    vuint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vsll_vx_i32m1_tu(vint32m1_t vd, vint32m1_t vs2, size_t rs1,
                                    size_t vl);
vint32m2_t __riscv_vsll_vv_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                    vuint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vsll_vx_i32m2_tu(vint32m2_t vd, vint32m2_t vs2, size_t rs1,
                                    size_t vl);
vint32m4_t __riscv_vsll_vv_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                    vuint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vsll_vx_i32m4_tu(vint32m4_t vd, vint32m4_t vs2, size_t rs1,
                                    size_t vl);
vint32m8_t __riscv_vsll_vv_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                    vuint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vsll_vx_i32m8_tu(vint32m8_t vd, vint32m8_t vs2, size_t rs1,
                                    size_t vl);
vint64m1_t __riscv_vsll_vv_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                    vuint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vsll_vx_i64m1_tu(vint64m1_t vd, vint64m1_t vs2, size_t rs1,
                                    size_t vl);
vint64m2_t __riscv_vsll_vv_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                    vuint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vsll_vx_i64m2_tu(vint64m2_t vd, vint64m2_t vs2, size_t rs1,
                                    size_t vl);
vint64m4_t __riscv_vsll_vv_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                    vuint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vsll_vx_i64m4_tu(vint64m4_t vd, vint64m4_t vs2, size_t rs1,
                                    size_t vl);
vint64m8_t __riscv_vsll_vv_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                    vuint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vsll_vx_i64m8_tu(vint64m8_t vd, vint64m8_t vs2, size_t rs1,
                                    size_t vl);
vint8mf8_t __riscv_vsra_vv_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                    vuint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vsra_vx_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2, size_t rs1,
                                    size_t vl);
vint8mf4_t __riscv_vsra_vv_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                    vuint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vsra_vx_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2, size_t rs1,
                                    size_t vl);
vint8mf2_t __riscv_vsra_vv_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                    vuint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vsra_vx_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2, size_t rs1,
                                    size_t vl);
vint8m1_t __riscv_vsra_vv_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, vuint8m1_t vs1,
                                  size_t vl);
vint8m1_t __riscv_vsra_vx_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, size_t rs1,
                                  size_t vl);
vint8m2_t __riscv_vsra_vv_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, vuint8m2_t vs1,
                                  size_t vl);
vint8m2_t __riscv_vsra_vx_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, size_t rs1,
                                  size_t vl);
vint8m4_t __riscv_vsra_vv_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, vuint8m4_t vs1,
                                  size_t vl);
vint8m4_t __riscv_vsra_vx_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, size_t rs1,
                                  size_t vl);
vint8m8_t __riscv_vsra_vv_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, vuint8m8_t vs1,
                                  size_t vl);
vint8m8_t __riscv_vsra_vx_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, size_t rs1,
                                  size_t vl);
vint16mf4_t __riscv_vsra_vv_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                      vuint16mf4_t vs1, size_t vl);
vint16mf4_t __riscv_vsra_vx_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                      size_t rs1, size_t vl);
vint16mf2_t __riscv_vsra_vv_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                      vuint16mf2_t vs1, size_t vl);
vint16mf2_t __riscv_vsra_vx_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                      size_t rs1, size_t vl);
vint16m1_t __riscv_vsra_vv_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                    vuint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vsra_vx_i16m1_tu(vint16m1_t vd, vint16m1_t vs2, size_t rs1,
                                    size_t vl);
vint16m2_t __riscv_vsra_vv_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                    vuint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vsra_vx_i16m2_tu(vint16m2_t vd, vint16m2_t vs2, size_t rs1,
                                    size_t vl);
vint16m4_t __riscv_vsra_vv_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                    vuint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vsra_vx_i16m4_tu(vint16m4_t vd, vint16m4_t vs2, size_t rs1,
                                    size_t vl);
vint16m8_t __riscv_vsra_vv_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                    vuint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vsra_vx_i16m8_tu(vint16m8_t vd, vint16m8_t vs2, size_t rs1,
                                    size_t vl);
vint32mf2_t __riscv_vsra_vv_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                      vuint32mf2_t vs1, size_t vl);
vint32mf2_t __riscv_vsra_vx_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                      size_t rs1, size_t vl);
vint32m1_t __riscv_vsra_vv_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                    vuint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vsra_vx_i32m1_tu(vint32m1_t vd, vint32m1_t vs2, size_t rs1,
                                    size_t vl);
vint32m2_t __riscv_vsra_vv_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                    vuint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vsra_vx_i32m2_tu(vint32m2_t vd, vint32m2_t vs2, size_t rs1,
                                    size_t vl);
vint32m4_t __riscv_vsra_vv_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                    vuint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vsra_vx_i32m4_tu(vint32m4_t vd, vint32m4_t vs2, size_t rs1,
                                    size_t vl);
vint32m8_t __riscv_vsra_vv_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                    vuint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vsra_vx_i32m8_tu(vint32m8_t vd, vint32m8_t vs2, size_t rs1,
                                    size_t vl);
vint64m1_t __riscv_vsra_vv_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                    vuint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vsra_vx_i64m1_tu(vint64m1_t vd, vint64m1_t vs2, size_t rs1,
                                    size_t vl);
vint64m2_t __riscv_vsra_vv_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                    vuint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vsra_vx_i64m2_tu(vint64m2_t vd, vint64m2_t vs2, size_t rs1,
                                    size_t vl);
vint64m4_t __riscv_vsra_vv_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                    vuint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vsra_vx_i64m4_tu(vint64m4_t vd, vint64m4_t vs2, size_t rs1,
                                    size_t vl);
vint64m8_t __riscv_vsra_vv_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                    vuint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vsra_vx_i64m8_tu(vint64m8_t vd, vint64m8_t vs2, size_t rs1,
                                    size_t vl);
vuint8mf8_t __riscv_vsll_vv_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                     vuint8mf8_t vs1, size_t vl);
vuint8mf8_t __riscv_vsll_vx_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                     size_t rs1, size_t vl);
vuint8mf4_t __riscv_vsll_vv_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                     vuint8mf4_t vs1, size_t vl);
vuint8mf4_t __riscv_vsll_vx_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                     size_t rs1, size_t vl);
vuint8mf2_t __riscv_vsll_vv_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                     vuint8mf2_t vs1, size_t vl);
vuint8mf2_t __riscv_vsll_vx_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                     size_t rs1, size_t vl);
vuint8m1_t __riscv_vsll_vv_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2,
                                   vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vsll_vx_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2, size_t rs1,
                                   size_t vl);
vuint8m2_t __riscv_vsll_vv_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2,
                                   vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vsll_vx_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2, size_t rs1,
                                   size_t vl);
vuint8m4_t __riscv_vsll_vv_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2,
                                   vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vsll_vx_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2, size_t rs1,
                                   size_t vl);
vuint8m8_t __riscv_vsll_vv_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2,
                                   vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vsll_vx_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2, size_t rs1,
                                   size_t vl);
vuint16mf4_t __riscv_vsll_vv_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                       vuint16mf4_t vs1, size_t vl);
vuint16mf4_t __riscv_vsll_vx_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                       size_t rs1, size_t vl);
vuint16mf2_t __riscv_vsll_vv_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                       vuint16mf2_t vs1, size_t vl);
vuint16mf2_t __riscv_vsll_vx_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                       size_t rs1, size_t vl);
vuint16m1_t __riscv_vsll_vv_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                     vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vsll_vx_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                     size_t rs1, size_t vl);
vuint16m2_t __riscv_vsll_vv_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                     vuint16m2_t vs1, size_t vl);
vuint16m2_t __riscv_vsll_vx_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                     size_t rs1, size_t vl);
vuint16m4_t __riscv_vsll_vv_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                     vuint16m4_t vs1, size_t vl);
vuint16m4_t __riscv_vsll_vx_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                     size_t rs1, size_t vl);
vuint16m8_t __riscv_vsll_vv_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                     vuint16m8_t vs1, size_t vl);
vuint16m8_t __riscv_vsll_vx_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                     size_t rs1, size_t vl);
vuint32mf2_t __riscv_vsll_vv_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                       vuint32mf2_t vs1, size_t vl);
vuint32mf2_t __riscv_vsll_vx_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                       size_t rs1, size_t vl);
vuint32m1_t __riscv_vsll_vv_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                     vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vsll_vx_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                     size_t rs1, size_t vl);
vuint32m2_t __riscv_vsll_vv_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                     vuint32m2_t vs1, size_t vl);
vuint32m2_t __riscv_vsll_vx_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                     size_t rs1, size_t vl);
vuint32m4_t __riscv_vsll_vv_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                     vuint32m4_t vs1, size_t vl);
vuint32m4_t __riscv_vsll_vx_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                     size_t rs1, size_t vl);
vuint32m8_t __riscv_vsll_vv_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                     vuint32m8_t vs1, size_t vl);
vuint32m8_t __riscv_vsll_vx_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                     size_t rs1, size_t vl);
vuint64m1_t __riscv_vsll_vv_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                     vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vsll_vx_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                     size_t rs1, size_t vl);
vuint64m2_t __riscv_vsll_vv_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                     vuint64m2_t vs1, size_t vl);
vuint64m2_t __riscv_vsll_vx_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                     size_t rs1, size_t vl);
vuint64m4_t __riscv_vsll_vv_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                     vuint64m4_t vs1, size_t vl);
vuint64m4_t __riscv_vsll_vx_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                     size_t rs1, size_t vl);
vuint64m8_t __riscv_vsll_vv_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                     vuint64m8_t vs1, size_t vl);
vuint64m8_t __riscv_vsll_vx_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                     size_t rs1, size_t vl);
vuint8mf8_t __riscv_vsrl_vv_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                     vuint8mf8_t vs1, size_t vl);
vuint8mf8_t __riscv_vsrl_vx_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                     size_t rs1, size_t vl);
vuint8mf4_t __riscv_vsrl_vv_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                     vuint8mf4_t vs1, size_t vl);
vuint8mf4_t __riscv_vsrl_vx_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                     size_t rs1, size_t vl);
vuint8mf2_t __riscv_vsrl_vv_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                     vuint8mf2_t vs1, size_t vl);
vuint8mf2_t __riscv_vsrl_vx_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                     size_t rs1, size_t vl);
vuint8m1_t __riscv_vsrl_vv_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2,
                                   vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vsrl_vx_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2, size_t rs1,
                                   size_t vl);
vuint8m2_t __riscv_vsrl_vv_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2,
                                   vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vsrl_vx_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2, size_t rs1,
                                   size_t vl);
vuint8m4_t __riscv_vsrl_vv_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2,
                                   vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vsrl_vx_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2, size_t rs1,
                                   size_t vl);
vuint8m8_t __riscv_vsrl_vv_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2,
                                   vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vsrl_vx_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2, size_t rs1,
                                   size_t vl);
vuint16mf4_t __riscv_vsrl_vv_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                       vuint16mf4_t vs1, size_t vl);
vuint16mf4_t __riscv_vsrl_vx_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                       size_t rs1, size_t vl);
vuint16mf2_t __riscv_vsrl_vv_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                       vuint16mf2_t vs1, size_t vl);
vuint16mf2_t __riscv_vsrl_vx_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                       size_t rs1, size_t vl);
vuint16m1_t __riscv_vsrl_vv_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                     vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vsrl_vx_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                     size_t rs1, size_t vl);
vuint16m2_t __riscv_vsrl_vv_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                     vuint16m2_t vs1, size_t vl);
vuint16m2_t __riscv_vsrl_vx_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                     size_t rs1, size_t vl);
vuint16m4_t __riscv_vsrl_vv_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                     vuint16m4_t vs1, size_t vl);
vuint16m4_t __riscv_vsrl_vx_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                     size_t rs1, size_t vl);
vuint16m8_t __riscv_vsrl_vv_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                     vuint16m8_t vs1, size_t vl);
vuint16m8_t __riscv_vsrl_vx_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                     size_t rs1, size_t vl);
vuint32mf2_t __riscv_vsrl_vv_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                       vuint32mf2_t vs1, size_t vl);
vuint32mf2_t __riscv_vsrl_vx_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                       size_t rs1, size_t vl);
vuint32m1_t __riscv_vsrl_vv_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                     vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vsrl_vx_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                     size_t rs1, size_t vl);
vuint32m2_t __riscv_vsrl_vv_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                     vuint32m2_t vs1, size_t vl);
vuint32m2_t __riscv_vsrl_vx_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                     size_t rs1, size_t vl);
vuint32m4_t __riscv_vsrl_vv_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                     vuint32m4_t vs1, size_t vl);
vuint32m4_t __riscv_vsrl_vx_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                     size_t rs1, size_t vl);
vuint32m8_t __riscv_vsrl_vv_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                     vuint32m8_t vs1, size_t vl);
vuint32m8_t __riscv_vsrl_vx_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                     size_t rs1, size_t vl);
vuint64m1_t __riscv_vsrl_vv_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                     vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vsrl_vx_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                     size_t rs1, size_t vl);
vuint64m2_t __riscv_vsrl_vv_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                     vuint64m2_t vs1, size_t vl);
vuint64m2_t __riscv_vsrl_vx_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                     size_t rs1, size_t vl);
vuint64m4_t __riscv_vsrl_vv_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                     vuint64m4_t vs1, size_t vl);
vuint64m4_t __riscv_vsrl_vx_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                     size_t rs1, size_t vl);
vuint64m8_t __riscv_vsrl_vv_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                     vuint64m8_t vs1, size_t vl);
vuint64m8_t __riscv_vsrl_vx_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                     size_t rs1, size_t vl);
// masked functions
vint8mf8_t __riscv_vsll_vv_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, vuint8mf8_t vs1,
                                     size_t vl);
vint8mf8_t __riscv_vsll_vx_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, size_t rs1, size_t vl);
vint8mf4_t __riscv_vsll_vv_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, vuint8mf4_t vs1,
                                     size_t vl);
vint8mf4_t __riscv_vsll_vx_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, size_t rs1, size_t vl);
vint8mf2_t __riscv_vsll_vv_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, vuint8mf2_t vs1,
                                     size_t vl);
vint8mf2_t __riscv_vsll_vx_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, size_t rs1, size_t vl);
vint8m1_t __riscv_vsll_vv_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   vuint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vsll_vx_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   size_t rs1, size_t vl);
vint8m2_t __riscv_vsll_vv_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   vuint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vsll_vx_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   size_t rs1, size_t vl);
vint8m4_t __riscv_vsll_vv_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   vuint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vsll_vx_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   size_t rs1, size_t vl);
vint8m8_t __riscv_vsll_vv_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   vuint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vsll_vx_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   size_t rs1, size_t vl);
vint16mf4_t __riscv_vsll_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, vuint16mf4_t vs1,
                                       size_t vl);
vint16mf4_t __riscv_vsll_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, size_t rs1, size_t vl);
vint16mf2_t __riscv_vsll_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, vuint16mf2_t vs1,
                                       size_t vl);
vint16mf2_t __riscv_vsll_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, size_t rs1, size_t vl);
vint16m1_t __riscv_vsll_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, vuint16m1_t vs1,
                                     size_t vl);
vint16m1_t __riscv_vsll_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, size_t rs1, size_t vl);
vint16m2_t __riscv_vsll_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     vuint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vsll_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     size_t rs1, size_t vl);
vint16m4_t __riscv_vsll_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     vuint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vsll_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     size_t rs1, size_t vl);
vint16m8_t __riscv_vsll_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     vuint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vsll_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     size_t rs1, size_t vl);
vint32mf2_t __riscv_vsll_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, vuint32mf2_t vs1,
                                       size_t vl);
vint32mf2_t __riscv_vsll_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, size_t rs1, size_t vl);
vint32m1_t __riscv_vsll_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, vuint32m1_t vs1,
                                     size_t vl);
vint32m1_t __riscv_vsll_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, size_t rs1, size_t vl);
vint32m2_t __riscv_vsll_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, vuint32m2_t vs1,
                                     size_t vl);
vint32m2_t __riscv_vsll_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, size_t rs1, size_t vl);
vint32m4_t __riscv_vsll_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     vuint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vsll_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     size_t rs1, size_t vl);
vint32m8_t __riscv_vsll_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     vuint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vsll_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     size_t rs1, size_t vl);
vint64m1_t __riscv_vsll_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, vuint64m1_t vs1,
                                     size_t vl);
vint64m1_t __riscv_vsll_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, size_t rs1, size_t vl);
vint64m2_t __riscv_vsll_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, vuint64m2_t vs1,
                                     size_t vl);
vint64m2_t __riscv_vsll_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, size_t rs1, size_t vl);
vint64m4_t __riscv_vsll_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, vuint64m4_t vs1,
                                     size_t vl);
vint64m4_t __riscv_vsll_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, size_t rs1, size_t vl);
vint64m8_t __riscv_vsll_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     vuint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vsll_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     size_t rs1, size_t vl);
vint8mf8_t __riscv_vsra_vv_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, vuint8mf8_t vs1,
                                     size_t vl);
vint8mf8_t __riscv_vsra_vx_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, size_t rs1, size_t vl);
vint8mf4_t __riscv_vsra_vv_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, vuint8mf4_t vs1,
                                     size_t vl);
vint8mf4_t __riscv_vsra_vx_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, size_t rs1, size_t vl);
vint8mf2_t __riscv_vsra_vv_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, vuint8mf2_t vs1,
                                     size_t vl);
vint8mf2_t __riscv_vsra_vx_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, size_t rs1, size_t vl);
vint8m1_t __riscv_vsra_vv_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   vuint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vsra_vx_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   size_t rs1, size_t vl);
vint8m2_t __riscv_vsra_vv_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   vuint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vsra_vx_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   size_t rs1, size_t vl);
vint8m4_t __riscv_vsra_vv_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   vuint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vsra_vx_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   size_t rs1, size_t vl);
vint8m8_t __riscv_vsra_vv_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   vuint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vsra_vx_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   size_t rs1, size_t vl);
vint16mf4_t __riscv_vsra_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, vuint16mf4_t vs1,
                                       size_t vl);
vint16mf4_t __riscv_vsra_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, size_t rs1, size_t vl);
vint16mf2_t __riscv_vsra_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, vuint16mf2_t vs1,
                                       size_t vl);
vint16mf2_t __riscv_vsra_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, size_t rs1, size_t vl);
vint16m1_t __riscv_vsra_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, vuint16m1_t vs1,
                                     size_t vl);
vint16m1_t __riscv_vsra_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, size_t rs1, size_t vl);
vint16m2_t __riscv_vsra_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     vuint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vsra_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     size_t rs1, size_t vl);
vint16m4_t __riscv_vsra_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     vuint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vsra_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     size_t rs1, size_t vl);
vint16m8_t __riscv_vsra_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     vuint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vsra_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     size_t rs1, size_t vl);
vint32mf2_t __riscv_vsra_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, vuint32mf2_t vs1,
                                       size_t vl);
vint32mf2_t __riscv_vsra_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, size_t rs1, size_t vl);
vint32m1_t __riscv_vsra_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, vuint32m1_t vs1,
                                     size_t vl);
vint32m1_t __riscv_vsra_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, size_t rs1, size_t vl);
vint32m2_t __riscv_vsra_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, vuint32m2_t vs1,
                                     size_t vl);
vint32m2_t __riscv_vsra_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, size_t rs1, size_t vl);
vint32m4_t __riscv_vsra_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     vuint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vsra_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     size_t rs1, size_t vl);
vint32m8_t __riscv_vsra_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     vuint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vsra_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     size_t rs1, size_t vl);
vint64m1_t __riscv_vsra_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, vuint64m1_t vs1,
                                     size_t vl);
vint64m1_t __riscv_vsra_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, size_t rs1, size_t vl);
vint64m2_t __riscv_vsra_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, vuint64m2_t vs1,
                                     size_t vl);
vint64m2_t __riscv_vsra_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, size_t rs1, size_t vl);
vint64m4_t __riscv_vsra_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, vuint64m4_t vs1,
                                     size_t vl);
vint64m4_t __riscv_vsra_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, size_t rs1, size_t vl);
vint64m8_t __riscv_vsra_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     vuint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vsra_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     size_t rs1, size_t vl);
vuint8mf8_t __riscv_vsll_vv_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs2, vuint8mf8_t vs1,
                                      size_t vl);
vuint8mf8_t __riscv_vsll_vx_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs2, size_t rs1, size_t vl);
vuint8mf4_t __riscv_vsll_vv_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs2, vuint8mf4_t vs1,
                                      size_t vl);
vuint8mf4_t __riscv_vsll_vx_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs2, size_t rs1, size_t vl);
vuint8mf2_t __riscv_vsll_vv_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs2, vuint8mf2_t vs1,
                                      size_t vl);
vuint8mf2_t __riscv_vsll_vx_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs2, size_t rs1, size_t vl);
vuint8m1_t __riscv_vsll_vv_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                    vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vsll_vx_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                    size_t rs1, size_t vl);
vuint8m2_t __riscv_vsll_vv_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                    vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vsll_vx_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                    size_t rs1, size_t vl);
vuint8m4_t __riscv_vsll_vv_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                    vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vsll_vx_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                    size_t rs1, size_t vl);
vuint8m8_t __riscv_vsll_vv_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                    vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vsll_vx_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                    size_t rs1, size_t vl);
vuint16mf4_t __riscv_vsll_vv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs2, vuint16mf4_t vs1,
                                        size_t vl);
vuint16mf4_t __riscv_vsll_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs2, size_t rs1,
                                        size_t vl);
vuint16mf2_t __riscv_vsll_vv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs2, vuint16mf2_t vs1,
                                        size_t vl);
vuint16mf2_t __riscv_vsll_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs2, size_t rs1,
                                        size_t vl);
vuint16m1_t __riscv_vsll_vv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs2, vuint16m1_t vs1,
                                      size_t vl);
vuint16m1_t __riscv_vsll_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs2, size_t rs1, size_t vl);
vuint16m2_t __riscv_vsll_vv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs2, vuint16m2_t vs1,
                                      size_t vl);
vuint16m2_t __riscv_vsll_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs2, size_t rs1, size_t vl);
vuint16m4_t __riscv_vsll_vv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs2, vuint16m4_t vs1,
                                      size_t vl);
vuint16m4_t __riscv_vsll_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs2, size_t rs1, size_t vl);
vuint16m8_t __riscv_vsll_vv_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs2, vuint16m8_t vs1,
                                      size_t vl);
vuint16m8_t __riscv_vsll_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs2, size_t rs1, size_t vl);
vuint32mf2_t __riscv_vsll_vv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs2, vuint32mf2_t vs1,
                                        size_t vl);
vuint32mf2_t __riscv_vsll_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs2, size_t rs1,
                                        size_t vl);
vuint32m1_t __riscv_vsll_vv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs2, vuint32m1_t vs1,
                                      size_t vl);
vuint32m1_t __riscv_vsll_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs2, size_t rs1, size_t vl);
vuint32m2_t __riscv_vsll_vv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs2, vuint32m2_t vs1,
                                      size_t vl);
vuint32m2_t __riscv_vsll_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs2, size_t rs1, size_t vl);
vuint32m4_t __riscv_vsll_vv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs2, vuint32m4_t vs1,
                                      size_t vl);
vuint32m4_t __riscv_vsll_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs2, size_t rs1, size_t vl);
vuint32m8_t __riscv_vsll_vv_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs2, vuint32m8_t vs1,
                                      size_t vl);
vuint32m8_t __riscv_vsll_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs2, size_t rs1, size_t vl);
vuint64m1_t __riscv_vsll_vv_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs2, vuint64m1_t vs1,
                                      size_t vl);
vuint64m1_t __riscv_vsll_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs2, size_t rs1, size_t vl);
vuint64m2_t __riscv_vsll_vv_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs2, vuint64m2_t vs1,
                                      size_t vl);
vuint64m2_t __riscv_vsll_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs2, size_t rs1, size_t vl);
vuint64m4_t __riscv_vsll_vv_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs2, vuint64m4_t vs1,
                                      size_t vl);
vuint64m4_t __riscv_vsll_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs2, size_t rs1, size_t vl);
vuint64m8_t __riscv_vsll_vv_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs2, vuint64m8_t vs1,
                                      size_t vl);
vuint64m8_t __riscv_vsll_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs2, size_t rs1, size_t vl);
vuint8mf8_t __riscv_vsrl_vv_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs2, vuint8mf8_t vs1,
                                      size_t vl);
vuint8mf8_t __riscv_vsrl_vx_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs2, size_t rs1, size_t vl);
vuint8mf4_t __riscv_vsrl_vv_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs2, vuint8mf4_t vs1,
                                      size_t vl);
vuint8mf4_t __riscv_vsrl_vx_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs2, size_t rs1, size_t vl);
vuint8mf2_t __riscv_vsrl_vv_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs2, vuint8mf2_t vs1,
                                      size_t vl);
vuint8mf2_t __riscv_vsrl_vx_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs2, size_t rs1, size_t vl);
vuint8m1_t __riscv_vsrl_vv_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                    vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vsrl_vx_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                    size_t rs1, size_t vl);
vuint8m2_t __riscv_vsrl_vv_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                    vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vsrl_vx_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                    size_t rs1, size_t vl);
vuint8m4_t __riscv_vsrl_vv_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                    vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vsrl_vx_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                    size_t rs1, size_t vl);
vuint8m8_t __riscv_vsrl_vv_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                    vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vsrl_vx_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                    size_t rs1, size_t vl);
vuint16mf4_t __riscv_vsrl_vv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs2, vuint16mf4_t vs1,
                                        size_t vl);
vuint16mf4_t __riscv_vsrl_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs2, size_t rs1,
                                        size_t vl);
vuint16mf2_t __riscv_vsrl_vv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs2, vuint16mf2_t vs1,
                                        size_t vl);
vuint16mf2_t __riscv_vsrl_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs2, size_t rs1,
                                        size_t vl);
vuint16m1_t __riscv_vsrl_vv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs2, vuint16m1_t vs1,
                                      size_t vl);
vuint16m1_t __riscv_vsrl_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs2, size_t rs1, size_t vl);
vuint16m2_t __riscv_vsrl_vv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs2, vuint16m2_t vs1,
                                      size_t vl);
vuint16m2_t __riscv_vsrl_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs2, size_t rs1, size_t vl);
vuint16m4_t __riscv_vsrl_vv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs2, vuint16m4_t vs1,
                                      size_t vl);
vuint16m4_t __riscv_vsrl_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs2, size_t rs1, size_t vl);
vuint16m8_t __riscv_vsrl_vv_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs2, vuint16m8_t vs1,
                                      size_t vl);
vuint16m8_t __riscv_vsrl_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs2, size_t rs1, size_t vl);
vuint32mf2_t __riscv_vsrl_vv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs2, vuint32mf2_t vs1,
                                        size_t vl);
vuint32mf2_t __riscv_vsrl_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs2, size_t rs1,
                                        size_t vl);
vuint32m1_t __riscv_vsrl_vv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs2, vuint32m1_t vs1,
                                      size_t vl);
vuint32m1_t __riscv_vsrl_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs2, size_t rs1, size_t vl);
vuint32m2_t __riscv_vsrl_vv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs2, vuint32m2_t vs1,
                                      size_t vl);
vuint32m2_t __riscv_vsrl_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs2, size_t rs1, size_t vl);
vuint32m4_t __riscv_vsrl_vv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs2, vuint32m4_t vs1,
                                      size_t vl);
vuint32m4_t __riscv_vsrl_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs2, size_t rs1, size_t vl);
vuint32m8_t __riscv_vsrl_vv_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs2, vuint32m8_t vs1,
                                      size_t vl);
vuint32m8_t __riscv_vsrl_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs2, size_t rs1, size_t vl);
vuint64m1_t __riscv_vsrl_vv_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs2, vuint64m1_t vs1,
                                      size_t vl);
vuint64m1_t __riscv_vsrl_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs2, size_t rs1, size_t vl);
vuint64m2_t __riscv_vsrl_vv_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs2, vuint64m2_t vs1,
                                      size_t vl);
vuint64m2_t __riscv_vsrl_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs2, size_t rs1, size_t vl);
vuint64m4_t __riscv_vsrl_vv_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs2, vuint64m4_t vs1,
                                      size_t vl);
vuint64m4_t __riscv_vsrl_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs2, size_t rs1, size_t vl);
vuint64m8_t __riscv_vsrl_vv_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs2, vuint64m8_t vs1,
                                      size_t vl);
vuint64m8_t __riscv_vsrl_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs2, size_t rs1, size_t vl);
// masked functions
vint8mf8_t __riscv_vsll_vv_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs2, vuint8mf8_t vs1,
                                      size_t vl);
vint8mf8_t __riscv_vsll_vx_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs2, size_t rs1, size_t vl);
vint8mf4_t __riscv_vsll_vv_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs2, vuint8mf4_t vs1,
                                      size_t vl);
vint8mf4_t __riscv_vsll_vx_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs2, size_t rs1, size_t vl);
vint8mf2_t __riscv_vsll_vv_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs2, vuint8mf2_t vs1,
                                      size_t vl);
vint8mf2_t __riscv_vsll_vx_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs2, size_t rs1, size_t vl);
vint8m1_t __riscv_vsll_vv_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                    vuint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vsll_vx_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                    size_t rs1, size_t vl);
vint8m2_t __riscv_vsll_vv_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                    vuint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vsll_vx_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                    size_t rs1, size_t vl);
vint8m4_t __riscv_vsll_vv_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                    vuint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vsll_vx_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                    size_t rs1, size_t vl);
vint8m8_t __riscv_vsll_vv_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                    vuint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vsll_vx_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                    size_t rs1, size_t vl);
vint16mf4_t __riscv_vsll_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, vuint16mf4_t vs1,
                                        size_t vl);
vint16mf4_t __riscv_vsll_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, size_t rs1, size_t vl);
vint16mf2_t __riscv_vsll_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, vuint16mf2_t vs1,
                                        size_t vl);
vint16mf2_t __riscv_vsll_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, size_t rs1, size_t vl);
vint16m1_t __riscv_vsll_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, vuint16m1_t vs1,
                                      size_t vl);
vint16m1_t __riscv_vsll_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, size_t rs1, size_t vl);
vint16m2_t __riscv_vsll_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, vuint16m2_t vs1,
                                      size_t vl);
vint16m2_t __riscv_vsll_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, size_t rs1, size_t vl);
vint16m4_t __riscv_vsll_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, vuint16m4_t vs1,
                                      size_t vl);
vint16m4_t __riscv_vsll_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, size_t rs1, size_t vl);
vint16m8_t __riscv_vsll_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, vuint16m8_t vs1,
                                      size_t vl);
vint16m8_t __riscv_vsll_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, size_t rs1, size_t vl);
vint32mf2_t __riscv_vsll_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, vuint32mf2_t vs1,
                                        size_t vl);
vint32mf2_t __riscv_vsll_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, size_t rs1, size_t vl);
vint32m1_t __riscv_vsll_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, vuint32m1_t vs1,
                                      size_t vl);
vint32m1_t __riscv_vsll_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, size_t rs1, size_t vl);
vint32m2_t __riscv_vsll_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, vuint32m2_t vs1,
                                      size_t vl);
vint32m2_t __riscv_vsll_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, size_t rs1, size_t vl);
vint32m4_t __riscv_vsll_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, vuint32m4_t vs1,
                                      size_t vl);
vint32m4_t __riscv_vsll_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, size_t rs1, size_t vl);
vint32m8_t __riscv_vsll_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, vuint32m8_t vs1,
                                      size_t vl);
vint32m8_t __riscv_vsll_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, size_t rs1, size_t vl);
vint64m1_t __riscv_vsll_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, vuint64m1_t vs1,
                                      size_t vl);
vint64m1_t __riscv_vsll_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, size_t rs1, size_t vl);
vint64m2_t __riscv_vsll_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, vuint64m2_t vs1,
                                      size_t vl);
vint64m2_t __riscv_vsll_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, size_t rs1, size_t vl);
vint64m4_t __riscv_vsll_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, vuint64m4_t vs1,
                                      size_t vl);
vint64m4_t __riscv_vsll_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, size_t rs1, size_t vl);
vint64m8_t __riscv_vsll_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, vuint64m8_t vs1,
                                      size_t vl);
vint64m8_t __riscv_vsll_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, size_t rs1, size_t vl);
vint8mf8_t __riscv_vsra_vv_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs2, vuint8mf8_t vs1,
                                      size_t vl);
vint8mf8_t __riscv_vsra_vx_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs2, size_t rs1, size_t vl);
vint8mf4_t __riscv_vsra_vv_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs2, vuint8mf4_t vs1,
                                      size_t vl);
vint8mf4_t __riscv_vsra_vx_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs2, size_t rs1, size_t vl);
vint8mf2_t __riscv_vsra_vv_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs2, vuint8mf2_t vs1,
                                      size_t vl);
vint8mf2_t __riscv_vsra_vx_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs2, size_t rs1, size_t vl);
vint8m1_t __riscv_vsra_vv_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                    vuint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vsra_vx_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                    size_t rs1, size_t vl);
vint8m2_t __riscv_vsra_vv_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                    vuint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vsra_vx_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                    size_t rs1, size_t vl);
vint8m4_t __riscv_vsra_vv_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                    vuint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vsra_vx_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                    size_t rs1, size_t vl);
vint8m8_t __riscv_vsra_vv_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                    vuint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vsra_vx_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                    size_t rs1, size_t vl);
vint16mf4_t __riscv_vsra_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, vuint16mf4_t vs1,
                                        size_t vl);
vint16mf4_t __riscv_vsra_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, size_t rs1, size_t vl);
vint16mf2_t __riscv_vsra_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, vuint16mf2_t vs1,
                                        size_t vl);
vint16mf2_t __riscv_vsra_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, size_t rs1, size_t vl);
vint16m1_t __riscv_vsra_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, vuint16m1_t vs1,
                                      size_t vl);
vint16m1_t __riscv_vsra_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, size_t rs1, size_t vl);
vint16m2_t __riscv_vsra_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, vuint16m2_t vs1,
                                      size_t vl);
vint16m2_t __riscv_vsra_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, size_t rs1, size_t vl);
vint16m4_t __riscv_vsra_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, vuint16m4_t vs1,
                                      size_t vl);
vint16m4_t __riscv_vsra_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, size_t rs1, size_t vl);
vint16m8_t __riscv_vsra_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, vuint16m8_t vs1,
                                      size_t vl);
vint16m8_t __riscv_vsra_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, size_t rs1, size_t vl);
vint32mf2_t __riscv_vsra_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, vuint32mf2_t vs1,
                                        size_t vl);
vint32mf2_t __riscv_vsra_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, size_t rs1, size_t vl);
vint32m1_t __riscv_vsra_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, vuint32m1_t vs1,
                                      size_t vl);
vint32m1_t __riscv_vsra_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, size_t rs1, size_t vl);
vint32m2_t __riscv_vsra_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, vuint32m2_t vs1,
                                      size_t vl);
vint32m2_t __riscv_vsra_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, size_t rs1, size_t vl);
vint32m4_t __riscv_vsra_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, vuint32m4_t vs1,
                                      size_t vl);
vint32m4_t __riscv_vsra_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, size_t rs1, size_t vl);
vint32m8_t __riscv_vsra_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, vuint32m8_t vs1,
                                      size_t vl);
vint32m8_t __riscv_vsra_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, size_t rs1, size_t vl);
vint64m1_t __riscv_vsra_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, vuint64m1_t vs1,
                                      size_t vl);
vint64m1_t __riscv_vsra_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, size_t rs1, size_t vl);
vint64m2_t __riscv_vsra_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, vuint64m2_t vs1,
                                      size_t vl);
vint64m2_t __riscv_vsra_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, size_t rs1, size_t vl);
vint64m4_t __riscv_vsra_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, vuint64m4_t vs1,
                                      size_t vl);
vint64m4_t __riscv_vsra_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, size_t rs1, size_t vl);
vint64m8_t __riscv_vsra_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, vuint64m8_t vs1,
                                      size_t vl);
vint64m8_t __riscv_vsra_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, size_t rs1, size_t vl);
vuint8mf8_t __riscv_vsll_vv_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs2, vuint8mf8_t vs1,
                                       size_t vl);
vuint8mf8_t __riscv_vsll_vx_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs2, size_t rs1, size_t vl);
vuint8mf4_t __riscv_vsll_vv_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs2, vuint8mf4_t vs1,
                                       size_t vl);
vuint8mf4_t __riscv_vsll_vx_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs2, size_t rs1, size_t vl);
vuint8mf2_t __riscv_vsll_vv_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs2, vuint8mf2_t vs1,
                                       size_t vl);
vuint8mf2_t __riscv_vsll_vx_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs2, size_t rs1, size_t vl);
vuint8m1_t __riscv_vsll_vv_u8m1_tumu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                     vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vsll_vx_u8m1_tumu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                     size_t rs1, size_t vl);
vuint8m2_t __riscv_vsll_vv_u8m2_tumu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                     vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vsll_vx_u8m2_tumu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                     size_t rs1, size_t vl);
vuint8m4_t __riscv_vsll_vv_u8m4_tumu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                     vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vsll_vx_u8m4_tumu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                     size_t rs1, size_t vl);
vuint8m8_t __riscv_vsll_vv_u8m8_tumu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                     vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vsll_vx_u8m8_tumu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                     size_t rs1, size_t vl);
vuint16mf4_t __riscv_vsll_vv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, vuint16mf4_t vs1,
                                         size_t vl);
vuint16mf4_t __riscv_vsll_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, size_t rs1,
                                         size_t vl);
vuint16mf2_t __riscv_vsll_vv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, vuint16mf2_t vs1,
                                         size_t vl);
vuint16mf2_t __riscv_vsll_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, size_t rs1,
                                         size_t vl);
vuint16m1_t __riscv_vsll_vv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, vuint16m1_t vs1,
                                       size_t vl);
vuint16m1_t __riscv_vsll_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, size_t rs1, size_t vl);
vuint16m2_t __riscv_vsll_vv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, vuint16m2_t vs1,
                                       size_t vl);
vuint16m2_t __riscv_vsll_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, size_t rs1, size_t vl);
vuint16m4_t __riscv_vsll_vv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, vuint16m4_t vs1,
                                       size_t vl);
vuint16m4_t __riscv_vsll_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, size_t rs1, size_t vl);
vuint16m8_t __riscv_vsll_vv_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, vuint16m8_t vs1,
                                       size_t vl);
vuint16m8_t __riscv_vsll_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, size_t rs1, size_t vl);
vuint32mf2_t __riscv_vsll_vv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, vuint32mf2_t vs1,
                                         size_t vl);
vuint32mf2_t __riscv_vsll_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, size_t rs1,
                                         size_t vl);
vuint32m1_t __riscv_vsll_vv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, vuint32m1_t vs1,
                                       size_t vl);
vuint32m1_t __riscv_vsll_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, size_t rs1, size_t vl);
vuint32m2_t __riscv_vsll_vv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, vuint32m2_t vs1,
                                       size_t vl);
vuint32m2_t __riscv_vsll_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, size_t rs1, size_t vl);
vuint32m4_t __riscv_vsll_vv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, vuint32m4_t vs1,
                                       size_t vl);
vuint32m4_t __riscv_vsll_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, size_t rs1, size_t vl);
vuint32m8_t __riscv_vsll_vv_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, vuint32m8_t vs1,
                                       size_t vl);
vuint32m8_t __riscv_vsll_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, size_t rs1, size_t vl);
vuint64m1_t __riscv_vsll_vv_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, vuint64m1_t vs1,
                                       size_t vl);
vuint64m1_t __riscv_vsll_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, size_t rs1, size_t vl);
vuint64m2_t __riscv_vsll_vv_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, vuint64m2_t vs1,
                                       size_t vl);
vuint64m2_t __riscv_vsll_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, size_t rs1, size_t vl);
vuint64m4_t __riscv_vsll_vv_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, vuint64m4_t vs1,
                                       size_t vl);
vuint64m4_t __riscv_vsll_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, size_t rs1, size_t vl);
vuint64m8_t __riscv_vsll_vv_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, vuint64m8_t vs1,
                                       size_t vl);
vuint64m8_t __riscv_vsll_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, size_t rs1, size_t vl);
vuint8mf8_t __riscv_vsrl_vv_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs2, vuint8mf8_t vs1,
                                       size_t vl);
vuint8mf8_t __riscv_vsrl_vx_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs2, size_t rs1, size_t vl);
vuint8mf4_t __riscv_vsrl_vv_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs2, vuint8mf4_t vs1,
                                       size_t vl);
vuint8mf4_t __riscv_vsrl_vx_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs2, size_t rs1, size_t vl);
vuint8mf2_t __riscv_vsrl_vv_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs2, vuint8mf2_t vs1,
                                       size_t vl);
vuint8mf2_t __riscv_vsrl_vx_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs2, size_t rs1, size_t vl);
vuint8m1_t __riscv_vsrl_vv_u8m1_tumu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                     vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vsrl_vx_u8m1_tumu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                     size_t rs1, size_t vl);
vuint8m2_t __riscv_vsrl_vv_u8m2_tumu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                     vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vsrl_vx_u8m2_tumu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                     size_t rs1, size_t vl);
vuint8m4_t __riscv_vsrl_vv_u8m4_tumu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                     vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vsrl_vx_u8m4_tumu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                     size_t rs1, size_t vl);
vuint8m8_t __riscv_vsrl_vv_u8m8_tumu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                     vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vsrl_vx_u8m8_tumu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                     size_t rs1, size_t vl);
vuint16mf4_t __riscv_vsrl_vv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, vuint16mf4_t vs1,
                                         size_t vl);
vuint16mf4_t __riscv_vsrl_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, size_t rs1,
                                         size_t vl);
vuint16mf2_t __riscv_vsrl_vv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, vuint16mf2_t vs1,
                                         size_t vl);
vuint16mf2_t __riscv_vsrl_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, size_t rs1,
                                         size_t vl);
vuint16m1_t __riscv_vsrl_vv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, vuint16m1_t vs1,
                                       size_t vl);
vuint16m1_t __riscv_vsrl_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, size_t rs1, size_t vl);
vuint16m2_t __riscv_vsrl_vv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, vuint16m2_t vs1,
                                       size_t vl);
vuint16m2_t __riscv_vsrl_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, size_t rs1, size_t vl);
vuint16m4_t __riscv_vsrl_vv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, vuint16m4_t vs1,
                                       size_t vl);
vuint16m4_t __riscv_vsrl_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, size_t rs1, size_t vl);
vuint16m8_t __riscv_vsrl_vv_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, vuint16m8_t vs1,
                                       size_t vl);
vuint16m8_t __riscv_vsrl_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, size_t rs1, size_t vl);
vuint32mf2_t __riscv_vsrl_vv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, vuint32mf2_t vs1,
                                         size_t vl);
vuint32mf2_t __riscv_vsrl_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, size_t rs1,
                                         size_t vl);
vuint32m1_t __riscv_vsrl_vv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, vuint32m1_t vs1,
                                       size_t vl);
vuint32m1_t __riscv_vsrl_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, size_t rs1, size_t vl);
vuint32m2_t __riscv_vsrl_vv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, vuint32m2_t vs1,
                                       size_t vl);
vuint32m2_t __riscv_vsrl_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, size_t rs1, size_t vl);
vuint32m4_t __riscv_vsrl_vv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, vuint32m4_t vs1,
                                       size_t vl);
vuint32m4_t __riscv_vsrl_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, size_t rs1, size_t vl);
vuint32m8_t __riscv_vsrl_vv_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, vuint32m8_t vs1,
                                       size_t vl);
vuint32m8_t __riscv_vsrl_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, size_t rs1, size_t vl);
vuint64m1_t __riscv_vsrl_vv_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, vuint64m1_t vs1,
                                       size_t vl);
vuint64m1_t __riscv_vsrl_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, size_t rs1, size_t vl);
vuint64m2_t __riscv_vsrl_vv_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, vuint64m2_t vs1,
                                       size_t vl);
vuint64m2_t __riscv_vsrl_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, size_t rs1, size_t vl);
vuint64m4_t __riscv_vsrl_vv_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, vuint64m4_t vs1,
                                       size_t vl);
vuint64m4_t __riscv_vsrl_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, size_t rs1, size_t vl);
vuint64m8_t __riscv_vsrl_vv_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, vuint64m8_t vs1,
                                       size_t vl);
vuint64m8_t __riscv_vsrl_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, size_t rs1, size_t vl);
// masked functions
vint8mf8_t __riscv_vsll_vv_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                    vuint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vsll_vx_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                    size_t rs1, size_t vl);
vint8mf4_t __riscv_vsll_vv_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                    vuint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vsll_vx_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                    size_t rs1, size_t vl);
vint8mf2_t __riscv_vsll_vv_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                    vuint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vsll_vx_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                    size_t rs1, size_t vl);
vint8m1_t __riscv_vsll_vv_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                  vuint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vsll_vx_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                  size_t rs1, size_t vl);
vint8m2_t __riscv_vsll_vv_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                  vuint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vsll_vx_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                  size_t rs1, size_t vl);
vint8m4_t __riscv_vsll_vv_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                  vuint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vsll_vx_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                  size_t rs1, size_t vl);
vint8m8_t __riscv_vsll_vv_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                  vuint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vsll_vx_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                  size_t rs1, size_t vl);
vint16mf4_t __riscv_vsll_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs2, vuint16mf4_t vs1,
                                      size_t vl);
vint16mf4_t __riscv_vsll_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs2, size_t rs1, size_t vl);
vint16mf2_t __riscv_vsll_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs2, vuint16mf2_t vs1,
                                      size_t vl);
vint16mf2_t __riscv_vsll_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs2, size_t rs1, size_t vl);
vint16m1_t __riscv_vsll_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                    vuint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vsll_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                    size_t rs1, size_t vl);
vint16m2_t __riscv_vsll_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                    vuint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vsll_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                    size_t rs1, size_t vl);
vint16m4_t __riscv_vsll_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                    vuint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vsll_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                    size_t rs1, size_t vl);
vint16m8_t __riscv_vsll_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                    vuint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vsll_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                    size_t rs1, size_t vl);
vint32mf2_t __riscv_vsll_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs2, vuint32mf2_t vs1,
                                      size_t vl);
vint32mf2_t __riscv_vsll_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs2, size_t rs1, size_t vl);
vint32m1_t __riscv_vsll_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                    vuint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vsll_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                    size_t rs1, size_t vl);
vint32m2_t __riscv_vsll_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                    vuint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vsll_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                    size_t rs1, size_t vl);
vint32m4_t __riscv_vsll_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                    vuint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vsll_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                    size_t rs1, size_t vl);
vint32m8_t __riscv_vsll_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                    vuint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vsll_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                    size_t rs1, size_t vl);
vint64m1_t __riscv_vsll_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                    vuint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vsll_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                    size_t rs1, size_t vl);
vint64m2_t __riscv_vsll_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                    vuint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vsll_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                    size_t rs1, size_t vl);
vint64m4_t __riscv_vsll_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                    vuint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vsll_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                    size_t rs1, size_t vl);
vint64m8_t __riscv_vsll_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                    vuint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vsll_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                    size_t rs1, size_t vl);
vint8mf8_t __riscv_vsra_vv_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                    vuint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vsra_vx_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                    size_t rs1, size_t vl);
vint8mf4_t __riscv_vsra_vv_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                    vuint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vsra_vx_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                    size_t rs1, size_t vl);
vint8mf2_t __riscv_vsra_vv_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                    vuint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vsra_vx_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                    size_t rs1, size_t vl);
vint8m1_t __riscv_vsra_vv_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                  vuint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vsra_vx_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                  size_t rs1, size_t vl);
vint8m2_t __riscv_vsra_vv_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                  vuint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vsra_vx_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                  size_t rs1, size_t vl);
vint8m4_t __riscv_vsra_vv_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                  vuint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vsra_vx_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                  size_t rs1, size_t vl);
vint8m8_t __riscv_vsra_vv_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                  vuint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vsra_vx_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                  size_t rs1, size_t vl);
vint16mf4_t __riscv_vsra_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs2, vuint16mf4_t vs1,
                                      size_t vl);
vint16mf4_t __riscv_vsra_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs2, size_t rs1, size_t vl);
vint16mf2_t __riscv_vsra_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs2, vuint16mf2_t vs1,
                                      size_t vl);
vint16mf2_t __riscv_vsra_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs2, size_t rs1, size_t vl);
vint16m1_t __riscv_vsra_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                    vuint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vsra_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                    size_t rs1, size_t vl);
vint16m2_t __riscv_vsra_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                    vuint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vsra_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                    size_t rs1, size_t vl);
vint16m4_t __riscv_vsra_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                    vuint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vsra_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                    size_t rs1, size_t vl);
vint16m8_t __riscv_vsra_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                    vuint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vsra_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                    size_t rs1, size_t vl);
vint32mf2_t __riscv_vsra_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs2, vuint32mf2_t vs1,
                                      size_t vl);
vint32mf2_t __riscv_vsra_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs2, size_t rs1, size_t vl);
vint32m1_t __riscv_vsra_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                    vuint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vsra_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                    size_t rs1, size_t vl);
vint32m2_t __riscv_vsra_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                    vuint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vsra_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                    size_t rs1, size_t vl);
vint32m4_t __riscv_vsra_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                    vuint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vsra_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                    size_t rs1, size_t vl);
vint32m8_t __riscv_vsra_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                    vuint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vsra_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                    size_t rs1, size_t vl);
vint64m1_t __riscv_vsra_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                    vuint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vsra_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                    size_t rs1, size_t vl);
vint64m2_t __riscv_vsra_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                    vuint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vsra_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                    size_t rs1, size_t vl);
vint64m4_t __riscv_vsra_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                    vuint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vsra_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                    size_t rs1, size_t vl);
vint64m8_t __riscv_vsra_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                    vuint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vsra_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                    size_t rs1, size_t vl);
vuint8mf8_t __riscv_vsll_vv_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                     vuint8mf8_t vs2, vuint8mf8_t vs1,
                                     size_t vl);
vuint8mf8_t __riscv_vsll_vx_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                     vuint8mf8_t vs2, size_t rs1, size_t vl);
vuint8mf4_t __riscv_vsll_vv_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                     vuint8mf4_t vs2, vuint8mf4_t vs1,
                                     size_t vl);
vuint8mf4_t __riscv_vsll_vx_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                     vuint8mf4_t vs2, size_t rs1, size_t vl);
vuint8mf2_t __riscv_vsll_vv_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                     vuint8mf2_t vs2, vuint8mf2_t vs1,
                                     size_t vl);
vuint8mf2_t __riscv_vsll_vx_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                     vuint8mf2_t vs2, size_t rs1, size_t vl);
vuint8m1_t __riscv_vsll_vv_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                   vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vsll_vx_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                   size_t rs1, size_t vl);
vuint8m2_t __riscv_vsll_vv_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                   vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vsll_vx_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                   size_t rs1, size_t vl);
vuint8m4_t __riscv_vsll_vv_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                   vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vsll_vx_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                   size_t rs1, size_t vl);
vuint8m8_t __riscv_vsll_vv_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                   vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vsll_vx_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                   size_t rs1, size_t vl);
vuint16mf4_t __riscv_vsll_vv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                       vuint16mf4_t vs2, vuint16mf4_t vs1,
                                       size_t vl);
vuint16mf4_t __riscv_vsll_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                       vuint16mf4_t vs2, size_t rs1, size_t vl);
vuint16mf2_t __riscv_vsll_vv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                       vuint16mf2_t vs2, vuint16mf2_t vs1,
                                       size_t vl);
vuint16mf2_t __riscv_vsll_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                       vuint16mf2_t vs2, size_t rs1, size_t vl);
vuint16m1_t __riscv_vsll_vv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                     vuint16m1_t vs2, vuint16m1_t vs1,
                                     size_t vl);
vuint16m1_t __riscv_vsll_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                     vuint16m1_t vs2, size_t rs1, size_t vl);
vuint16m2_t __riscv_vsll_vv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                     vuint16m2_t vs2, vuint16m2_t vs1,
                                     size_t vl);
vuint16m2_t __riscv_vsll_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                     vuint16m2_t vs2, size_t rs1, size_t vl);
vuint16m4_t __riscv_vsll_vv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                     vuint16m4_t vs2, vuint16m4_t vs1,
                                     size_t vl);
vuint16m4_t __riscv_vsll_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                     vuint16m4_t vs2, size_t rs1, size_t vl);
vuint16m8_t __riscv_vsll_vv_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                     vuint16m8_t vs2, vuint16m8_t vs1,
                                     size_t vl);
vuint16m8_t __riscv_vsll_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                     vuint16m8_t vs2, size_t rs1, size_t vl);
vuint32mf2_t __riscv_vsll_vv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                       vuint32mf2_t vs2, vuint32mf2_t vs1,
                                       size_t vl);
vuint32mf2_t __riscv_vsll_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                       vuint32mf2_t vs2, size_t rs1, size_t vl);
vuint32m1_t __riscv_vsll_vv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                     vuint32m1_t vs2, vuint32m1_t vs1,
                                     size_t vl);
vuint32m1_t __riscv_vsll_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                     vuint32m1_t vs2, size_t rs1, size_t vl);
vuint32m2_t __riscv_vsll_vv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                     vuint32m2_t vs2, vuint32m2_t vs1,
                                     size_t vl);
vuint32m2_t __riscv_vsll_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                     vuint32m2_t vs2, size_t rs1, size_t vl);
vuint32m4_t __riscv_vsll_vv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                     vuint32m4_t vs2, vuint32m4_t vs1,
                                     size_t vl);
vuint32m4_t __riscv_vsll_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                     vuint32m4_t vs2, size_t rs1, size_t vl);
vuint32m8_t __riscv_vsll_vv_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                     vuint32m8_t vs2, vuint32m8_t vs1,
                                     size_t vl);
vuint32m8_t __riscv_vsll_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                     vuint32m8_t vs2, size_t rs1, size_t vl);
vuint64m1_t __riscv_vsll_vv_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                     vuint64m1_t vs2, vuint64m1_t vs1,
                                     size_t vl);
vuint64m1_t __riscv_vsll_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                     vuint64m1_t vs2, size_t rs1, size_t vl);
vuint64m2_t __riscv_vsll_vv_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                     vuint64m2_t vs2, vuint64m2_t vs1,
                                     size_t vl);
vuint64m2_t __riscv_vsll_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                     vuint64m2_t vs2, size_t rs1, size_t vl);
vuint64m4_t __riscv_vsll_vv_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                     vuint64m4_t vs2, vuint64m4_t vs1,
                                     size_t vl);
vuint64m4_t __riscv_vsll_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                     vuint64m4_t vs2, size_t rs1, size_t vl);
vuint64m8_t __riscv_vsll_vv_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                     vuint64m8_t vs2, vuint64m8_t vs1,
                                     size_t vl);
vuint64m8_t __riscv_vsll_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                     vuint64m8_t vs2, size_t rs1, size_t vl);
vuint8mf8_t __riscv_vsrl_vv_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                     vuint8mf8_t vs2, vuint8mf8_t vs1,
                                     size_t vl);
vuint8mf8_t __riscv_vsrl_vx_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                     vuint8mf8_t vs2, size_t rs1, size_t vl);
vuint8mf4_t __riscv_vsrl_vv_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                     vuint8mf4_t vs2, vuint8mf4_t vs1,
                                     size_t vl);
vuint8mf4_t __riscv_vsrl_vx_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                     vuint8mf4_t vs2, size_t rs1, size_t vl);
vuint8mf2_t __riscv_vsrl_vv_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                     vuint8mf2_t vs2, vuint8mf2_t vs1,
                                     size_t vl);
vuint8mf2_t __riscv_vsrl_vx_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                     vuint8mf2_t vs2, size_t rs1, size_t vl);
vuint8m1_t __riscv_vsrl_vv_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                   vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vsrl_vx_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                   size_t rs1, size_t vl);
vuint8m2_t __riscv_vsrl_vv_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                   vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vsrl_vx_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                   size_t rs1, size_t vl);
vuint8m4_t __riscv_vsrl_vv_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                   vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vsrl_vx_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                   size_t rs1, size_t vl);
vuint8m8_t __riscv_vsrl_vv_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                   vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vsrl_vx_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                   size_t rs1, size_t vl);
vuint16mf4_t __riscv_vsrl_vv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                       vuint16mf4_t vs2, vuint16mf4_t vs1,
                                       size_t vl);
vuint16mf4_t __riscv_vsrl_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                       vuint16mf4_t vs2, size_t rs1, size_t vl);
vuint16mf2_t __riscv_vsrl_vv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                       vuint16mf2_t vs2, vuint16mf2_t vs1,
                                       size_t vl);
vuint16mf2_t __riscv_vsrl_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                       vuint16mf2_t vs2, size_t rs1, size_t vl);
vuint16m1_t __riscv_vsrl_vv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                     vuint16m1_t vs2, vuint16m1_t vs1,
                                     size_t vl);
vuint16m1_t __riscv_vsrl_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                     vuint16m1_t vs2, size_t rs1, size_t vl);
vuint16m2_t __riscv_vsrl_vv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                     vuint16m2_t vs2, vuint16m2_t vs1,
                                     size_t vl);
vuint16m2_t __riscv_vsrl_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                     vuint16m2_t vs2, size_t rs1, size_t vl);
vuint16m4_t __riscv_vsrl_vv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                     vuint16m4_t vs2, vuint16m4_t vs1,
                                     size_t vl);
vuint16m4_t __riscv_vsrl_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                     vuint16m4_t vs2, size_t rs1, size_t vl);
vuint16m8_t __riscv_vsrl_vv_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                     vuint16m8_t vs2, vuint16m8_t vs1,
                                     size_t vl);
vuint16m8_t __riscv_vsrl_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                     vuint16m8_t vs2, size_t rs1, size_t vl);
vuint32mf2_t __riscv_vsrl_vv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                       vuint32mf2_t vs2, vuint32mf2_t vs1,
                                       size_t vl);
vuint32mf2_t __riscv_vsrl_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                       vuint32mf2_t vs2, size_t rs1, size_t vl);
vuint32m1_t __riscv_vsrl_vv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                     vuint32m1_t vs2, vuint32m1_t vs1,
                                     size_t vl);
vuint32m1_t __riscv_vsrl_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                     vuint32m1_t vs2, size_t rs1, size_t vl);
vuint32m2_t __riscv_vsrl_vv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                     vuint32m2_t vs2, vuint32m2_t vs1,
                                     size_t vl);
vuint32m2_t __riscv_vsrl_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                     vuint32m2_t vs2, size_t rs1, size_t vl);
vuint32m4_t __riscv_vsrl_vv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                     vuint32m4_t vs2, vuint32m4_t vs1,
                                     size_t vl);
vuint32m4_t __riscv_vsrl_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                     vuint32m4_t vs2, size_t rs1, size_t vl);
vuint32m8_t __riscv_vsrl_vv_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                     vuint32m8_t vs2, vuint32m8_t vs1,
                                     size_t vl);
vuint32m8_t __riscv_vsrl_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                     vuint32m8_t vs2, size_t rs1, size_t vl);
vuint64m1_t __riscv_vsrl_vv_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                     vuint64m1_t vs2, vuint64m1_t vs1,
                                     size_t vl);
vuint64m1_t __riscv_vsrl_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                     vuint64m1_t vs2, size_t rs1, size_t vl);
vuint64m2_t __riscv_vsrl_vv_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                     vuint64m2_t vs2, vuint64m2_t vs1,
                                     size_t vl);
vuint64m2_t __riscv_vsrl_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                     vuint64m2_t vs2, size_t rs1, size_t vl);
vuint64m4_t __riscv_vsrl_vv_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                     vuint64m4_t vs2, vuint64m4_t vs1,
                                     size_t vl);
vuint64m4_t __riscv_vsrl_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                     vuint64m4_t vs2, size_t rs1, size_t vl);
vuint64m8_t __riscv_vsrl_vv_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                     vuint64m8_t vs2, vuint64m8_t vs1,
                                     size_t vl);
vuint64m8_t __riscv_vsrl_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                     vuint64m8_t vs2, size_t rs1, size_t vl);

Vector Narrowing Integer Right Shift Intrinsics

vint8mf8_t __riscv_vnsra_wv_i8mf8_tu(vint8mf8_t vd, vint16mf4_t vs2,
                                     vuint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vnsra_wx_i8mf8_tu(vint8mf8_t vd, vint16mf4_t vs2, size_t rs1,
                                     size_t vl);
vint8mf4_t __riscv_vnsra_wv_i8mf4_tu(vint8mf4_t vd, vint16mf2_t vs2,
                                     vuint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vnsra_wx_i8mf4_tu(vint8mf4_t vd, vint16mf2_t vs2, size_t rs1,
                                     size_t vl);
vint8mf2_t __riscv_vnsra_wv_i8mf2_tu(vint8mf2_t vd, vint16m1_t vs2,
                                     vuint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vnsra_wx_i8mf2_tu(vint8mf2_t vd, vint16m1_t vs2, size_t rs1,
                                     size_t vl);
vint8m1_t __riscv_vnsra_wv_i8m1_tu(vint8m1_t vd, vint16m2_t vs2, vuint8m1_t vs1,
                                   size_t vl);
vint8m1_t __riscv_vnsra_wx_i8m1_tu(vint8m1_t vd, vint16m2_t vs2, size_t rs1,
                                   size_t vl);
vint8m2_t __riscv_vnsra_wv_i8m2_tu(vint8m2_t vd, vint16m4_t vs2, vuint8m2_t vs1,
                                   size_t vl);
vint8m2_t __riscv_vnsra_wx_i8m2_tu(vint8m2_t vd, vint16m4_t vs2, size_t rs1,
                                   size_t vl);
vint8m4_t __riscv_vnsra_wv_i8m4_tu(vint8m4_t vd, vint16m8_t vs2, vuint8m4_t vs1,
                                   size_t vl);
vint8m4_t __riscv_vnsra_wx_i8m4_tu(vint8m4_t vd, vint16m8_t vs2, size_t rs1,
                                   size_t vl);
vint16mf4_t __riscv_vnsra_wv_i16mf4_tu(vint16mf4_t vd, vint32mf2_t vs2,
                                       vuint16mf4_t vs1, size_t vl);
vint16mf4_t __riscv_vnsra_wx_i16mf4_tu(vint16mf4_t vd, vint32mf2_t vs2,
                                       size_t rs1, size_t vl);
vint16mf2_t __riscv_vnsra_wv_i16mf2_tu(vint16mf2_t vd, vint32m1_t vs2,
                                       vuint16mf2_t vs1, size_t vl);
vint16mf2_t __riscv_vnsra_wx_i16mf2_tu(vint16mf2_t vd, vint32m1_t vs2,
                                       size_t rs1, size_t vl);
vint16m1_t __riscv_vnsra_wv_i16m1_tu(vint16m1_t vd, vint32m2_t vs2,
                                     vuint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vnsra_wx_i16m1_tu(vint16m1_t vd, vint32m2_t vs2, size_t rs1,
                                     size_t vl);
vint16m2_t __riscv_vnsra_wv_i16m2_tu(vint16m2_t vd, vint32m4_t vs2,
                                     vuint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vnsra_wx_i16m2_tu(vint16m2_t vd, vint32m4_t vs2, size_t rs1,
                                     size_t vl);
vint16m4_t __riscv_vnsra_wv_i16m4_tu(vint16m4_t vd, vint32m8_t vs2,
                                     vuint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vnsra_wx_i16m4_tu(vint16m4_t vd, vint32m8_t vs2, size_t rs1,
                                     size_t vl);
vint32mf2_t __riscv_vnsra_wv_i32mf2_tu(vint32mf2_t vd, vint64m1_t vs2,
                                       vuint32mf2_t vs1, size_t vl);
vint32mf2_t __riscv_vnsra_wx_i32mf2_tu(vint32mf2_t vd, vint64m1_t vs2,
                                       size_t rs1, size_t vl);
vint32m1_t __riscv_vnsra_wv_i32m1_tu(vint32m1_t vd, vint64m2_t vs2,
                                     vuint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vnsra_wx_i32m1_tu(vint32m1_t vd, vint64m2_t vs2, size_t rs1,
                                     size_t vl);
vint32m2_t __riscv_vnsra_wv_i32m2_tu(vint32m2_t vd, vint64m4_t vs2,
                                     vuint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vnsra_wx_i32m2_tu(vint32m2_t vd, vint64m4_t vs2, size_t rs1,
                                     size_t vl);
vint32m4_t __riscv_vnsra_wv_i32m4_tu(vint32m4_t vd, vint64m8_t vs2,
                                     vuint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vnsra_wx_i32m4_tu(vint32m4_t vd, vint64m8_t vs2, size_t rs1,
                                     size_t vl);
vuint8mf8_t __riscv_vnsrl_wv_u8mf8_tu(vuint8mf8_t vd, vuint16mf4_t vs2,
                                      vuint8mf8_t vs1, size_t vl);
vuint8mf8_t __riscv_vnsrl_wx_u8mf8_tu(vuint8mf8_t vd, vuint16mf4_t vs2,
                                      size_t rs1, size_t vl);
vuint8mf4_t __riscv_vnsrl_wv_u8mf4_tu(vuint8mf4_t vd, vuint16mf2_t vs2,
                                      vuint8mf4_t vs1, size_t vl);
vuint8mf4_t __riscv_vnsrl_wx_u8mf4_tu(vuint8mf4_t vd, vuint16mf2_t vs2,
                                      size_t rs1, size_t vl);
vuint8mf2_t __riscv_vnsrl_wv_u8mf2_tu(vuint8mf2_t vd, vuint16m1_t vs2,
                                      vuint8mf2_t vs1, size_t vl);
vuint8mf2_t __riscv_vnsrl_wx_u8mf2_tu(vuint8mf2_t vd, vuint16m1_t vs2,
                                      size_t rs1, size_t vl);
vuint8m1_t __riscv_vnsrl_wv_u8m1_tu(vuint8m1_t vd, vuint16m2_t vs2,
                                    vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vnsrl_wx_u8m1_tu(vuint8m1_t vd, vuint16m2_t vs2, size_t rs1,
                                    size_t vl);
vuint8m2_t __riscv_vnsrl_wv_u8m2_tu(vuint8m2_t vd, vuint16m4_t vs2,
                                    vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vnsrl_wx_u8m2_tu(vuint8m2_t vd, vuint16m4_t vs2, size_t rs1,
                                    size_t vl);
vuint8m4_t __riscv_vnsrl_wv_u8m4_tu(vuint8m4_t vd, vuint16m8_t vs2,
                                    vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vnsrl_wx_u8m4_tu(vuint8m4_t vd, vuint16m8_t vs2, size_t rs1,
                                    size_t vl);
vuint16mf4_t __riscv_vnsrl_wv_u16mf4_tu(vuint16mf4_t vd, vuint32mf2_t vs2,
                                        vuint16mf4_t vs1, size_t vl);
vuint16mf4_t __riscv_vnsrl_wx_u16mf4_tu(vuint16mf4_t vd, vuint32mf2_t vs2,
                                        size_t rs1, size_t vl);
vuint16mf2_t __riscv_vnsrl_wv_u16mf2_tu(vuint16mf2_t vd, vuint32m1_t vs2,
                                        vuint16mf2_t vs1, size_t vl);
vuint16mf2_t __riscv_vnsrl_wx_u16mf2_tu(vuint16mf2_t vd, vuint32m1_t vs2,
                                        size_t rs1, size_t vl);
vuint16m1_t __riscv_vnsrl_wv_u16m1_tu(vuint16m1_t vd, vuint32m2_t vs2,
                                      vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vnsrl_wx_u16m1_tu(vuint16m1_t vd, vuint32m2_t vs2,
                                      size_t rs1, size_t vl);
vuint16m2_t __riscv_vnsrl_wv_u16m2_tu(vuint16m2_t vd, vuint32m4_t vs2,
                                      vuint16m2_t vs1, size_t vl);
vuint16m2_t __riscv_vnsrl_wx_u16m2_tu(vuint16m2_t vd, vuint32m4_t vs2,
                                      size_t rs1, size_t vl);
vuint16m4_t __riscv_vnsrl_wv_u16m4_tu(vuint16m4_t vd, vuint32m8_t vs2,
                                      vuint16m4_t vs1, size_t vl);
vuint16m4_t __riscv_vnsrl_wx_u16m4_tu(vuint16m4_t vd, vuint32m8_t vs2,
                                      size_t rs1, size_t vl);
vuint32mf2_t __riscv_vnsrl_wv_u32mf2_tu(vuint32mf2_t vd, vuint64m1_t vs2,
                                        vuint32mf2_t vs1, size_t vl);
vuint32mf2_t __riscv_vnsrl_wx_u32mf2_tu(vuint32mf2_t vd, vuint64m1_t vs2,
                                        size_t rs1, size_t vl);
vuint32m1_t __riscv_vnsrl_wv_u32m1_tu(vuint32m1_t vd, vuint64m2_t vs2,
                                      vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vnsrl_wx_u32m1_tu(vuint32m1_t vd, vuint64m2_t vs2,
                                      size_t rs1, size_t vl);
vuint32m2_t __riscv_vnsrl_wv_u32m2_tu(vuint32m2_t vd, vuint64m4_t vs2,
                                      vuint32m2_t vs1, size_t vl);
vuint32m2_t __riscv_vnsrl_wx_u32m2_tu(vuint32m2_t vd, vuint64m4_t vs2,
                                      size_t rs1, size_t vl);
vuint32m4_t __riscv_vnsrl_wv_u32m4_tu(vuint32m4_t vd, vuint64m8_t vs2,
                                      vuint32m4_t vs1, size_t vl);
vuint32m4_t __riscv_vnsrl_wx_u32m4_tu(vuint32m4_t vd, vuint64m8_t vs2,
                                      size_t rs1, size_t vl);
// masked functions
vint8mf8_t __riscv_vnsra_wv_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                      vint16mf4_t vs2, vuint8mf8_t vs1,
                                      size_t vl);
vint8mf8_t __riscv_vnsra_wx_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                      vint16mf4_t vs2, size_t rs1, size_t vl);
vint8mf4_t __riscv_vnsra_wv_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                      vint16mf2_t vs2, vuint8mf4_t vs1,
                                      size_t vl);
vint8mf4_t __riscv_vnsra_wx_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                      vint16mf2_t vs2, size_t rs1, size_t vl);
vint8mf2_t __riscv_vnsra_wv_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                      vint16m1_t vs2, vuint8mf2_t vs1,
                                      size_t vl);
vint8mf2_t __riscv_vnsra_wx_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                      vint16m1_t vs2, size_t rs1, size_t vl);
vint8m1_t __riscv_vnsra_wv_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint16m2_t vs2,
                                    vuint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vnsra_wx_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint16m2_t vs2,
                                    size_t rs1, size_t vl);
vint8m2_t __riscv_vnsra_wv_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint16m4_t vs2,
                                    vuint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vnsra_wx_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint16m4_t vs2,
                                    size_t rs1, size_t vl);
vint8m4_t __riscv_vnsra_wv_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint16m8_t vs2,
                                    vuint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vnsra_wx_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint16m8_t vs2,
                                    size_t rs1, size_t vl);
vint16mf4_t __riscv_vnsra_wv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                        vint32mf2_t vs2, vuint16mf4_t vs1,
                                        size_t vl);
vint16mf4_t __riscv_vnsra_wx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                        vint32mf2_t vs2, size_t rs1, size_t vl);
vint16mf2_t __riscv_vnsra_wv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                        vint32m1_t vs2, vuint16mf2_t vs1,
                                        size_t vl);
vint16mf2_t __riscv_vnsra_wx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                        vint32m1_t vs2, size_t rs1, size_t vl);
vint16m1_t __riscv_vnsra_wv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                      vint32m2_t vs2, vuint16m1_t vs1,
                                      size_t vl);
vint16m1_t __riscv_vnsra_wx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                      vint32m2_t vs2, size_t rs1, size_t vl);
vint16m2_t __riscv_vnsra_wv_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                      vint32m4_t vs2, vuint16m2_t vs1,
                                      size_t vl);
vint16m2_t __riscv_vnsra_wx_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                      vint32m4_t vs2, size_t rs1, size_t vl);
vint16m4_t __riscv_vnsra_wv_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                      vint32m8_t vs2, vuint16m4_t vs1,
                                      size_t vl);
vint16m4_t __riscv_vnsra_wx_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                      vint32m8_t vs2, size_t rs1, size_t vl);
vint32mf2_t __riscv_vnsra_wv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                        vint64m1_t vs2, vuint32mf2_t vs1,
                                        size_t vl);
vint32mf2_t __riscv_vnsra_wx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                        vint64m1_t vs2, size_t rs1, size_t vl);
vint32m1_t __riscv_vnsra_wv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                      vint64m2_t vs2, vuint32m1_t vs1,
                                      size_t vl);
vint32m1_t __riscv_vnsra_wx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                      vint64m2_t vs2, size_t rs1, size_t vl);
vint32m2_t __riscv_vnsra_wv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                      vint64m4_t vs2, vuint32m2_t vs1,
                                      size_t vl);
vint32m2_t __riscv_vnsra_wx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                      vint64m4_t vs2, size_t rs1, size_t vl);
vint32m4_t __riscv_vnsra_wv_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                      vint64m8_t vs2, vuint32m4_t vs1,
                                      size_t vl);
vint32m4_t __riscv_vnsra_wx_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                      vint64m8_t vs2, size_t rs1, size_t vl);
vuint8mf8_t __riscv_vnsrl_wv_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                       vuint16mf4_t vs2, vuint8mf8_t vs1,
                                       size_t vl);
vuint8mf8_t __riscv_vnsrl_wx_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                       vuint16mf4_t vs2, size_t rs1, size_t vl);
vuint8mf4_t __riscv_vnsrl_wv_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                       vuint16mf2_t vs2, vuint8mf4_t vs1,
                                       size_t vl);
vuint8mf4_t __riscv_vnsrl_wx_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                       vuint16mf2_t vs2, size_t rs1, size_t vl);
vuint8mf2_t __riscv_vnsrl_wv_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                       vuint16m1_t vs2, vuint8mf2_t vs1,
                                       size_t vl);
vuint8mf2_t __riscv_vnsrl_wx_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                       vuint16m1_t vs2, size_t rs1, size_t vl);
vuint8m1_t __riscv_vnsrl_wv_u8m1_tum(vbool8_t vm, vuint8m1_t vd,
                                     vuint16m2_t vs2, vuint8m1_t vs1,
                                     size_t vl);
vuint8m1_t __riscv_vnsrl_wx_u8m1_tum(vbool8_t vm, vuint8m1_t vd,
                                     vuint16m2_t vs2, size_t rs1, size_t vl);
vuint8m2_t __riscv_vnsrl_wv_u8m2_tum(vbool4_t vm, vuint8m2_t vd,
                                     vuint16m4_t vs2, vuint8m2_t vs1,
                                     size_t vl);
vuint8m2_t __riscv_vnsrl_wx_u8m2_tum(vbool4_t vm, vuint8m2_t vd,
                                     vuint16m4_t vs2, size_t rs1, size_t vl);
vuint8m4_t __riscv_vnsrl_wv_u8m4_tum(vbool2_t vm, vuint8m4_t vd,
                                     vuint16m8_t vs2, vuint8m4_t vs1,
                                     size_t vl);
vuint8m4_t __riscv_vnsrl_wx_u8m4_tum(vbool2_t vm, vuint8m4_t vd,
                                     vuint16m8_t vs2, size_t rs1, size_t vl);
vuint16mf4_t __riscv_vnsrl_wv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                         vuint32mf2_t vs2, vuint16mf4_t vs1,
                                         size_t vl);
vuint16mf4_t __riscv_vnsrl_wx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                         vuint32mf2_t vs2, size_t rs1,
                                         size_t vl);
vuint16mf2_t __riscv_vnsrl_wv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                         vuint32m1_t vs2, vuint16mf2_t vs1,
                                         size_t vl);
vuint16mf2_t __riscv_vnsrl_wx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                         vuint32m1_t vs2, size_t rs1,
                                         size_t vl);
vuint16m1_t __riscv_vnsrl_wv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                       vuint32m2_t vs2, vuint16m1_t vs1,
                                       size_t vl);
vuint16m1_t __riscv_vnsrl_wx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                       vuint32m2_t vs2, size_t rs1, size_t vl);
vuint16m2_t __riscv_vnsrl_wv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                       vuint32m4_t vs2, vuint16m2_t vs1,
                                       size_t vl);
vuint16m2_t __riscv_vnsrl_wx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                       vuint32m4_t vs2, size_t rs1, size_t vl);
vuint16m4_t __riscv_vnsrl_wv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                       vuint32m8_t vs2, vuint16m4_t vs1,
                                       size_t vl);
vuint16m4_t __riscv_vnsrl_wx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                       vuint32m8_t vs2, size_t rs1, size_t vl);
vuint32mf2_t __riscv_vnsrl_wv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                         vuint64m1_t vs2, vuint32mf2_t vs1,
                                         size_t vl);
vuint32mf2_t __riscv_vnsrl_wx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                         vuint64m1_t vs2, size_t rs1,
                                         size_t vl);
vuint32m1_t __riscv_vnsrl_wv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                       vuint64m2_t vs2, vuint32m1_t vs1,
                                       size_t vl);
vuint32m1_t __riscv_vnsrl_wx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                       vuint64m2_t vs2, size_t rs1, size_t vl);
vuint32m2_t __riscv_vnsrl_wv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                       vuint64m4_t vs2, vuint32m2_t vs1,
                                       size_t vl);
vuint32m2_t __riscv_vnsrl_wx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                       vuint64m4_t vs2, size_t rs1, size_t vl);
vuint32m4_t __riscv_vnsrl_wv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                       vuint64m8_t vs2, vuint32m4_t vs1,
                                       size_t vl);
vuint32m4_t __riscv_vnsrl_wx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                       vuint64m8_t vs2, size_t rs1, size_t vl);
// masked functions
vint8mf8_t __riscv_vnsra_wv_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                       vint16mf4_t vs2, vuint8mf8_t vs1,
                                       size_t vl);
vint8mf8_t __riscv_vnsra_wx_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                       vint16mf4_t vs2, size_t rs1, size_t vl);
vint8mf4_t __riscv_vnsra_wv_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                       vint16mf2_t vs2, vuint8mf4_t vs1,
                                       size_t vl);
vint8mf4_t __riscv_vnsra_wx_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                       vint16mf2_t vs2, size_t rs1, size_t vl);
vint8mf2_t __riscv_vnsra_wv_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                       vint16m1_t vs2, vuint8mf2_t vs1,
                                       size_t vl);
vint8mf2_t __riscv_vnsra_wx_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                       vint16m1_t vs2, size_t rs1, size_t vl);
vint8m1_t __riscv_vnsra_wv_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint16m2_t vs2,
                                     vuint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vnsra_wx_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint16m2_t vs2,
                                     size_t rs1, size_t vl);
vint8m2_t __riscv_vnsra_wv_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint16m4_t vs2,
                                     vuint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vnsra_wx_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint16m4_t vs2,
                                     size_t rs1, size_t vl);
vint8m4_t __riscv_vnsra_wv_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint16m8_t vs2,
                                     vuint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vnsra_wx_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint16m8_t vs2,
                                     size_t rs1, size_t vl);
vint16mf4_t __riscv_vnsra_wv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                         vint32mf2_t vs2, vuint16mf4_t vs1,
                                         size_t vl);
vint16mf4_t __riscv_vnsra_wx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                         vint32mf2_t vs2, size_t rs1,
                                         size_t vl);
vint16mf2_t __riscv_vnsra_wv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                         vint32m1_t vs2, vuint16mf2_t vs1,
                                         size_t vl);
vint16mf2_t __riscv_vnsra_wx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                         vint32m1_t vs2, size_t rs1, size_t vl);
vint16m1_t __riscv_vnsra_wv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                       vint32m2_t vs2, vuint16m1_t vs1,
                                       size_t vl);
vint16m1_t __riscv_vnsra_wx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                       vint32m2_t vs2, size_t rs1, size_t vl);
vint16m2_t __riscv_vnsra_wv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                       vint32m4_t vs2, vuint16m2_t vs1,
                                       size_t vl);
vint16m2_t __riscv_vnsra_wx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                       vint32m4_t vs2, size_t rs1, size_t vl);
vint16m4_t __riscv_vnsra_wv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                       vint32m8_t vs2, vuint16m4_t vs1,
                                       size_t vl);
vint16m4_t __riscv_vnsra_wx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                       vint32m8_t vs2, size_t rs1, size_t vl);
vint32mf2_t __riscv_vnsra_wv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                         vint64m1_t vs2, vuint32mf2_t vs1,
                                         size_t vl);
vint32mf2_t __riscv_vnsra_wx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                         vint64m1_t vs2, size_t rs1, size_t vl);
vint32m1_t __riscv_vnsra_wv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                       vint64m2_t vs2, vuint32m1_t vs1,
                                       size_t vl);
vint32m1_t __riscv_vnsra_wx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                       vint64m2_t vs2, size_t rs1, size_t vl);
vint32m2_t __riscv_vnsra_wv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                       vint64m4_t vs2, vuint32m2_t vs1,
                                       size_t vl);
vint32m2_t __riscv_vnsra_wx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                       vint64m4_t vs2, size_t rs1, size_t vl);
vint32m4_t __riscv_vnsra_wv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                       vint64m8_t vs2, vuint32m4_t vs1,
                                       size_t vl);
vint32m4_t __riscv_vnsra_wx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                       vint64m8_t vs2, size_t rs1, size_t vl);
vuint8mf8_t __riscv_vnsrl_wv_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                        vuint16mf4_t vs2, vuint8mf8_t vs1,
                                        size_t vl);
vuint8mf8_t __riscv_vnsrl_wx_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                        vuint16mf4_t vs2, size_t rs1,
                                        size_t vl);
vuint8mf4_t __riscv_vnsrl_wv_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                        vuint16mf2_t vs2, vuint8mf4_t vs1,
                                        size_t vl);
vuint8mf4_t __riscv_vnsrl_wx_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                        vuint16mf2_t vs2, size_t rs1,
                                        size_t vl);
vuint8mf2_t __riscv_vnsrl_wv_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                        vuint16m1_t vs2, vuint8mf2_t vs1,
                                        size_t vl);
vuint8mf2_t __riscv_vnsrl_wx_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                        vuint16m1_t vs2, size_t rs1, size_t vl);
vuint8m1_t __riscv_vnsrl_wv_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                      vuint16m2_t vs2, vuint8m1_t vs1,
                                      size_t vl);
vuint8m1_t __riscv_vnsrl_wx_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                      vuint16m2_t vs2, size_t rs1, size_t vl);
vuint8m2_t __riscv_vnsrl_wv_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                      vuint16m4_t vs2, vuint8m2_t vs1,
                                      size_t vl);
vuint8m2_t __riscv_vnsrl_wx_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                      vuint16m4_t vs2, size_t rs1, size_t vl);
vuint8m4_t __riscv_vnsrl_wv_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                      vuint16m8_t vs2, vuint8m4_t vs1,
                                      size_t vl);
vuint8m4_t __riscv_vnsrl_wx_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                      vuint16m8_t vs2, size_t rs1, size_t vl);
vuint16mf4_t __riscv_vnsrl_wv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                          vuint32mf2_t vs2, vuint16mf4_t vs1,
                                          size_t vl);
vuint16mf4_t __riscv_vnsrl_wx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                          vuint32mf2_t vs2, size_t rs1,
                                          size_t vl);
vuint16mf2_t __riscv_vnsrl_wv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                          vuint32m1_t vs2, vuint16mf2_t vs1,
                                          size_t vl);
vuint16mf2_t __riscv_vnsrl_wx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                          vuint32m1_t vs2, size_t rs1,
                                          size_t vl);
vuint16m1_t __riscv_vnsrl_wv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                        vuint32m2_t vs2, vuint16m1_t vs1,
                                        size_t vl);
vuint16m1_t __riscv_vnsrl_wx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                        vuint32m2_t vs2, size_t rs1, size_t vl);
vuint16m2_t __riscv_vnsrl_wv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                        vuint32m4_t vs2, vuint16m2_t vs1,
                                        size_t vl);
vuint16m2_t __riscv_vnsrl_wx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                        vuint32m4_t vs2, size_t rs1, size_t vl);
vuint16m4_t __riscv_vnsrl_wv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                        vuint32m8_t vs2, vuint16m4_t vs1,
                                        size_t vl);
vuint16m4_t __riscv_vnsrl_wx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                        vuint32m8_t vs2, size_t rs1, size_t vl);
vuint32mf2_t __riscv_vnsrl_wv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                          vuint64m1_t vs2, vuint32mf2_t vs1,
                                          size_t vl);
vuint32mf2_t __riscv_vnsrl_wx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                          vuint64m1_t vs2, size_t rs1,
                                          size_t vl);
vuint32m1_t __riscv_vnsrl_wv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                        vuint64m2_t vs2, vuint32m1_t vs1,
                                        size_t vl);
vuint32m1_t __riscv_vnsrl_wx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                        vuint64m2_t vs2, size_t rs1, size_t vl);
vuint32m2_t __riscv_vnsrl_wv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                        vuint64m4_t vs2, vuint32m2_t vs1,
                                        size_t vl);
vuint32m2_t __riscv_vnsrl_wx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                        vuint64m4_t vs2, size_t rs1, size_t vl);
vuint32m4_t __riscv_vnsrl_wv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                        vuint64m8_t vs2, vuint32m4_t vs1,
                                        size_t vl);
vuint32m4_t __riscv_vnsrl_wx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                        vuint64m8_t vs2, size_t rs1, size_t vl);
// masked functions
vint8mf8_t __riscv_vnsra_wv_i8mf8_mu(vbool64_t vm, vint8mf8_t vd,
                                     vint16mf4_t vs2, vuint8mf8_t vs1,
                                     size_t vl);
vint8mf8_t __riscv_vnsra_wx_i8mf8_mu(vbool64_t vm, vint8mf8_t vd,
                                     vint16mf4_t vs2, size_t rs1, size_t vl);
vint8mf4_t __riscv_vnsra_wv_i8mf4_mu(vbool32_t vm, vint8mf4_t vd,
                                     vint16mf2_t vs2, vuint8mf4_t vs1,
                                     size_t vl);
vint8mf4_t __riscv_vnsra_wx_i8mf4_mu(vbool32_t vm, vint8mf4_t vd,
                                     vint16mf2_t vs2, size_t rs1, size_t vl);
vint8mf2_t __riscv_vnsra_wv_i8mf2_mu(vbool16_t vm, vint8mf2_t vd,
                                     vint16m1_t vs2, vuint8mf2_t vs1,
                                     size_t vl);
vint8mf2_t __riscv_vnsra_wx_i8mf2_mu(vbool16_t vm, vint8mf2_t vd,
                                     vint16m1_t vs2, size_t rs1, size_t vl);
vint8m1_t __riscv_vnsra_wv_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint16m2_t vs2,
                                   vuint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vnsra_wx_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint16m2_t vs2,
                                   size_t rs1, size_t vl);
vint8m2_t __riscv_vnsra_wv_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint16m4_t vs2,
                                   vuint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vnsra_wx_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint16m4_t vs2,
                                   size_t rs1, size_t vl);
vint8m4_t __riscv_vnsra_wv_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint16m8_t vs2,
                                   vuint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vnsra_wx_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint16m8_t vs2,
                                   size_t rs1, size_t vl);
vint16mf4_t __riscv_vnsra_wv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                       vint32mf2_t vs2, vuint16mf4_t vs1,
                                       size_t vl);
vint16mf4_t __riscv_vnsra_wx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                       vint32mf2_t vs2, size_t rs1, size_t vl);
vint16mf2_t __riscv_vnsra_wv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                       vint32m1_t vs2, vuint16mf2_t vs1,
                                       size_t vl);
vint16mf2_t __riscv_vnsra_wx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                       vint32m1_t vs2, size_t rs1, size_t vl);
vint16m1_t __riscv_vnsra_wv_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                     vint32m2_t vs2, vuint16m1_t vs1,
                                     size_t vl);
vint16m1_t __riscv_vnsra_wx_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                     vint32m2_t vs2, size_t rs1, size_t vl);
vint16m2_t __riscv_vnsra_wv_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint32m4_t vs2,
                                     vuint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vnsra_wx_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint32m4_t vs2,
                                     size_t rs1, size_t vl);
vint16m4_t __riscv_vnsra_wv_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint32m8_t vs2,
                                     vuint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vnsra_wx_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint32m8_t vs2,
                                     size_t rs1, size_t vl);
vint32mf2_t __riscv_vnsra_wv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                       vint64m1_t vs2, vuint32mf2_t vs1,
                                       size_t vl);
vint32mf2_t __riscv_vnsra_wx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                       vint64m1_t vs2, size_t rs1, size_t vl);
vint32m1_t __riscv_vnsra_wv_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                     vint64m2_t vs2, vuint32m1_t vs1,
                                     size_t vl);
vint32m1_t __riscv_vnsra_wx_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                     vint64m2_t vs2, size_t rs1, size_t vl);
vint32m2_t __riscv_vnsra_wv_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                     vint64m4_t vs2, vuint32m2_t vs1,
                                     size_t vl);
vint32m2_t __riscv_vnsra_wx_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                     vint64m4_t vs2, size_t rs1, size_t vl);
vint32m4_t __riscv_vnsra_wv_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint64m8_t vs2,
                                     vuint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vnsra_wx_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint64m8_t vs2,
                                     size_t rs1, size_t vl);
vuint8mf8_t __riscv_vnsrl_wv_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                      vuint16mf4_t vs2, vuint8mf8_t vs1,
                                      size_t vl);
vuint8mf8_t __riscv_vnsrl_wx_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                      vuint16mf4_t vs2, size_t rs1, size_t vl);
vuint8mf4_t __riscv_vnsrl_wv_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                      vuint16mf2_t vs2, vuint8mf4_t vs1,
                                      size_t vl);
vuint8mf4_t __riscv_vnsrl_wx_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                      vuint16mf2_t vs2, size_t rs1, size_t vl);
vuint8mf2_t __riscv_vnsrl_wv_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                      vuint16m1_t vs2, vuint8mf2_t vs1,
                                      size_t vl);
vuint8mf2_t __riscv_vnsrl_wx_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                      vuint16m1_t vs2, size_t rs1, size_t vl);
vuint8m1_t __riscv_vnsrl_wv_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint16m2_t vs2,
                                    vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vnsrl_wx_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint16m2_t vs2,
                                    size_t rs1, size_t vl);
vuint8m2_t __riscv_vnsrl_wv_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint16m4_t vs2,
                                    vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vnsrl_wx_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint16m4_t vs2,
                                    size_t rs1, size_t vl);
vuint8m4_t __riscv_vnsrl_wv_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint16m8_t vs2,
                                    vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vnsrl_wx_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint16m8_t vs2,
                                    size_t rs1, size_t vl);
vuint16mf4_t __riscv_vnsrl_wv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                        vuint32mf2_t vs2, vuint16mf4_t vs1,
                                        size_t vl);
vuint16mf4_t __riscv_vnsrl_wx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                        vuint32mf2_t vs2, size_t rs1,
                                        size_t vl);
vuint16mf2_t __riscv_vnsrl_wv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                        vuint32m1_t vs2, vuint16mf2_t vs1,
                                        size_t vl);
vuint16mf2_t __riscv_vnsrl_wx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                        vuint32m1_t vs2, size_t rs1, size_t vl);
vuint16m1_t __riscv_vnsrl_wv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                      vuint32m2_t vs2, vuint16m1_t vs1,
                                      size_t vl);
vuint16m1_t __riscv_vnsrl_wx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                      vuint32m2_t vs2, size_t rs1, size_t vl);
vuint16m2_t __riscv_vnsrl_wv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                      vuint32m4_t vs2, vuint16m2_t vs1,
                                      size_t vl);
vuint16m2_t __riscv_vnsrl_wx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                      vuint32m4_t vs2, size_t rs1, size_t vl);
vuint16m4_t __riscv_vnsrl_wv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                      vuint32m8_t vs2, vuint16m4_t vs1,
                                      size_t vl);
vuint16m4_t __riscv_vnsrl_wx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                      vuint32m8_t vs2, size_t rs1, size_t vl);
vuint32mf2_t __riscv_vnsrl_wv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                        vuint64m1_t vs2, vuint32mf2_t vs1,
                                        size_t vl);
vuint32mf2_t __riscv_vnsrl_wx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                        vuint64m1_t vs2, size_t rs1, size_t vl);
vuint32m1_t __riscv_vnsrl_wv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                      vuint64m2_t vs2, vuint32m1_t vs1,
                                      size_t vl);
vuint32m1_t __riscv_vnsrl_wx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                      vuint64m2_t vs2, size_t rs1, size_t vl);
vuint32m2_t __riscv_vnsrl_wv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                      vuint64m4_t vs2, vuint32m2_t vs1,
                                      size_t vl);
vuint32m2_t __riscv_vnsrl_wx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                      vuint64m4_t vs2, size_t rs1, size_t vl);
vuint32m4_t __riscv_vnsrl_wv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                      vuint64m8_t vs2, vuint32m4_t vs1,
                                      size_t vl);
vuint32m4_t __riscv_vnsrl_wx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                      vuint64m8_t vs2, size_t rs1, size_t vl);

Vector Integer Narrowing Intrinsics

vint8mf8_t __riscv_vncvt_x_x_w_i8mf8_tu(vint8mf8_t vd, vint16mf4_t vs2,
                                        size_t vl);
vint8mf4_t __riscv_vncvt_x_x_w_i8mf4_tu(vint8mf4_t vd, vint16mf2_t vs2,
                                        size_t vl);
vint8mf2_t __riscv_vncvt_x_x_w_i8mf2_tu(vint8mf2_t vd, vint16m1_t vs2,
                                        size_t vl);
vint8m1_t __riscv_vncvt_x_x_w_i8m1_tu(vint8m1_t vd, vint16m2_t vs2, size_t vl);
vint8m2_t __riscv_vncvt_x_x_w_i8m2_tu(vint8m2_t vd, vint16m4_t vs2, size_t vl);
vint8m4_t __riscv_vncvt_x_x_w_i8m4_tu(vint8m4_t vd, vint16m8_t vs2, size_t vl);
vuint8mf8_t __riscv_vncvt_x_x_w_u8mf8_tu(vuint8mf8_t vd, vuint16mf4_t vs2,
                                         size_t vl);
vuint8mf4_t __riscv_vncvt_x_x_w_u8mf4_tu(vuint8mf4_t vd, vuint16mf2_t vs2,
                                         size_t vl);
vuint8mf2_t __riscv_vncvt_x_x_w_u8mf2_tu(vuint8mf2_t vd, vuint16m1_t vs2,
                                         size_t vl);
vuint8m1_t __riscv_vncvt_x_x_w_u8m1_tu(vuint8m1_t vd, vuint16m2_t vs2,
                                       size_t vl);
vuint8m2_t __riscv_vncvt_x_x_w_u8m2_tu(vuint8m2_t vd, vuint16m4_t vs2,
                                       size_t vl);
vuint8m4_t __riscv_vncvt_x_x_w_u8m4_tu(vuint8m4_t vd, vuint16m8_t vs2,
                                       size_t vl);
vint16mf4_t __riscv_vncvt_x_x_w_i16mf4_tu(vint16mf4_t vd, vint32mf2_t vs2,
                                          size_t vl);
vint16mf2_t __riscv_vncvt_x_x_w_i16mf2_tu(vint16mf2_t vd, vint32m1_t vs2,
                                          size_t vl);
vint16m1_t __riscv_vncvt_x_x_w_i16m1_tu(vint16m1_t vd, vint32m2_t vs2,
                                        size_t vl);
vint16m2_t __riscv_vncvt_x_x_w_i16m2_tu(vint16m2_t vd, vint32m4_t vs2,
                                        size_t vl);
vint16m4_t __riscv_vncvt_x_x_w_i16m4_tu(vint16m4_t vd, vint32m8_t vs2,
                                        size_t vl);
vuint16mf4_t __riscv_vncvt_x_x_w_u16mf4_tu(vuint16mf4_t vd, vuint32mf2_t vs2,
                                           size_t vl);
vuint16mf2_t __riscv_vncvt_x_x_w_u16mf2_tu(vuint16mf2_t vd, vuint32m1_t vs2,
                                           size_t vl);
vuint16m1_t __riscv_vncvt_x_x_w_u16m1_tu(vuint16m1_t vd, vuint32m2_t vs2,
                                         size_t vl);
vuint16m2_t __riscv_vncvt_x_x_w_u16m2_tu(vuint16m2_t vd, vuint32m4_t vs2,
                                         size_t vl);
vuint16m4_t __riscv_vncvt_x_x_w_u16m4_tu(vuint16m4_t vd, vuint32m8_t vs2,
                                         size_t vl);
vint32mf2_t __riscv_vncvt_x_x_w_i32mf2_tu(vint32mf2_t vd, vint64m1_t vs2,
                                          size_t vl);
vint32m1_t __riscv_vncvt_x_x_w_i32m1_tu(vint32m1_t vd, vint64m2_t vs2,
                                        size_t vl);
vint32m2_t __riscv_vncvt_x_x_w_i32m2_tu(vint32m2_t vd, vint64m4_t vs2,
                                        size_t vl);
vint32m4_t __riscv_vncvt_x_x_w_i32m4_tu(vint32m4_t vd, vint64m8_t vs2,
                                        size_t vl);
vuint32mf2_t __riscv_vncvt_x_x_w_u32mf2_tu(vuint32mf2_t vd, vuint64m1_t vs2,
                                           size_t vl);
vuint32m1_t __riscv_vncvt_x_x_w_u32m1_tu(vuint32m1_t vd, vuint64m2_t vs2,
                                         size_t vl);
vuint32m2_t __riscv_vncvt_x_x_w_u32m2_tu(vuint32m2_t vd, vuint64m4_t vs2,
                                         size_t vl);
vuint32m4_t __riscv_vncvt_x_x_w_u32m4_tu(vuint32m4_t vd, vuint64m8_t vs2,
                                         size_t vl);
// masked functions
vint8mf8_t __riscv_vncvt_x_x_w_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                         vint16mf4_t vs2, size_t vl);
vint8mf4_t __riscv_vncvt_x_x_w_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                         vint16mf2_t vs2, size_t vl);
vint8mf2_t __riscv_vncvt_x_x_w_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                         vint16m1_t vs2, size_t vl);
vint8m1_t __riscv_vncvt_x_x_w_i8m1_tum(vbool8_t vm, vint8m1_t vd,
                                       vint16m2_t vs2, size_t vl);
vint8m2_t __riscv_vncvt_x_x_w_i8m2_tum(vbool4_t vm, vint8m2_t vd,
                                       vint16m4_t vs2, size_t vl);
vint8m4_t __riscv_vncvt_x_x_w_i8m4_tum(vbool2_t vm, vint8m4_t vd,
                                       vint16m8_t vs2, size_t vl);
vuint8mf8_t __riscv_vncvt_x_x_w_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                          vuint16mf4_t vs2, size_t vl);
vuint8mf4_t __riscv_vncvt_x_x_w_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                          vuint16mf2_t vs2, size_t vl);
vuint8mf2_t __riscv_vncvt_x_x_w_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                          vuint16m1_t vs2, size_t vl);
vuint8m1_t __riscv_vncvt_x_x_w_u8m1_tum(vbool8_t vm, vuint8m1_t vd,
                                        vuint16m2_t vs2, size_t vl);
vuint8m2_t __riscv_vncvt_x_x_w_u8m2_tum(vbool4_t vm, vuint8m2_t vd,
                                        vuint16m4_t vs2, size_t vl);
vuint8m4_t __riscv_vncvt_x_x_w_u8m4_tum(vbool2_t vm, vuint8m4_t vd,
                                        vuint16m8_t vs2, size_t vl);
vint16mf4_t __riscv_vncvt_x_x_w_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                           vint32mf2_t vs2, size_t vl);
vint16mf2_t __riscv_vncvt_x_x_w_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                           vint32m1_t vs2, size_t vl);
vint16m1_t __riscv_vncvt_x_x_w_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                         vint32m2_t vs2, size_t vl);
vint16m2_t __riscv_vncvt_x_x_w_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                         vint32m4_t vs2, size_t vl);
vint16m4_t __riscv_vncvt_x_x_w_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                         vint32m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vncvt_x_x_w_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                            vuint32mf2_t vs2, size_t vl);
vuint16mf2_t __riscv_vncvt_x_x_w_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                            vuint32m1_t vs2, size_t vl);
vuint16m1_t __riscv_vncvt_x_x_w_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                          vuint32m2_t vs2, size_t vl);
vuint16m2_t __riscv_vncvt_x_x_w_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                          vuint32m4_t vs2, size_t vl);
vuint16m4_t __riscv_vncvt_x_x_w_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                          vuint32m8_t vs2, size_t vl);
vint32mf2_t __riscv_vncvt_x_x_w_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                           vint64m1_t vs2, size_t vl);
vint32m1_t __riscv_vncvt_x_x_w_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                         vint64m2_t vs2, size_t vl);
vint32m2_t __riscv_vncvt_x_x_w_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                         vint64m4_t vs2, size_t vl);
vint32m4_t __riscv_vncvt_x_x_w_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                         vint64m8_t vs2, size_t vl);
vuint32mf2_t __riscv_vncvt_x_x_w_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                            vuint64m1_t vs2, size_t vl);
vuint32m1_t __riscv_vncvt_x_x_w_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                          vuint64m2_t vs2, size_t vl);
vuint32m2_t __riscv_vncvt_x_x_w_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                          vuint64m4_t vs2, size_t vl);
vuint32m4_t __riscv_vncvt_x_x_w_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                          vuint64m8_t vs2, size_t vl);
// masked functions
vint8mf8_t __riscv_vncvt_x_x_w_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                          vint16mf4_t vs2, size_t vl);
vint8mf4_t __riscv_vncvt_x_x_w_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                          vint16mf2_t vs2, size_t vl);
vint8mf2_t __riscv_vncvt_x_x_w_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                          vint16m1_t vs2, size_t vl);
vint8m1_t __riscv_vncvt_x_x_w_i8m1_tumu(vbool8_t vm, vint8m1_t vd,
                                        vint16m2_t vs2, size_t vl);
vint8m2_t __riscv_vncvt_x_x_w_i8m2_tumu(vbool4_t vm, vint8m2_t vd,
                                        vint16m4_t vs2, size_t vl);
vint8m4_t __riscv_vncvt_x_x_w_i8m4_tumu(vbool2_t vm, vint8m4_t vd,
                                        vint16m8_t vs2, size_t vl);
vuint8mf8_t __riscv_vncvt_x_x_w_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                           vuint16mf4_t vs2, size_t vl);
vuint8mf4_t __riscv_vncvt_x_x_w_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                           vuint16mf2_t vs2, size_t vl);
vuint8mf2_t __riscv_vncvt_x_x_w_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                           vuint16m1_t vs2, size_t vl);
vuint8m1_t __riscv_vncvt_x_x_w_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                         vuint16m2_t vs2, size_t vl);
vuint8m2_t __riscv_vncvt_x_x_w_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                         vuint16m4_t vs2, size_t vl);
vuint8m4_t __riscv_vncvt_x_x_w_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                         vuint16m8_t vs2, size_t vl);
vint16mf4_t __riscv_vncvt_x_x_w_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                            vint32mf2_t vs2, size_t vl);
vint16mf2_t __riscv_vncvt_x_x_w_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                            vint32m1_t vs2, size_t vl);
vint16m1_t __riscv_vncvt_x_x_w_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                          vint32m2_t vs2, size_t vl);
vint16m2_t __riscv_vncvt_x_x_w_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                          vint32m4_t vs2, size_t vl);
vint16m4_t __riscv_vncvt_x_x_w_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                          vint32m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vncvt_x_x_w_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                             vuint32mf2_t vs2, size_t vl);
vuint16mf2_t __riscv_vncvt_x_x_w_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                             vuint32m1_t vs2, size_t vl);
vuint16m1_t __riscv_vncvt_x_x_w_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                           vuint32m2_t vs2, size_t vl);
vuint16m2_t __riscv_vncvt_x_x_w_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                           vuint32m4_t vs2, size_t vl);
vuint16m4_t __riscv_vncvt_x_x_w_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                           vuint32m8_t vs2, size_t vl);
vint32mf2_t __riscv_vncvt_x_x_w_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                            vint64m1_t vs2, size_t vl);
vint32m1_t __riscv_vncvt_x_x_w_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                          vint64m2_t vs2, size_t vl);
vint32m2_t __riscv_vncvt_x_x_w_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                          vint64m4_t vs2, size_t vl);
vint32m4_t __riscv_vncvt_x_x_w_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                          vint64m8_t vs2, size_t vl);
vuint32mf2_t __riscv_vncvt_x_x_w_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                             vuint64m1_t vs2, size_t vl);
vuint32m1_t __riscv_vncvt_x_x_w_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                           vuint64m2_t vs2, size_t vl);
vuint32m2_t __riscv_vncvt_x_x_w_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                           vuint64m4_t vs2, size_t vl);
vuint32m4_t __riscv_vncvt_x_x_w_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                           vuint64m8_t vs2, size_t vl);
// masked functions
vint8mf8_t __riscv_vncvt_x_x_w_i8mf8_mu(vbool64_t vm, vint8mf8_t vd,
                                        vint16mf4_t vs2, size_t vl);
vint8mf4_t __riscv_vncvt_x_x_w_i8mf4_mu(vbool32_t vm, vint8mf4_t vd,
                                        vint16mf2_t vs2, size_t vl);
vint8mf2_t __riscv_vncvt_x_x_w_i8mf2_mu(vbool16_t vm, vint8mf2_t vd,
                                        vint16m1_t vs2, size_t vl);
vint8m1_t __riscv_vncvt_x_x_w_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint16m2_t vs2,
                                      size_t vl);
vint8m2_t __riscv_vncvt_x_x_w_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint16m4_t vs2,
                                      size_t vl);
vint8m4_t __riscv_vncvt_x_x_w_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint16m8_t vs2,
                                      size_t vl);
vuint8mf8_t __riscv_vncvt_x_x_w_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                         vuint16mf4_t vs2, size_t vl);
vuint8mf4_t __riscv_vncvt_x_x_w_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                         vuint16mf2_t vs2, size_t vl);
vuint8mf2_t __riscv_vncvt_x_x_w_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                         vuint16m1_t vs2, size_t vl);
vuint8m1_t __riscv_vncvt_x_x_w_u8m1_mu(vbool8_t vm, vuint8m1_t vd,
                                       vuint16m2_t vs2, size_t vl);
vuint8m2_t __riscv_vncvt_x_x_w_u8m2_mu(vbool4_t vm, vuint8m2_t vd,
                                       vuint16m4_t vs2, size_t vl);
vuint8m4_t __riscv_vncvt_x_x_w_u8m4_mu(vbool2_t vm, vuint8m4_t vd,
                                       vuint16m8_t vs2, size_t vl);
vint16mf4_t __riscv_vncvt_x_x_w_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                          vint32mf2_t vs2, size_t vl);
vint16mf2_t __riscv_vncvt_x_x_w_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                          vint32m1_t vs2, size_t vl);
vint16m1_t __riscv_vncvt_x_x_w_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                        vint32m2_t vs2, size_t vl);
vint16m2_t __riscv_vncvt_x_x_w_i16m2_mu(vbool8_t vm, vint16m2_t vd,
                                        vint32m4_t vs2, size_t vl);
vint16m4_t __riscv_vncvt_x_x_w_i16m4_mu(vbool4_t vm, vint16m4_t vd,
                                        vint32m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vncvt_x_x_w_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                           vuint32mf2_t vs2, size_t vl);
vuint16mf2_t __riscv_vncvt_x_x_w_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                           vuint32m1_t vs2, size_t vl);
vuint16m1_t __riscv_vncvt_x_x_w_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                         vuint32m2_t vs2, size_t vl);
vuint16m2_t __riscv_vncvt_x_x_w_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                         vuint32m4_t vs2, size_t vl);
vuint16m4_t __riscv_vncvt_x_x_w_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                         vuint32m8_t vs2, size_t vl);
vint32mf2_t __riscv_vncvt_x_x_w_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                          vint64m1_t vs2, size_t vl);
vint32m1_t __riscv_vncvt_x_x_w_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                        vint64m2_t vs2, size_t vl);
vint32m2_t __riscv_vncvt_x_x_w_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                        vint64m4_t vs2, size_t vl);
vint32m4_t __riscv_vncvt_x_x_w_i32m4_mu(vbool8_t vm, vint32m4_t vd,
                                        vint64m8_t vs2, size_t vl);
vuint32mf2_t __riscv_vncvt_x_x_w_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                           vuint64m1_t vs2, size_t vl);
vuint32m1_t __riscv_vncvt_x_x_w_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                         vuint64m2_t vs2, size_t vl);
vuint32m2_t __riscv_vncvt_x_x_w_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                         vuint64m4_t vs2, size_t vl);
vuint32m4_t __riscv_vncvt_x_x_w_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                         vuint64m8_t vs2, size_t vl);

Vector Integer Compare Intrinsics

// masked functions
vbool64_t __riscv_vmseq_vv_i8mf8_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vint8mf8_t vs2, vint8mf8_t vs1,
                                        size_t vl);
vbool64_t __riscv_vmseq_vx_i8mf8_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vint8mf8_t vs2, int8_t rs1, size_t vl);
vbool32_t __riscv_vmseq_vv_i8mf4_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint8mf4_t vs2, vint8mf4_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmseq_vx_i8mf4_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint8mf4_t vs2, int8_t rs1, size_t vl);
vbool16_t __riscv_vmseq_vv_i8mf2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint8mf2_t vs2, vint8mf2_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmseq_vx_i8mf2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint8mf2_t vs2, int8_t rs1, size_t vl);
vbool8_t __riscv_vmseq_vv_i8m1_b8_mu(vbool8_t vm, vbool8_t vd, vint8m1_t vs2,
                                     vint8m1_t vs1, size_t vl);
vbool8_t __riscv_vmseq_vx_i8m1_b8_mu(vbool8_t vm, vbool8_t vd, vint8m1_t vs2,
                                     int8_t rs1, size_t vl);
vbool4_t __riscv_vmseq_vv_i8m2_b4_mu(vbool4_t vm, vbool4_t vd, vint8m2_t vs2,
                                     vint8m2_t vs1, size_t vl);
vbool4_t __riscv_vmseq_vx_i8m2_b4_mu(vbool4_t vm, vbool4_t vd, vint8m2_t vs2,
                                     int8_t rs1, size_t vl);
vbool2_t __riscv_vmseq_vv_i8m4_b2_mu(vbool2_t vm, vbool2_t vd, vint8m4_t vs2,
                                     vint8m4_t vs1, size_t vl);
vbool2_t __riscv_vmseq_vx_i8m4_b2_mu(vbool2_t vm, vbool2_t vd, vint8m4_t vs2,
                                     int8_t rs1, size_t vl);
vbool1_t __riscv_vmseq_vv_i8m8_b1_mu(vbool1_t vm, vbool1_t vd, vint8m8_t vs2,
                                     vint8m8_t vs1, size_t vl);
vbool1_t __riscv_vmseq_vx_i8m8_b1_mu(vbool1_t vm, vbool1_t vd, vint8m8_t vs2,
                                     int8_t rs1, size_t vl);
vbool64_t __riscv_vmseq_vv_i16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vint16mf4_t vs2, vint16mf4_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmseq_vx_i16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vint16mf4_t vs2, int16_t rs1,
                                         size_t vl);
vbool32_t __riscv_vmseq_vv_i16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vint16mf2_t vs2, vint16mf2_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmseq_vx_i16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vint16mf2_t vs2, int16_t rs1,
                                         size_t vl);
vbool16_t __riscv_vmseq_vv_i16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint16m1_t vs2, vint16m1_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmseq_vx_i16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint16m1_t vs2, int16_t rs1, size_t vl);
vbool8_t __riscv_vmseq_vv_i16m2_b8_mu(vbool8_t vm, vbool8_t vd, vint16m2_t vs2,
                                      vint16m2_t vs1, size_t vl);
vbool8_t __riscv_vmseq_vx_i16m2_b8_mu(vbool8_t vm, vbool8_t vd, vint16m2_t vs2,
                                      int16_t rs1, size_t vl);
vbool4_t __riscv_vmseq_vv_i16m4_b4_mu(vbool4_t vm, vbool4_t vd, vint16m4_t vs2,
                                      vint16m4_t vs1, size_t vl);
vbool4_t __riscv_vmseq_vx_i16m4_b4_mu(vbool4_t vm, vbool4_t vd, vint16m4_t vs2,
                                      int16_t rs1, size_t vl);
vbool2_t __riscv_vmseq_vv_i16m8_b2_mu(vbool2_t vm, vbool2_t vd, vint16m8_t vs2,
                                      vint16m8_t vs1, size_t vl);
vbool2_t __riscv_vmseq_vx_i16m8_b2_mu(vbool2_t vm, vbool2_t vd, vint16m8_t vs2,
                                      int16_t rs1, size_t vl);
vbool64_t __riscv_vmseq_vv_i32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vint32mf2_t vs2, vint32mf2_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmseq_vx_i32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vint32mf2_t vs2, int32_t rs1,
                                         size_t vl);
vbool32_t __riscv_vmseq_vv_i32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint32m1_t vs2, vint32m1_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmseq_vx_i32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint32m1_t vs2, int32_t rs1, size_t vl);
vbool16_t __riscv_vmseq_vv_i32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint32m2_t vs2, vint32m2_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmseq_vx_i32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint32m2_t vs2, int32_t rs1, size_t vl);
vbool8_t __riscv_vmseq_vv_i32m4_b8_mu(vbool8_t vm, vbool8_t vd, vint32m4_t vs2,
                                      vint32m4_t vs1, size_t vl);
vbool8_t __riscv_vmseq_vx_i32m4_b8_mu(vbool8_t vm, vbool8_t vd, vint32m4_t vs2,
                                      int32_t rs1, size_t vl);
vbool4_t __riscv_vmseq_vv_i32m8_b4_mu(vbool4_t vm, vbool4_t vd, vint32m8_t vs2,
                                      vint32m8_t vs1, size_t vl);
vbool4_t __riscv_vmseq_vx_i32m8_b4_mu(vbool4_t vm, vbool4_t vd, vint32m8_t vs2,
                                      int32_t rs1, size_t vl);
vbool64_t __riscv_vmseq_vv_i64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vint64m1_t vs2, vint64m1_t vs1,
                                        size_t vl);
vbool64_t __riscv_vmseq_vx_i64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vint64m1_t vs2, int64_t rs1, size_t vl);
vbool32_t __riscv_vmseq_vv_i64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint64m2_t vs2, vint64m2_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmseq_vx_i64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint64m2_t vs2, int64_t rs1, size_t vl);
vbool16_t __riscv_vmseq_vv_i64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint64m4_t vs2, vint64m4_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmseq_vx_i64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint64m4_t vs2, int64_t rs1, size_t vl);
vbool8_t __riscv_vmseq_vv_i64m8_b8_mu(vbool8_t vm, vbool8_t vd, vint64m8_t vs2,
                                      vint64m8_t vs1, size_t vl);
vbool8_t __riscv_vmseq_vx_i64m8_b8_mu(vbool8_t vm, vbool8_t vd, vint64m8_t vs2,
                                      int64_t rs1, size_t vl);
vbool64_t __riscv_vmsne_vv_i8mf8_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vint8mf8_t vs2, vint8mf8_t vs1,
                                        size_t vl);
vbool64_t __riscv_vmsne_vx_i8mf8_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vint8mf8_t vs2, int8_t rs1, size_t vl);
vbool32_t __riscv_vmsne_vv_i8mf4_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint8mf4_t vs2, vint8mf4_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmsne_vx_i8mf4_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint8mf4_t vs2, int8_t rs1, size_t vl);
vbool16_t __riscv_vmsne_vv_i8mf2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint8mf2_t vs2, vint8mf2_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmsne_vx_i8mf2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint8mf2_t vs2, int8_t rs1, size_t vl);
vbool8_t __riscv_vmsne_vv_i8m1_b8_mu(vbool8_t vm, vbool8_t vd, vint8m1_t vs2,
                                     vint8m1_t vs1, size_t vl);
vbool8_t __riscv_vmsne_vx_i8m1_b8_mu(vbool8_t vm, vbool8_t vd, vint8m1_t vs2,
                                     int8_t rs1, size_t vl);
vbool4_t __riscv_vmsne_vv_i8m2_b4_mu(vbool4_t vm, vbool4_t vd, vint8m2_t vs2,
                                     vint8m2_t vs1, size_t vl);
vbool4_t __riscv_vmsne_vx_i8m2_b4_mu(vbool4_t vm, vbool4_t vd, vint8m2_t vs2,
                                     int8_t rs1, size_t vl);
vbool2_t __riscv_vmsne_vv_i8m4_b2_mu(vbool2_t vm, vbool2_t vd, vint8m4_t vs2,
                                     vint8m4_t vs1, size_t vl);
vbool2_t __riscv_vmsne_vx_i8m4_b2_mu(vbool2_t vm, vbool2_t vd, vint8m4_t vs2,
                                     int8_t rs1, size_t vl);
vbool1_t __riscv_vmsne_vv_i8m8_b1_mu(vbool1_t vm, vbool1_t vd, vint8m8_t vs2,
                                     vint8m8_t vs1, size_t vl);
vbool1_t __riscv_vmsne_vx_i8m8_b1_mu(vbool1_t vm, vbool1_t vd, vint8m8_t vs2,
                                     int8_t rs1, size_t vl);
vbool64_t __riscv_vmsne_vv_i16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vint16mf4_t vs2, vint16mf4_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmsne_vx_i16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vint16mf4_t vs2, int16_t rs1,
                                         size_t vl);
vbool32_t __riscv_vmsne_vv_i16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vint16mf2_t vs2, vint16mf2_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmsne_vx_i16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vint16mf2_t vs2, int16_t rs1,
                                         size_t vl);
vbool16_t __riscv_vmsne_vv_i16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint16m1_t vs2, vint16m1_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmsne_vx_i16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint16m1_t vs2, int16_t rs1, size_t vl);
vbool8_t __riscv_vmsne_vv_i16m2_b8_mu(vbool8_t vm, vbool8_t vd, vint16m2_t vs2,
                                      vint16m2_t vs1, size_t vl);
vbool8_t __riscv_vmsne_vx_i16m2_b8_mu(vbool8_t vm, vbool8_t vd, vint16m2_t vs2,
                                      int16_t rs1, size_t vl);
vbool4_t __riscv_vmsne_vv_i16m4_b4_mu(vbool4_t vm, vbool4_t vd, vint16m4_t vs2,
                                      vint16m4_t vs1, size_t vl);
vbool4_t __riscv_vmsne_vx_i16m4_b4_mu(vbool4_t vm, vbool4_t vd, vint16m4_t vs2,
                                      int16_t rs1, size_t vl);
vbool2_t __riscv_vmsne_vv_i16m8_b2_mu(vbool2_t vm, vbool2_t vd, vint16m8_t vs2,
                                      vint16m8_t vs1, size_t vl);
vbool2_t __riscv_vmsne_vx_i16m8_b2_mu(vbool2_t vm, vbool2_t vd, vint16m8_t vs2,
                                      int16_t rs1, size_t vl);
vbool64_t __riscv_vmsne_vv_i32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vint32mf2_t vs2, vint32mf2_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmsne_vx_i32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vint32mf2_t vs2, int32_t rs1,
                                         size_t vl);
vbool32_t __riscv_vmsne_vv_i32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint32m1_t vs2, vint32m1_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmsne_vx_i32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint32m1_t vs2, int32_t rs1, size_t vl);
vbool16_t __riscv_vmsne_vv_i32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint32m2_t vs2, vint32m2_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmsne_vx_i32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint32m2_t vs2, int32_t rs1, size_t vl);
vbool8_t __riscv_vmsne_vv_i32m4_b8_mu(vbool8_t vm, vbool8_t vd, vint32m4_t vs2,
                                      vint32m4_t vs1, size_t vl);
vbool8_t __riscv_vmsne_vx_i32m4_b8_mu(vbool8_t vm, vbool8_t vd, vint32m4_t vs2,
                                      int32_t rs1, size_t vl);
vbool4_t __riscv_vmsne_vv_i32m8_b4_mu(vbool4_t vm, vbool4_t vd, vint32m8_t vs2,
                                      vint32m8_t vs1, size_t vl);
vbool4_t __riscv_vmsne_vx_i32m8_b4_mu(vbool4_t vm, vbool4_t vd, vint32m8_t vs2,
                                      int32_t rs1, size_t vl);
vbool64_t __riscv_vmsne_vv_i64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vint64m1_t vs2, vint64m1_t vs1,
                                        size_t vl);
vbool64_t __riscv_vmsne_vx_i64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vint64m1_t vs2, int64_t rs1, size_t vl);
vbool32_t __riscv_vmsne_vv_i64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint64m2_t vs2, vint64m2_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmsne_vx_i64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint64m2_t vs2, int64_t rs1, size_t vl);
vbool16_t __riscv_vmsne_vv_i64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint64m4_t vs2, vint64m4_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmsne_vx_i64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint64m4_t vs2, int64_t rs1, size_t vl);
vbool8_t __riscv_vmsne_vv_i64m8_b8_mu(vbool8_t vm, vbool8_t vd, vint64m8_t vs2,
                                      vint64m8_t vs1, size_t vl);
vbool8_t __riscv_vmsne_vx_i64m8_b8_mu(vbool8_t vm, vbool8_t vd, vint64m8_t vs2,
                                      int64_t rs1, size_t vl);
vbool64_t __riscv_vmslt_vv_i8mf8_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vint8mf8_t vs2, vint8mf8_t vs1,
                                        size_t vl);
vbool64_t __riscv_vmslt_vx_i8mf8_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vint8mf8_t vs2, int8_t rs1, size_t vl);
vbool32_t __riscv_vmslt_vv_i8mf4_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint8mf4_t vs2, vint8mf4_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmslt_vx_i8mf4_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint8mf4_t vs2, int8_t rs1, size_t vl);
vbool16_t __riscv_vmslt_vv_i8mf2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint8mf2_t vs2, vint8mf2_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmslt_vx_i8mf2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint8mf2_t vs2, int8_t rs1, size_t vl);
vbool8_t __riscv_vmslt_vv_i8m1_b8_mu(vbool8_t vm, vbool8_t vd, vint8m1_t vs2,
                                     vint8m1_t vs1, size_t vl);
vbool8_t __riscv_vmslt_vx_i8m1_b8_mu(vbool8_t vm, vbool8_t vd, vint8m1_t vs2,
                                     int8_t rs1, size_t vl);
vbool4_t __riscv_vmslt_vv_i8m2_b4_mu(vbool4_t vm, vbool4_t vd, vint8m2_t vs2,
                                     vint8m2_t vs1, size_t vl);
vbool4_t __riscv_vmslt_vx_i8m2_b4_mu(vbool4_t vm, vbool4_t vd, vint8m2_t vs2,
                                     int8_t rs1, size_t vl);
vbool2_t __riscv_vmslt_vv_i8m4_b2_mu(vbool2_t vm, vbool2_t vd, vint8m4_t vs2,
                                     vint8m4_t vs1, size_t vl);
vbool2_t __riscv_vmslt_vx_i8m4_b2_mu(vbool2_t vm, vbool2_t vd, vint8m4_t vs2,
                                     int8_t rs1, size_t vl);
vbool1_t __riscv_vmslt_vv_i8m8_b1_mu(vbool1_t vm, vbool1_t vd, vint8m8_t vs2,
                                     vint8m8_t vs1, size_t vl);
vbool1_t __riscv_vmslt_vx_i8m8_b1_mu(vbool1_t vm, vbool1_t vd, vint8m8_t vs2,
                                     int8_t rs1, size_t vl);
vbool64_t __riscv_vmslt_vv_i16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vint16mf4_t vs2, vint16mf4_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmslt_vx_i16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vint16mf4_t vs2, int16_t rs1,
                                         size_t vl);
vbool32_t __riscv_vmslt_vv_i16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vint16mf2_t vs2, vint16mf2_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmslt_vx_i16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vint16mf2_t vs2, int16_t rs1,
                                         size_t vl);
vbool16_t __riscv_vmslt_vv_i16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint16m1_t vs2, vint16m1_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmslt_vx_i16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint16m1_t vs2, int16_t rs1, size_t vl);
vbool8_t __riscv_vmslt_vv_i16m2_b8_mu(vbool8_t vm, vbool8_t vd, vint16m2_t vs2,
                                      vint16m2_t vs1, size_t vl);
vbool8_t __riscv_vmslt_vx_i16m2_b8_mu(vbool8_t vm, vbool8_t vd, vint16m2_t vs2,
                                      int16_t rs1, size_t vl);
vbool4_t __riscv_vmslt_vv_i16m4_b4_mu(vbool4_t vm, vbool4_t vd, vint16m4_t vs2,
                                      vint16m4_t vs1, size_t vl);
vbool4_t __riscv_vmslt_vx_i16m4_b4_mu(vbool4_t vm, vbool4_t vd, vint16m4_t vs2,
                                      int16_t rs1, size_t vl);
vbool2_t __riscv_vmslt_vv_i16m8_b2_mu(vbool2_t vm, vbool2_t vd, vint16m8_t vs2,
                                      vint16m8_t vs1, size_t vl);
vbool2_t __riscv_vmslt_vx_i16m8_b2_mu(vbool2_t vm, vbool2_t vd, vint16m8_t vs2,
                                      int16_t rs1, size_t vl);
vbool64_t __riscv_vmslt_vv_i32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vint32mf2_t vs2, vint32mf2_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmslt_vx_i32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vint32mf2_t vs2, int32_t rs1,
                                         size_t vl);
vbool32_t __riscv_vmslt_vv_i32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint32m1_t vs2, vint32m1_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmslt_vx_i32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint32m1_t vs2, int32_t rs1, size_t vl);
vbool16_t __riscv_vmslt_vv_i32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint32m2_t vs2, vint32m2_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmslt_vx_i32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint32m2_t vs2, int32_t rs1, size_t vl);
vbool8_t __riscv_vmslt_vv_i32m4_b8_mu(vbool8_t vm, vbool8_t vd, vint32m4_t vs2,
                                      vint32m4_t vs1, size_t vl);
vbool8_t __riscv_vmslt_vx_i32m4_b8_mu(vbool8_t vm, vbool8_t vd, vint32m4_t vs2,
                                      int32_t rs1, size_t vl);
vbool4_t __riscv_vmslt_vv_i32m8_b4_mu(vbool4_t vm, vbool4_t vd, vint32m8_t vs2,
                                      vint32m8_t vs1, size_t vl);
vbool4_t __riscv_vmslt_vx_i32m8_b4_mu(vbool4_t vm, vbool4_t vd, vint32m8_t vs2,
                                      int32_t rs1, size_t vl);
vbool64_t __riscv_vmslt_vv_i64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vint64m1_t vs2, vint64m1_t vs1,
                                        size_t vl);
vbool64_t __riscv_vmslt_vx_i64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vint64m1_t vs2, int64_t rs1, size_t vl);
vbool32_t __riscv_vmslt_vv_i64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint64m2_t vs2, vint64m2_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmslt_vx_i64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint64m2_t vs2, int64_t rs1, size_t vl);
vbool16_t __riscv_vmslt_vv_i64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint64m4_t vs2, vint64m4_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmslt_vx_i64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint64m4_t vs2, int64_t rs1, size_t vl);
vbool8_t __riscv_vmslt_vv_i64m8_b8_mu(vbool8_t vm, vbool8_t vd, vint64m8_t vs2,
                                      vint64m8_t vs1, size_t vl);
vbool8_t __riscv_vmslt_vx_i64m8_b8_mu(vbool8_t vm, vbool8_t vd, vint64m8_t vs2,
                                      int64_t rs1, size_t vl);
vbool64_t __riscv_vmsle_vv_i8mf8_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vint8mf8_t vs2, vint8mf8_t vs1,
                                        size_t vl);
vbool64_t __riscv_vmsle_vx_i8mf8_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vint8mf8_t vs2, int8_t rs1, size_t vl);
vbool32_t __riscv_vmsle_vv_i8mf4_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint8mf4_t vs2, vint8mf4_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmsle_vx_i8mf4_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint8mf4_t vs2, int8_t rs1, size_t vl);
vbool16_t __riscv_vmsle_vv_i8mf2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint8mf2_t vs2, vint8mf2_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmsle_vx_i8mf2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint8mf2_t vs2, int8_t rs1, size_t vl);
vbool8_t __riscv_vmsle_vv_i8m1_b8_mu(vbool8_t vm, vbool8_t vd, vint8m1_t vs2,
                                     vint8m1_t vs1, size_t vl);
vbool8_t __riscv_vmsle_vx_i8m1_b8_mu(vbool8_t vm, vbool8_t vd, vint8m1_t vs2,
                                     int8_t rs1, size_t vl);
vbool4_t __riscv_vmsle_vv_i8m2_b4_mu(vbool4_t vm, vbool4_t vd, vint8m2_t vs2,
                                     vint8m2_t vs1, size_t vl);
vbool4_t __riscv_vmsle_vx_i8m2_b4_mu(vbool4_t vm, vbool4_t vd, vint8m2_t vs2,
                                     int8_t rs1, size_t vl);
vbool2_t __riscv_vmsle_vv_i8m4_b2_mu(vbool2_t vm, vbool2_t vd, vint8m4_t vs2,
                                     vint8m4_t vs1, size_t vl);
vbool2_t __riscv_vmsle_vx_i8m4_b2_mu(vbool2_t vm, vbool2_t vd, vint8m4_t vs2,
                                     int8_t rs1, size_t vl);
vbool1_t __riscv_vmsle_vv_i8m8_b1_mu(vbool1_t vm, vbool1_t vd, vint8m8_t vs2,
                                     vint8m8_t vs1, size_t vl);
vbool1_t __riscv_vmsle_vx_i8m8_b1_mu(vbool1_t vm, vbool1_t vd, vint8m8_t vs2,
                                     int8_t rs1, size_t vl);
vbool64_t __riscv_vmsle_vv_i16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vint16mf4_t vs2, vint16mf4_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmsle_vx_i16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vint16mf4_t vs2, int16_t rs1,
                                         size_t vl);
vbool32_t __riscv_vmsle_vv_i16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vint16mf2_t vs2, vint16mf2_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmsle_vx_i16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vint16mf2_t vs2, int16_t rs1,
                                         size_t vl);
vbool16_t __riscv_vmsle_vv_i16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint16m1_t vs2, vint16m1_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmsle_vx_i16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint16m1_t vs2, int16_t rs1, size_t vl);
vbool8_t __riscv_vmsle_vv_i16m2_b8_mu(vbool8_t vm, vbool8_t vd, vint16m2_t vs2,
                                      vint16m2_t vs1, size_t vl);
vbool8_t __riscv_vmsle_vx_i16m2_b8_mu(vbool8_t vm, vbool8_t vd, vint16m2_t vs2,
                                      int16_t rs1, size_t vl);
vbool4_t __riscv_vmsle_vv_i16m4_b4_mu(vbool4_t vm, vbool4_t vd, vint16m4_t vs2,
                                      vint16m4_t vs1, size_t vl);
vbool4_t __riscv_vmsle_vx_i16m4_b4_mu(vbool4_t vm, vbool4_t vd, vint16m4_t vs2,
                                      int16_t rs1, size_t vl);
vbool2_t __riscv_vmsle_vv_i16m8_b2_mu(vbool2_t vm, vbool2_t vd, vint16m8_t vs2,
                                      vint16m8_t vs1, size_t vl);
vbool2_t __riscv_vmsle_vx_i16m8_b2_mu(vbool2_t vm, vbool2_t vd, vint16m8_t vs2,
                                      int16_t rs1, size_t vl);
vbool64_t __riscv_vmsle_vv_i32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vint32mf2_t vs2, vint32mf2_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmsle_vx_i32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vint32mf2_t vs2, int32_t rs1,
                                         size_t vl);
vbool32_t __riscv_vmsle_vv_i32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint32m1_t vs2, vint32m1_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmsle_vx_i32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint32m1_t vs2, int32_t rs1, size_t vl);
vbool16_t __riscv_vmsle_vv_i32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint32m2_t vs2, vint32m2_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmsle_vx_i32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint32m2_t vs2, int32_t rs1, size_t vl);
vbool8_t __riscv_vmsle_vv_i32m4_b8_mu(vbool8_t vm, vbool8_t vd, vint32m4_t vs2,
                                      vint32m4_t vs1, size_t vl);
vbool8_t __riscv_vmsle_vx_i32m4_b8_mu(vbool8_t vm, vbool8_t vd, vint32m4_t vs2,
                                      int32_t rs1, size_t vl);
vbool4_t __riscv_vmsle_vv_i32m8_b4_mu(vbool4_t vm, vbool4_t vd, vint32m8_t vs2,
                                      vint32m8_t vs1, size_t vl);
vbool4_t __riscv_vmsle_vx_i32m8_b4_mu(vbool4_t vm, vbool4_t vd, vint32m8_t vs2,
                                      int32_t rs1, size_t vl);
vbool64_t __riscv_vmsle_vv_i64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vint64m1_t vs2, vint64m1_t vs1,
                                        size_t vl);
vbool64_t __riscv_vmsle_vx_i64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vint64m1_t vs2, int64_t rs1, size_t vl);
vbool32_t __riscv_vmsle_vv_i64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint64m2_t vs2, vint64m2_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmsle_vx_i64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint64m2_t vs2, int64_t rs1, size_t vl);
vbool16_t __riscv_vmsle_vv_i64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint64m4_t vs2, vint64m4_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmsle_vx_i64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint64m4_t vs2, int64_t rs1, size_t vl);
vbool8_t __riscv_vmsle_vv_i64m8_b8_mu(vbool8_t vm, vbool8_t vd, vint64m8_t vs2,
                                      vint64m8_t vs1, size_t vl);
vbool8_t __riscv_vmsle_vx_i64m8_b8_mu(vbool8_t vm, vbool8_t vd, vint64m8_t vs2,
                                      int64_t rs1, size_t vl);
vbool64_t __riscv_vmsgt_vv_i8mf8_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vint8mf8_t vs2, vint8mf8_t vs1,
                                        size_t vl);
vbool64_t __riscv_vmsgt_vx_i8mf8_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vint8mf8_t vs2, int8_t rs1, size_t vl);
vbool32_t __riscv_vmsgt_vv_i8mf4_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint8mf4_t vs2, vint8mf4_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmsgt_vx_i8mf4_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint8mf4_t vs2, int8_t rs1, size_t vl);
vbool16_t __riscv_vmsgt_vv_i8mf2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint8mf2_t vs2, vint8mf2_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmsgt_vx_i8mf2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint8mf2_t vs2, int8_t rs1, size_t vl);
vbool8_t __riscv_vmsgt_vv_i8m1_b8_mu(vbool8_t vm, vbool8_t vd, vint8m1_t vs2,
                                     vint8m1_t vs1, size_t vl);
vbool8_t __riscv_vmsgt_vx_i8m1_b8_mu(vbool8_t vm, vbool8_t vd, vint8m1_t vs2,
                                     int8_t rs1, size_t vl);
vbool4_t __riscv_vmsgt_vv_i8m2_b4_mu(vbool4_t vm, vbool4_t vd, vint8m2_t vs2,
                                     vint8m2_t vs1, size_t vl);
vbool4_t __riscv_vmsgt_vx_i8m2_b4_mu(vbool4_t vm, vbool4_t vd, vint8m2_t vs2,
                                     int8_t rs1, size_t vl);
vbool2_t __riscv_vmsgt_vv_i8m4_b2_mu(vbool2_t vm, vbool2_t vd, vint8m4_t vs2,
                                     vint8m4_t vs1, size_t vl);
vbool2_t __riscv_vmsgt_vx_i8m4_b2_mu(vbool2_t vm, vbool2_t vd, vint8m4_t vs2,
                                     int8_t rs1, size_t vl);
vbool1_t __riscv_vmsgt_vv_i8m8_b1_mu(vbool1_t vm, vbool1_t vd, vint8m8_t vs2,
                                     vint8m8_t vs1, size_t vl);
vbool1_t __riscv_vmsgt_vx_i8m8_b1_mu(vbool1_t vm, vbool1_t vd, vint8m8_t vs2,
                                     int8_t rs1, size_t vl);
vbool64_t __riscv_vmsgt_vv_i16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vint16mf4_t vs2, vint16mf4_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmsgt_vx_i16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vint16mf4_t vs2, int16_t rs1,
                                         size_t vl);
vbool32_t __riscv_vmsgt_vv_i16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vint16mf2_t vs2, vint16mf2_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmsgt_vx_i16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vint16mf2_t vs2, int16_t rs1,
                                         size_t vl);
vbool16_t __riscv_vmsgt_vv_i16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint16m1_t vs2, vint16m1_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmsgt_vx_i16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint16m1_t vs2, int16_t rs1, size_t vl);
vbool8_t __riscv_vmsgt_vv_i16m2_b8_mu(vbool8_t vm, vbool8_t vd, vint16m2_t vs2,
                                      vint16m2_t vs1, size_t vl);
vbool8_t __riscv_vmsgt_vx_i16m2_b8_mu(vbool8_t vm, vbool8_t vd, vint16m2_t vs2,
                                      int16_t rs1, size_t vl);
vbool4_t __riscv_vmsgt_vv_i16m4_b4_mu(vbool4_t vm, vbool4_t vd, vint16m4_t vs2,
                                      vint16m4_t vs1, size_t vl);
vbool4_t __riscv_vmsgt_vx_i16m4_b4_mu(vbool4_t vm, vbool4_t vd, vint16m4_t vs2,
                                      int16_t rs1, size_t vl);
vbool2_t __riscv_vmsgt_vv_i16m8_b2_mu(vbool2_t vm, vbool2_t vd, vint16m8_t vs2,
                                      vint16m8_t vs1, size_t vl);
vbool2_t __riscv_vmsgt_vx_i16m8_b2_mu(vbool2_t vm, vbool2_t vd, vint16m8_t vs2,
                                      int16_t rs1, size_t vl);
vbool64_t __riscv_vmsgt_vv_i32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vint32mf2_t vs2, vint32mf2_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmsgt_vx_i32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vint32mf2_t vs2, int32_t rs1,
                                         size_t vl);
vbool32_t __riscv_vmsgt_vv_i32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint32m1_t vs2, vint32m1_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmsgt_vx_i32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint32m1_t vs2, int32_t rs1, size_t vl);
vbool16_t __riscv_vmsgt_vv_i32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint32m2_t vs2, vint32m2_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmsgt_vx_i32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint32m2_t vs2, int32_t rs1, size_t vl);
vbool8_t __riscv_vmsgt_vv_i32m4_b8_mu(vbool8_t vm, vbool8_t vd, vint32m4_t vs2,
                                      vint32m4_t vs1, size_t vl);
vbool8_t __riscv_vmsgt_vx_i32m4_b8_mu(vbool8_t vm, vbool8_t vd, vint32m4_t vs2,
                                      int32_t rs1, size_t vl);
vbool4_t __riscv_vmsgt_vv_i32m8_b4_mu(vbool4_t vm, vbool4_t vd, vint32m8_t vs2,
                                      vint32m8_t vs1, size_t vl);
vbool4_t __riscv_vmsgt_vx_i32m8_b4_mu(vbool4_t vm, vbool4_t vd, vint32m8_t vs2,
                                      int32_t rs1, size_t vl);
vbool64_t __riscv_vmsgt_vv_i64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vint64m1_t vs2, vint64m1_t vs1,
                                        size_t vl);
vbool64_t __riscv_vmsgt_vx_i64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vint64m1_t vs2, int64_t rs1, size_t vl);
vbool32_t __riscv_vmsgt_vv_i64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint64m2_t vs2, vint64m2_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmsgt_vx_i64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint64m2_t vs2, int64_t rs1, size_t vl);
vbool16_t __riscv_vmsgt_vv_i64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint64m4_t vs2, vint64m4_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmsgt_vx_i64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint64m4_t vs2, int64_t rs1, size_t vl);
vbool8_t __riscv_vmsgt_vv_i64m8_b8_mu(vbool8_t vm, vbool8_t vd, vint64m8_t vs2,
                                      vint64m8_t vs1, size_t vl);
vbool8_t __riscv_vmsgt_vx_i64m8_b8_mu(vbool8_t vm, vbool8_t vd, vint64m8_t vs2,
                                      int64_t rs1, size_t vl);
vbool64_t __riscv_vmsge_vv_i8mf8_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vint8mf8_t vs2, vint8mf8_t vs1,
                                        size_t vl);
vbool64_t __riscv_vmsge_vx_i8mf8_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vint8mf8_t vs2, int8_t rs1, size_t vl);
vbool32_t __riscv_vmsge_vv_i8mf4_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint8mf4_t vs2, vint8mf4_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmsge_vx_i8mf4_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint8mf4_t vs2, int8_t rs1, size_t vl);
vbool16_t __riscv_vmsge_vv_i8mf2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint8mf2_t vs2, vint8mf2_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmsge_vx_i8mf2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint8mf2_t vs2, int8_t rs1, size_t vl);
vbool8_t __riscv_vmsge_vv_i8m1_b8_mu(vbool8_t vm, vbool8_t vd, vint8m1_t vs2,
                                     vint8m1_t vs1, size_t vl);
vbool8_t __riscv_vmsge_vx_i8m1_b8_mu(vbool8_t vm, vbool8_t vd, vint8m1_t vs2,
                                     int8_t rs1, size_t vl);
vbool4_t __riscv_vmsge_vv_i8m2_b4_mu(vbool4_t vm, vbool4_t vd, vint8m2_t vs2,
                                     vint8m2_t vs1, size_t vl);
vbool4_t __riscv_vmsge_vx_i8m2_b4_mu(vbool4_t vm, vbool4_t vd, vint8m2_t vs2,
                                     int8_t rs1, size_t vl);
vbool2_t __riscv_vmsge_vv_i8m4_b2_mu(vbool2_t vm, vbool2_t vd, vint8m4_t vs2,
                                     vint8m4_t vs1, size_t vl);
vbool2_t __riscv_vmsge_vx_i8m4_b2_mu(vbool2_t vm, vbool2_t vd, vint8m4_t vs2,
                                     int8_t rs1, size_t vl);
vbool1_t __riscv_vmsge_vv_i8m8_b1_mu(vbool1_t vm, vbool1_t vd, vint8m8_t vs2,
                                     vint8m8_t vs1, size_t vl);
vbool1_t __riscv_vmsge_vx_i8m8_b1_mu(vbool1_t vm, vbool1_t vd, vint8m8_t vs2,
                                     int8_t rs1, size_t vl);
vbool64_t __riscv_vmsge_vv_i16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vint16mf4_t vs2, vint16mf4_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmsge_vx_i16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vint16mf4_t vs2, int16_t rs1,
                                         size_t vl);
vbool32_t __riscv_vmsge_vv_i16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vint16mf2_t vs2, vint16mf2_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmsge_vx_i16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vint16mf2_t vs2, int16_t rs1,
                                         size_t vl);
vbool16_t __riscv_vmsge_vv_i16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint16m1_t vs2, vint16m1_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmsge_vx_i16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint16m1_t vs2, int16_t rs1, size_t vl);
vbool8_t __riscv_vmsge_vv_i16m2_b8_mu(vbool8_t vm, vbool8_t vd, vint16m2_t vs2,
                                      vint16m2_t vs1, size_t vl);
vbool8_t __riscv_vmsge_vx_i16m2_b8_mu(vbool8_t vm, vbool8_t vd, vint16m2_t vs2,
                                      int16_t rs1, size_t vl);
vbool4_t __riscv_vmsge_vv_i16m4_b4_mu(vbool4_t vm, vbool4_t vd, vint16m4_t vs2,
                                      vint16m4_t vs1, size_t vl);
vbool4_t __riscv_vmsge_vx_i16m4_b4_mu(vbool4_t vm, vbool4_t vd, vint16m4_t vs2,
                                      int16_t rs1, size_t vl);
vbool2_t __riscv_vmsge_vv_i16m8_b2_mu(vbool2_t vm, vbool2_t vd, vint16m8_t vs2,
                                      vint16m8_t vs1, size_t vl);
vbool2_t __riscv_vmsge_vx_i16m8_b2_mu(vbool2_t vm, vbool2_t vd, vint16m8_t vs2,
                                      int16_t rs1, size_t vl);
vbool64_t __riscv_vmsge_vv_i32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vint32mf2_t vs2, vint32mf2_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmsge_vx_i32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vint32mf2_t vs2, int32_t rs1,
                                         size_t vl);
vbool32_t __riscv_vmsge_vv_i32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint32m1_t vs2, vint32m1_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmsge_vx_i32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint32m1_t vs2, int32_t rs1, size_t vl);
vbool16_t __riscv_vmsge_vv_i32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint32m2_t vs2, vint32m2_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmsge_vx_i32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint32m2_t vs2, int32_t rs1, size_t vl);
vbool8_t __riscv_vmsge_vv_i32m4_b8_mu(vbool8_t vm, vbool8_t vd, vint32m4_t vs2,
                                      vint32m4_t vs1, size_t vl);
vbool8_t __riscv_vmsge_vx_i32m4_b8_mu(vbool8_t vm, vbool8_t vd, vint32m4_t vs2,
                                      int32_t rs1, size_t vl);
vbool4_t __riscv_vmsge_vv_i32m8_b4_mu(vbool4_t vm, vbool4_t vd, vint32m8_t vs2,
                                      vint32m8_t vs1, size_t vl);
vbool4_t __riscv_vmsge_vx_i32m8_b4_mu(vbool4_t vm, vbool4_t vd, vint32m8_t vs2,
                                      int32_t rs1, size_t vl);
vbool64_t __riscv_vmsge_vv_i64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vint64m1_t vs2, vint64m1_t vs1,
                                        size_t vl);
vbool64_t __riscv_vmsge_vx_i64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vint64m1_t vs2, int64_t rs1, size_t vl);
vbool32_t __riscv_vmsge_vv_i64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint64m2_t vs2, vint64m2_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmsge_vx_i64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vint64m2_t vs2, int64_t rs1, size_t vl);
vbool16_t __riscv_vmsge_vv_i64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint64m4_t vs2, vint64m4_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmsge_vx_i64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vint64m4_t vs2, int64_t rs1, size_t vl);
vbool8_t __riscv_vmsge_vv_i64m8_b8_mu(vbool8_t vm, vbool8_t vd, vint64m8_t vs2,
                                      vint64m8_t vs1, size_t vl);
vbool8_t __riscv_vmsge_vx_i64m8_b8_mu(vbool8_t vm, vbool8_t vd, vint64m8_t vs2,
                                      int64_t rs1, size_t vl);
vbool64_t __riscv_vmseq_vv_u8mf8_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vuint8mf8_t vs2, vuint8mf8_t vs1,
                                        size_t vl);
vbool64_t __riscv_vmseq_vx_u8mf8_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vuint8mf8_t vs2, uint8_t rs1,
                                        size_t vl);
vbool32_t __riscv_vmseq_vv_u8mf4_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vuint8mf4_t vs2, vuint8mf4_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmseq_vx_u8mf4_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vuint8mf4_t vs2, uint8_t rs1,
                                        size_t vl);
vbool16_t __riscv_vmseq_vv_u8mf2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vuint8mf2_t vs2, vuint8mf2_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmseq_vx_u8mf2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vuint8mf2_t vs2, uint8_t rs1,
                                        size_t vl);
vbool8_t __riscv_vmseq_vv_u8m1_b8_mu(vbool8_t vm, vbool8_t vd, vuint8m1_t vs2,
                                     vuint8m1_t vs1, size_t vl);
vbool8_t __riscv_vmseq_vx_u8m1_b8_mu(vbool8_t vm, vbool8_t vd, vuint8m1_t vs2,
                                     uint8_t rs1, size_t vl);
vbool4_t __riscv_vmseq_vv_u8m2_b4_mu(vbool4_t vm, vbool4_t vd, vuint8m2_t vs2,
                                     vuint8m2_t vs1, size_t vl);
vbool4_t __riscv_vmseq_vx_u8m2_b4_mu(vbool4_t vm, vbool4_t vd, vuint8m2_t vs2,
                                     uint8_t rs1, size_t vl);
vbool2_t __riscv_vmseq_vv_u8m4_b2_mu(vbool2_t vm, vbool2_t vd, vuint8m4_t vs2,
                                     vuint8m4_t vs1, size_t vl);
vbool2_t __riscv_vmseq_vx_u8m4_b2_mu(vbool2_t vm, vbool2_t vd, vuint8m4_t vs2,
                                     uint8_t rs1, size_t vl);
vbool1_t __riscv_vmseq_vv_u8m8_b1_mu(vbool1_t vm, vbool1_t vd, vuint8m8_t vs2,
                                     vuint8m8_t vs1, size_t vl);
vbool1_t __riscv_vmseq_vx_u8m8_b1_mu(vbool1_t vm, vbool1_t vd, vuint8m8_t vs2,
                                     uint8_t rs1, size_t vl);
vbool64_t __riscv_vmseq_vv_u16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vuint16mf4_t vs2, vuint16mf4_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmseq_vx_u16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vuint16mf4_t vs2, uint16_t rs1,
                                         size_t vl);
vbool32_t __riscv_vmseq_vv_u16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint16mf2_t vs2, vuint16mf2_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmseq_vx_u16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint16mf2_t vs2, uint16_t rs1,
                                         size_t vl);
vbool16_t __riscv_vmseq_vv_u16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vuint16m1_t vs2, vuint16m1_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmseq_vx_u16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vuint16m1_t vs2, uint16_t rs1,
                                        size_t vl);
vbool8_t __riscv_vmseq_vv_u16m2_b8_mu(vbool8_t vm, vbool8_t vd, vuint16m2_t vs2,
                                      vuint16m2_t vs1, size_t vl);
vbool8_t __riscv_vmseq_vx_u16m2_b8_mu(vbool8_t vm, vbool8_t vd, vuint16m2_t vs2,
                                      uint16_t rs1, size_t vl);
vbool4_t __riscv_vmseq_vv_u16m4_b4_mu(vbool4_t vm, vbool4_t vd, vuint16m4_t vs2,
                                      vuint16m4_t vs1, size_t vl);
vbool4_t __riscv_vmseq_vx_u16m4_b4_mu(vbool4_t vm, vbool4_t vd, vuint16m4_t vs2,
                                      uint16_t rs1, size_t vl);
vbool2_t __riscv_vmseq_vv_u16m8_b2_mu(vbool2_t vm, vbool2_t vd, vuint16m8_t vs2,
                                      vuint16m8_t vs1, size_t vl);
vbool2_t __riscv_vmseq_vx_u16m8_b2_mu(vbool2_t vm, vbool2_t vd, vuint16m8_t vs2,
                                      uint16_t rs1, size_t vl);
vbool64_t __riscv_vmseq_vv_u32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vuint32mf2_t vs2, vuint32mf2_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmseq_vx_u32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vuint32mf2_t vs2, uint32_t rs1,
                                         size_t vl);
vbool32_t __riscv_vmseq_vv_u32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vuint32m1_t vs2, vuint32m1_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmseq_vx_u32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vuint32m1_t vs2, uint32_t rs1,
                                        size_t vl);
vbool16_t __riscv_vmseq_vv_u32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vuint32m2_t vs2, vuint32m2_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmseq_vx_u32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vuint32m2_t vs2, uint32_t rs1,
                                        size_t vl);
vbool8_t __riscv_vmseq_vv_u32m4_b8_mu(vbool8_t vm, vbool8_t vd, vuint32m4_t vs2,
                                      vuint32m4_t vs1, size_t vl);
vbool8_t __riscv_vmseq_vx_u32m4_b8_mu(vbool8_t vm, vbool8_t vd, vuint32m4_t vs2,
                                      uint32_t rs1, size_t vl);
vbool4_t __riscv_vmseq_vv_u32m8_b4_mu(vbool4_t vm, vbool4_t vd, vuint32m8_t vs2,
                                      vuint32m8_t vs1, size_t vl);
vbool4_t __riscv_vmseq_vx_u32m8_b4_mu(vbool4_t vm, vbool4_t vd, vuint32m8_t vs2,
                                      uint32_t rs1, size_t vl);
vbool64_t __riscv_vmseq_vv_u64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vuint64m1_t vs2, vuint64m1_t vs1,
                                        size_t vl);
vbool64_t __riscv_vmseq_vx_u64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vuint64m1_t vs2, uint64_t rs1,
                                        size_t vl);
vbool32_t __riscv_vmseq_vv_u64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vuint64m2_t vs2, vuint64m2_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmseq_vx_u64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vuint64m2_t vs2, uint64_t rs1,
                                        size_t vl);
vbool16_t __riscv_vmseq_vv_u64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vuint64m4_t vs2, vuint64m4_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmseq_vx_u64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vuint64m4_t vs2, uint64_t rs1,
                                        size_t vl);
vbool8_t __riscv_vmseq_vv_u64m8_b8_mu(vbool8_t vm, vbool8_t vd, vuint64m8_t vs2,
                                      vuint64m8_t vs1, size_t vl);
vbool8_t __riscv_vmseq_vx_u64m8_b8_mu(vbool8_t vm, vbool8_t vd, vuint64m8_t vs2,
                                      uint64_t rs1, size_t vl);
vbool64_t __riscv_vmsne_vv_u8mf8_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vuint8mf8_t vs2, vuint8mf8_t vs1,
                                        size_t vl);
vbool64_t __riscv_vmsne_vx_u8mf8_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vuint8mf8_t vs2, uint8_t rs1,
                                        size_t vl);
vbool32_t __riscv_vmsne_vv_u8mf4_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vuint8mf4_t vs2, vuint8mf4_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmsne_vx_u8mf4_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vuint8mf4_t vs2, uint8_t rs1,
                                        size_t vl);
vbool16_t __riscv_vmsne_vv_u8mf2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vuint8mf2_t vs2, vuint8mf2_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmsne_vx_u8mf2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vuint8mf2_t vs2, uint8_t rs1,
                                        size_t vl);
vbool8_t __riscv_vmsne_vv_u8m1_b8_mu(vbool8_t vm, vbool8_t vd, vuint8m1_t vs2,
                                     vuint8m1_t vs1, size_t vl);
vbool8_t __riscv_vmsne_vx_u8m1_b8_mu(vbool8_t vm, vbool8_t vd, vuint8m1_t vs2,
                                     uint8_t rs1, size_t vl);
vbool4_t __riscv_vmsne_vv_u8m2_b4_mu(vbool4_t vm, vbool4_t vd, vuint8m2_t vs2,
                                     vuint8m2_t vs1, size_t vl);
vbool4_t __riscv_vmsne_vx_u8m2_b4_mu(vbool4_t vm, vbool4_t vd, vuint8m2_t vs2,
                                     uint8_t rs1, size_t vl);
vbool2_t __riscv_vmsne_vv_u8m4_b2_mu(vbool2_t vm, vbool2_t vd, vuint8m4_t vs2,
                                     vuint8m4_t vs1, size_t vl);
vbool2_t __riscv_vmsne_vx_u8m4_b2_mu(vbool2_t vm, vbool2_t vd, vuint8m4_t vs2,
                                     uint8_t rs1, size_t vl);
vbool1_t __riscv_vmsne_vv_u8m8_b1_mu(vbool1_t vm, vbool1_t vd, vuint8m8_t vs2,
                                     vuint8m8_t vs1, size_t vl);
vbool1_t __riscv_vmsne_vx_u8m8_b1_mu(vbool1_t vm, vbool1_t vd, vuint8m8_t vs2,
                                     uint8_t rs1, size_t vl);
vbool64_t __riscv_vmsne_vv_u16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vuint16mf4_t vs2, vuint16mf4_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmsne_vx_u16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vuint16mf4_t vs2, uint16_t rs1,
                                         size_t vl);
vbool32_t __riscv_vmsne_vv_u16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint16mf2_t vs2, vuint16mf2_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmsne_vx_u16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint16mf2_t vs2, uint16_t rs1,
                                         size_t vl);
vbool16_t __riscv_vmsne_vv_u16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vuint16m1_t vs2, vuint16m1_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmsne_vx_u16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vuint16m1_t vs2, uint16_t rs1,
                                        size_t vl);
vbool8_t __riscv_vmsne_vv_u16m2_b8_mu(vbool8_t vm, vbool8_t vd, vuint16m2_t vs2,
                                      vuint16m2_t vs1, size_t vl);
vbool8_t __riscv_vmsne_vx_u16m2_b8_mu(vbool8_t vm, vbool8_t vd, vuint16m2_t vs2,
                                      uint16_t rs1, size_t vl);
vbool4_t __riscv_vmsne_vv_u16m4_b4_mu(vbool4_t vm, vbool4_t vd, vuint16m4_t vs2,
                                      vuint16m4_t vs1, size_t vl);
vbool4_t __riscv_vmsne_vx_u16m4_b4_mu(vbool4_t vm, vbool4_t vd, vuint16m4_t vs2,
                                      uint16_t rs1, size_t vl);
vbool2_t __riscv_vmsne_vv_u16m8_b2_mu(vbool2_t vm, vbool2_t vd, vuint16m8_t vs2,
                                      vuint16m8_t vs1, size_t vl);
vbool2_t __riscv_vmsne_vx_u16m8_b2_mu(vbool2_t vm, vbool2_t vd, vuint16m8_t vs2,
                                      uint16_t rs1, size_t vl);
vbool64_t __riscv_vmsne_vv_u32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vuint32mf2_t vs2, vuint32mf2_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmsne_vx_u32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vuint32mf2_t vs2, uint32_t rs1,
                                         size_t vl);
vbool32_t __riscv_vmsne_vv_u32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vuint32m1_t vs2, vuint32m1_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmsne_vx_u32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vuint32m1_t vs2, uint32_t rs1,
                                        size_t vl);
vbool16_t __riscv_vmsne_vv_u32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vuint32m2_t vs2, vuint32m2_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmsne_vx_u32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vuint32m2_t vs2, uint32_t rs1,
                                        size_t vl);
vbool8_t __riscv_vmsne_vv_u32m4_b8_mu(vbool8_t vm, vbool8_t vd, vuint32m4_t vs2,
                                      vuint32m4_t vs1, size_t vl);
vbool8_t __riscv_vmsne_vx_u32m4_b8_mu(vbool8_t vm, vbool8_t vd, vuint32m4_t vs2,
                                      uint32_t rs1, size_t vl);
vbool4_t __riscv_vmsne_vv_u32m8_b4_mu(vbool4_t vm, vbool4_t vd, vuint32m8_t vs2,
                                      vuint32m8_t vs1, size_t vl);
vbool4_t __riscv_vmsne_vx_u32m8_b4_mu(vbool4_t vm, vbool4_t vd, vuint32m8_t vs2,
                                      uint32_t rs1, size_t vl);
vbool64_t __riscv_vmsne_vv_u64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vuint64m1_t vs2, vuint64m1_t vs1,
                                        size_t vl);
vbool64_t __riscv_vmsne_vx_u64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vuint64m1_t vs2, uint64_t rs1,
                                        size_t vl);
vbool32_t __riscv_vmsne_vv_u64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vuint64m2_t vs2, vuint64m2_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmsne_vx_u64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vuint64m2_t vs2, uint64_t rs1,
                                        size_t vl);
vbool16_t __riscv_vmsne_vv_u64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vuint64m4_t vs2, vuint64m4_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmsne_vx_u64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vuint64m4_t vs2, uint64_t rs1,
                                        size_t vl);
vbool8_t __riscv_vmsne_vv_u64m8_b8_mu(vbool8_t vm, vbool8_t vd, vuint64m8_t vs2,
                                      vuint64m8_t vs1, size_t vl);
vbool8_t __riscv_vmsne_vx_u64m8_b8_mu(vbool8_t vm, vbool8_t vd, vuint64m8_t vs2,
                                      uint64_t rs1, size_t vl);
vbool64_t __riscv_vmsltu_vv_u8mf8_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vuint8mf8_t vs2, vuint8mf8_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmsltu_vx_u8mf8_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vuint8mf8_t vs2, uint8_t rs1,
                                         size_t vl);
vbool32_t __riscv_vmsltu_vv_u8mf4_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint8mf4_t vs2, vuint8mf4_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmsltu_vx_u8mf4_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint8mf4_t vs2, uint8_t rs1,
                                         size_t vl);
vbool16_t __riscv_vmsltu_vv_u8mf2_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint8mf2_t vs2, vuint8mf2_t vs1,
                                         size_t vl);
vbool16_t __riscv_vmsltu_vx_u8mf2_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint8mf2_t vs2, uint8_t rs1,
                                         size_t vl);
vbool8_t __riscv_vmsltu_vv_u8m1_b8_mu(vbool8_t vm, vbool8_t vd, vuint8m1_t vs2,
                                      vuint8m1_t vs1, size_t vl);
vbool8_t __riscv_vmsltu_vx_u8m1_b8_mu(vbool8_t vm, vbool8_t vd, vuint8m1_t vs2,
                                      uint8_t rs1, size_t vl);
vbool4_t __riscv_vmsltu_vv_u8m2_b4_mu(vbool4_t vm, vbool4_t vd, vuint8m2_t vs2,
                                      vuint8m2_t vs1, size_t vl);
vbool4_t __riscv_vmsltu_vx_u8m2_b4_mu(vbool4_t vm, vbool4_t vd, vuint8m2_t vs2,
                                      uint8_t rs1, size_t vl);
vbool2_t __riscv_vmsltu_vv_u8m4_b2_mu(vbool2_t vm, vbool2_t vd, vuint8m4_t vs2,
                                      vuint8m4_t vs1, size_t vl);
vbool2_t __riscv_vmsltu_vx_u8m4_b2_mu(vbool2_t vm, vbool2_t vd, vuint8m4_t vs2,
                                      uint8_t rs1, size_t vl);
vbool1_t __riscv_vmsltu_vv_u8m8_b1_mu(vbool1_t vm, vbool1_t vd, vuint8m8_t vs2,
                                      vuint8m8_t vs1, size_t vl);
vbool1_t __riscv_vmsltu_vx_u8m8_b1_mu(vbool1_t vm, vbool1_t vd, vuint8m8_t vs2,
                                      uint8_t rs1, size_t vl);
vbool64_t __riscv_vmsltu_vv_u16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                          vuint16mf4_t vs2, vuint16mf4_t vs1,
                                          size_t vl);
vbool64_t __riscv_vmsltu_vx_u16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                          vuint16mf4_t vs2, uint16_t rs1,
                                          size_t vl);
vbool32_t __riscv_vmsltu_vv_u16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                          vuint16mf2_t vs2, vuint16mf2_t vs1,
                                          size_t vl);
vbool32_t __riscv_vmsltu_vx_u16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                          vuint16mf2_t vs2, uint16_t rs1,
                                          size_t vl);
vbool16_t __riscv_vmsltu_vv_u16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint16m1_t vs2, vuint16m1_t vs1,
                                         size_t vl);
vbool16_t __riscv_vmsltu_vx_u16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint16m1_t vs2, uint16_t rs1,
                                         size_t vl);
vbool8_t __riscv_vmsltu_vv_u16m2_b8_mu(vbool8_t vm, vbool8_t vd,
                                       vuint16m2_t vs2, vuint16m2_t vs1,
                                       size_t vl);
vbool8_t __riscv_vmsltu_vx_u16m2_b8_mu(vbool8_t vm, vbool8_t vd,
                                       vuint16m2_t vs2, uint16_t rs1,
                                       size_t vl);
vbool4_t __riscv_vmsltu_vv_u16m4_b4_mu(vbool4_t vm, vbool4_t vd,
                                       vuint16m4_t vs2, vuint16m4_t vs1,
                                       size_t vl);
vbool4_t __riscv_vmsltu_vx_u16m4_b4_mu(vbool4_t vm, vbool4_t vd,
                                       vuint16m4_t vs2, uint16_t rs1,
                                       size_t vl);
vbool2_t __riscv_vmsltu_vv_u16m8_b2_mu(vbool2_t vm, vbool2_t vd,
                                       vuint16m8_t vs2, vuint16m8_t vs1,
                                       size_t vl);
vbool2_t __riscv_vmsltu_vx_u16m8_b2_mu(vbool2_t vm, vbool2_t vd,
                                       vuint16m8_t vs2, uint16_t rs1,
                                       size_t vl);
vbool64_t __riscv_vmsltu_vv_u32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                          vuint32mf2_t vs2, vuint32mf2_t vs1,
                                          size_t vl);
vbool64_t __riscv_vmsltu_vx_u32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                          vuint32mf2_t vs2, uint32_t rs1,
                                          size_t vl);
vbool32_t __riscv_vmsltu_vv_u32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint32m1_t vs2, vuint32m1_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmsltu_vx_u32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint32m1_t vs2, uint32_t rs1,
                                         size_t vl);
vbool16_t __riscv_vmsltu_vv_u32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint32m2_t vs2, vuint32m2_t vs1,
                                         size_t vl);
vbool16_t __riscv_vmsltu_vx_u32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint32m2_t vs2, uint32_t rs1,
                                         size_t vl);
vbool8_t __riscv_vmsltu_vv_u32m4_b8_mu(vbool8_t vm, vbool8_t vd,
                                       vuint32m4_t vs2, vuint32m4_t vs1,
                                       size_t vl);
vbool8_t __riscv_vmsltu_vx_u32m4_b8_mu(vbool8_t vm, vbool8_t vd,
                                       vuint32m4_t vs2, uint32_t rs1,
                                       size_t vl);
vbool4_t __riscv_vmsltu_vv_u32m8_b4_mu(vbool4_t vm, vbool4_t vd,
                                       vuint32m8_t vs2, vuint32m8_t vs1,
                                       size_t vl);
vbool4_t __riscv_vmsltu_vx_u32m8_b4_mu(vbool4_t vm, vbool4_t vd,
                                       vuint32m8_t vs2, uint32_t rs1,
                                       size_t vl);
vbool64_t __riscv_vmsltu_vv_u64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vuint64m1_t vs2, vuint64m1_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmsltu_vx_u64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vuint64m1_t vs2, uint64_t rs1,
                                         size_t vl);
vbool32_t __riscv_vmsltu_vv_u64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint64m2_t vs2, vuint64m2_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmsltu_vx_u64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint64m2_t vs2, uint64_t rs1,
                                         size_t vl);
vbool16_t __riscv_vmsltu_vv_u64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint64m4_t vs2, vuint64m4_t vs1,
                                         size_t vl);
vbool16_t __riscv_vmsltu_vx_u64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint64m4_t vs2, uint64_t rs1,
                                         size_t vl);
vbool8_t __riscv_vmsltu_vv_u64m8_b8_mu(vbool8_t vm, vbool8_t vd,
                                       vuint64m8_t vs2, vuint64m8_t vs1,
                                       size_t vl);
vbool8_t __riscv_vmsltu_vx_u64m8_b8_mu(vbool8_t vm, vbool8_t vd,
                                       vuint64m8_t vs2, uint64_t rs1,
                                       size_t vl);
vbool64_t __riscv_vmsleu_vv_u8mf8_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vuint8mf8_t vs2, vuint8mf8_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmsleu_vx_u8mf8_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vuint8mf8_t vs2, uint8_t rs1,
                                         size_t vl);
vbool32_t __riscv_vmsleu_vv_u8mf4_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint8mf4_t vs2, vuint8mf4_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmsleu_vx_u8mf4_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint8mf4_t vs2, uint8_t rs1,
                                         size_t vl);
vbool16_t __riscv_vmsleu_vv_u8mf2_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint8mf2_t vs2, vuint8mf2_t vs1,
                                         size_t vl);
vbool16_t __riscv_vmsleu_vx_u8mf2_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint8mf2_t vs2, uint8_t rs1,
                                         size_t vl);
vbool8_t __riscv_vmsleu_vv_u8m1_b8_mu(vbool8_t vm, vbool8_t vd, vuint8m1_t vs2,
                                      vuint8m1_t vs1, size_t vl);
vbool8_t __riscv_vmsleu_vx_u8m1_b8_mu(vbool8_t vm, vbool8_t vd, vuint8m1_t vs2,
                                      uint8_t rs1, size_t vl);
vbool4_t __riscv_vmsleu_vv_u8m2_b4_mu(vbool4_t vm, vbool4_t vd, vuint8m2_t vs2,
                                      vuint8m2_t vs1, size_t vl);
vbool4_t __riscv_vmsleu_vx_u8m2_b4_mu(vbool4_t vm, vbool4_t vd, vuint8m2_t vs2,
                                      uint8_t rs1, size_t vl);
vbool2_t __riscv_vmsleu_vv_u8m4_b2_mu(vbool2_t vm, vbool2_t vd, vuint8m4_t vs2,
                                      vuint8m4_t vs1, size_t vl);
vbool2_t __riscv_vmsleu_vx_u8m4_b2_mu(vbool2_t vm, vbool2_t vd, vuint8m4_t vs2,
                                      uint8_t rs1, size_t vl);
vbool1_t __riscv_vmsleu_vv_u8m8_b1_mu(vbool1_t vm, vbool1_t vd, vuint8m8_t vs2,
                                      vuint8m8_t vs1, size_t vl);
vbool1_t __riscv_vmsleu_vx_u8m8_b1_mu(vbool1_t vm, vbool1_t vd, vuint8m8_t vs2,
                                      uint8_t rs1, size_t vl);
vbool64_t __riscv_vmsleu_vv_u16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                          vuint16mf4_t vs2, vuint16mf4_t vs1,
                                          size_t vl);
vbool64_t __riscv_vmsleu_vx_u16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                          vuint16mf4_t vs2, uint16_t rs1,
                                          size_t vl);
vbool32_t __riscv_vmsleu_vv_u16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                          vuint16mf2_t vs2, vuint16mf2_t vs1,
                                          size_t vl);
vbool32_t __riscv_vmsleu_vx_u16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                          vuint16mf2_t vs2, uint16_t rs1,
                                          size_t vl);
vbool16_t __riscv_vmsleu_vv_u16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint16m1_t vs2, vuint16m1_t vs1,
                                         size_t vl);
vbool16_t __riscv_vmsleu_vx_u16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint16m1_t vs2, uint16_t rs1,
                                         size_t vl);
vbool8_t __riscv_vmsleu_vv_u16m2_b8_mu(vbool8_t vm, vbool8_t vd,
                                       vuint16m2_t vs2, vuint16m2_t vs1,
                                       size_t vl);
vbool8_t __riscv_vmsleu_vx_u16m2_b8_mu(vbool8_t vm, vbool8_t vd,
                                       vuint16m2_t vs2, uint16_t rs1,
                                       size_t vl);
vbool4_t __riscv_vmsleu_vv_u16m4_b4_mu(vbool4_t vm, vbool4_t vd,
                                       vuint16m4_t vs2, vuint16m4_t vs1,
                                       size_t vl);
vbool4_t __riscv_vmsleu_vx_u16m4_b4_mu(vbool4_t vm, vbool4_t vd,
                                       vuint16m4_t vs2, uint16_t rs1,
                                       size_t vl);
vbool2_t __riscv_vmsleu_vv_u16m8_b2_mu(vbool2_t vm, vbool2_t vd,
                                       vuint16m8_t vs2, vuint16m8_t vs1,
                                       size_t vl);
vbool2_t __riscv_vmsleu_vx_u16m8_b2_mu(vbool2_t vm, vbool2_t vd,
                                       vuint16m8_t vs2, uint16_t rs1,
                                       size_t vl);
vbool64_t __riscv_vmsleu_vv_u32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                          vuint32mf2_t vs2, vuint32mf2_t vs1,
                                          size_t vl);
vbool64_t __riscv_vmsleu_vx_u32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                          vuint32mf2_t vs2, uint32_t rs1,
                                          size_t vl);
vbool32_t __riscv_vmsleu_vv_u32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint32m1_t vs2, vuint32m1_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmsleu_vx_u32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint32m1_t vs2, uint32_t rs1,
                                         size_t vl);
vbool16_t __riscv_vmsleu_vv_u32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint32m2_t vs2, vuint32m2_t vs1,
                                         size_t vl);
vbool16_t __riscv_vmsleu_vx_u32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint32m2_t vs2, uint32_t rs1,
                                         size_t vl);
vbool8_t __riscv_vmsleu_vv_u32m4_b8_mu(vbool8_t vm, vbool8_t vd,
                                       vuint32m4_t vs2, vuint32m4_t vs1,
                                       size_t vl);
vbool8_t __riscv_vmsleu_vx_u32m4_b8_mu(vbool8_t vm, vbool8_t vd,
                                       vuint32m4_t vs2, uint32_t rs1,
                                       size_t vl);
vbool4_t __riscv_vmsleu_vv_u32m8_b4_mu(vbool4_t vm, vbool4_t vd,
                                       vuint32m8_t vs2, vuint32m8_t vs1,
                                       size_t vl);
vbool4_t __riscv_vmsleu_vx_u32m8_b4_mu(vbool4_t vm, vbool4_t vd,
                                       vuint32m8_t vs2, uint32_t rs1,
                                       size_t vl);
vbool64_t __riscv_vmsleu_vv_u64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vuint64m1_t vs2, vuint64m1_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmsleu_vx_u64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vuint64m1_t vs2, uint64_t rs1,
                                         size_t vl);
vbool32_t __riscv_vmsleu_vv_u64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint64m2_t vs2, vuint64m2_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmsleu_vx_u64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint64m2_t vs2, uint64_t rs1,
                                         size_t vl);
vbool16_t __riscv_vmsleu_vv_u64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint64m4_t vs2, vuint64m4_t vs1,
                                         size_t vl);
vbool16_t __riscv_vmsleu_vx_u64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint64m4_t vs2, uint64_t rs1,
                                         size_t vl);
vbool8_t __riscv_vmsleu_vv_u64m8_b8_mu(vbool8_t vm, vbool8_t vd,
                                       vuint64m8_t vs2, vuint64m8_t vs1,
                                       size_t vl);
vbool8_t __riscv_vmsleu_vx_u64m8_b8_mu(vbool8_t vm, vbool8_t vd,
                                       vuint64m8_t vs2, uint64_t rs1,
                                       size_t vl);
vbool64_t __riscv_vmsgtu_vv_u8mf8_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vuint8mf8_t vs2, vuint8mf8_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmsgtu_vx_u8mf8_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vuint8mf8_t vs2, uint8_t rs1,
                                         size_t vl);
vbool32_t __riscv_vmsgtu_vv_u8mf4_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint8mf4_t vs2, vuint8mf4_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmsgtu_vx_u8mf4_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint8mf4_t vs2, uint8_t rs1,
                                         size_t vl);
vbool16_t __riscv_vmsgtu_vv_u8mf2_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint8mf2_t vs2, vuint8mf2_t vs1,
                                         size_t vl);
vbool16_t __riscv_vmsgtu_vx_u8mf2_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint8mf2_t vs2, uint8_t rs1,
                                         size_t vl);
vbool8_t __riscv_vmsgtu_vv_u8m1_b8_mu(vbool8_t vm, vbool8_t vd, vuint8m1_t vs2,
                                      vuint8m1_t vs1, size_t vl);
vbool8_t __riscv_vmsgtu_vx_u8m1_b8_mu(vbool8_t vm, vbool8_t vd, vuint8m1_t vs2,
                                      uint8_t rs1, size_t vl);
vbool4_t __riscv_vmsgtu_vv_u8m2_b4_mu(vbool4_t vm, vbool4_t vd, vuint8m2_t vs2,
                                      vuint8m2_t vs1, size_t vl);
vbool4_t __riscv_vmsgtu_vx_u8m2_b4_mu(vbool4_t vm, vbool4_t vd, vuint8m2_t vs2,
                                      uint8_t rs1, size_t vl);
vbool2_t __riscv_vmsgtu_vv_u8m4_b2_mu(vbool2_t vm, vbool2_t vd, vuint8m4_t vs2,
                                      vuint8m4_t vs1, size_t vl);
vbool2_t __riscv_vmsgtu_vx_u8m4_b2_mu(vbool2_t vm, vbool2_t vd, vuint8m4_t vs2,
                                      uint8_t rs1, size_t vl);
vbool1_t __riscv_vmsgtu_vv_u8m8_b1_mu(vbool1_t vm, vbool1_t vd, vuint8m8_t vs2,
                                      vuint8m8_t vs1, size_t vl);
vbool1_t __riscv_vmsgtu_vx_u8m8_b1_mu(vbool1_t vm, vbool1_t vd, vuint8m8_t vs2,
                                      uint8_t rs1, size_t vl);
vbool64_t __riscv_vmsgtu_vv_u16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                          vuint16mf4_t vs2, vuint16mf4_t vs1,
                                          size_t vl);
vbool64_t __riscv_vmsgtu_vx_u16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                          vuint16mf4_t vs2, uint16_t rs1,
                                          size_t vl);
vbool32_t __riscv_vmsgtu_vv_u16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                          vuint16mf2_t vs2, vuint16mf2_t vs1,
                                          size_t vl);
vbool32_t __riscv_vmsgtu_vx_u16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                          vuint16mf2_t vs2, uint16_t rs1,
                                          size_t vl);
vbool16_t __riscv_vmsgtu_vv_u16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint16m1_t vs2, vuint16m1_t vs1,
                                         size_t vl);
vbool16_t __riscv_vmsgtu_vx_u16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint16m1_t vs2, uint16_t rs1,
                                         size_t vl);
vbool8_t __riscv_vmsgtu_vv_u16m2_b8_mu(vbool8_t vm, vbool8_t vd,
                                       vuint16m2_t vs2, vuint16m2_t vs1,
                                       size_t vl);
vbool8_t __riscv_vmsgtu_vx_u16m2_b8_mu(vbool8_t vm, vbool8_t vd,
                                       vuint16m2_t vs2, uint16_t rs1,
                                       size_t vl);
vbool4_t __riscv_vmsgtu_vv_u16m4_b4_mu(vbool4_t vm, vbool4_t vd,
                                       vuint16m4_t vs2, vuint16m4_t vs1,
                                       size_t vl);
vbool4_t __riscv_vmsgtu_vx_u16m4_b4_mu(vbool4_t vm, vbool4_t vd,
                                       vuint16m4_t vs2, uint16_t rs1,
                                       size_t vl);
vbool2_t __riscv_vmsgtu_vv_u16m8_b2_mu(vbool2_t vm, vbool2_t vd,
                                       vuint16m8_t vs2, vuint16m8_t vs1,
                                       size_t vl);
vbool2_t __riscv_vmsgtu_vx_u16m8_b2_mu(vbool2_t vm, vbool2_t vd,
                                       vuint16m8_t vs2, uint16_t rs1,
                                       size_t vl);
vbool64_t __riscv_vmsgtu_vv_u32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                          vuint32mf2_t vs2, vuint32mf2_t vs1,
                                          size_t vl);
vbool64_t __riscv_vmsgtu_vx_u32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                          vuint32mf2_t vs2, uint32_t rs1,
                                          size_t vl);
vbool32_t __riscv_vmsgtu_vv_u32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint32m1_t vs2, vuint32m1_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmsgtu_vx_u32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint32m1_t vs2, uint32_t rs1,
                                         size_t vl);
vbool16_t __riscv_vmsgtu_vv_u32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint32m2_t vs2, vuint32m2_t vs1,
                                         size_t vl);
vbool16_t __riscv_vmsgtu_vx_u32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint32m2_t vs2, uint32_t rs1,
                                         size_t vl);
vbool8_t __riscv_vmsgtu_vv_u32m4_b8_mu(vbool8_t vm, vbool8_t vd,
                                       vuint32m4_t vs2, vuint32m4_t vs1,
                                       size_t vl);
vbool8_t __riscv_vmsgtu_vx_u32m4_b8_mu(vbool8_t vm, vbool8_t vd,
                                       vuint32m4_t vs2, uint32_t rs1,
                                       size_t vl);
vbool4_t __riscv_vmsgtu_vv_u32m8_b4_mu(vbool4_t vm, vbool4_t vd,
                                       vuint32m8_t vs2, vuint32m8_t vs1,
                                       size_t vl);
vbool4_t __riscv_vmsgtu_vx_u32m8_b4_mu(vbool4_t vm, vbool4_t vd,
                                       vuint32m8_t vs2, uint32_t rs1,
                                       size_t vl);
vbool64_t __riscv_vmsgtu_vv_u64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vuint64m1_t vs2, vuint64m1_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmsgtu_vx_u64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vuint64m1_t vs2, uint64_t rs1,
                                         size_t vl);
vbool32_t __riscv_vmsgtu_vv_u64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint64m2_t vs2, vuint64m2_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmsgtu_vx_u64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint64m2_t vs2, uint64_t rs1,
                                         size_t vl);
vbool16_t __riscv_vmsgtu_vv_u64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint64m4_t vs2, vuint64m4_t vs1,
                                         size_t vl);
vbool16_t __riscv_vmsgtu_vx_u64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint64m4_t vs2, uint64_t rs1,
                                         size_t vl);
vbool8_t __riscv_vmsgtu_vv_u64m8_b8_mu(vbool8_t vm, vbool8_t vd,
                                       vuint64m8_t vs2, vuint64m8_t vs1,
                                       size_t vl);
vbool8_t __riscv_vmsgtu_vx_u64m8_b8_mu(vbool8_t vm, vbool8_t vd,
                                       vuint64m8_t vs2, uint64_t rs1,
                                       size_t vl);
vbool64_t __riscv_vmsgeu_vv_u8mf8_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vuint8mf8_t vs2, vuint8mf8_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmsgeu_vx_u8mf8_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vuint8mf8_t vs2, uint8_t rs1,
                                         size_t vl);
vbool32_t __riscv_vmsgeu_vv_u8mf4_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint8mf4_t vs2, vuint8mf4_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmsgeu_vx_u8mf4_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint8mf4_t vs2, uint8_t rs1,
                                         size_t vl);
vbool16_t __riscv_vmsgeu_vv_u8mf2_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint8mf2_t vs2, vuint8mf2_t vs1,
                                         size_t vl);
vbool16_t __riscv_vmsgeu_vx_u8mf2_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint8mf2_t vs2, uint8_t rs1,
                                         size_t vl);
vbool8_t __riscv_vmsgeu_vv_u8m1_b8_mu(vbool8_t vm, vbool8_t vd, vuint8m1_t vs2,
                                      vuint8m1_t vs1, size_t vl);
vbool8_t __riscv_vmsgeu_vx_u8m1_b8_mu(vbool8_t vm, vbool8_t vd, vuint8m1_t vs2,
                                      uint8_t rs1, size_t vl);
vbool4_t __riscv_vmsgeu_vv_u8m2_b4_mu(vbool4_t vm, vbool4_t vd, vuint8m2_t vs2,
                                      vuint8m2_t vs1, size_t vl);
vbool4_t __riscv_vmsgeu_vx_u8m2_b4_mu(vbool4_t vm, vbool4_t vd, vuint8m2_t vs2,
                                      uint8_t rs1, size_t vl);
vbool2_t __riscv_vmsgeu_vv_u8m4_b2_mu(vbool2_t vm, vbool2_t vd, vuint8m4_t vs2,
                                      vuint8m4_t vs1, size_t vl);
vbool2_t __riscv_vmsgeu_vx_u8m4_b2_mu(vbool2_t vm, vbool2_t vd, vuint8m4_t vs2,
                                      uint8_t rs1, size_t vl);
vbool1_t __riscv_vmsgeu_vv_u8m8_b1_mu(vbool1_t vm, vbool1_t vd, vuint8m8_t vs2,
                                      vuint8m8_t vs1, size_t vl);
vbool1_t __riscv_vmsgeu_vx_u8m8_b1_mu(vbool1_t vm, vbool1_t vd, vuint8m8_t vs2,
                                      uint8_t rs1, size_t vl);
vbool64_t __riscv_vmsgeu_vv_u16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                          vuint16mf4_t vs2, vuint16mf4_t vs1,
                                          size_t vl);
vbool64_t __riscv_vmsgeu_vx_u16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                          vuint16mf4_t vs2, uint16_t rs1,
                                          size_t vl);
vbool32_t __riscv_vmsgeu_vv_u16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                          vuint16mf2_t vs2, vuint16mf2_t vs1,
                                          size_t vl);
vbool32_t __riscv_vmsgeu_vx_u16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                          vuint16mf2_t vs2, uint16_t rs1,
                                          size_t vl);
vbool16_t __riscv_vmsgeu_vv_u16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint16m1_t vs2, vuint16m1_t vs1,
                                         size_t vl);
vbool16_t __riscv_vmsgeu_vx_u16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint16m1_t vs2, uint16_t rs1,
                                         size_t vl);
vbool8_t __riscv_vmsgeu_vv_u16m2_b8_mu(vbool8_t vm, vbool8_t vd,
                                       vuint16m2_t vs2, vuint16m2_t vs1,
                                       size_t vl);
vbool8_t __riscv_vmsgeu_vx_u16m2_b8_mu(vbool8_t vm, vbool8_t vd,
                                       vuint16m2_t vs2, uint16_t rs1,
                                       size_t vl);
vbool4_t __riscv_vmsgeu_vv_u16m4_b4_mu(vbool4_t vm, vbool4_t vd,
                                       vuint16m4_t vs2, vuint16m4_t vs1,
                                       size_t vl);
vbool4_t __riscv_vmsgeu_vx_u16m4_b4_mu(vbool4_t vm, vbool4_t vd,
                                       vuint16m4_t vs2, uint16_t rs1,
                                       size_t vl);
vbool2_t __riscv_vmsgeu_vv_u16m8_b2_mu(vbool2_t vm, vbool2_t vd,
                                       vuint16m8_t vs2, vuint16m8_t vs1,
                                       size_t vl);
vbool2_t __riscv_vmsgeu_vx_u16m8_b2_mu(vbool2_t vm, vbool2_t vd,
                                       vuint16m8_t vs2, uint16_t rs1,
                                       size_t vl);
vbool64_t __riscv_vmsgeu_vv_u32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                          vuint32mf2_t vs2, vuint32mf2_t vs1,
                                          size_t vl);
vbool64_t __riscv_vmsgeu_vx_u32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                          vuint32mf2_t vs2, uint32_t rs1,
                                          size_t vl);
vbool32_t __riscv_vmsgeu_vv_u32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint32m1_t vs2, vuint32m1_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmsgeu_vx_u32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint32m1_t vs2, uint32_t rs1,
                                         size_t vl);
vbool16_t __riscv_vmsgeu_vv_u32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint32m2_t vs2, vuint32m2_t vs1,
                                         size_t vl);
vbool16_t __riscv_vmsgeu_vx_u32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint32m2_t vs2, uint32_t rs1,
                                         size_t vl);
vbool8_t __riscv_vmsgeu_vv_u32m4_b8_mu(vbool8_t vm, vbool8_t vd,
                                       vuint32m4_t vs2, vuint32m4_t vs1,
                                       size_t vl);
vbool8_t __riscv_vmsgeu_vx_u32m4_b8_mu(vbool8_t vm, vbool8_t vd,
                                       vuint32m4_t vs2, uint32_t rs1,
                                       size_t vl);
vbool4_t __riscv_vmsgeu_vv_u32m8_b4_mu(vbool4_t vm, vbool4_t vd,
                                       vuint32m8_t vs2, vuint32m8_t vs1,
                                       size_t vl);
vbool4_t __riscv_vmsgeu_vx_u32m8_b4_mu(vbool4_t vm, vbool4_t vd,
                                       vuint32m8_t vs2, uint32_t rs1,
                                       size_t vl);
vbool64_t __riscv_vmsgeu_vv_u64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vuint64m1_t vs2, vuint64m1_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmsgeu_vx_u64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vuint64m1_t vs2, uint64_t rs1,
                                         size_t vl);
vbool32_t __riscv_vmsgeu_vv_u64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint64m2_t vs2, vuint64m2_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmsgeu_vx_u64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vuint64m2_t vs2, uint64_t rs1,
                                         size_t vl);
vbool16_t __riscv_vmsgeu_vv_u64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint64m4_t vs2, vuint64m4_t vs1,
                                         size_t vl);
vbool16_t __riscv_vmsgeu_vx_u64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                         vuint64m4_t vs2, uint64_t rs1,
                                         size_t vl);
vbool8_t __riscv_vmsgeu_vv_u64m8_b8_mu(vbool8_t vm, vbool8_t vd,
                                       vuint64m8_t vs2, vuint64m8_t vs1,
                                       size_t vl);
vbool8_t __riscv_vmsgeu_vx_u64m8_b8_mu(vbool8_t vm, vbool8_t vd,
                                       vuint64m8_t vs2, uint64_t rs1,
                                       size_t vl);

Vector Integer Min/Max Intrinsics

vint8mf8_t __riscv_vmin_vv_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                    vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vmin_vx_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2, int8_t rs1,
                                    size_t vl);
vint8mf4_t __riscv_vmin_vv_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                    vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vmin_vx_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2, int8_t rs1,
                                    size_t vl);
vint8mf2_t __riscv_vmin_vv_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                    vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vmin_vx_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2, int8_t rs1,
                                    size_t vl);
vint8m1_t __riscv_vmin_vv_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, vint8m1_t vs1,
                                  size_t vl);
vint8m1_t __riscv_vmin_vx_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, int8_t rs1,
                                  size_t vl);
vint8m2_t __riscv_vmin_vv_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, vint8m2_t vs1,
                                  size_t vl);
vint8m2_t __riscv_vmin_vx_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, int8_t rs1,
                                  size_t vl);
vint8m4_t __riscv_vmin_vv_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, vint8m4_t vs1,
                                  size_t vl);
vint8m4_t __riscv_vmin_vx_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, int8_t rs1,
                                  size_t vl);
vint8m8_t __riscv_vmin_vv_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, vint8m8_t vs1,
                                  size_t vl);
vint8m8_t __riscv_vmin_vx_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, int8_t rs1,
                                  size_t vl);
vint16mf4_t __riscv_vmin_vv_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                      vint16mf4_t vs1, size_t vl);
vint16mf4_t __riscv_vmin_vx_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                      int16_t rs1, size_t vl);
vint16mf2_t __riscv_vmin_vv_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                      vint16mf2_t vs1, size_t vl);
vint16mf2_t __riscv_vmin_vx_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                      int16_t rs1, size_t vl);
vint16m1_t __riscv_vmin_vv_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                    vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vmin_vx_i16m1_tu(vint16m1_t vd, vint16m1_t vs2, int16_t rs1,
                                    size_t vl);
vint16m2_t __riscv_vmin_vv_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                    vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vmin_vx_i16m2_tu(vint16m2_t vd, vint16m2_t vs2, int16_t rs1,
                                    size_t vl);
vint16m4_t __riscv_vmin_vv_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                    vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vmin_vx_i16m4_tu(vint16m4_t vd, vint16m4_t vs2, int16_t rs1,
                                    size_t vl);
vint16m8_t __riscv_vmin_vv_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                    vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vmin_vx_i16m8_tu(vint16m8_t vd, vint16m8_t vs2, int16_t rs1,
                                    size_t vl);
vint32mf2_t __riscv_vmin_vv_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                      vint32mf2_t vs1, size_t vl);
vint32mf2_t __riscv_vmin_vx_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                      int32_t rs1, size_t vl);
vint32m1_t __riscv_vmin_vv_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                    vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vmin_vx_i32m1_tu(vint32m1_t vd, vint32m1_t vs2, int32_t rs1,
                                    size_t vl);
vint32m2_t __riscv_vmin_vv_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                    vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vmin_vx_i32m2_tu(vint32m2_t vd, vint32m2_t vs2, int32_t rs1,
                                    size_t vl);
vint32m4_t __riscv_vmin_vv_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                    vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vmin_vx_i32m4_tu(vint32m4_t vd, vint32m4_t vs2, int32_t rs1,
                                    size_t vl);
vint32m8_t __riscv_vmin_vv_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                    vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vmin_vx_i32m8_tu(vint32m8_t vd, vint32m8_t vs2, int32_t rs1,
                                    size_t vl);
vint64m1_t __riscv_vmin_vv_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                    vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vmin_vx_i64m1_tu(vint64m1_t vd, vint64m1_t vs2, int64_t rs1,
                                    size_t vl);
vint64m2_t __riscv_vmin_vv_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                    vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vmin_vx_i64m2_tu(vint64m2_t vd, vint64m2_t vs2, int64_t rs1,
                                    size_t vl);
vint64m4_t __riscv_vmin_vv_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                    vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vmin_vx_i64m4_tu(vint64m4_t vd, vint64m4_t vs2, int64_t rs1,
                                    size_t vl);
vint64m8_t __riscv_vmin_vv_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                    vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vmin_vx_i64m8_tu(vint64m8_t vd, vint64m8_t vs2, int64_t rs1,
                                    size_t vl);
vint8mf8_t __riscv_vmax_vv_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                    vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vmax_vx_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2, int8_t rs1,
                                    size_t vl);
vint8mf4_t __riscv_vmax_vv_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                    vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vmax_vx_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2, int8_t rs1,
                                    size_t vl);
vint8mf2_t __riscv_vmax_vv_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                    vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vmax_vx_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2, int8_t rs1,
                                    size_t vl);
vint8m1_t __riscv_vmax_vv_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, vint8m1_t vs1,
                                  size_t vl);
vint8m1_t __riscv_vmax_vx_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, int8_t rs1,
                                  size_t vl);
vint8m2_t __riscv_vmax_vv_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, vint8m2_t vs1,
                                  size_t vl);
vint8m2_t __riscv_vmax_vx_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, int8_t rs1,
                                  size_t vl);
vint8m4_t __riscv_vmax_vv_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, vint8m4_t vs1,
                                  size_t vl);
vint8m4_t __riscv_vmax_vx_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, int8_t rs1,
                                  size_t vl);
vint8m8_t __riscv_vmax_vv_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, vint8m8_t vs1,
                                  size_t vl);
vint8m8_t __riscv_vmax_vx_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, int8_t rs1,
                                  size_t vl);
vint16mf4_t __riscv_vmax_vv_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                      vint16mf4_t vs1, size_t vl);
vint16mf4_t __riscv_vmax_vx_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                      int16_t rs1, size_t vl);
vint16mf2_t __riscv_vmax_vv_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                      vint16mf2_t vs1, size_t vl);
vint16mf2_t __riscv_vmax_vx_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                      int16_t rs1, size_t vl);
vint16m1_t __riscv_vmax_vv_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                    vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vmax_vx_i16m1_tu(vint16m1_t vd, vint16m1_t vs2, int16_t rs1,
                                    size_t vl);
vint16m2_t __riscv_vmax_vv_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                    vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vmax_vx_i16m2_tu(vint16m2_t vd, vint16m2_t vs2, int16_t rs1,
                                    size_t vl);
vint16m4_t __riscv_vmax_vv_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                    vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vmax_vx_i16m4_tu(vint16m4_t vd, vint16m4_t vs2, int16_t rs1,
                                    size_t vl);
vint16m8_t __riscv_vmax_vv_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                    vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vmax_vx_i16m8_tu(vint16m8_t vd, vint16m8_t vs2, int16_t rs1,
                                    size_t vl);
vint32mf2_t __riscv_vmax_vv_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                      vint32mf2_t vs1, size_t vl);
vint32mf2_t __riscv_vmax_vx_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                      int32_t rs1, size_t vl);
vint32m1_t __riscv_vmax_vv_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                    vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vmax_vx_i32m1_tu(vint32m1_t vd, vint32m1_t vs2, int32_t rs1,
                                    size_t vl);
vint32m2_t __riscv_vmax_vv_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                    vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vmax_vx_i32m2_tu(vint32m2_t vd, vint32m2_t vs2, int32_t rs1,
                                    size_t vl);
vint32m4_t __riscv_vmax_vv_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                    vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vmax_vx_i32m4_tu(vint32m4_t vd, vint32m4_t vs2, int32_t rs1,
                                    size_t vl);
vint32m8_t __riscv_vmax_vv_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                    vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vmax_vx_i32m8_tu(vint32m8_t vd, vint32m8_t vs2, int32_t rs1,
                                    size_t vl);
vint64m1_t __riscv_vmax_vv_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                    vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vmax_vx_i64m1_tu(vint64m1_t vd, vint64m1_t vs2, int64_t rs1,
                                    size_t vl);
vint64m2_t __riscv_vmax_vv_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                    vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vmax_vx_i64m2_tu(vint64m2_t vd, vint64m2_t vs2, int64_t rs1,
                                    size_t vl);
vint64m4_t __riscv_vmax_vv_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                    vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vmax_vx_i64m4_tu(vint64m4_t vd, vint64m4_t vs2, int64_t rs1,
                                    size_t vl);
vint64m8_t __riscv_vmax_vv_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                    vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vmax_vx_i64m8_tu(vint64m8_t vd, vint64m8_t vs2, int64_t rs1,
                                    size_t vl);
vuint8mf8_t __riscv_vminu_vv_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                      vuint8mf8_t vs1, size_t vl);
vuint8mf8_t __riscv_vminu_vx_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                      uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vminu_vv_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                      vuint8mf4_t vs1, size_t vl);
vuint8mf4_t __riscv_vminu_vx_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                      uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vminu_vv_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                      vuint8mf2_t vs1, size_t vl);
vuint8mf2_t __riscv_vminu_vx_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                      uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vminu_vv_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2,
                                    vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vminu_vx_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2, uint8_t rs1,
                                    size_t vl);
vuint8m2_t __riscv_vminu_vv_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2,
                                    vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vminu_vx_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2, uint8_t rs1,
                                    size_t vl);
vuint8m4_t __riscv_vminu_vv_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2,
                                    vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vminu_vx_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2, uint8_t rs1,
                                    size_t vl);
vuint8m8_t __riscv_vminu_vv_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2,
                                    vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vminu_vx_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2, uint8_t rs1,
                                    size_t vl);
vuint16mf4_t __riscv_vminu_vv_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                        vuint16mf4_t vs1, size_t vl);
vuint16mf4_t __riscv_vminu_vx_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                        uint16_t rs1, size_t vl);
vuint16mf2_t __riscv_vminu_vv_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                        vuint16mf2_t vs1, size_t vl);
vuint16mf2_t __riscv_vminu_vx_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                        uint16_t rs1, size_t vl);
vuint16m1_t __riscv_vminu_vv_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                      vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vminu_vx_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                      uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vminu_vv_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                      vuint16m2_t vs1, size_t vl);
vuint16m2_t __riscv_vminu_vx_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                      uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vminu_vv_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                      vuint16m4_t vs1, size_t vl);
vuint16m4_t __riscv_vminu_vx_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                      uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vminu_vv_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                      vuint16m8_t vs1, size_t vl);
vuint16m8_t __riscv_vminu_vx_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                      uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vminu_vv_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                        vuint32mf2_t vs1, size_t vl);
vuint32mf2_t __riscv_vminu_vx_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                        uint32_t rs1, size_t vl);
vuint32m1_t __riscv_vminu_vv_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                      vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vminu_vx_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                      uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vminu_vv_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                      vuint32m2_t vs1, size_t vl);
vuint32m2_t __riscv_vminu_vx_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                      uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vminu_vv_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                      vuint32m4_t vs1, size_t vl);
vuint32m4_t __riscv_vminu_vx_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                      uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vminu_vv_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                      vuint32m8_t vs1, size_t vl);
vuint32m8_t __riscv_vminu_vx_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                      uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vminu_vv_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                      vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vminu_vx_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                      uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vminu_vv_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                      vuint64m2_t vs1, size_t vl);
vuint64m2_t __riscv_vminu_vx_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                      uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vminu_vv_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                      vuint64m4_t vs1, size_t vl);
vuint64m4_t __riscv_vminu_vx_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                      uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vminu_vv_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                      vuint64m8_t vs1, size_t vl);
vuint64m8_t __riscv_vminu_vx_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                      uint64_t rs1, size_t vl);
vuint8mf8_t __riscv_vmaxu_vv_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                      vuint8mf8_t vs1, size_t vl);
vuint8mf8_t __riscv_vmaxu_vx_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                      uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vmaxu_vv_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                      vuint8mf4_t vs1, size_t vl);
vuint8mf4_t __riscv_vmaxu_vx_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                      uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vmaxu_vv_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                      vuint8mf2_t vs1, size_t vl);
vuint8mf2_t __riscv_vmaxu_vx_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                      uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vmaxu_vv_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2,
                                    vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vmaxu_vx_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2, uint8_t rs1,
                                    size_t vl);
vuint8m2_t __riscv_vmaxu_vv_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2,
                                    vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vmaxu_vx_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2, uint8_t rs1,
                                    size_t vl);
vuint8m4_t __riscv_vmaxu_vv_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2,
                                    vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vmaxu_vx_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2, uint8_t rs1,
                                    size_t vl);
vuint8m8_t __riscv_vmaxu_vv_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2,
                                    vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vmaxu_vx_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2, uint8_t rs1,
                                    size_t vl);
vuint16mf4_t __riscv_vmaxu_vv_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                        vuint16mf4_t vs1, size_t vl);
vuint16mf4_t __riscv_vmaxu_vx_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                        uint16_t rs1, size_t vl);
vuint16mf2_t __riscv_vmaxu_vv_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                        vuint16mf2_t vs1, size_t vl);
vuint16mf2_t __riscv_vmaxu_vx_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                        uint16_t rs1, size_t vl);
vuint16m1_t __riscv_vmaxu_vv_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                      vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vmaxu_vx_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                      uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vmaxu_vv_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                      vuint16m2_t vs1, size_t vl);
vuint16m2_t __riscv_vmaxu_vx_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                      uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vmaxu_vv_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                      vuint16m4_t vs1, size_t vl);
vuint16m4_t __riscv_vmaxu_vx_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                      uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vmaxu_vv_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                      vuint16m8_t vs1, size_t vl);
vuint16m8_t __riscv_vmaxu_vx_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                      uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vmaxu_vv_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                        vuint32mf2_t vs1, size_t vl);
vuint32mf2_t __riscv_vmaxu_vx_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                        uint32_t rs1, size_t vl);
vuint32m1_t __riscv_vmaxu_vv_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                      vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vmaxu_vx_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                      uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vmaxu_vv_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                      vuint32m2_t vs1, size_t vl);
vuint32m2_t __riscv_vmaxu_vx_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                      uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vmaxu_vv_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                      vuint32m4_t vs1, size_t vl);
vuint32m4_t __riscv_vmaxu_vx_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                      uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vmaxu_vv_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                      vuint32m8_t vs1, size_t vl);
vuint32m8_t __riscv_vmaxu_vx_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                      uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vmaxu_vv_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                      vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vmaxu_vx_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                      uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vmaxu_vv_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                      vuint64m2_t vs1, size_t vl);
vuint64m2_t __riscv_vmaxu_vx_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                      uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vmaxu_vv_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                      vuint64m4_t vs1, size_t vl);
vuint64m4_t __riscv_vmaxu_vx_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                      uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vmaxu_vv_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                      vuint64m8_t vs1, size_t vl);
vuint64m8_t __riscv_vmaxu_vx_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                      uint64_t rs1, size_t vl);
// masked functions
vint8mf8_t __riscv_vmin_vv_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vmin_vx_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vmin_vv_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vmin_vx_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vmin_vv_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vmin_vx_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vmin_vv_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vmin_vx_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   int8_t rs1, size_t vl);
vint8m2_t __riscv_vmin_vv_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vmin_vx_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   int8_t rs1, size_t vl);
vint8m4_t __riscv_vmin_vv_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vmin_vx_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   int8_t rs1, size_t vl);
vint8m8_t __riscv_vmin_vv_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vmin_vx_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   int8_t rs1, size_t vl);
vint16mf4_t __riscv_vmin_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, vint16mf4_t vs1,
                                       size_t vl);
vint16mf4_t __riscv_vmin_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vmin_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, vint16mf2_t vs1,
                                       size_t vl);
vint16mf2_t __riscv_vmin_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, int16_t rs1, size_t vl);
vint16m1_t __riscv_vmin_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vmin_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vmin_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vmin_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     int16_t rs1, size_t vl);
vint16m4_t __riscv_vmin_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vmin_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     int16_t rs1, size_t vl);
vint16m8_t __riscv_vmin_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vmin_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     int16_t rs1, size_t vl);
vint32mf2_t __riscv_vmin_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, vint32mf2_t vs1,
                                       size_t vl);
vint32mf2_t __riscv_vmin_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, int32_t rs1, size_t vl);
vint32m1_t __riscv_vmin_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vmin_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vmin_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vmin_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vmin_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vmin_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     int32_t rs1, size_t vl);
vint32m8_t __riscv_vmin_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vmin_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     int32_t rs1, size_t vl);
vint64m1_t __riscv_vmin_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vmin_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vmin_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vmin_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vmin_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vmin_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vmin_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vmin_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     int64_t rs1, size_t vl);
vint8mf8_t __riscv_vmax_vv_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vmax_vx_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vmax_vv_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vmax_vx_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vmax_vv_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vmax_vx_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vmax_vv_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vmax_vx_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   int8_t rs1, size_t vl);
vint8m2_t __riscv_vmax_vv_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vmax_vx_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   int8_t rs1, size_t vl);
vint8m4_t __riscv_vmax_vv_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vmax_vx_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   int8_t rs1, size_t vl);
vint8m8_t __riscv_vmax_vv_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vmax_vx_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   int8_t rs1, size_t vl);
vint16mf4_t __riscv_vmax_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, vint16mf4_t vs1,
                                       size_t vl);
vint16mf4_t __riscv_vmax_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vmax_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, vint16mf2_t vs1,
                                       size_t vl);
vint16mf2_t __riscv_vmax_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, int16_t rs1, size_t vl);
vint16m1_t __riscv_vmax_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vmax_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vmax_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vmax_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     int16_t rs1, size_t vl);
vint16m4_t __riscv_vmax_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vmax_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     int16_t rs1, size_t vl);
vint16m8_t __riscv_vmax_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vmax_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     int16_t rs1, size_t vl);
vint32mf2_t __riscv_vmax_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, vint32mf2_t vs1,
                                       size_t vl);
vint32mf2_t __riscv_vmax_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, int32_t rs1, size_t vl);
vint32m1_t __riscv_vmax_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vmax_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vmax_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vmax_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vmax_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vmax_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     int32_t rs1, size_t vl);
vint32m8_t __riscv_vmax_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vmax_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     int32_t rs1, size_t vl);
vint64m1_t __riscv_vmax_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vmax_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vmax_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vmax_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vmax_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vmax_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vmax_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vmax_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     int64_t rs1, size_t vl);
vuint8mf8_t __riscv_vminu_vv_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs2, vuint8mf8_t vs1,
                                       size_t vl);
vuint8mf8_t __riscv_vminu_vx_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vminu_vv_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs2, vuint8mf4_t vs1,
                                       size_t vl);
vuint8mf4_t __riscv_vminu_vx_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vminu_vv_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs2, vuint8mf2_t vs1,
                                       size_t vl);
vuint8mf2_t __riscv_vminu_vx_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vminu_vv_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                     vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vminu_vx_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vminu_vv_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                     vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vminu_vx_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vminu_vv_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                     vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vminu_vx_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vminu_vv_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                     vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vminu_vx_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                     uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vminu_vv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, vuint16mf4_t vs1,
                                         size_t vl);
vuint16mf4_t __riscv_vminu_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, uint16_t rs1,
                                         size_t vl);
vuint16mf2_t __riscv_vminu_vv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, vuint16mf2_t vs1,
                                         size_t vl);
vuint16mf2_t __riscv_vminu_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, uint16_t rs1,
                                         size_t vl);
vuint16m1_t __riscv_vminu_vv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, vuint16m1_t vs1,
                                       size_t vl);
vuint16m1_t __riscv_vminu_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m2_t __riscv_vminu_vv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, vuint16m2_t vs1,
                                       size_t vl);
vuint16m2_t __riscv_vminu_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m4_t __riscv_vminu_vv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, vuint16m4_t vs1,
                                       size_t vl);
vuint16m4_t __riscv_vminu_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m8_t __riscv_vminu_vv_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, vuint16m8_t vs1,
                                       size_t vl);
vuint16m8_t __riscv_vminu_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32mf2_t __riscv_vminu_vv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, vuint32mf2_t vs1,
                                         size_t vl);
vuint32mf2_t __riscv_vminu_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, uint32_t rs1,
                                         size_t vl);
vuint32m1_t __riscv_vminu_vv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, vuint32m1_t vs1,
                                       size_t vl);
vuint32m1_t __riscv_vminu_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m2_t __riscv_vminu_vv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, vuint32m2_t vs1,
                                       size_t vl);
vuint32m2_t __riscv_vminu_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m4_t __riscv_vminu_vv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, vuint32m4_t vs1,
                                       size_t vl);
vuint32m4_t __riscv_vminu_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m8_t __riscv_vminu_vv_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, vuint32m8_t vs1,
                                       size_t vl);
vuint32m8_t __riscv_vminu_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m1_t __riscv_vminu_vv_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, vuint64m1_t vs1,
                                       size_t vl);
vuint64m1_t __riscv_vminu_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m2_t __riscv_vminu_vv_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, vuint64m2_t vs1,
                                       size_t vl);
vuint64m2_t __riscv_vminu_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m4_t __riscv_vminu_vv_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, vuint64m4_t vs1,
                                       size_t vl);
vuint64m4_t __riscv_vminu_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m8_t __riscv_vminu_vv_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, vuint64m8_t vs1,
                                       size_t vl);
vuint64m8_t __riscv_vminu_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, uint64_t rs1,
                                       size_t vl);
vuint8mf8_t __riscv_vmaxu_vv_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs2, vuint8mf8_t vs1,
                                       size_t vl);
vuint8mf8_t __riscv_vmaxu_vx_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vmaxu_vv_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs2, vuint8mf4_t vs1,
                                       size_t vl);
vuint8mf4_t __riscv_vmaxu_vx_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vmaxu_vv_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs2, vuint8mf2_t vs1,
                                       size_t vl);
vuint8mf2_t __riscv_vmaxu_vx_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vmaxu_vv_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                     vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vmaxu_vx_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vmaxu_vv_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                     vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vmaxu_vx_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vmaxu_vv_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                     vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vmaxu_vx_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vmaxu_vv_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                     vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vmaxu_vx_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                     uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vmaxu_vv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, vuint16mf4_t vs1,
                                         size_t vl);
vuint16mf4_t __riscv_vmaxu_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, uint16_t rs1,
                                         size_t vl);
vuint16mf2_t __riscv_vmaxu_vv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, vuint16mf2_t vs1,
                                         size_t vl);
vuint16mf2_t __riscv_vmaxu_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, uint16_t rs1,
                                         size_t vl);
vuint16m1_t __riscv_vmaxu_vv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, vuint16m1_t vs1,
                                       size_t vl);
vuint16m1_t __riscv_vmaxu_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m2_t __riscv_vmaxu_vv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, vuint16m2_t vs1,
                                       size_t vl);
vuint16m2_t __riscv_vmaxu_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m4_t __riscv_vmaxu_vv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, vuint16m4_t vs1,
                                       size_t vl);
vuint16m4_t __riscv_vmaxu_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m8_t __riscv_vmaxu_vv_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, vuint16m8_t vs1,
                                       size_t vl);
vuint16m8_t __riscv_vmaxu_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32mf2_t __riscv_vmaxu_vv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, vuint32mf2_t vs1,
                                         size_t vl);
vuint32mf2_t __riscv_vmaxu_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, uint32_t rs1,
                                         size_t vl);
vuint32m1_t __riscv_vmaxu_vv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, vuint32m1_t vs1,
                                       size_t vl);
vuint32m1_t __riscv_vmaxu_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m2_t __riscv_vmaxu_vv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, vuint32m2_t vs1,
                                       size_t vl);
vuint32m2_t __riscv_vmaxu_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m4_t __riscv_vmaxu_vv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, vuint32m4_t vs1,
                                       size_t vl);
vuint32m4_t __riscv_vmaxu_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m8_t __riscv_vmaxu_vv_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, vuint32m8_t vs1,
                                       size_t vl);
vuint32m8_t __riscv_vmaxu_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m1_t __riscv_vmaxu_vv_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, vuint64m1_t vs1,
                                       size_t vl);
vuint64m1_t __riscv_vmaxu_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m2_t __riscv_vmaxu_vv_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, vuint64m2_t vs1,
                                       size_t vl);
vuint64m2_t __riscv_vmaxu_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m4_t __riscv_vmaxu_vv_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, vuint64m4_t vs1,
                                       size_t vl);
vuint64m4_t __riscv_vmaxu_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m8_t __riscv_vmaxu_vv_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, vuint64m8_t vs1,
                                       size_t vl);
vuint64m8_t __riscv_vmaxu_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, uint64_t rs1,
                                       size_t vl);
// masked functions
vint8mf8_t __riscv_vmin_vv_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs2, vint8mf8_t vs1,
                                      size_t vl);
vint8mf8_t __riscv_vmin_vx_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vmin_vv_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs2, vint8mf4_t vs1,
                                      size_t vl);
vint8mf4_t __riscv_vmin_vx_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vmin_vv_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs2, vint8mf2_t vs1,
                                      size_t vl);
vint8mf2_t __riscv_vmin_vx_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vmin_vv_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                    vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vmin_vx_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                    int8_t rs1, size_t vl);
vint8m2_t __riscv_vmin_vv_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                    vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vmin_vx_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                    int8_t rs1, size_t vl);
vint8m4_t __riscv_vmin_vv_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                    vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vmin_vx_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                    int8_t rs1, size_t vl);
vint8m8_t __riscv_vmin_vv_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                    vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vmin_vx_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                    int8_t rs1, size_t vl);
vint16mf4_t __riscv_vmin_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, vint16mf4_t vs1,
                                        size_t vl);
vint16mf4_t __riscv_vmin_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, int16_t rs1,
                                        size_t vl);
vint16mf2_t __riscv_vmin_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, vint16mf2_t vs1,
                                        size_t vl);
vint16mf2_t __riscv_vmin_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, int16_t rs1,
                                        size_t vl);
vint16m1_t __riscv_vmin_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, vint16m1_t vs1,
                                      size_t vl);
vint16m1_t __riscv_vmin_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vmin_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, vint16m2_t vs1,
                                      size_t vl);
vint16m2_t __riscv_vmin_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, int16_t rs1, size_t vl);
vint16m4_t __riscv_vmin_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, vint16m4_t vs1,
                                      size_t vl);
vint16m4_t __riscv_vmin_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, int16_t rs1, size_t vl);
vint16m8_t __riscv_vmin_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, vint16m8_t vs1,
                                      size_t vl);
vint16m8_t __riscv_vmin_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, int16_t rs1, size_t vl);
vint32mf2_t __riscv_vmin_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, vint32mf2_t vs1,
                                        size_t vl);
vint32mf2_t __riscv_vmin_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, int32_t rs1,
                                        size_t vl);
vint32m1_t __riscv_vmin_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, vint32m1_t vs1,
                                      size_t vl);
vint32m1_t __riscv_vmin_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vmin_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, vint32m2_t vs1,
                                      size_t vl);
vint32m2_t __riscv_vmin_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vmin_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, vint32m4_t vs1,
                                      size_t vl);
vint32m4_t __riscv_vmin_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, int32_t rs1, size_t vl);
vint32m8_t __riscv_vmin_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, vint32m8_t vs1,
                                      size_t vl);
vint32m8_t __riscv_vmin_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, int32_t rs1, size_t vl);
vint64m1_t __riscv_vmin_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, vint64m1_t vs1,
                                      size_t vl);
vint64m1_t __riscv_vmin_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vmin_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, vint64m2_t vs1,
                                      size_t vl);
vint64m2_t __riscv_vmin_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vmin_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, vint64m4_t vs1,
                                      size_t vl);
vint64m4_t __riscv_vmin_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vmin_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, vint64m8_t vs1,
                                      size_t vl);
vint64m8_t __riscv_vmin_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, int64_t rs1, size_t vl);
vint8mf8_t __riscv_vmax_vv_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs2, vint8mf8_t vs1,
                                      size_t vl);
vint8mf8_t __riscv_vmax_vx_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vmax_vv_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs2, vint8mf4_t vs1,
                                      size_t vl);
vint8mf4_t __riscv_vmax_vx_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vmax_vv_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs2, vint8mf2_t vs1,
                                      size_t vl);
vint8mf2_t __riscv_vmax_vx_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vmax_vv_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                    vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vmax_vx_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                    int8_t rs1, size_t vl);
vint8m2_t __riscv_vmax_vv_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                    vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vmax_vx_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                    int8_t rs1, size_t vl);
vint8m4_t __riscv_vmax_vv_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                    vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vmax_vx_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                    int8_t rs1, size_t vl);
vint8m8_t __riscv_vmax_vv_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                    vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vmax_vx_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                    int8_t rs1, size_t vl);
vint16mf4_t __riscv_vmax_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, vint16mf4_t vs1,
                                        size_t vl);
vint16mf4_t __riscv_vmax_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, int16_t rs1,
                                        size_t vl);
vint16mf2_t __riscv_vmax_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, vint16mf2_t vs1,
                                        size_t vl);
vint16mf2_t __riscv_vmax_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, int16_t rs1,
                                        size_t vl);
vint16m1_t __riscv_vmax_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, vint16m1_t vs1,
                                      size_t vl);
vint16m1_t __riscv_vmax_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vmax_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, vint16m2_t vs1,
                                      size_t vl);
vint16m2_t __riscv_vmax_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, int16_t rs1, size_t vl);
vint16m4_t __riscv_vmax_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, vint16m4_t vs1,
                                      size_t vl);
vint16m4_t __riscv_vmax_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, int16_t rs1, size_t vl);
vint16m8_t __riscv_vmax_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, vint16m8_t vs1,
                                      size_t vl);
vint16m8_t __riscv_vmax_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, int16_t rs1, size_t vl);
vint32mf2_t __riscv_vmax_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, vint32mf2_t vs1,
                                        size_t vl);
vint32mf2_t __riscv_vmax_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, int32_t rs1,
                                        size_t vl);
vint32m1_t __riscv_vmax_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, vint32m1_t vs1,
                                      size_t vl);
vint32m1_t __riscv_vmax_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vmax_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, vint32m2_t vs1,
                                      size_t vl);
vint32m2_t __riscv_vmax_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vmax_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, vint32m4_t vs1,
                                      size_t vl);
vint32m4_t __riscv_vmax_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, int32_t rs1, size_t vl);
vint32m8_t __riscv_vmax_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, vint32m8_t vs1,
                                      size_t vl);
vint32m8_t __riscv_vmax_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, int32_t rs1, size_t vl);
vint64m1_t __riscv_vmax_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, vint64m1_t vs1,
                                      size_t vl);
vint64m1_t __riscv_vmax_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vmax_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, vint64m2_t vs1,
                                      size_t vl);
vint64m2_t __riscv_vmax_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vmax_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, vint64m4_t vs1,
                                      size_t vl);
vint64m4_t __riscv_vmax_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vmax_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, vint64m8_t vs1,
                                      size_t vl);
vint64m8_t __riscv_vmax_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, int64_t rs1, size_t vl);
vuint8mf8_t __riscv_vminu_vv_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                        vuint8mf8_t vs2, vuint8mf8_t vs1,
                                        size_t vl);
vuint8mf8_t __riscv_vminu_vx_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                        vuint8mf8_t vs2, uint8_t rs1,
                                        size_t vl);
vuint8mf4_t __riscv_vminu_vv_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                        vuint8mf4_t vs2, vuint8mf4_t vs1,
                                        size_t vl);
vuint8mf4_t __riscv_vminu_vx_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                        vuint8mf4_t vs2, uint8_t rs1,
                                        size_t vl);
vuint8mf2_t __riscv_vminu_vv_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                        vuint8mf2_t vs2, vuint8mf2_t vs1,
                                        size_t vl);
vuint8mf2_t __riscv_vminu_vx_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                        vuint8mf2_t vs2, uint8_t rs1,
                                        size_t vl);
vuint8m1_t __riscv_vminu_vv_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                      vuint8m1_t vs2, vuint8m1_t vs1,
                                      size_t vl);
vuint8m1_t __riscv_vminu_vx_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                      vuint8m1_t vs2, uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vminu_vv_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                      vuint8m2_t vs2, vuint8m2_t vs1,
                                      size_t vl);
vuint8m2_t __riscv_vminu_vx_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                      vuint8m2_t vs2, uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vminu_vv_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                      vuint8m4_t vs2, vuint8m4_t vs1,
                                      size_t vl);
vuint8m4_t __riscv_vminu_vx_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                      vuint8m4_t vs2, uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vminu_vv_u8m8_tumu(vbool1_t vm, vuint8m8_t vd,
                                      vuint8m8_t vs2, vuint8m8_t vs1,
                                      size_t vl);
vuint8m8_t __riscv_vminu_vx_u8m8_tumu(vbool1_t vm, vuint8m8_t vd,
                                      vuint8m8_t vs2, uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vminu_vv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                          vuint16mf4_t vs2, vuint16mf4_t vs1,
                                          size_t vl);
vuint16mf4_t __riscv_vminu_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                          vuint16mf4_t vs2, uint16_t rs1,
                                          size_t vl);
vuint16mf2_t __riscv_vminu_vv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                          vuint16mf2_t vs2, vuint16mf2_t vs1,
                                          size_t vl);
vuint16mf2_t __riscv_vminu_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                          vuint16mf2_t vs2, uint16_t rs1,
                                          size_t vl);
vuint16m1_t __riscv_vminu_vv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                        vuint16m1_t vs2, vuint16m1_t vs1,
                                        size_t vl);
vuint16m1_t __riscv_vminu_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                        vuint16m1_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m2_t __riscv_vminu_vv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                        vuint16m2_t vs2, vuint16m2_t vs1,
                                        size_t vl);
vuint16m2_t __riscv_vminu_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                        vuint16m2_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m4_t __riscv_vminu_vv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                        vuint16m4_t vs2, vuint16m4_t vs1,
                                        size_t vl);
vuint16m4_t __riscv_vminu_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                        vuint16m4_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m8_t __riscv_vminu_vv_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                        vuint16m8_t vs2, vuint16m8_t vs1,
                                        size_t vl);
vuint16m8_t __riscv_vminu_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                        vuint16m8_t vs2, uint16_t rs1,
                                        size_t vl);
vuint32mf2_t __riscv_vminu_vv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                          vuint32mf2_t vs2, vuint32mf2_t vs1,
                                          size_t vl);
vuint32mf2_t __riscv_vminu_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                          vuint32mf2_t vs2, uint32_t rs1,
                                          size_t vl);
vuint32m1_t __riscv_vminu_vv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                        vuint32m1_t vs2, vuint32m1_t vs1,
                                        size_t vl);
vuint32m1_t __riscv_vminu_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                        vuint32m1_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m2_t __riscv_vminu_vv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                        vuint32m2_t vs2, vuint32m2_t vs1,
                                        size_t vl);
vuint32m2_t __riscv_vminu_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                        vuint32m2_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m4_t __riscv_vminu_vv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                        vuint32m4_t vs2, vuint32m4_t vs1,
                                        size_t vl);
vuint32m4_t __riscv_vminu_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                        vuint32m4_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m8_t __riscv_vminu_vv_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                        vuint32m8_t vs2, vuint32m8_t vs1,
                                        size_t vl);
vuint32m8_t __riscv_vminu_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                        vuint32m8_t vs2, uint32_t rs1,
                                        size_t vl);
vuint64m1_t __riscv_vminu_vv_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                        vuint64m1_t vs2, vuint64m1_t vs1,
                                        size_t vl);
vuint64m1_t __riscv_vminu_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                        vuint64m1_t vs2, uint64_t rs1,
                                        size_t vl);
vuint64m2_t __riscv_vminu_vv_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                        vuint64m2_t vs2, vuint64m2_t vs1,
                                        size_t vl);
vuint64m2_t __riscv_vminu_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                        vuint64m2_t vs2, uint64_t rs1,
                                        size_t vl);
vuint64m4_t __riscv_vminu_vv_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                        vuint64m4_t vs2, vuint64m4_t vs1,
                                        size_t vl);
vuint64m4_t __riscv_vminu_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                        vuint64m4_t vs2, uint64_t rs1,
                                        size_t vl);
vuint64m8_t __riscv_vminu_vv_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                        vuint64m8_t vs2, vuint64m8_t vs1,
                                        size_t vl);
vuint64m8_t __riscv_vminu_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                        vuint64m8_t vs2, uint64_t rs1,
                                        size_t vl);
vuint8mf8_t __riscv_vmaxu_vv_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                        vuint8mf8_t vs2, vuint8mf8_t vs1,
                                        size_t vl);
vuint8mf8_t __riscv_vmaxu_vx_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                        vuint8mf8_t vs2, uint8_t rs1,
                                        size_t vl);
vuint8mf4_t __riscv_vmaxu_vv_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                        vuint8mf4_t vs2, vuint8mf4_t vs1,
                                        size_t vl);
vuint8mf4_t __riscv_vmaxu_vx_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                        vuint8mf4_t vs2, uint8_t rs1,
                                        size_t vl);
vuint8mf2_t __riscv_vmaxu_vv_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                        vuint8mf2_t vs2, vuint8mf2_t vs1,
                                        size_t vl);
vuint8mf2_t __riscv_vmaxu_vx_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                        vuint8mf2_t vs2, uint8_t rs1,
                                        size_t vl);
vuint8m1_t __riscv_vmaxu_vv_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                      vuint8m1_t vs2, vuint8m1_t vs1,
                                      size_t vl);
vuint8m1_t __riscv_vmaxu_vx_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                      vuint8m1_t vs2, uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vmaxu_vv_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                      vuint8m2_t vs2, vuint8m2_t vs1,
                                      size_t vl);
vuint8m2_t __riscv_vmaxu_vx_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                      vuint8m2_t vs2, uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vmaxu_vv_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                      vuint8m4_t vs2, vuint8m4_t vs1,
                                      size_t vl);
vuint8m4_t __riscv_vmaxu_vx_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                      vuint8m4_t vs2, uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vmaxu_vv_u8m8_tumu(vbool1_t vm, vuint8m8_t vd,
                                      vuint8m8_t vs2, vuint8m8_t vs1,
                                      size_t vl);
vuint8m8_t __riscv_vmaxu_vx_u8m8_tumu(vbool1_t vm, vuint8m8_t vd,
                                      vuint8m8_t vs2, uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vmaxu_vv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                          vuint16mf4_t vs2, vuint16mf4_t vs1,
                                          size_t vl);
vuint16mf4_t __riscv_vmaxu_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                          vuint16mf4_t vs2, uint16_t rs1,
                                          size_t vl);
vuint16mf2_t __riscv_vmaxu_vv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                          vuint16mf2_t vs2, vuint16mf2_t vs1,
                                          size_t vl);
vuint16mf2_t __riscv_vmaxu_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                          vuint16mf2_t vs2, uint16_t rs1,
                                          size_t vl);
vuint16m1_t __riscv_vmaxu_vv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                        vuint16m1_t vs2, vuint16m1_t vs1,
                                        size_t vl);
vuint16m1_t __riscv_vmaxu_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                        vuint16m1_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m2_t __riscv_vmaxu_vv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                        vuint16m2_t vs2, vuint16m2_t vs1,
                                        size_t vl);
vuint16m2_t __riscv_vmaxu_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                        vuint16m2_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m4_t __riscv_vmaxu_vv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                        vuint16m4_t vs2, vuint16m4_t vs1,
                                        size_t vl);
vuint16m4_t __riscv_vmaxu_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                        vuint16m4_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m8_t __riscv_vmaxu_vv_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                        vuint16m8_t vs2, vuint16m8_t vs1,
                                        size_t vl);
vuint16m8_t __riscv_vmaxu_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                        vuint16m8_t vs2, uint16_t rs1,
                                        size_t vl);
vuint32mf2_t __riscv_vmaxu_vv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                          vuint32mf2_t vs2, vuint32mf2_t vs1,
                                          size_t vl);
vuint32mf2_t __riscv_vmaxu_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                          vuint32mf2_t vs2, uint32_t rs1,
                                          size_t vl);
vuint32m1_t __riscv_vmaxu_vv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                        vuint32m1_t vs2, vuint32m1_t vs1,
                                        size_t vl);
vuint32m1_t __riscv_vmaxu_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                        vuint32m1_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m2_t __riscv_vmaxu_vv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                        vuint32m2_t vs2, vuint32m2_t vs1,
                                        size_t vl);
vuint32m2_t __riscv_vmaxu_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                        vuint32m2_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m4_t __riscv_vmaxu_vv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                        vuint32m4_t vs2, vuint32m4_t vs1,
                                        size_t vl);
vuint32m4_t __riscv_vmaxu_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                        vuint32m4_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m8_t __riscv_vmaxu_vv_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                        vuint32m8_t vs2, vuint32m8_t vs1,
                                        size_t vl);
vuint32m8_t __riscv_vmaxu_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                        vuint32m8_t vs2, uint32_t rs1,
                                        size_t vl);
vuint64m1_t __riscv_vmaxu_vv_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                        vuint64m1_t vs2, vuint64m1_t vs1,
                                        size_t vl);
vuint64m1_t __riscv_vmaxu_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                        vuint64m1_t vs2, uint64_t rs1,
                                        size_t vl);
vuint64m2_t __riscv_vmaxu_vv_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                        vuint64m2_t vs2, vuint64m2_t vs1,
                                        size_t vl);
vuint64m2_t __riscv_vmaxu_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                        vuint64m2_t vs2, uint64_t rs1,
                                        size_t vl);
vuint64m4_t __riscv_vmaxu_vv_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                        vuint64m4_t vs2, vuint64m4_t vs1,
                                        size_t vl);
vuint64m4_t __riscv_vmaxu_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                        vuint64m4_t vs2, uint64_t rs1,
                                        size_t vl);
vuint64m8_t __riscv_vmaxu_vv_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                        vuint64m8_t vs2, vuint64m8_t vs1,
                                        size_t vl);
vuint64m8_t __riscv_vmaxu_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                        vuint64m8_t vs2, uint64_t rs1,
                                        size_t vl);
// masked functions
vint8mf8_t __riscv_vmin_vv_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                    vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vmin_vx_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                    int8_t rs1, size_t vl);
vint8mf4_t __riscv_vmin_vv_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                    vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vmin_vx_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                    int8_t rs1, size_t vl);
vint8mf2_t __riscv_vmin_vv_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                    vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vmin_vx_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                    int8_t rs1, size_t vl);
vint8m1_t __riscv_vmin_vv_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                  vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vmin_vx_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                  int8_t rs1, size_t vl);
vint8m2_t __riscv_vmin_vv_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                  vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vmin_vx_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                  int8_t rs1, size_t vl);
vint8m4_t __riscv_vmin_vv_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                  vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vmin_vx_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                  int8_t rs1, size_t vl);
vint8m8_t __riscv_vmin_vv_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                  vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vmin_vx_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                  int8_t rs1, size_t vl);
vint16mf4_t __riscv_vmin_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs2, vint16mf4_t vs1,
                                      size_t vl);
vint16mf4_t __riscv_vmin_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs2, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vmin_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs2, vint16mf2_t vs1,
                                      size_t vl);
vint16mf2_t __riscv_vmin_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs2, int16_t rs1, size_t vl);
vint16m1_t __riscv_vmin_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                    vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vmin_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                    int16_t rs1, size_t vl);
vint16m2_t __riscv_vmin_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                    vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vmin_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                    int16_t rs1, size_t vl);
vint16m4_t __riscv_vmin_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                    vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vmin_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                    int16_t rs1, size_t vl);
vint16m8_t __riscv_vmin_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                    vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vmin_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                    int16_t rs1, size_t vl);
vint32mf2_t __riscv_vmin_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs2, vint32mf2_t vs1,
                                      size_t vl);
vint32mf2_t __riscv_vmin_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs2, int32_t rs1, size_t vl);
vint32m1_t __riscv_vmin_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                    vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vmin_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                    int32_t rs1, size_t vl);
vint32m2_t __riscv_vmin_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                    vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vmin_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                    int32_t rs1, size_t vl);
vint32m4_t __riscv_vmin_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                    vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vmin_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                    int32_t rs1, size_t vl);
vint32m8_t __riscv_vmin_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                    vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vmin_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                    int32_t rs1, size_t vl);
vint64m1_t __riscv_vmin_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                    vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vmin_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                    int64_t rs1, size_t vl);
vint64m2_t __riscv_vmin_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                    vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vmin_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                    int64_t rs1, size_t vl);
vint64m4_t __riscv_vmin_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                    vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vmin_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                    int64_t rs1, size_t vl);
vint64m8_t __riscv_vmin_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                    vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vmin_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                    int64_t rs1, size_t vl);
vint8mf8_t __riscv_vmax_vv_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                    vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vmax_vx_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                    int8_t rs1, size_t vl);
vint8mf4_t __riscv_vmax_vv_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                    vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vmax_vx_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                    int8_t rs1, size_t vl);
vint8mf2_t __riscv_vmax_vv_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                    vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vmax_vx_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                    int8_t rs1, size_t vl);
vint8m1_t __riscv_vmax_vv_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                  vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vmax_vx_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                  int8_t rs1, size_t vl);
vint8m2_t __riscv_vmax_vv_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                  vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vmax_vx_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                  int8_t rs1, size_t vl);
vint8m4_t __riscv_vmax_vv_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                  vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vmax_vx_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                  int8_t rs1, size_t vl);
vint8m8_t __riscv_vmax_vv_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                  vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vmax_vx_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                  int8_t rs1, size_t vl);
vint16mf4_t __riscv_vmax_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs2, vint16mf4_t vs1,
                                      size_t vl);
vint16mf4_t __riscv_vmax_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs2, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vmax_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs2, vint16mf2_t vs1,
                                      size_t vl);
vint16mf2_t __riscv_vmax_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs2, int16_t rs1, size_t vl);
vint16m1_t __riscv_vmax_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                    vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vmax_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                    int16_t rs1, size_t vl);
vint16m2_t __riscv_vmax_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                    vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vmax_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                    int16_t rs1, size_t vl);
vint16m4_t __riscv_vmax_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                    vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vmax_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                    int16_t rs1, size_t vl);
vint16m8_t __riscv_vmax_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                    vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vmax_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                    int16_t rs1, size_t vl);
vint32mf2_t __riscv_vmax_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs2, vint32mf2_t vs1,
                                      size_t vl);
vint32mf2_t __riscv_vmax_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs2, int32_t rs1, size_t vl);
vint32m1_t __riscv_vmax_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                    vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vmax_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                    int32_t rs1, size_t vl);
vint32m2_t __riscv_vmax_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                    vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vmax_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                    int32_t rs1, size_t vl);
vint32m4_t __riscv_vmax_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                    vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vmax_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                    int32_t rs1, size_t vl);
vint32m8_t __riscv_vmax_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                    vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vmax_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                    int32_t rs1, size_t vl);
vint64m1_t __riscv_vmax_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                    vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vmax_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                    int64_t rs1, size_t vl);
vint64m2_t __riscv_vmax_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                    vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vmax_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                    int64_t rs1, size_t vl);
vint64m4_t __riscv_vmax_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                    vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vmax_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                    int64_t rs1, size_t vl);
vint64m8_t __riscv_vmax_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                    vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vmax_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                    int64_t rs1, size_t vl);
vuint8mf8_t __riscv_vminu_vv_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs2, vuint8mf8_t vs1,
                                      size_t vl);
vuint8mf8_t __riscv_vminu_vx_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vminu_vv_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs2, vuint8mf4_t vs1,
                                      size_t vl);
vuint8mf4_t __riscv_vminu_vx_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vminu_vv_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs2, vuint8mf2_t vs1,
                                      size_t vl);
vuint8mf2_t __riscv_vminu_vx_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vminu_vv_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                    vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vminu_vx_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vminu_vv_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                    vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vminu_vx_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vminu_vv_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                    vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vminu_vx_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vminu_vv_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                    vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vminu_vx_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                    uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vminu_vv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs2, vuint16mf4_t vs1,
                                        size_t vl);
vuint16mf4_t __riscv_vminu_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16mf2_t __riscv_vminu_vv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs2, vuint16mf2_t vs1,
                                        size_t vl);
vuint16mf2_t __riscv_vminu_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m1_t __riscv_vminu_vv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs2, vuint16m1_t vs1,
                                      size_t vl);
vuint16m1_t __riscv_vminu_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs2, uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vminu_vv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs2, vuint16m2_t vs1,
                                      size_t vl);
vuint16m2_t __riscv_vminu_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs2, uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vminu_vv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs2, vuint16m4_t vs1,
                                      size_t vl);
vuint16m4_t __riscv_vminu_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs2, uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vminu_vv_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs2, vuint16m8_t vs1,
                                      size_t vl);
vuint16m8_t __riscv_vminu_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs2, uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vminu_vv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs2, vuint32mf2_t vs1,
                                        size_t vl);
vuint32mf2_t __riscv_vminu_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m1_t __riscv_vminu_vv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs2, vuint32m1_t vs1,
                                      size_t vl);
vuint32m1_t __riscv_vminu_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs2, uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vminu_vv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs2, vuint32m2_t vs1,
                                      size_t vl);
vuint32m2_t __riscv_vminu_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs2, uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vminu_vv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs2, vuint32m4_t vs1,
                                      size_t vl);
vuint32m4_t __riscv_vminu_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs2, uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vminu_vv_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs2, vuint32m8_t vs1,
                                      size_t vl);
vuint32m8_t __riscv_vminu_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs2, uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vminu_vv_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs2, vuint64m1_t vs1,
                                      size_t vl);
vuint64m1_t __riscv_vminu_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs2, uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vminu_vv_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs2, vuint64m2_t vs1,
                                      size_t vl);
vuint64m2_t __riscv_vminu_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs2, uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vminu_vv_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs2, vuint64m4_t vs1,
                                      size_t vl);
vuint64m4_t __riscv_vminu_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs2, uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vminu_vv_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs2, vuint64m8_t vs1,
                                      size_t vl);
vuint64m8_t __riscv_vminu_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs2, uint64_t rs1, size_t vl);
vuint8mf8_t __riscv_vmaxu_vv_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs2, vuint8mf8_t vs1,
                                      size_t vl);
vuint8mf8_t __riscv_vmaxu_vx_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vmaxu_vv_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs2, vuint8mf4_t vs1,
                                      size_t vl);
vuint8mf4_t __riscv_vmaxu_vx_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vmaxu_vv_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs2, vuint8mf2_t vs1,
                                      size_t vl);
vuint8mf2_t __riscv_vmaxu_vx_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vmaxu_vv_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                    vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vmaxu_vx_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vmaxu_vv_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                    vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vmaxu_vx_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vmaxu_vv_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                    vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vmaxu_vx_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vmaxu_vv_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                    vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vmaxu_vx_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                    uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vmaxu_vv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs2, vuint16mf4_t vs1,
                                        size_t vl);
vuint16mf4_t __riscv_vmaxu_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16mf2_t __riscv_vmaxu_vv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs2, vuint16mf2_t vs1,
                                        size_t vl);
vuint16mf2_t __riscv_vmaxu_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m1_t __riscv_vmaxu_vv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs2, vuint16m1_t vs1,
                                      size_t vl);
vuint16m1_t __riscv_vmaxu_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs2, uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vmaxu_vv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs2, vuint16m2_t vs1,
                                      size_t vl);
vuint16m2_t __riscv_vmaxu_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs2, uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vmaxu_vv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs2, vuint16m4_t vs1,
                                      size_t vl);
vuint16m4_t __riscv_vmaxu_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs2, uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vmaxu_vv_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs2, vuint16m8_t vs1,
                                      size_t vl);
vuint16m8_t __riscv_vmaxu_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs2, uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vmaxu_vv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs2, vuint32mf2_t vs1,
                                        size_t vl);
vuint32mf2_t __riscv_vmaxu_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m1_t __riscv_vmaxu_vv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs2, vuint32m1_t vs1,
                                      size_t vl);
vuint32m1_t __riscv_vmaxu_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs2, uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vmaxu_vv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs2, vuint32m2_t vs1,
                                      size_t vl);
vuint32m2_t __riscv_vmaxu_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs2, uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vmaxu_vv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs2, vuint32m4_t vs1,
                                      size_t vl);
vuint32m4_t __riscv_vmaxu_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs2, uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vmaxu_vv_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs2, vuint32m8_t vs1,
                                      size_t vl);
vuint32m8_t __riscv_vmaxu_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs2, uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vmaxu_vv_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs2, vuint64m1_t vs1,
                                      size_t vl);
vuint64m1_t __riscv_vmaxu_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs2, uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vmaxu_vv_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs2, vuint64m2_t vs1,
                                      size_t vl);
vuint64m2_t __riscv_vmaxu_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs2, uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vmaxu_vv_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs2, vuint64m4_t vs1,
                                      size_t vl);
vuint64m4_t __riscv_vmaxu_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs2, uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vmaxu_vv_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs2, vuint64m8_t vs1,
                                      size_t vl);
vuint64m8_t __riscv_vmaxu_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs2, uint64_t rs1, size_t vl);

Vector Single-Width Integer Multiply Intrinsics

vint8mf8_t __riscv_vmul_vv_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                    vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vmul_vx_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2, int8_t rs1,
                                    size_t vl);
vint8mf4_t __riscv_vmul_vv_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                    vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vmul_vx_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2, int8_t rs1,
                                    size_t vl);
vint8mf2_t __riscv_vmul_vv_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                    vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vmul_vx_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2, int8_t rs1,
                                    size_t vl);
vint8m1_t __riscv_vmul_vv_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, vint8m1_t vs1,
                                  size_t vl);
vint8m1_t __riscv_vmul_vx_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, int8_t rs1,
                                  size_t vl);
vint8m2_t __riscv_vmul_vv_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, vint8m2_t vs1,
                                  size_t vl);
vint8m2_t __riscv_vmul_vx_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, int8_t rs1,
                                  size_t vl);
vint8m4_t __riscv_vmul_vv_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, vint8m4_t vs1,
                                  size_t vl);
vint8m4_t __riscv_vmul_vx_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, int8_t rs1,
                                  size_t vl);
vint8m8_t __riscv_vmul_vv_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, vint8m8_t vs1,
                                  size_t vl);
vint8m8_t __riscv_vmul_vx_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, int8_t rs1,
                                  size_t vl);
vint16mf4_t __riscv_vmul_vv_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                      vint16mf4_t vs1, size_t vl);
vint16mf4_t __riscv_vmul_vx_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                      int16_t rs1, size_t vl);
vint16mf2_t __riscv_vmul_vv_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                      vint16mf2_t vs1, size_t vl);
vint16mf2_t __riscv_vmul_vx_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                      int16_t rs1, size_t vl);
vint16m1_t __riscv_vmul_vv_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                    vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vmul_vx_i16m1_tu(vint16m1_t vd, vint16m1_t vs2, int16_t rs1,
                                    size_t vl);
vint16m2_t __riscv_vmul_vv_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                    vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vmul_vx_i16m2_tu(vint16m2_t vd, vint16m2_t vs2, int16_t rs1,
                                    size_t vl);
vint16m4_t __riscv_vmul_vv_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                    vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vmul_vx_i16m4_tu(vint16m4_t vd, vint16m4_t vs2, int16_t rs1,
                                    size_t vl);
vint16m8_t __riscv_vmul_vv_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                    vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vmul_vx_i16m8_tu(vint16m8_t vd, vint16m8_t vs2, int16_t rs1,
                                    size_t vl);
vint32mf2_t __riscv_vmul_vv_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                      vint32mf2_t vs1, size_t vl);
vint32mf2_t __riscv_vmul_vx_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                      int32_t rs1, size_t vl);
vint32m1_t __riscv_vmul_vv_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                    vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vmul_vx_i32m1_tu(vint32m1_t vd, vint32m1_t vs2, int32_t rs1,
                                    size_t vl);
vint32m2_t __riscv_vmul_vv_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                    vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vmul_vx_i32m2_tu(vint32m2_t vd, vint32m2_t vs2, int32_t rs1,
                                    size_t vl);
vint32m4_t __riscv_vmul_vv_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                    vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vmul_vx_i32m4_tu(vint32m4_t vd, vint32m4_t vs2, int32_t rs1,
                                    size_t vl);
vint32m8_t __riscv_vmul_vv_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                    vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vmul_vx_i32m8_tu(vint32m8_t vd, vint32m8_t vs2, int32_t rs1,
                                    size_t vl);
vint64m1_t __riscv_vmul_vv_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                    vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vmul_vx_i64m1_tu(vint64m1_t vd, vint64m1_t vs2, int64_t rs1,
                                    size_t vl);
vint64m2_t __riscv_vmul_vv_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                    vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vmul_vx_i64m2_tu(vint64m2_t vd, vint64m2_t vs2, int64_t rs1,
                                    size_t vl);
vint64m4_t __riscv_vmul_vv_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                    vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vmul_vx_i64m4_tu(vint64m4_t vd, vint64m4_t vs2, int64_t rs1,
                                    size_t vl);
vint64m8_t __riscv_vmul_vv_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                    vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vmul_vx_i64m8_tu(vint64m8_t vd, vint64m8_t vs2, int64_t rs1,
                                    size_t vl);
vint8mf8_t __riscv_vmulh_vv_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                     vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vmulh_vx_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2, int8_t rs1,
                                     size_t vl);
vint8mf4_t __riscv_vmulh_vv_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                     vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vmulh_vx_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2, int8_t rs1,
                                     size_t vl);
vint8mf2_t __riscv_vmulh_vv_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                     vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vmulh_vx_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2, int8_t rs1,
                                     size_t vl);
vint8m1_t __riscv_vmulh_vv_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, vint8m1_t vs1,
                                   size_t vl);
vint8m1_t __riscv_vmulh_vx_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, int8_t rs1,
                                   size_t vl);
vint8m2_t __riscv_vmulh_vv_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, vint8m2_t vs1,
                                   size_t vl);
vint8m2_t __riscv_vmulh_vx_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, int8_t rs1,
                                   size_t vl);
vint8m4_t __riscv_vmulh_vv_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, vint8m4_t vs1,
                                   size_t vl);
vint8m4_t __riscv_vmulh_vx_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, int8_t rs1,
                                   size_t vl);
vint8m8_t __riscv_vmulh_vv_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, vint8m8_t vs1,
                                   size_t vl);
vint8m8_t __riscv_vmulh_vx_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, int8_t rs1,
                                   size_t vl);
vint16mf4_t __riscv_vmulh_vv_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                       vint16mf4_t vs1, size_t vl);
vint16mf4_t __riscv_vmulh_vx_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                       int16_t rs1, size_t vl);
vint16mf2_t __riscv_vmulh_vv_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                       vint16mf2_t vs1, size_t vl);
vint16mf2_t __riscv_vmulh_vx_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                       int16_t rs1, size_t vl);
vint16m1_t __riscv_vmulh_vv_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                     vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vmulh_vx_i16m1_tu(vint16m1_t vd, vint16m1_t vs2, int16_t rs1,
                                     size_t vl);
vint16m2_t __riscv_vmulh_vv_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                     vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vmulh_vx_i16m2_tu(vint16m2_t vd, vint16m2_t vs2, int16_t rs1,
                                     size_t vl);
vint16m4_t __riscv_vmulh_vv_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                     vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vmulh_vx_i16m4_tu(vint16m4_t vd, vint16m4_t vs2, int16_t rs1,
                                     size_t vl);
vint16m8_t __riscv_vmulh_vv_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                     vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vmulh_vx_i16m8_tu(vint16m8_t vd, vint16m8_t vs2, int16_t rs1,
                                     size_t vl);
vint32mf2_t __riscv_vmulh_vv_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                       vint32mf2_t vs1, size_t vl);
vint32mf2_t __riscv_vmulh_vx_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                       int32_t rs1, size_t vl);
vint32m1_t __riscv_vmulh_vv_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                     vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vmulh_vx_i32m1_tu(vint32m1_t vd, vint32m1_t vs2, int32_t rs1,
                                     size_t vl);
vint32m2_t __riscv_vmulh_vv_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                     vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vmulh_vx_i32m2_tu(vint32m2_t vd, vint32m2_t vs2, int32_t rs1,
                                     size_t vl);
vint32m4_t __riscv_vmulh_vv_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                     vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vmulh_vx_i32m4_tu(vint32m4_t vd, vint32m4_t vs2, int32_t rs1,
                                     size_t vl);
vint32m8_t __riscv_vmulh_vv_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                     vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vmulh_vx_i32m8_tu(vint32m8_t vd, vint32m8_t vs2, int32_t rs1,
                                     size_t vl);
vint64m1_t __riscv_vmulh_vv_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                     vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vmulh_vx_i64m1_tu(vint64m1_t vd, vint64m1_t vs2, int64_t rs1,
                                     size_t vl);
vint64m2_t __riscv_vmulh_vv_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                     vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vmulh_vx_i64m2_tu(vint64m2_t vd, vint64m2_t vs2, int64_t rs1,
                                     size_t vl);
vint64m4_t __riscv_vmulh_vv_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                     vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vmulh_vx_i64m4_tu(vint64m4_t vd, vint64m4_t vs2, int64_t rs1,
                                     size_t vl);
vint64m8_t __riscv_vmulh_vv_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                     vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vmulh_vx_i64m8_tu(vint64m8_t vd, vint64m8_t vs2, int64_t rs1,
                                     size_t vl);
vint8mf8_t __riscv_vmulhsu_vv_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                       vuint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vmulhsu_vx_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                       uint8_t rs1, size_t vl);
vint8mf4_t __riscv_vmulhsu_vv_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                       vuint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vmulhsu_vx_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                       uint8_t rs1, size_t vl);
vint8mf2_t __riscv_vmulhsu_vv_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                       vuint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vmulhsu_vx_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                       uint8_t rs1, size_t vl);
vint8m1_t __riscv_vmulhsu_vv_i8m1_tu(vint8m1_t vd, vint8m1_t vs2,
                                     vuint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vmulhsu_vx_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, uint8_t rs1,
                                     size_t vl);
vint8m2_t __riscv_vmulhsu_vv_i8m2_tu(vint8m2_t vd, vint8m2_t vs2,
                                     vuint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vmulhsu_vx_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, uint8_t rs1,
                                     size_t vl);
vint8m4_t __riscv_vmulhsu_vv_i8m4_tu(vint8m4_t vd, vint8m4_t vs2,
                                     vuint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vmulhsu_vx_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, uint8_t rs1,
                                     size_t vl);
vint8m8_t __riscv_vmulhsu_vv_i8m8_tu(vint8m8_t vd, vint8m8_t vs2,
                                     vuint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vmulhsu_vx_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, uint8_t rs1,
                                     size_t vl);
vint16mf4_t __riscv_vmulhsu_vv_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                         vuint16mf4_t vs1, size_t vl);
vint16mf4_t __riscv_vmulhsu_vx_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                         uint16_t rs1, size_t vl);
vint16mf2_t __riscv_vmulhsu_vv_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                         vuint16mf2_t vs1, size_t vl);
vint16mf2_t __riscv_vmulhsu_vx_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                         uint16_t rs1, size_t vl);
vint16m1_t __riscv_vmulhsu_vv_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                       vuint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vmulhsu_vx_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                       uint16_t rs1, size_t vl);
vint16m2_t __riscv_vmulhsu_vv_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                       vuint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vmulhsu_vx_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                       uint16_t rs1, size_t vl);
vint16m4_t __riscv_vmulhsu_vv_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                       vuint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vmulhsu_vx_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                       uint16_t rs1, size_t vl);
vint16m8_t __riscv_vmulhsu_vv_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                       vuint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vmulhsu_vx_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                       uint16_t rs1, size_t vl);
vint32mf2_t __riscv_vmulhsu_vv_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                         vuint32mf2_t vs1, size_t vl);
vint32mf2_t __riscv_vmulhsu_vx_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                         uint32_t rs1, size_t vl);
vint32m1_t __riscv_vmulhsu_vv_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                       vuint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vmulhsu_vx_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                       uint32_t rs1, size_t vl);
vint32m2_t __riscv_vmulhsu_vv_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                       vuint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vmulhsu_vx_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                       uint32_t rs1, size_t vl);
vint32m4_t __riscv_vmulhsu_vv_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                       vuint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vmulhsu_vx_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                       uint32_t rs1, size_t vl);
vint32m8_t __riscv_vmulhsu_vv_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                       vuint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vmulhsu_vx_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                       uint32_t rs1, size_t vl);
vint64m1_t __riscv_vmulhsu_vv_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                       vuint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vmulhsu_vx_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                       uint64_t rs1, size_t vl);
vint64m2_t __riscv_vmulhsu_vv_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                       vuint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vmulhsu_vx_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                       uint64_t rs1, size_t vl);
vint64m4_t __riscv_vmulhsu_vv_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                       vuint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vmulhsu_vx_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                       uint64_t rs1, size_t vl);
vint64m8_t __riscv_vmulhsu_vv_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                       vuint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vmulhsu_vx_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                       uint64_t rs1, size_t vl);
vuint8mf8_t __riscv_vmul_vv_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                     vuint8mf8_t vs1, size_t vl);
vuint8mf8_t __riscv_vmul_vx_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vmul_vv_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                     vuint8mf4_t vs1, size_t vl);
vuint8mf4_t __riscv_vmul_vx_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vmul_vv_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                     vuint8mf2_t vs1, size_t vl);
vuint8mf2_t __riscv_vmul_vx_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vmul_vv_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2,
                                   vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vmul_vx_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2, uint8_t rs1,
                                   size_t vl);
vuint8m2_t __riscv_vmul_vv_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2,
                                   vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vmul_vx_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2, uint8_t rs1,
                                   size_t vl);
vuint8m4_t __riscv_vmul_vv_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2,
                                   vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vmul_vx_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2, uint8_t rs1,
                                   size_t vl);
vuint8m8_t __riscv_vmul_vv_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2,
                                   vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vmul_vx_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2, uint8_t rs1,
                                   size_t vl);
vuint16mf4_t __riscv_vmul_vv_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                       vuint16mf4_t vs1, size_t vl);
vuint16mf4_t __riscv_vmul_vx_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                       uint16_t rs1, size_t vl);
vuint16mf2_t __riscv_vmul_vv_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                       vuint16mf2_t vs1, size_t vl);
vuint16mf2_t __riscv_vmul_vx_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                       uint16_t rs1, size_t vl);
vuint16m1_t __riscv_vmul_vv_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                     vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vmul_vx_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                     uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vmul_vv_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                     vuint16m2_t vs1, size_t vl);
vuint16m2_t __riscv_vmul_vx_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                     uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vmul_vv_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                     vuint16m4_t vs1, size_t vl);
vuint16m4_t __riscv_vmul_vx_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                     uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vmul_vv_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                     vuint16m8_t vs1, size_t vl);
vuint16m8_t __riscv_vmul_vx_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                     uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vmul_vv_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                       vuint32mf2_t vs1, size_t vl);
vuint32mf2_t __riscv_vmul_vx_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                       uint32_t rs1, size_t vl);
vuint32m1_t __riscv_vmul_vv_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                     vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vmul_vx_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                     uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vmul_vv_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                     vuint32m2_t vs1, size_t vl);
vuint32m2_t __riscv_vmul_vx_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                     uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vmul_vv_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                     vuint32m4_t vs1, size_t vl);
vuint32m4_t __riscv_vmul_vx_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                     uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vmul_vv_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                     vuint32m8_t vs1, size_t vl);
vuint32m8_t __riscv_vmul_vx_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                     uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vmul_vv_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                     vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vmul_vx_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                     uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vmul_vv_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                     vuint64m2_t vs1, size_t vl);
vuint64m2_t __riscv_vmul_vx_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                     uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vmul_vv_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                     vuint64m4_t vs1, size_t vl);
vuint64m4_t __riscv_vmul_vx_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                     uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vmul_vv_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                     vuint64m8_t vs1, size_t vl);
vuint64m8_t __riscv_vmul_vx_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                     uint64_t rs1, size_t vl);
vuint8mf8_t __riscv_vmulhu_vv_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                       vuint8mf8_t vs1, size_t vl);
vuint8mf8_t __riscv_vmulhu_vx_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                       uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vmulhu_vv_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                       vuint8mf4_t vs1, size_t vl);
vuint8mf4_t __riscv_vmulhu_vx_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                       uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vmulhu_vv_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                       vuint8mf2_t vs1, size_t vl);
vuint8mf2_t __riscv_vmulhu_vx_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                       uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vmulhu_vv_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2,
                                     vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vmulhu_vx_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2, uint8_t rs1,
                                     size_t vl);
vuint8m2_t __riscv_vmulhu_vv_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2,
                                     vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vmulhu_vx_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2, uint8_t rs1,
                                     size_t vl);
vuint8m4_t __riscv_vmulhu_vv_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2,
                                     vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vmulhu_vx_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2, uint8_t rs1,
                                     size_t vl);
vuint8m8_t __riscv_vmulhu_vv_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2,
                                     vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vmulhu_vx_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2, uint8_t rs1,
                                     size_t vl);
vuint16mf4_t __riscv_vmulhu_vv_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                         vuint16mf4_t vs1, size_t vl);
vuint16mf4_t __riscv_vmulhu_vx_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                         uint16_t rs1, size_t vl);
vuint16mf2_t __riscv_vmulhu_vv_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                         vuint16mf2_t vs1, size_t vl);
vuint16mf2_t __riscv_vmulhu_vx_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                         uint16_t rs1, size_t vl);
vuint16m1_t __riscv_vmulhu_vv_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                       vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vmulhu_vx_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                       uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vmulhu_vv_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                       vuint16m2_t vs1, size_t vl);
vuint16m2_t __riscv_vmulhu_vx_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                       uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vmulhu_vv_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                       vuint16m4_t vs1, size_t vl);
vuint16m4_t __riscv_vmulhu_vx_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                       uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vmulhu_vv_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                       vuint16m8_t vs1, size_t vl);
vuint16m8_t __riscv_vmulhu_vx_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                       uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vmulhu_vv_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                         vuint32mf2_t vs1, size_t vl);
vuint32mf2_t __riscv_vmulhu_vx_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                         uint32_t rs1, size_t vl);
vuint32m1_t __riscv_vmulhu_vv_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                       vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vmulhu_vx_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                       uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vmulhu_vv_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                       vuint32m2_t vs1, size_t vl);
vuint32m2_t __riscv_vmulhu_vx_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                       uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vmulhu_vv_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                       vuint32m4_t vs1, size_t vl);
vuint32m4_t __riscv_vmulhu_vx_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                       uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vmulhu_vv_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                       vuint32m8_t vs1, size_t vl);
vuint32m8_t __riscv_vmulhu_vx_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                       uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vmulhu_vv_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                       vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vmulhu_vx_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                       uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vmulhu_vv_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                       vuint64m2_t vs1, size_t vl);
vuint64m2_t __riscv_vmulhu_vx_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                       uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vmulhu_vv_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                       vuint64m4_t vs1, size_t vl);
vuint64m4_t __riscv_vmulhu_vx_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                       uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vmulhu_vv_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                       vuint64m8_t vs1, size_t vl);
vuint64m8_t __riscv_vmulhu_vx_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                       uint64_t rs1, size_t vl);
// masked functions
vint8mf8_t __riscv_vmul_vv_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vmul_vx_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vmul_vv_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vmul_vx_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vmul_vv_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vmul_vx_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vmul_vv_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vmul_vx_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   int8_t rs1, size_t vl);
vint8m2_t __riscv_vmul_vv_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vmul_vx_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   int8_t rs1, size_t vl);
vint8m4_t __riscv_vmul_vv_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vmul_vx_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   int8_t rs1, size_t vl);
vint8m8_t __riscv_vmul_vv_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vmul_vx_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   int8_t rs1, size_t vl);
vint16mf4_t __riscv_vmul_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, vint16mf4_t vs1,
                                       size_t vl);
vint16mf4_t __riscv_vmul_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vmul_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, vint16mf2_t vs1,
                                       size_t vl);
vint16mf2_t __riscv_vmul_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, int16_t rs1, size_t vl);
vint16m1_t __riscv_vmul_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vmul_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vmul_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vmul_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     int16_t rs1, size_t vl);
vint16m4_t __riscv_vmul_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vmul_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     int16_t rs1, size_t vl);
vint16m8_t __riscv_vmul_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vmul_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     int16_t rs1, size_t vl);
vint32mf2_t __riscv_vmul_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, vint32mf2_t vs1,
                                       size_t vl);
vint32mf2_t __riscv_vmul_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, int32_t rs1, size_t vl);
vint32m1_t __riscv_vmul_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vmul_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vmul_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vmul_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vmul_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vmul_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     int32_t rs1, size_t vl);
vint32m8_t __riscv_vmul_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vmul_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     int32_t rs1, size_t vl);
vint64m1_t __riscv_vmul_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vmul_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vmul_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vmul_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vmul_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vmul_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vmul_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vmul_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     int64_t rs1, size_t vl);
vint8mf8_t __riscv_vmulh_vv_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs2, vint8mf8_t vs1,
                                      size_t vl);
vint8mf8_t __riscv_vmulh_vx_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vmulh_vv_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs2, vint8mf4_t vs1,
                                      size_t vl);
vint8mf4_t __riscv_vmulh_vx_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vmulh_vv_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs2, vint8mf2_t vs1,
                                      size_t vl);
vint8mf2_t __riscv_vmulh_vx_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vmulh_vv_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                    vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vmulh_vx_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                    int8_t rs1, size_t vl);
vint8m2_t __riscv_vmulh_vv_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                    vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vmulh_vx_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                    int8_t rs1, size_t vl);
vint8m4_t __riscv_vmulh_vv_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                    vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vmulh_vx_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                    int8_t rs1, size_t vl);
vint8m8_t __riscv_vmulh_vv_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                    vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vmulh_vx_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                    int8_t rs1, size_t vl);
vint16mf4_t __riscv_vmulh_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, vint16mf4_t vs1,
                                        size_t vl);
vint16mf4_t __riscv_vmulh_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, int16_t rs1,
                                        size_t vl);
vint16mf2_t __riscv_vmulh_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, vint16mf2_t vs1,
                                        size_t vl);
vint16mf2_t __riscv_vmulh_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, int16_t rs1,
                                        size_t vl);
vint16m1_t __riscv_vmulh_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, vint16m1_t vs1,
                                      size_t vl);
vint16m1_t __riscv_vmulh_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vmulh_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, vint16m2_t vs1,
                                      size_t vl);
vint16m2_t __riscv_vmulh_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, int16_t rs1, size_t vl);
vint16m4_t __riscv_vmulh_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, vint16m4_t vs1,
                                      size_t vl);
vint16m4_t __riscv_vmulh_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, int16_t rs1, size_t vl);
vint16m8_t __riscv_vmulh_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, vint16m8_t vs1,
                                      size_t vl);
vint16m8_t __riscv_vmulh_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, int16_t rs1, size_t vl);
vint32mf2_t __riscv_vmulh_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, vint32mf2_t vs1,
                                        size_t vl);
vint32mf2_t __riscv_vmulh_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, int32_t rs1,
                                        size_t vl);
vint32m1_t __riscv_vmulh_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, vint32m1_t vs1,
                                      size_t vl);
vint32m1_t __riscv_vmulh_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vmulh_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, vint32m2_t vs1,
                                      size_t vl);
vint32m2_t __riscv_vmulh_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vmulh_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, vint32m4_t vs1,
                                      size_t vl);
vint32m4_t __riscv_vmulh_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, int32_t rs1, size_t vl);
vint32m8_t __riscv_vmulh_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, vint32m8_t vs1,
                                      size_t vl);
vint32m8_t __riscv_vmulh_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, int32_t rs1, size_t vl);
vint64m1_t __riscv_vmulh_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, vint64m1_t vs1,
                                      size_t vl);
vint64m1_t __riscv_vmulh_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vmulh_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, vint64m2_t vs1,
                                      size_t vl);
vint64m2_t __riscv_vmulh_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vmulh_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, vint64m4_t vs1,
                                      size_t vl);
vint64m4_t __riscv_vmulh_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vmulh_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, vint64m8_t vs1,
                                      size_t vl);
vint64m8_t __riscv_vmulh_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, int64_t rs1, size_t vl);
vint8mf8_t __riscv_vmulhsu_vv_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                        vint8mf8_t vs2, vuint8mf8_t vs1,
                                        size_t vl);
vint8mf8_t __riscv_vmulhsu_vx_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                        vint8mf8_t vs2, uint8_t rs1, size_t vl);
vint8mf4_t __riscv_vmulhsu_vv_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                        vint8mf4_t vs2, vuint8mf4_t vs1,
                                        size_t vl);
vint8mf4_t __riscv_vmulhsu_vx_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                        vint8mf4_t vs2, uint8_t rs1, size_t vl);
vint8mf2_t __riscv_vmulhsu_vv_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                        vint8mf2_t vs2, vuint8mf2_t vs1,
                                        size_t vl);
vint8mf2_t __riscv_vmulhsu_vx_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                        vint8mf2_t vs2, uint8_t rs1, size_t vl);
vint8m1_t __riscv_vmulhsu_vv_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                      vuint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vmulhsu_vx_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                      uint8_t rs1, size_t vl);
vint8m2_t __riscv_vmulhsu_vv_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                      vuint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vmulhsu_vx_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                      uint8_t rs1, size_t vl);
vint8m4_t __riscv_vmulhsu_vv_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                      vuint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vmulhsu_vx_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                      uint8_t rs1, size_t vl);
vint8m8_t __riscv_vmulhsu_vv_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                      vuint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vmulhsu_vx_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                      uint8_t rs1, size_t vl);
vint16mf4_t __riscv_vmulhsu_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                          vint16mf4_t vs2, vuint16mf4_t vs1,
                                          size_t vl);
vint16mf4_t __riscv_vmulhsu_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                          vint16mf4_t vs2, uint16_t rs1,
                                          size_t vl);
vint16mf2_t __riscv_vmulhsu_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                          vint16mf2_t vs2, vuint16mf2_t vs1,
                                          size_t vl);
vint16mf2_t __riscv_vmulhsu_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                          vint16mf2_t vs2, uint16_t rs1,
                                          size_t vl);
vint16m1_t __riscv_vmulhsu_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                        vint16m1_t vs2, vuint16m1_t vs1,
                                        size_t vl);
vint16m1_t __riscv_vmulhsu_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                        vint16m1_t vs2, uint16_t rs1,
                                        size_t vl);
vint16m2_t __riscv_vmulhsu_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                        vint16m2_t vs2, vuint16m2_t vs1,
                                        size_t vl);
vint16m2_t __riscv_vmulhsu_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                        vint16m2_t vs2, uint16_t rs1,
                                        size_t vl);
vint16m4_t __riscv_vmulhsu_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                        vint16m4_t vs2, vuint16m4_t vs1,
                                        size_t vl);
vint16m4_t __riscv_vmulhsu_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                        vint16m4_t vs2, uint16_t rs1,
                                        size_t vl);
vint16m8_t __riscv_vmulhsu_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                        vint16m8_t vs2, vuint16m8_t vs1,
                                        size_t vl);
vint16m8_t __riscv_vmulhsu_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                        vint16m8_t vs2, uint16_t rs1,
                                        size_t vl);
vint32mf2_t __riscv_vmulhsu_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                          vint32mf2_t vs2, vuint32mf2_t vs1,
                                          size_t vl);
vint32mf2_t __riscv_vmulhsu_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                          vint32mf2_t vs2, uint32_t rs1,
                                          size_t vl);
vint32m1_t __riscv_vmulhsu_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                        vint32m1_t vs2, vuint32m1_t vs1,
                                        size_t vl);
vint32m1_t __riscv_vmulhsu_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                        vint32m1_t vs2, uint32_t rs1,
                                        size_t vl);
vint32m2_t __riscv_vmulhsu_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                        vint32m2_t vs2, vuint32m2_t vs1,
                                        size_t vl);
vint32m2_t __riscv_vmulhsu_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                        vint32m2_t vs2, uint32_t rs1,
                                        size_t vl);
vint32m4_t __riscv_vmulhsu_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                        vint32m4_t vs2, vuint32m4_t vs1,
                                        size_t vl);
vint32m4_t __riscv_vmulhsu_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                        vint32m4_t vs2, uint32_t rs1,
                                        size_t vl);
vint32m8_t __riscv_vmulhsu_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                        vint32m8_t vs2, vuint32m8_t vs1,
                                        size_t vl);
vint32m8_t __riscv_vmulhsu_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                        vint32m8_t vs2, uint32_t rs1,
                                        size_t vl);
vint64m1_t __riscv_vmulhsu_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                        vint64m1_t vs2, vuint64m1_t vs1,
                                        size_t vl);
vint64m1_t __riscv_vmulhsu_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                        vint64m1_t vs2, uint64_t rs1,
                                        size_t vl);
vint64m2_t __riscv_vmulhsu_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                        vint64m2_t vs2, vuint64m2_t vs1,
                                        size_t vl);
vint64m2_t __riscv_vmulhsu_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                        vint64m2_t vs2, uint64_t rs1,
                                        size_t vl);
vint64m4_t __riscv_vmulhsu_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                        vint64m4_t vs2, vuint64m4_t vs1,
                                        size_t vl);
vint64m4_t __riscv_vmulhsu_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                        vint64m4_t vs2, uint64_t rs1,
                                        size_t vl);
vint64m8_t __riscv_vmulhsu_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                        vint64m8_t vs2, vuint64m8_t vs1,
                                        size_t vl);
vint64m8_t __riscv_vmulhsu_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                        vint64m8_t vs2, uint64_t rs1,
                                        size_t vl);
vuint8mf8_t __riscv_vmul_vv_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs2, vuint8mf8_t vs1,
                                      size_t vl);
vuint8mf8_t __riscv_vmul_vx_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vmul_vv_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs2, vuint8mf4_t vs1,
                                      size_t vl);
vuint8mf4_t __riscv_vmul_vx_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vmul_vv_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs2, vuint8mf2_t vs1,
                                      size_t vl);
vuint8mf2_t __riscv_vmul_vx_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vmul_vv_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                    vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vmul_vx_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vmul_vv_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                    vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vmul_vx_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vmul_vv_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                    vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vmul_vx_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vmul_vv_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                    vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vmul_vx_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                    uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vmul_vv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs2, vuint16mf4_t vs1,
                                        size_t vl);
vuint16mf4_t __riscv_vmul_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16mf2_t __riscv_vmul_vv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs2, vuint16mf2_t vs1,
                                        size_t vl);
vuint16mf2_t __riscv_vmul_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m1_t __riscv_vmul_vv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs2, vuint16m1_t vs1,
                                      size_t vl);
vuint16m1_t __riscv_vmul_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs2, uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vmul_vv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs2, vuint16m2_t vs1,
                                      size_t vl);
vuint16m2_t __riscv_vmul_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs2, uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vmul_vv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs2, vuint16m4_t vs1,
                                      size_t vl);
vuint16m4_t __riscv_vmul_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs2, uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vmul_vv_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs2, vuint16m8_t vs1,
                                      size_t vl);
vuint16m8_t __riscv_vmul_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs2, uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vmul_vv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs2, vuint32mf2_t vs1,
                                        size_t vl);
vuint32mf2_t __riscv_vmul_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m1_t __riscv_vmul_vv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs2, vuint32m1_t vs1,
                                      size_t vl);
vuint32m1_t __riscv_vmul_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs2, uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vmul_vv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs2, vuint32m2_t vs1,
                                      size_t vl);
vuint32m2_t __riscv_vmul_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs2, uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vmul_vv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs2, vuint32m4_t vs1,
                                      size_t vl);
vuint32m4_t __riscv_vmul_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs2, uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vmul_vv_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs2, vuint32m8_t vs1,
                                      size_t vl);
vuint32m8_t __riscv_vmul_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs2, uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vmul_vv_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs2, vuint64m1_t vs1,
                                      size_t vl);
vuint64m1_t __riscv_vmul_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs2, uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vmul_vv_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs2, vuint64m2_t vs1,
                                      size_t vl);
vuint64m2_t __riscv_vmul_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs2, uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vmul_vv_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs2, vuint64m4_t vs1,
                                      size_t vl);
vuint64m4_t __riscv_vmul_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs2, uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vmul_vv_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs2, vuint64m8_t vs1,
                                      size_t vl);
vuint64m8_t __riscv_vmul_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs2, uint64_t rs1, size_t vl);
vuint8mf8_t __riscv_vmulhu_vv_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                        vuint8mf8_t vs2, vuint8mf8_t vs1,
                                        size_t vl);
vuint8mf8_t __riscv_vmulhu_vx_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                        vuint8mf8_t vs2, uint8_t rs1,
                                        size_t vl);
vuint8mf4_t __riscv_vmulhu_vv_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                        vuint8mf4_t vs2, vuint8mf4_t vs1,
                                        size_t vl);
vuint8mf4_t __riscv_vmulhu_vx_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                        vuint8mf4_t vs2, uint8_t rs1,
                                        size_t vl);
vuint8mf2_t __riscv_vmulhu_vv_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                        vuint8mf2_t vs2, vuint8mf2_t vs1,
                                        size_t vl);
vuint8mf2_t __riscv_vmulhu_vx_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                        vuint8mf2_t vs2, uint8_t rs1,
                                        size_t vl);
vuint8m1_t __riscv_vmulhu_vv_u8m1_tum(vbool8_t vm, vuint8m1_t vd,
                                      vuint8m1_t vs2, vuint8m1_t vs1,
                                      size_t vl);
vuint8m1_t __riscv_vmulhu_vx_u8m1_tum(vbool8_t vm, vuint8m1_t vd,
                                      vuint8m1_t vs2, uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vmulhu_vv_u8m2_tum(vbool4_t vm, vuint8m2_t vd,
                                      vuint8m2_t vs2, vuint8m2_t vs1,
                                      size_t vl);
vuint8m2_t __riscv_vmulhu_vx_u8m2_tum(vbool4_t vm, vuint8m2_t vd,
                                      vuint8m2_t vs2, uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vmulhu_vv_u8m4_tum(vbool2_t vm, vuint8m4_t vd,
                                      vuint8m4_t vs2, vuint8m4_t vs1,
                                      size_t vl);
vuint8m4_t __riscv_vmulhu_vx_u8m4_tum(vbool2_t vm, vuint8m4_t vd,
                                      vuint8m4_t vs2, uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vmulhu_vv_u8m8_tum(vbool1_t vm, vuint8m8_t vd,
                                      vuint8m8_t vs2, vuint8m8_t vs1,
                                      size_t vl);
vuint8m8_t __riscv_vmulhu_vx_u8m8_tum(vbool1_t vm, vuint8m8_t vd,
                                      vuint8m8_t vs2, uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vmulhu_vv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                          vuint16mf4_t vs2, vuint16mf4_t vs1,
                                          size_t vl);
vuint16mf4_t __riscv_vmulhu_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                          vuint16mf4_t vs2, uint16_t rs1,
                                          size_t vl);
vuint16mf2_t __riscv_vmulhu_vv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                          vuint16mf2_t vs2, vuint16mf2_t vs1,
                                          size_t vl);
vuint16mf2_t __riscv_vmulhu_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                          vuint16mf2_t vs2, uint16_t rs1,
                                          size_t vl);
vuint16m1_t __riscv_vmulhu_vv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                        vuint16m1_t vs2, vuint16m1_t vs1,
                                        size_t vl);
vuint16m1_t __riscv_vmulhu_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                        vuint16m1_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m2_t __riscv_vmulhu_vv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                        vuint16m2_t vs2, vuint16m2_t vs1,
                                        size_t vl);
vuint16m2_t __riscv_vmulhu_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                        vuint16m2_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m4_t __riscv_vmulhu_vv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                        vuint16m4_t vs2, vuint16m4_t vs1,
                                        size_t vl);
vuint16m4_t __riscv_vmulhu_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                        vuint16m4_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m8_t __riscv_vmulhu_vv_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                        vuint16m8_t vs2, vuint16m8_t vs1,
                                        size_t vl);
vuint16m8_t __riscv_vmulhu_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                        vuint16m8_t vs2, uint16_t rs1,
                                        size_t vl);
vuint32mf2_t __riscv_vmulhu_vv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                          vuint32mf2_t vs2, vuint32mf2_t vs1,
                                          size_t vl);
vuint32mf2_t __riscv_vmulhu_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                          vuint32mf2_t vs2, uint32_t rs1,
                                          size_t vl);
vuint32m1_t __riscv_vmulhu_vv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                        vuint32m1_t vs2, vuint32m1_t vs1,
                                        size_t vl);
vuint32m1_t __riscv_vmulhu_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                        vuint32m1_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m2_t __riscv_vmulhu_vv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                        vuint32m2_t vs2, vuint32m2_t vs1,
                                        size_t vl);
vuint32m2_t __riscv_vmulhu_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                        vuint32m2_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m4_t __riscv_vmulhu_vv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                        vuint32m4_t vs2, vuint32m4_t vs1,
                                        size_t vl);
vuint32m4_t __riscv_vmulhu_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                        vuint32m4_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m8_t __riscv_vmulhu_vv_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                        vuint32m8_t vs2, vuint32m8_t vs1,
                                        size_t vl);
vuint32m8_t __riscv_vmulhu_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                        vuint32m8_t vs2, uint32_t rs1,
                                        size_t vl);
vuint64m1_t __riscv_vmulhu_vv_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                        vuint64m1_t vs2, vuint64m1_t vs1,
                                        size_t vl);
vuint64m1_t __riscv_vmulhu_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                        vuint64m1_t vs2, uint64_t rs1,
                                        size_t vl);
vuint64m2_t __riscv_vmulhu_vv_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                        vuint64m2_t vs2, vuint64m2_t vs1,
                                        size_t vl);
vuint64m2_t __riscv_vmulhu_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                        vuint64m2_t vs2, uint64_t rs1,
                                        size_t vl);
vuint64m4_t __riscv_vmulhu_vv_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                        vuint64m4_t vs2, vuint64m4_t vs1,
                                        size_t vl);
vuint64m4_t __riscv_vmulhu_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                        vuint64m4_t vs2, uint64_t rs1,
                                        size_t vl);
vuint64m8_t __riscv_vmulhu_vv_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                        vuint64m8_t vs2, vuint64m8_t vs1,
                                        size_t vl);
vuint64m8_t __riscv_vmulhu_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                        vuint64m8_t vs2, uint64_t rs1,
                                        size_t vl);
// masked functions
vint8mf8_t __riscv_vmul_vv_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs2, vint8mf8_t vs1,
                                      size_t vl);
vint8mf8_t __riscv_vmul_vx_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vmul_vv_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs2, vint8mf4_t vs1,
                                      size_t vl);
vint8mf4_t __riscv_vmul_vx_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vmul_vv_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs2, vint8mf2_t vs1,
                                      size_t vl);
vint8mf2_t __riscv_vmul_vx_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vmul_vv_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                    vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vmul_vx_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                    int8_t rs1, size_t vl);
vint8m2_t __riscv_vmul_vv_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                    vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vmul_vx_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                    int8_t rs1, size_t vl);
vint8m4_t __riscv_vmul_vv_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                    vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vmul_vx_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                    int8_t rs1, size_t vl);
vint8m8_t __riscv_vmul_vv_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                    vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vmul_vx_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                    int8_t rs1, size_t vl);
vint16mf4_t __riscv_vmul_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, vint16mf4_t vs1,
                                        size_t vl);
vint16mf4_t __riscv_vmul_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, int16_t rs1,
                                        size_t vl);
vint16mf2_t __riscv_vmul_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, vint16mf2_t vs1,
                                        size_t vl);
vint16mf2_t __riscv_vmul_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, int16_t rs1,
                                        size_t vl);
vint16m1_t __riscv_vmul_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, vint16m1_t vs1,
                                      size_t vl);
vint16m1_t __riscv_vmul_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vmul_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, vint16m2_t vs1,
                                      size_t vl);
vint16m2_t __riscv_vmul_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, int16_t rs1, size_t vl);
vint16m4_t __riscv_vmul_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, vint16m4_t vs1,
                                      size_t vl);
vint16m4_t __riscv_vmul_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, int16_t rs1, size_t vl);
vint16m8_t __riscv_vmul_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, vint16m8_t vs1,
                                      size_t vl);
vint16m8_t __riscv_vmul_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, int16_t rs1, size_t vl);
vint32mf2_t __riscv_vmul_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, vint32mf2_t vs1,
                                        size_t vl);
vint32mf2_t __riscv_vmul_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, int32_t rs1,
                                        size_t vl);
vint32m1_t __riscv_vmul_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, vint32m1_t vs1,
                                      size_t vl);
vint32m1_t __riscv_vmul_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vmul_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, vint32m2_t vs1,
                                      size_t vl);
vint32m2_t __riscv_vmul_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vmul_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, vint32m4_t vs1,
                                      size_t vl);
vint32m4_t __riscv_vmul_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, int32_t rs1, size_t vl);
vint32m8_t __riscv_vmul_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, vint32m8_t vs1,
                                      size_t vl);
vint32m8_t __riscv_vmul_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, int32_t rs1, size_t vl);
vint64m1_t __riscv_vmul_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, vint64m1_t vs1,
                                      size_t vl);
vint64m1_t __riscv_vmul_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vmul_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, vint64m2_t vs1,
                                      size_t vl);
vint64m2_t __riscv_vmul_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vmul_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, vint64m4_t vs1,
                                      size_t vl);
vint64m4_t __riscv_vmul_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vmul_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, vint64m8_t vs1,
                                      size_t vl);
vint64m8_t __riscv_vmul_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, int64_t rs1, size_t vl);
vint8mf8_t __riscv_vmulh_vv_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                       vint8mf8_t vs2, vint8mf8_t vs1,
                                       size_t vl);
vint8mf8_t __riscv_vmulh_vx_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                       vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vmulh_vv_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                       vint8mf4_t vs2, vint8mf4_t vs1,
                                       size_t vl);
vint8mf4_t __riscv_vmulh_vx_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                       vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vmulh_vv_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                       vint8mf2_t vs2, vint8mf2_t vs1,
                                       size_t vl);
vint8mf2_t __riscv_vmulh_vx_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                       vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vmulh_vv_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                     vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vmulh_vx_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                     int8_t rs1, size_t vl);
vint8m2_t __riscv_vmulh_vv_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                     vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vmulh_vx_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                     int8_t rs1, size_t vl);
vint8m4_t __riscv_vmulh_vv_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                     vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vmulh_vx_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                     int8_t rs1, size_t vl);
vint8m8_t __riscv_vmulh_vv_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                     vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vmulh_vx_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                     int8_t rs1, size_t vl);
vint16mf4_t __riscv_vmulh_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                         vint16mf4_t vs2, vint16mf4_t vs1,
                                         size_t vl);
vint16mf4_t __riscv_vmulh_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                         vint16mf4_t vs2, int16_t rs1,
                                         size_t vl);
vint16mf2_t __riscv_vmulh_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                         vint16mf2_t vs2, vint16mf2_t vs1,
                                         size_t vl);
vint16mf2_t __riscv_vmulh_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                         vint16mf2_t vs2, int16_t rs1,
                                         size_t vl);
vint16m1_t __riscv_vmulh_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                       vint16m1_t vs2, vint16m1_t vs1,
                                       size_t vl);
vint16m1_t __riscv_vmulh_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                       vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vmulh_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                       vint16m2_t vs2, vint16m2_t vs1,
                                       size_t vl);
vint16m2_t __riscv_vmulh_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                       vint16m2_t vs2, int16_t rs1, size_t vl);
vint16m4_t __riscv_vmulh_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                       vint16m4_t vs2, vint16m4_t vs1,
                                       size_t vl);
vint16m4_t __riscv_vmulh_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                       vint16m4_t vs2, int16_t rs1, size_t vl);
vint16m8_t __riscv_vmulh_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                       vint16m8_t vs2, vint16m8_t vs1,
                                       size_t vl);
vint16m8_t __riscv_vmulh_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                       vint16m8_t vs2, int16_t rs1, size_t vl);
vint32mf2_t __riscv_vmulh_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                         vint32mf2_t vs2, vint32mf2_t vs1,
                                         size_t vl);
vint32mf2_t __riscv_vmulh_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                         vint32mf2_t vs2, int32_t rs1,
                                         size_t vl);
vint32m1_t __riscv_vmulh_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                       vint32m1_t vs2, vint32m1_t vs1,
                                       size_t vl);
vint32m1_t __riscv_vmulh_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                       vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vmulh_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                       vint32m2_t vs2, vint32m2_t vs1,
                                       size_t vl);
vint32m2_t __riscv_vmulh_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                       vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vmulh_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                       vint32m4_t vs2, vint32m4_t vs1,
                                       size_t vl);
vint32m4_t __riscv_vmulh_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                       vint32m4_t vs2, int32_t rs1, size_t vl);
vint32m8_t __riscv_vmulh_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                       vint32m8_t vs2, vint32m8_t vs1,
                                       size_t vl);
vint32m8_t __riscv_vmulh_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                       vint32m8_t vs2, int32_t rs1, size_t vl);
vint64m1_t __riscv_vmulh_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                       vint64m1_t vs2, vint64m1_t vs1,
                                       size_t vl);
vint64m1_t __riscv_vmulh_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                       vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vmulh_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                       vint64m2_t vs2, vint64m2_t vs1,
                                       size_t vl);
vint64m2_t __riscv_vmulh_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                       vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vmulh_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                       vint64m4_t vs2, vint64m4_t vs1,
                                       size_t vl);
vint64m4_t __riscv_vmulh_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                       vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vmulh_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                       vint64m8_t vs2, vint64m8_t vs1,
                                       size_t vl);
vint64m8_t __riscv_vmulh_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                       vint64m8_t vs2, int64_t rs1, size_t vl);
vint8mf8_t __riscv_vmulhsu_vv_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                         vint8mf8_t vs2, vuint8mf8_t vs1,
                                         size_t vl);
vint8mf8_t __riscv_vmulhsu_vx_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                         vint8mf8_t vs2, uint8_t rs1,
                                         size_t vl);
vint8mf4_t __riscv_vmulhsu_vv_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                         vint8mf4_t vs2, vuint8mf4_t vs1,
                                         size_t vl);
vint8mf4_t __riscv_vmulhsu_vx_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                         vint8mf4_t vs2, uint8_t rs1,
                                         size_t vl);
vint8mf2_t __riscv_vmulhsu_vv_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                         vint8mf2_t vs2, vuint8mf2_t vs1,
                                         size_t vl);
vint8mf2_t __riscv_vmulhsu_vx_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                         vint8mf2_t vs2, uint8_t rs1,
                                         size_t vl);
vint8m1_t __riscv_vmulhsu_vv_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                       vuint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vmulhsu_vx_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                       uint8_t rs1, size_t vl);
vint8m2_t __riscv_vmulhsu_vv_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                       vuint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vmulhsu_vx_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                       uint8_t rs1, size_t vl);
vint8m4_t __riscv_vmulhsu_vv_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                       vuint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vmulhsu_vx_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                       uint8_t rs1, size_t vl);
vint8m8_t __riscv_vmulhsu_vv_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                       vuint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vmulhsu_vx_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                       uint8_t rs1, size_t vl);
vint16mf4_t __riscv_vmulhsu_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                           vint16mf4_t vs2, vuint16mf4_t vs1,
                                           size_t vl);
vint16mf4_t __riscv_vmulhsu_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                           vint16mf4_t vs2, uint16_t rs1,
                                           size_t vl);
vint16mf2_t __riscv_vmulhsu_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                           vint16mf2_t vs2, vuint16mf2_t vs1,
                                           size_t vl);
vint16mf2_t __riscv_vmulhsu_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                           vint16mf2_t vs2, uint16_t rs1,
                                           size_t vl);
vint16m1_t __riscv_vmulhsu_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                         vint16m1_t vs2, vuint16m1_t vs1,
                                         size_t vl);
vint16m1_t __riscv_vmulhsu_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                         vint16m1_t vs2, uint16_t rs1,
                                         size_t vl);
vint16m2_t __riscv_vmulhsu_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                         vint16m2_t vs2, vuint16m2_t vs1,
                                         size_t vl);
vint16m2_t __riscv_vmulhsu_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                         vint16m2_t vs2, uint16_t rs1,
                                         size_t vl);
vint16m4_t __riscv_vmulhsu_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                         vint16m4_t vs2, vuint16m4_t vs1,
                                         size_t vl);
vint16m4_t __riscv_vmulhsu_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                         vint16m4_t vs2, uint16_t rs1,
                                         size_t vl);
vint16m8_t __riscv_vmulhsu_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                         vint16m8_t vs2, vuint16m8_t vs1,
                                         size_t vl);
vint16m8_t __riscv_vmulhsu_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                         vint16m8_t vs2, uint16_t rs1,
                                         size_t vl);
vint32mf2_t __riscv_vmulhsu_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                           vint32mf2_t vs2, vuint32mf2_t vs1,
                                           size_t vl);
vint32mf2_t __riscv_vmulhsu_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                           vint32mf2_t vs2, uint32_t rs1,
                                           size_t vl);
vint32m1_t __riscv_vmulhsu_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                         vint32m1_t vs2, vuint32m1_t vs1,
                                         size_t vl);
vint32m1_t __riscv_vmulhsu_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                         vint32m1_t vs2, uint32_t rs1,
                                         size_t vl);
vint32m2_t __riscv_vmulhsu_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                         vint32m2_t vs2, vuint32m2_t vs1,
                                         size_t vl);
vint32m2_t __riscv_vmulhsu_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                         vint32m2_t vs2, uint32_t rs1,
                                         size_t vl);
vint32m4_t __riscv_vmulhsu_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                         vint32m4_t vs2, vuint32m4_t vs1,
                                         size_t vl);
vint32m4_t __riscv_vmulhsu_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                         vint32m4_t vs2, uint32_t rs1,
                                         size_t vl);
vint32m8_t __riscv_vmulhsu_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                         vint32m8_t vs2, vuint32m8_t vs1,
                                         size_t vl);
vint32m8_t __riscv_vmulhsu_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                         vint32m8_t vs2, uint32_t rs1,
                                         size_t vl);
vint64m1_t __riscv_vmulhsu_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                         vint64m1_t vs2, vuint64m1_t vs1,
                                         size_t vl);
vint64m1_t __riscv_vmulhsu_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                         vint64m1_t vs2, uint64_t rs1,
                                         size_t vl);
vint64m2_t __riscv_vmulhsu_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                         vint64m2_t vs2, vuint64m2_t vs1,
                                         size_t vl);
vint64m2_t __riscv_vmulhsu_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                         vint64m2_t vs2, uint64_t rs1,
                                         size_t vl);
vint64m4_t __riscv_vmulhsu_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                         vint64m4_t vs2, vuint64m4_t vs1,
                                         size_t vl);
vint64m4_t __riscv_vmulhsu_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                         vint64m4_t vs2, uint64_t rs1,
                                         size_t vl);
vint64m8_t __riscv_vmulhsu_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                         vint64m8_t vs2, vuint64m8_t vs1,
                                         size_t vl);
vint64m8_t __riscv_vmulhsu_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                         vint64m8_t vs2, uint64_t rs1,
                                         size_t vl);
vuint8mf8_t __riscv_vmul_vv_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs2, vuint8mf8_t vs1,
                                       size_t vl);
vuint8mf8_t __riscv_vmul_vx_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vmul_vv_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs2, vuint8mf4_t vs1,
                                       size_t vl);
vuint8mf4_t __riscv_vmul_vx_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vmul_vv_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs2, vuint8mf2_t vs1,
                                       size_t vl);
vuint8mf2_t __riscv_vmul_vx_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vmul_vv_u8m1_tumu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                     vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vmul_vx_u8m1_tumu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vmul_vv_u8m2_tumu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                     vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vmul_vx_u8m2_tumu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vmul_vv_u8m4_tumu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                     vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vmul_vx_u8m4_tumu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vmul_vv_u8m8_tumu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                     vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vmul_vx_u8m8_tumu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                     uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vmul_vv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, vuint16mf4_t vs1,
                                         size_t vl);
vuint16mf4_t __riscv_vmul_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, uint16_t rs1,
                                         size_t vl);
vuint16mf2_t __riscv_vmul_vv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, vuint16mf2_t vs1,
                                         size_t vl);
vuint16mf2_t __riscv_vmul_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, uint16_t rs1,
                                         size_t vl);
vuint16m1_t __riscv_vmul_vv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, vuint16m1_t vs1,
                                       size_t vl);
vuint16m1_t __riscv_vmul_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m2_t __riscv_vmul_vv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, vuint16m2_t vs1,
                                       size_t vl);
vuint16m2_t __riscv_vmul_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m4_t __riscv_vmul_vv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, vuint16m4_t vs1,
                                       size_t vl);
vuint16m4_t __riscv_vmul_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m8_t __riscv_vmul_vv_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, vuint16m8_t vs1,
                                       size_t vl);
vuint16m8_t __riscv_vmul_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32mf2_t __riscv_vmul_vv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, vuint32mf2_t vs1,
                                         size_t vl);
vuint32mf2_t __riscv_vmul_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, uint32_t rs1,
                                         size_t vl);
vuint32m1_t __riscv_vmul_vv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, vuint32m1_t vs1,
                                       size_t vl);
vuint32m1_t __riscv_vmul_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m2_t __riscv_vmul_vv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, vuint32m2_t vs1,
                                       size_t vl);
vuint32m2_t __riscv_vmul_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m4_t __riscv_vmul_vv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, vuint32m4_t vs1,
                                       size_t vl);
vuint32m4_t __riscv_vmul_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m8_t __riscv_vmul_vv_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, vuint32m8_t vs1,
                                       size_t vl);
vuint32m8_t __riscv_vmul_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m1_t __riscv_vmul_vv_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, vuint64m1_t vs1,
                                       size_t vl);
vuint64m1_t __riscv_vmul_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m2_t __riscv_vmul_vv_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, vuint64m2_t vs1,
                                       size_t vl);
vuint64m2_t __riscv_vmul_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m4_t __riscv_vmul_vv_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, vuint64m4_t vs1,
                                       size_t vl);
vuint64m4_t __riscv_vmul_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m8_t __riscv_vmul_vv_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, vuint64m8_t vs1,
                                       size_t vl);
vuint64m8_t __riscv_vmul_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, uint64_t rs1,
                                       size_t vl);
vuint8mf8_t __riscv_vmulhu_vv_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                         vuint8mf8_t vs2, vuint8mf8_t vs1,
                                         size_t vl);
vuint8mf8_t __riscv_vmulhu_vx_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                         vuint8mf8_t vs2, uint8_t rs1,
                                         size_t vl);
vuint8mf4_t __riscv_vmulhu_vv_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                         vuint8mf4_t vs2, vuint8mf4_t vs1,
                                         size_t vl);
vuint8mf4_t __riscv_vmulhu_vx_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                         vuint8mf4_t vs2, uint8_t rs1,
                                         size_t vl);
vuint8mf2_t __riscv_vmulhu_vv_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                         vuint8mf2_t vs2, vuint8mf2_t vs1,
                                         size_t vl);
vuint8mf2_t __riscv_vmulhu_vx_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                         vuint8mf2_t vs2, uint8_t rs1,
                                         size_t vl);
vuint8m1_t __riscv_vmulhu_vv_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                       vuint8m1_t vs2, vuint8m1_t vs1,
                                       size_t vl);
vuint8m1_t __riscv_vmulhu_vx_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                       vuint8m1_t vs2, uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vmulhu_vv_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                       vuint8m2_t vs2, vuint8m2_t vs1,
                                       size_t vl);
vuint8m2_t __riscv_vmulhu_vx_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                       vuint8m2_t vs2, uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vmulhu_vv_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                       vuint8m4_t vs2, vuint8m4_t vs1,
                                       size_t vl);
vuint8m4_t __riscv_vmulhu_vx_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                       vuint8m4_t vs2, uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vmulhu_vv_u8m8_tumu(vbool1_t vm, vuint8m8_t vd,
                                       vuint8m8_t vs2, vuint8m8_t vs1,
                                       size_t vl);
vuint8m8_t __riscv_vmulhu_vx_u8m8_tumu(vbool1_t vm, vuint8m8_t vd,
                                       vuint8m8_t vs2, uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vmulhu_vv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                           vuint16mf4_t vs2, vuint16mf4_t vs1,
                                           size_t vl);
vuint16mf4_t __riscv_vmulhu_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                           vuint16mf4_t vs2, uint16_t rs1,
                                           size_t vl);
vuint16mf2_t __riscv_vmulhu_vv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                           vuint16mf2_t vs2, vuint16mf2_t vs1,
                                           size_t vl);
vuint16mf2_t __riscv_vmulhu_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                           vuint16mf2_t vs2, uint16_t rs1,
                                           size_t vl);
vuint16m1_t __riscv_vmulhu_vv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                         vuint16m1_t vs2, vuint16m1_t vs1,
                                         size_t vl);
vuint16m1_t __riscv_vmulhu_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                         vuint16m1_t vs2, uint16_t rs1,
                                         size_t vl);
vuint16m2_t __riscv_vmulhu_vv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                         vuint16m2_t vs2, vuint16m2_t vs1,
                                         size_t vl);
vuint16m2_t __riscv_vmulhu_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                         vuint16m2_t vs2, uint16_t rs1,
                                         size_t vl);
vuint16m4_t __riscv_vmulhu_vv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                         vuint16m4_t vs2, vuint16m4_t vs1,
                                         size_t vl);
vuint16m4_t __riscv_vmulhu_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                         vuint16m4_t vs2, uint16_t rs1,
                                         size_t vl);
vuint16m8_t __riscv_vmulhu_vv_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                         vuint16m8_t vs2, vuint16m8_t vs1,
                                         size_t vl);
vuint16m8_t __riscv_vmulhu_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                         vuint16m8_t vs2, uint16_t rs1,
                                         size_t vl);
vuint32mf2_t __riscv_vmulhu_vv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                           vuint32mf2_t vs2, vuint32mf2_t vs1,
                                           size_t vl);
vuint32mf2_t __riscv_vmulhu_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                           vuint32mf2_t vs2, uint32_t rs1,
                                           size_t vl);
vuint32m1_t __riscv_vmulhu_vv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                         vuint32m1_t vs2, vuint32m1_t vs1,
                                         size_t vl);
vuint32m1_t __riscv_vmulhu_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                         vuint32m1_t vs2, uint32_t rs1,
                                         size_t vl);
vuint32m2_t __riscv_vmulhu_vv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                         vuint32m2_t vs2, vuint32m2_t vs1,
                                         size_t vl);
vuint32m2_t __riscv_vmulhu_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                         vuint32m2_t vs2, uint32_t rs1,
                                         size_t vl);
vuint32m4_t __riscv_vmulhu_vv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                         vuint32m4_t vs2, vuint32m4_t vs1,
                                         size_t vl);
vuint32m4_t __riscv_vmulhu_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                         vuint32m4_t vs2, uint32_t rs1,
                                         size_t vl);
vuint32m8_t __riscv_vmulhu_vv_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                         vuint32m8_t vs2, vuint32m8_t vs1,
                                         size_t vl);
vuint32m8_t __riscv_vmulhu_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                         vuint32m8_t vs2, uint32_t rs1,
                                         size_t vl);
vuint64m1_t __riscv_vmulhu_vv_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                         vuint64m1_t vs2, vuint64m1_t vs1,
                                         size_t vl);
vuint64m1_t __riscv_vmulhu_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                         vuint64m1_t vs2, uint64_t rs1,
                                         size_t vl);
vuint64m2_t __riscv_vmulhu_vv_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                         vuint64m2_t vs2, vuint64m2_t vs1,
                                         size_t vl);
vuint64m2_t __riscv_vmulhu_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                         vuint64m2_t vs2, uint64_t rs1,
                                         size_t vl);
vuint64m4_t __riscv_vmulhu_vv_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                         vuint64m4_t vs2, vuint64m4_t vs1,
                                         size_t vl);
vuint64m4_t __riscv_vmulhu_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                         vuint64m4_t vs2, uint64_t rs1,
                                         size_t vl);
vuint64m8_t __riscv_vmulhu_vv_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                         vuint64m8_t vs2, vuint64m8_t vs1,
                                         size_t vl);
vuint64m8_t __riscv_vmulhu_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                         vuint64m8_t vs2, uint64_t rs1,
                                         size_t vl);
// masked functions
vint8mf8_t __riscv_vmul_vv_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                    vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vmul_vx_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                    int8_t rs1, size_t vl);
vint8mf4_t __riscv_vmul_vv_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                    vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vmul_vx_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                    int8_t rs1, size_t vl);
vint8mf2_t __riscv_vmul_vv_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                    vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vmul_vx_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                    int8_t rs1, size_t vl);
vint8m1_t __riscv_vmul_vv_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                  vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vmul_vx_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                  int8_t rs1, size_t vl);
vint8m2_t __riscv_vmul_vv_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                  vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vmul_vx_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                  int8_t rs1, size_t vl);
vint8m4_t __riscv_vmul_vv_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                  vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vmul_vx_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                  int8_t rs1, size_t vl);
vint8m8_t __riscv_vmul_vv_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                  vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vmul_vx_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                  int8_t rs1, size_t vl);
vint16mf4_t __riscv_vmul_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs2, vint16mf4_t vs1,
                                      size_t vl);
vint16mf4_t __riscv_vmul_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs2, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vmul_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs2, vint16mf2_t vs1,
                                      size_t vl);
vint16mf2_t __riscv_vmul_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs2, int16_t rs1, size_t vl);
vint16m1_t __riscv_vmul_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                    vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vmul_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                    int16_t rs1, size_t vl);
vint16m2_t __riscv_vmul_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                    vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vmul_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                    int16_t rs1, size_t vl);
vint16m4_t __riscv_vmul_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                    vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vmul_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                    int16_t rs1, size_t vl);
vint16m8_t __riscv_vmul_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                    vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vmul_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                    int16_t rs1, size_t vl);
vint32mf2_t __riscv_vmul_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs2, vint32mf2_t vs1,
                                      size_t vl);
vint32mf2_t __riscv_vmul_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs2, int32_t rs1, size_t vl);
vint32m1_t __riscv_vmul_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                    vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vmul_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                    int32_t rs1, size_t vl);
vint32m2_t __riscv_vmul_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                    vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vmul_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                    int32_t rs1, size_t vl);
vint32m4_t __riscv_vmul_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                    vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vmul_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                    int32_t rs1, size_t vl);
vint32m8_t __riscv_vmul_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                    vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vmul_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                    int32_t rs1, size_t vl);
vint64m1_t __riscv_vmul_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                    vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vmul_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                    int64_t rs1, size_t vl);
vint64m2_t __riscv_vmul_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                    vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vmul_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                    int64_t rs1, size_t vl);
vint64m4_t __riscv_vmul_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                    vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vmul_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                    int64_t rs1, size_t vl);
vint64m8_t __riscv_vmul_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                    vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vmul_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                    int64_t rs1, size_t vl);
vint8mf8_t __riscv_vmulh_vv_i8mf8_mu(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vmulh_vx_i8mf8_mu(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vmulh_vv_i8mf4_mu(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vmulh_vx_i8mf4_mu(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vmulh_vv_i8mf2_mu(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vmulh_vx_i8mf2_mu(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vmulh_vv_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vmulh_vx_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   int8_t rs1, size_t vl);
vint8m2_t __riscv_vmulh_vv_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vmulh_vx_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   int8_t rs1, size_t vl);
vint8m4_t __riscv_vmulh_vv_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vmulh_vx_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   int8_t rs1, size_t vl);
vint8m8_t __riscv_vmulh_vv_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vmulh_vx_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   int8_t rs1, size_t vl);
vint16mf4_t __riscv_vmulh_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, vint16mf4_t vs1,
                                       size_t vl);
vint16mf4_t __riscv_vmulh_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vmulh_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, vint16mf2_t vs1,
                                       size_t vl);
vint16mf2_t __riscv_vmulh_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, int16_t rs1, size_t vl);
vint16m1_t __riscv_vmulh_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vmulh_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vmulh_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vmulh_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     int16_t rs1, size_t vl);
vint16m4_t __riscv_vmulh_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vmulh_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     int16_t rs1, size_t vl);
vint16m8_t __riscv_vmulh_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vmulh_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     int16_t rs1, size_t vl);
vint32mf2_t __riscv_vmulh_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, vint32mf2_t vs1,
                                       size_t vl);
vint32mf2_t __riscv_vmulh_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, int32_t rs1, size_t vl);
vint32m1_t __riscv_vmulh_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vmulh_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vmulh_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vmulh_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vmulh_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vmulh_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     int32_t rs1, size_t vl);
vint32m8_t __riscv_vmulh_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vmulh_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     int32_t rs1, size_t vl);
vint64m1_t __riscv_vmulh_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vmulh_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vmulh_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vmulh_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vmulh_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vmulh_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vmulh_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vmulh_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     int64_t rs1, size_t vl);
vint8mf8_t __riscv_vmulhsu_vv_i8mf8_mu(vbool64_t vm, vint8mf8_t vd,
                                       vint8mf8_t vs2, vuint8mf8_t vs1,
                                       size_t vl);
vint8mf8_t __riscv_vmulhsu_vx_i8mf8_mu(vbool64_t vm, vint8mf8_t vd,
                                       vint8mf8_t vs2, uint8_t rs1, size_t vl);
vint8mf4_t __riscv_vmulhsu_vv_i8mf4_mu(vbool32_t vm, vint8mf4_t vd,
                                       vint8mf4_t vs2, vuint8mf4_t vs1,
                                       size_t vl);
vint8mf4_t __riscv_vmulhsu_vx_i8mf4_mu(vbool32_t vm, vint8mf4_t vd,
                                       vint8mf4_t vs2, uint8_t rs1, size_t vl);
vint8mf2_t __riscv_vmulhsu_vv_i8mf2_mu(vbool16_t vm, vint8mf2_t vd,
                                       vint8mf2_t vs2, vuint8mf2_t vs1,
                                       size_t vl);
vint8mf2_t __riscv_vmulhsu_vx_i8mf2_mu(vbool16_t vm, vint8mf2_t vd,
                                       vint8mf2_t vs2, uint8_t rs1, size_t vl);
vint8m1_t __riscv_vmulhsu_vv_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                     vuint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vmulhsu_vx_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                     uint8_t rs1, size_t vl);
vint8m2_t __riscv_vmulhsu_vv_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                     vuint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vmulhsu_vx_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                     uint8_t rs1, size_t vl);
vint8m4_t __riscv_vmulhsu_vv_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                     vuint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vmulhsu_vx_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                     uint8_t rs1, size_t vl);
vint8m8_t __riscv_vmulhsu_vv_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                     vuint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vmulhsu_vx_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                     uint8_t rs1, size_t vl);
vint16mf4_t __riscv_vmulhsu_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                         vint16mf4_t vs2, vuint16mf4_t vs1,
                                         size_t vl);
vint16mf4_t __riscv_vmulhsu_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                         vint16mf4_t vs2, uint16_t rs1,
                                         size_t vl);
vint16mf2_t __riscv_vmulhsu_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                         vint16mf2_t vs2, vuint16mf2_t vs1,
                                         size_t vl);
vint16mf2_t __riscv_vmulhsu_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                         vint16mf2_t vs2, uint16_t rs1,
                                         size_t vl);
vint16m1_t __riscv_vmulhsu_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                       vint16m1_t vs2, vuint16m1_t vs1,
                                       size_t vl);
vint16m1_t __riscv_vmulhsu_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                       vint16m1_t vs2, uint16_t rs1, size_t vl);
vint16m2_t __riscv_vmulhsu_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd,
                                       vint16m2_t vs2, vuint16m2_t vs1,
                                       size_t vl);
vint16m2_t __riscv_vmulhsu_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd,
                                       vint16m2_t vs2, uint16_t rs1, size_t vl);
vint16m4_t __riscv_vmulhsu_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd,
                                       vint16m4_t vs2, vuint16m4_t vs1,
                                       size_t vl);
vint16m4_t __riscv_vmulhsu_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd,
                                       vint16m4_t vs2, uint16_t rs1, size_t vl);
vint16m8_t __riscv_vmulhsu_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd,
                                       vint16m8_t vs2, vuint16m8_t vs1,
                                       size_t vl);
vint16m8_t __riscv_vmulhsu_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd,
                                       vint16m8_t vs2, uint16_t rs1, size_t vl);
vint32mf2_t __riscv_vmulhsu_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                         vint32mf2_t vs2, vuint32mf2_t vs1,
                                         size_t vl);
vint32mf2_t __riscv_vmulhsu_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                         vint32mf2_t vs2, uint32_t rs1,
                                         size_t vl);
vint32m1_t __riscv_vmulhsu_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                       vint32m1_t vs2, vuint32m1_t vs1,
                                       size_t vl);
vint32m1_t __riscv_vmulhsu_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                       vint32m1_t vs2, uint32_t rs1, size_t vl);
vint32m2_t __riscv_vmulhsu_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                       vint32m2_t vs2, vuint32m2_t vs1,
                                       size_t vl);
vint32m2_t __riscv_vmulhsu_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                       vint32m2_t vs2, uint32_t rs1, size_t vl);
vint32m4_t __riscv_vmulhsu_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd,
                                       vint32m4_t vs2, vuint32m4_t vs1,
                                       size_t vl);
vint32m4_t __riscv_vmulhsu_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd,
                                       vint32m4_t vs2, uint32_t rs1, size_t vl);
vint32m8_t __riscv_vmulhsu_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd,
                                       vint32m8_t vs2, vuint32m8_t vs1,
                                       size_t vl);
vint32m8_t __riscv_vmulhsu_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd,
                                       vint32m8_t vs2, uint32_t rs1, size_t vl);
vint64m1_t __riscv_vmulhsu_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                       vint64m1_t vs2, vuint64m1_t vs1,
                                       size_t vl);
vint64m1_t __riscv_vmulhsu_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                       vint64m1_t vs2, uint64_t rs1, size_t vl);
vint64m2_t __riscv_vmulhsu_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                       vint64m2_t vs2, vuint64m2_t vs1,
                                       size_t vl);
vint64m2_t __riscv_vmulhsu_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                       vint64m2_t vs2, uint64_t rs1, size_t vl);
vint64m4_t __riscv_vmulhsu_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                       vint64m4_t vs2, vuint64m4_t vs1,
                                       size_t vl);
vint64m4_t __riscv_vmulhsu_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                       vint64m4_t vs2, uint64_t rs1, size_t vl);
vint64m8_t __riscv_vmulhsu_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd,
                                       vint64m8_t vs2, vuint64m8_t vs1,
                                       size_t vl);
vint64m8_t __riscv_vmulhsu_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd,
                                       vint64m8_t vs2, uint64_t rs1, size_t vl);
vuint8mf8_t __riscv_vmul_vv_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                     vuint8mf8_t vs2, vuint8mf8_t vs1,
                                     size_t vl);
vuint8mf8_t __riscv_vmul_vx_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                     vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vmul_vv_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                     vuint8mf4_t vs2, vuint8mf4_t vs1,
                                     size_t vl);
vuint8mf4_t __riscv_vmul_vx_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                     vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vmul_vv_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                     vuint8mf2_t vs2, vuint8mf2_t vs1,
                                     size_t vl);
vuint8mf2_t __riscv_vmul_vx_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                     vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vmul_vv_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                   vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vmul_vx_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                   uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vmul_vv_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                   vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vmul_vx_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                   uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vmul_vv_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                   vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vmul_vx_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                   uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vmul_vv_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                   vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vmul_vx_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                   uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vmul_vv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                       vuint16mf4_t vs2, vuint16mf4_t vs1,
                                       size_t vl);
vuint16mf4_t __riscv_vmul_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                       vuint16mf4_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16mf2_t __riscv_vmul_vv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                       vuint16mf2_t vs2, vuint16mf2_t vs1,
                                       size_t vl);
vuint16mf2_t __riscv_vmul_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                       vuint16mf2_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m1_t __riscv_vmul_vv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                     vuint16m1_t vs2, vuint16m1_t vs1,
                                     size_t vl);
vuint16m1_t __riscv_vmul_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                     vuint16m1_t vs2, uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vmul_vv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                     vuint16m2_t vs2, vuint16m2_t vs1,
                                     size_t vl);
vuint16m2_t __riscv_vmul_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                     vuint16m2_t vs2, uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vmul_vv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                     vuint16m4_t vs2, vuint16m4_t vs1,
                                     size_t vl);
vuint16m4_t __riscv_vmul_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                     vuint16m4_t vs2, uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vmul_vv_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                     vuint16m8_t vs2, vuint16m8_t vs1,
                                     size_t vl);
vuint16m8_t __riscv_vmul_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                     vuint16m8_t vs2, uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vmul_vv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                       vuint32mf2_t vs2, vuint32mf2_t vs1,
                                       size_t vl);
vuint32mf2_t __riscv_vmul_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                       vuint32mf2_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m1_t __riscv_vmul_vv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                     vuint32m1_t vs2, vuint32m1_t vs1,
                                     size_t vl);
vuint32m1_t __riscv_vmul_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                     vuint32m1_t vs2, uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vmul_vv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                     vuint32m2_t vs2, vuint32m2_t vs1,
                                     size_t vl);
vuint32m2_t __riscv_vmul_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                     vuint32m2_t vs2, uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vmul_vv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                     vuint32m4_t vs2, vuint32m4_t vs1,
                                     size_t vl);
vuint32m4_t __riscv_vmul_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                     vuint32m4_t vs2, uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vmul_vv_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                     vuint32m8_t vs2, vuint32m8_t vs1,
                                     size_t vl);
vuint32m8_t __riscv_vmul_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                     vuint32m8_t vs2, uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vmul_vv_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                     vuint64m1_t vs2, vuint64m1_t vs1,
                                     size_t vl);
vuint64m1_t __riscv_vmul_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                     vuint64m1_t vs2, uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vmul_vv_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                     vuint64m2_t vs2, vuint64m2_t vs1,
                                     size_t vl);
vuint64m2_t __riscv_vmul_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                     vuint64m2_t vs2, uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vmul_vv_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                     vuint64m4_t vs2, vuint64m4_t vs1,
                                     size_t vl);
vuint64m4_t __riscv_vmul_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                     vuint64m4_t vs2, uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vmul_vv_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                     vuint64m8_t vs2, vuint64m8_t vs1,
                                     size_t vl);
vuint64m8_t __riscv_vmul_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                     vuint64m8_t vs2, uint64_t rs1, size_t vl);
vuint8mf8_t __riscv_vmulhu_vv_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs2, vuint8mf8_t vs1,
                                       size_t vl);
vuint8mf8_t __riscv_vmulhu_vx_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vmulhu_vv_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs2, vuint8mf4_t vs1,
                                       size_t vl);
vuint8mf4_t __riscv_vmulhu_vx_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vmulhu_vv_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs2, vuint8mf2_t vs1,
                                       size_t vl);
vuint8mf2_t __riscv_vmulhu_vx_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vmulhu_vv_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                     vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vmulhu_vx_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vmulhu_vv_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                     vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vmulhu_vx_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vmulhu_vv_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                     vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vmulhu_vx_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vmulhu_vv_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                     vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vmulhu_vx_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                     uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vmulhu_vv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, vuint16mf4_t vs1,
                                         size_t vl);
vuint16mf4_t __riscv_vmulhu_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, uint16_t rs1,
                                         size_t vl);
vuint16mf2_t __riscv_vmulhu_vv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, vuint16mf2_t vs1,
                                         size_t vl);
vuint16mf2_t __riscv_vmulhu_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, uint16_t rs1,
                                         size_t vl);
vuint16m1_t __riscv_vmulhu_vv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, vuint16m1_t vs1,
                                       size_t vl);
vuint16m1_t __riscv_vmulhu_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m2_t __riscv_vmulhu_vv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, vuint16m2_t vs1,
                                       size_t vl);
vuint16m2_t __riscv_vmulhu_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m4_t __riscv_vmulhu_vv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, vuint16m4_t vs1,
                                       size_t vl);
vuint16m4_t __riscv_vmulhu_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m8_t __riscv_vmulhu_vv_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, vuint16m8_t vs1,
                                       size_t vl);
vuint16m8_t __riscv_vmulhu_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32mf2_t __riscv_vmulhu_vv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, vuint32mf2_t vs1,
                                         size_t vl);
vuint32mf2_t __riscv_vmulhu_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, uint32_t rs1,
                                         size_t vl);
vuint32m1_t __riscv_vmulhu_vv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, vuint32m1_t vs1,
                                       size_t vl);
vuint32m1_t __riscv_vmulhu_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m2_t __riscv_vmulhu_vv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, vuint32m2_t vs1,
                                       size_t vl);
vuint32m2_t __riscv_vmulhu_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m4_t __riscv_vmulhu_vv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, vuint32m4_t vs1,
                                       size_t vl);
vuint32m4_t __riscv_vmulhu_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m8_t __riscv_vmulhu_vv_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, vuint32m8_t vs1,
                                       size_t vl);
vuint32m8_t __riscv_vmulhu_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m1_t __riscv_vmulhu_vv_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, vuint64m1_t vs1,
                                       size_t vl);
vuint64m1_t __riscv_vmulhu_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m2_t __riscv_vmulhu_vv_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, vuint64m2_t vs1,
                                       size_t vl);
vuint64m2_t __riscv_vmulhu_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m4_t __riscv_vmulhu_vv_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, vuint64m4_t vs1,
                                       size_t vl);
vuint64m4_t __riscv_vmulhu_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m8_t __riscv_vmulhu_vv_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, vuint64m8_t vs1,
                                       size_t vl);
vuint64m8_t __riscv_vmulhu_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, uint64_t rs1,
                                       size_t vl);

Vector Integer Divide Intrinsics

vint8mf8_t __riscv_vdiv_vv_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                    vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vdiv_vx_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2, int8_t rs1,
                                    size_t vl);
vint8mf4_t __riscv_vdiv_vv_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                    vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vdiv_vx_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2, int8_t rs1,
                                    size_t vl);
vint8mf2_t __riscv_vdiv_vv_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                    vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vdiv_vx_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2, int8_t rs1,
                                    size_t vl);
vint8m1_t __riscv_vdiv_vv_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, vint8m1_t vs1,
                                  size_t vl);
vint8m1_t __riscv_vdiv_vx_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, int8_t rs1,
                                  size_t vl);
vint8m2_t __riscv_vdiv_vv_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, vint8m2_t vs1,
                                  size_t vl);
vint8m2_t __riscv_vdiv_vx_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, int8_t rs1,
                                  size_t vl);
vint8m4_t __riscv_vdiv_vv_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, vint8m4_t vs1,
                                  size_t vl);
vint8m4_t __riscv_vdiv_vx_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, int8_t rs1,
                                  size_t vl);
vint8m8_t __riscv_vdiv_vv_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, vint8m8_t vs1,
                                  size_t vl);
vint8m8_t __riscv_vdiv_vx_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, int8_t rs1,
                                  size_t vl);
vint16mf4_t __riscv_vdiv_vv_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                      vint16mf4_t vs1, size_t vl);
vint16mf4_t __riscv_vdiv_vx_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                      int16_t rs1, size_t vl);
vint16mf2_t __riscv_vdiv_vv_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                      vint16mf2_t vs1, size_t vl);
vint16mf2_t __riscv_vdiv_vx_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                      int16_t rs1, size_t vl);
vint16m1_t __riscv_vdiv_vv_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                    vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vdiv_vx_i16m1_tu(vint16m1_t vd, vint16m1_t vs2, int16_t rs1,
                                    size_t vl);
vint16m2_t __riscv_vdiv_vv_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                    vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vdiv_vx_i16m2_tu(vint16m2_t vd, vint16m2_t vs2, int16_t rs1,
                                    size_t vl);
vint16m4_t __riscv_vdiv_vv_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                    vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vdiv_vx_i16m4_tu(vint16m4_t vd, vint16m4_t vs2, int16_t rs1,
                                    size_t vl);
vint16m8_t __riscv_vdiv_vv_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                    vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vdiv_vx_i16m8_tu(vint16m8_t vd, vint16m8_t vs2, int16_t rs1,
                                    size_t vl);
vint32mf2_t __riscv_vdiv_vv_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                      vint32mf2_t vs1, size_t vl);
vint32mf2_t __riscv_vdiv_vx_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                      int32_t rs1, size_t vl);
vint32m1_t __riscv_vdiv_vv_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                    vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vdiv_vx_i32m1_tu(vint32m1_t vd, vint32m1_t vs2, int32_t rs1,
                                    size_t vl);
vint32m2_t __riscv_vdiv_vv_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                    vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vdiv_vx_i32m2_tu(vint32m2_t vd, vint32m2_t vs2, int32_t rs1,
                                    size_t vl);
vint32m4_t __riscv_vdiv_vv_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                    vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vdiv_vx_i32m4_tu(vint32m4_t vd, vint32m4_t vs2, int32_t rs1,
                                    size_t vl);
vint32m8_t __riscv_vdiv_vv_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                    vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vdiv_vx_i32m8_tu(vint32m8_t vd, vint32m8_t vs2, int32_t rs1,
                                    size_t vl);
vint64m1_t __riscv_vdiv_vv_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                    vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vdiv_vx_i64m1_tu(vint64m1_t vd, vint64m1_t vs2, int64_t rs1,
                                    size_t vl);
vint64m2_t __riscv_vdiv_vv_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                    vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vdiv_vx_i64m2_tu(vint64m2_t vd, vint64m2_t vs2, int64_t rs1,
                                    size_t vl);
vint64m4_t __riscv_vdiv_vv_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                    vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vdiv_vx_i64m4_tu(vint64m4_t vd, vint64m4_t vs2, int64_t rs1,
                                    size_t vl);
vint64m8_t __riscv_vdiv_vv_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                    vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vdiv_vx_i64m8_tu(vint64m8_t vd, vint64m8_t vs2, int64_t rs1,
                                    size_t vl);
vint8mf8_t __riscv_vrem_vv_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                    vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vrem_vx_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2, int8_t rs1,
                                    size_t vl);
vint8mf4_t __riscv_vrem_vv_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                    vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vrem_vx_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2, int8_t rs1,
                                    size_t vl);
vint8mf2_t __riscv_vrem_vv_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                    vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vrem_vx_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2, int8_t rs1,
                                    size_t vl);
vint8m1_t __riscv_vrem_vv_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, vint8m1_t vs1,
                                  size_t vl);
vint8m1_t __riscv_vrem_vx_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, int8_t rs1,
                                  size_t vl);
vint8m2_t __riscv_vrem_vv_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, vint8m2_t vs1,
                                  size_t vl);
vint8m2_t __riscv_vrem_vx_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, int8_t rs1,
                                  size_t vl);
vint8m4_t __riscv_vrem_vv_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, vint8m4_t vs1,
                                  size_t vl);
vint8m4_t __riscv_vrem_vx_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, int8_t rs1,
                                  size_t vl);
vint8m8_t __riscv_vrem_vv_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, vint8m8_t vs1,
                                  size_t vl);
vint8m8_t __riscv_vrem_vx_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, int8_t rs1,
                                  size_t vl);
vint16mf4_t __riscv_vrem_vv_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                      vint16mf4_t vs1, size_t vl);
vint16mf4_t __riscv_vrem_vx_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                      int16_t rs1, size_t vl);
vint16mf2_t __riscv_vrem_vv_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                      vint16mf2_t vs1, size_t vl);
vint16mf2_t __riscv_vrem_vx_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                      int16_t rs1, size_t vl);
vint16m1_t __riscv_vrem_vv_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                    vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vrem_vx_i16m1_tu(vint16m1_t vd, vint16m1_t vs2, int16_t rs1,
                                    size_t vl);
vint16m2_t __riscv_vrem_vv_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                    vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vrem_vx_i16m2_tu(vint16m2_t vd, vint16m2_t vs2, int16_t rs1,
                                    size_t vl);
vint16m4_t __riscv_vrem_vv_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                    vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vrem_vx_i16m4_tu(vint16m4_t vd, vint16m4_t vs2, int16_t rs1,
                                    size_t vl);
vint16m8_t __riscv_vrem_vv_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                    vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vrem_vx_i16m8_tu(vint16m8_t vd, vint16m8_t vs2, int16_t rs1,
                                    size_t vl);
vint32mf2_t __riscv_vrem_vv_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                      vint32mf2_t vs1, size_t vl);
vint32mf2_t __riscv_vrem_vx_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                      int32_t rs1, size_t vl);
vint32m1_t __riscv_vrem_vv_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                    vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vrem_vx_i32m1_tu(vint32m1_t vd, vint32m1_t vs2, int32_t rs1,
                                    size_t vl);
vint32m2_t __riscv_vrem_vv_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                    vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vrem_vx_i32m2_tu(vint32m2_t vd, vint32m2_t vs2, int32_t rs1,
                                    size_t vl);
vint32m4_t __riscv_vrem_vv_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                    vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vrem_vx_i32m4_tu(vint32m4_t vd, vint32m4_t vs2, int32_t rs1,
                                    size_t vl);
vint32m8_t __riscv_vrem_vv_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                    vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vrem_vx_i32m8_tu(vint32m8_t vd, vint32m8_t vs2, int32_t rs1,
                                    size_t vl);
vint64m1_t __riscv_vrem_vv_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                    vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vrem_vx_i64m1_tu(vint64m1_t vd, vint64m1_t vs2, int64_t rs1,
                                    size_t vl);
vint64m2_t __riscv_vrem_vv_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                    vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vrem_vx_i64m2_tu(vint64m2_t vd, vint64m2_t vs2, int64_t rs1,
                                    size_t vl);
vint64m4_t __riscv_vrem_vv_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                    vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vrem_vx_i64m4_tu(vint64m4_t vd, vint64m4_t vs2, int64_t rs1,
                                    size_t vl);
vint64m8_t __riscv_vrem_vv_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                    vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vrem_vx_i64m8_tu(vint64m8_t vd, vint64m8_t vs2, int64_t rs1,
                                    size_t vl);
vuint8mf8_t __riscv_vdivu_vv_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                      vuint8mf8_t vs1, size_t vl);
vuint8mf8_t __riscv_vdivu_vx_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                      uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vdivu_vv_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                      vuint8mf4_t vs1, size_t vl);
vuint8mf4_t __riscv_vdivu_vx_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                      uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vdivu_vv_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                      vuint8mf2_t vs1, size_t vl);
vuint8mf2_t __riscv_vdivu_vx_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                      uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vdivu_vv_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2,
                                    vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vdivu_vx_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2, uint8_t rs1,
                                    size_t vl);
vuint8m2_t __riscv_vdivu_vv_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2,
                                    vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vdivu_vx_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2, uint8_t rs1,
                                    size_t vl);
vuint8m4_t __riscv_vdivu_vv_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2,
                                    vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vdivu_vx_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2, uint8_t rs1,
                                    size_t vl);
vuint8m8_t __riscv_vdivu_vv_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2,
                                    vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vdivu_vx_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2, uint8_t rs1,
                                    size_t vl);
vuint16mf4_t __riscv_vdivu_vv_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                        vuint16mf4_t vs1, size_t vl);
vuint16mf4_t __riscv_vdivu_vx_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                        uint16_t rs1, size_t vl);
vuint16mf2_t __riscv_vdivu_vv_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                        vuint16mf2_t vs1, size_t vl);
vuint16mf2_t __riscv_vdivu_vx_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                        uint16_t rs1, size_t vl);
vuint16m1_t __riscv_vdivu_vv_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                      vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vdivu_vx_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                      uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vdivu_vv_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                      vuint16m2_t vs1, size_t vl);
vuint16m2_t __riscv_vdivu_vx_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                      uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vdivu_vv_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                      vuint16m4_t vs1, size_t vl);
vuint16m4_t __riscv_vdivu_vx_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                      uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vdivu_vv_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                      vuint16m8_t vs1, size_t vl);
vuint16m8_t __riscv_vdivu_vx_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                      uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vdivu_vv_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                        vuint32mf2_t vs1, size_t vl);
vuint32mf2_t __riscv_vdivu_vx_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                        uint32_t rs1, size_t vl);
vuint32m1_t __riscv_vdivu_vv_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                      vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vdivu_vx_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                      uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vdivu_vv_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                      vuint32m2_t vs1, size_t vl);
vuint32m2_t __riscv_vdivu_vx_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                      uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vdivu_vv_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                      vuint32m4_t vs1, size_t vl);
vuint32m4_t __riscv_vdivu_vx_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                      uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vdivu_vv_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                      vuint32m8_t vs1, size_t vl);
vuint32m8_t __riscv_vdivu_vx_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                      uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vdivu_vv_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                      vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vdivu_vx_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                      uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vdivu_vv_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                      vuint64m2_t vs1, size_t vl);
vuint64m2_t __riscv_vdivu_vx_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                      uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vdivu_vv_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                      vuint64m4_t vs1, size_t vl);
vuint64m4_t __riscv_vdivu_vx_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                      uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vdivu_vv_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                      vuint64m8_t vs1, size_t vl);
vuint64m8_t __riscv_vdivu_vx_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                      uint64_t rs1, size_t vl);
vuint8mf8_t __riscv_vremu_vv_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                      vuint8mf8_t vs1, size_t vl);
vuint8mf8_t __riscv_vremu_vx_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                      uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vremu_vv_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                      vuint8mf4_t vs1, size_t vl);
vuint8mf4_t __riscv_vremu_vx_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                      uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vremu_vv_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                      vuint8mf2_t vs1, size_t vl);
vuint8mf2_t __riscv_vremu_vx_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                      uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vremu_vv_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2,
                                    vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vremu_vx_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2, uint8_t rs1,
                                    size_t vl);
vuint8m2_t __riscv_vremu_vv_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2,
                                    vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vremu_vx_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2, uint8_t rs1,
                                    size_t vl);
vuint8m4_t __riscv_vremu_vv_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2,
                                    vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vremu_vx_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2, uint8_t rs1,
                                    size_t vl);
vuint8m8_t __riscv_vremu_vv_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2,
                                    vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vremu_vx_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2, uint8_t rs1,
                                    size_t vl);
vuint16mf4_t __riscv_vremu_vv_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                        vuint16mf4_t vs1, size_t vl);
vuint16mf4_t __riscv_vremu_vx_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                        uint16_t rs1, size_t vl);
vuint16mf2_t __riscv_vremu_vv_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                        vuint16mf2_t vs1, size_t vl);
vuint16mf2_t __riscv_vremu_vx_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                        uint16_t rs1, size_t vl);
vuint16m1_t __riscv_vremu_vv_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                      vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vremu_vx_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                      uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vremu_vv_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                      vuint16m2_t vs1, size_t vl);
vuint16m2_t __riscv_vremu_vx_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                      uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vremu_vv_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                      vuint16m4_t vs1, size_t vl);
vuint16m4_t __riscv_vremu_vx_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                      uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vremu_vv_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                      vuint16m8_t vs1, size_t vl);
vuint16m8_t __riscv_vremu_vx_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                      uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vremu_vv_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                        vuint32mf2_t vs1, size_t vl);
vuint32mf2_t __riscv_vremu_vx_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                        uint32_t rs1, size_t vl);
vuint32m1_t __riscv_vremu_vv_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                      vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vremu_vx_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                      uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vremu_vv_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                      vuint32m2_t vs1, size_t vl);
vuint32m2_t __riscv_vremu_vx_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                      uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vremu_vv_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                      vuint32m4_t vs1, size_t vl);
vuint32m4_t __riscv_vremu_vx_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                      uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vremu_vv_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                      vuint32m8_t vs1, size_t vl);
vuint32m8_t __riscv_vremu_vx_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                      uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vremu_vv_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                      vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vremu_vx_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                      uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vremu_vv_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                      vuint64m2_t vs1, size_t vl);
vuint64m2_t __riscv_vremu_vx_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                      uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vremu_vv_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                      vuint64m4_t vs1, size_t vl);
vuint64m4_t __riscv_vremu_vx_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                      uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vremu_vv_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                      vuint64m8_t vs1, size_t vl);
vuint64m8_t __riscv_vremu_vx_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                      uint64_t rs1, size_t vl);
// masked functions
vint8mf8_t __riscv_vdiv_vv_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vdiv_vx_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vdiv_vv_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vdiv_vx_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vdiv_vv_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vdiv_vx_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vdiv_vv_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vdiv_vx_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   int8_t rs1, size_t vl);
vint8m2_t __riscv_vdiv_vv_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vdiv_vx_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   int8_t rs1, size_t vl);
vint8m4_t __riscv_vdiv_vv_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vdiv_vx_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   int8_t rs1, size_t vl);
vint8m8_t __riscv_vdiv_vv_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vdiv_vx_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   int8_t rs1, size_t vl);
vint16mf4_t __riscv_vdiv_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, vint16mf4_t vs1,
                                       size_t vl);
vint16mf4_t __riscv_vdiv_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vdiv_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, vint16mf2_t vs1,
                                       size_t vl);
vint16mf2_t __riscv_vdiv_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, int16_t rs1, size_t vl);
vint16m1_t __riscv_vdiv_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vdiv_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vdiv_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vdiv_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     int16_t rs1, size_t vl);
vint16m4_t __riscv_vdiv_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vdiv_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     int16_t rs1, size_t vl);
vint16m8_t __riscv_vdiv_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vdiv_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     int16_t rs1, size_t vl);
vint32mf2_t __riscv_vdiv_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, vint32mf2_t vs1,
                                       size_t vl);
vint32mf2_t __riscv_vdiv_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, int32_t rs1, size_t vl);
vint32m1_t __riscv_vdiv_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vdiv_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vdiv_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vdiv_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vdiv_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vdiv_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     int32_t rs1, size_t vl);
vint32m8_t __riscv_vdiv_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vdiv_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     int32_t rs1, size_t vl);
vint64m1_t __riscv_vdiv_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vdiv_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vdiv_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vdiv_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vdiv_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vdiv_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vdiv_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vdiv_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     int64_t rs1, size_t vl);
vint8mf8_t __riscv_vrem_vv_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vrem_vx_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vrem_vv_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vrem_vx_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vrem_vv_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vrem_vx_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vrem_vv_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vrem_vx_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                   int8_t rs1, size_t vl);
vint8m2_t __riscv_vrem_vv_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vrem_vx_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                   int8_t rs1, size_t vl);
vint8m4_t __riscv_vrem_vv_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vrem_vx_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                   int8_t rs1, size_t vl);
vint8m8_t __riscv_vrem_vv_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vrem_vx_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                   int8_t rs1, size_t vl);
vint16mf4_t __riscv_vrem_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, vint16mf4_t vs1,
                                       size_t vl);
vint16mf4_t __riscv_vrem_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs2, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vrem_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, vint16mf2_t vs1,
                                       size_t vl);
vint16mf2_t __riscv_vrem_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs2, int16_t rs1, size_t vl);
vint16m1_t __riscv_vrem_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vrem_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vrem_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vrem_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                     int16_t rs1, size_t vl);
vint16m4_t __riscv_vrem_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vrem_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                     int16_t rs1, size_t vl);
vint16m8_t __riscv_vrem_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vrem_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                     int16_t rs1, size_t vl);
vint32mf2_t __riscv_vrem_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, vint32mf2_t vs1,
                                       size_t vl);
vint32mf2_t __riscv_vrem_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs2, int32_t rs1, size_t vl);
vint32m1_t __riscv_vrem_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vrem_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vrem_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vrem_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vrem_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vrem_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                     int32_t rs1, size_t vl);
vint32m8_t __riscv_vrem_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vrem_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                     int32_t rs1, size_t vl);
vint64m1_t __riscv_vrem_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vrem_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vrem_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vrem_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vrem_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vrem_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vrem_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vrem_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                     int64_t rs1, size_t vl);
vuint8mf8_t __riscv_vdivu_vv_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs2, vuint8mf8_t vs1,
                                       size_t vl);
vuint8mf8_t __riscv_vdivu_vx_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vdivu_vv_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs2, vuint8mf4_t vs1,
                                       size_t vl);
vuint8mf4_t __riscv_vdivu_vx_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vdivu_vv_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs2, vuint8mf2_t vs1,
                                       size_t vl);
vuint8mf2_t __riscv_vdivu_vx_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vdivu_vv_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                     vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vdivu_vx_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vdivu_vv_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                     vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vdivu_vx_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vdivu_vv_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                     vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vdivu_vx_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vdivu_vv_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                     vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vdivu_vx_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                     uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vdivu_vv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, vuint16mf4_t vs1,
                                         size_t vl);
vuint16mf4_t __riscv_vdivu_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, uint16_t rs1,
                                         size_t vl);
vuint16mf2_t __riscv_vdivu_vv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, vuint16mf2_t vs1,
                                         size_t vl);
vuint16mf2_t __riscv_vdivu_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, uint16_t rs1,
                                         size_t vl);
vuint16m1_t __riscv_vdivu_vv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, vuint16m1_t vs1,
                                       size_t vl);
vuint16m1_t __riscv_vdivu_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m2_t __riscv_vdivu_vv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, vuint16m2_t vs1,
                                       size_t vl);
vuint16m2_t __riscv_vdivu_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m4_t __riscv_vdivu_vv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, vuint16m4_t vs1,
                                       size_t vl);
vuint16m4_t __riscv_vdivu_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m8_t __riscv_vdivu_vv_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, vuint16m8_t vs1,
                                       size_t vl);
vuint16m8_t __riscv_vdivu_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32mf2_t __riscv_vdivu_vv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, vuint32mf2_t vs1,
                                         size_t vl);
vuint32mf2_t __riscv_vdivu_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, uint32_t rs1,
                                         size_t vl);
vuint32m1_t __riscv_vdivu_vv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, vuint32m1_t vs1,
                                       size_t vl);
vuint32m1_t __riscv_vdivu_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m2_t __riscv_vdivu_vv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, vuint32m2_t vs1,
                                       size_t vl);
vuint32m2_t __riscv_vdivu_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m4_t __riscv_vdivu_vv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, vuint32m4_t vs1,
                                       size_t vl);
vuint32m4_t __riscv_vdivu_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m8_t __riscv_vdivu_vv_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, vuint32m8_t vs1,
                                       size_t vl);
vuint32m8_t __riscv_vdivu_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m1_t __riscv_vdivu_vv_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, vuint64m1_t vs1,
                                       size_t vl);
vuint64m1_t __riscv_vdivu_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m2_t __riscv_vdivu_vv_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, vuint64m2_t vs1,
                                       size_t vl);
vuint64m2_t __riscv_vdivu_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m4_t __riscv_vdivu_vv_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, vuint64m4_t vs1,
                                       size_t vl);
vuint64m4_t __riscv_vdivu_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m8_t __riscv_vdivu_vv_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, vuint64m8_t vs1,
                                       size_t vl);
vuint64m8_t __riscv_vdivu_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, uint64_t rs1,
                                       size_t vl);
vuint8mf8_t __riscv_vremu_vv_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs2, vuint8mf8_t vs1,
                                       size_t vl);
vuint8mf8_t __riscv_vremu_vx_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vremu_vv_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs2, vuint8mf4_t vs1,
                                       size_t vl);
vuint8mf4_t __riscv_vremu_vx_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vremu_vv_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs2, vuint8mf2_t vs1,
                                       size_t vl);
vuint8mf2_t __riscv_vremu_vx_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vremu_vv_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                     vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vremu_vx_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vremu_vv_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                     vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vremu_vx_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vremu_vv_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                     vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vremu_vx_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                     uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vremu_vv_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                     vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vremu_vx_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                     uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vremu_vv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, vuint16mf4_t vs1,
                                         size_t vl);
vuint16mf4_t __riscv_vremu_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs2, uint16_t rs1,
                                         size_t vl);
vuint16mf2_t __riscv_vremu_vv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, vuint16mf2_t vs1,
                                         size_t vl);
vuint16mf2_t __riscv_vremu_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs2, uint16_t rs1,
                                         size_t vl);
vuint16m1_t __riscv_vremu_vv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, vuint16m1_t vs1,
                                       size_t vl);
vuint16m1_t __riscv_vremu_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m2_t __riscv_vremu_vv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, vuint16m2_t vs1,
                                       size_t vl);
vuint16m2_t __riscv_vremu_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m4_t __riscv_vremu_vv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, vuint16m4_t vs1,
                                       size_t vl);
vuint16m4_t __riscv_vremu_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs2, uint16_t rs1,
                                       size_t vl);
vuint16m8_t __riscv_vremu_vv_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, vuint16m8_t vs1,
                                       size_t vl);
vuint16m8_t __riscv_vremu_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32mf2_t __riscv_vremu_vv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, vuint32mf2_t vs1,
                                         size_t vl);
vuint32mf2_t __riscv_vremu_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs2, uint32_t rs1,
                                         size_t vl);
vuint32m1_t __riscv_vremu_vv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, vuint32m1_t vs1,
                                       size_t vl);
vuint32m1_t __riscv_vremu_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m2_t __riscv_vremu_vv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, vuint32m2_t vs1,
                                       size_t vl);
vuint32m2_t __riscv_vremu_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m4_t __riscv_vremu_vv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, vuint32m4_t vs1,
                                       size_t vl);
vuint32m4_t __riscv_vremu_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs2, uint32_t rs1,
                                       size_t vl);
vuint32m8_t __riscv_vremu_vv_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, vuint32m8_t vs1,
                                       size_t vl);
vuint32m8_t __riscv_vremu_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m1_t __riscv_vremu_vv_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, vuint64m1_t vs1,
                                       size_t vl);
vuint64m1_t __riscv_vremu_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m2_t __riscv_vremu_vv_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, vuint64m2_t vs1,
                                       size_t vl);
vuint64m2_t __riscv_vremu_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m4_t __riscv_vremu_vv_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, vuint64m4_t vs1,
                                       size_t vl);
vuint64m4_t __riscv_vremu_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs2, uint64_t rs1,
                                       size_t vl);
vuint64m8_t __riscv_vremu_vv_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, vuint64m8_t vs1,
                                       size_t vl);
vuint64m8_t __riscv_vremu_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs2, uint64_t rs1,
                                       size_t vl);
// masked functions
vint8mf8_t __riscv_vdiv_vv_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs2, vint8mf8_t vs1,
                                      size_t vl);
vint8mf8_t __riscv_vdiv_vx_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vdiv_vv_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs2, vint8mf4_t vs1,
                                      size_t vl);
vint8mf4_t __riscv_vdiv_vx_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vdiv_vv_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs2, vint8mf2_t vs1,
                                      size_t vl);
vint8mf2_t __riscv_vdiv_vx_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vdiv_vv_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                    vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vdiv_vx_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                    int8_t rs1, size_t vl);
vint8m2_t __riscv_vdiv_vv_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                    vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vdiv_vx_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                    int8_t rs1, size_t vl);
vint8m4_t __riscv_vdiv_vv_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                    vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vdiv_vx_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                    int8_t rs1, size_t vl);
vint8m8_t __riscv_vdiv_vv_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                    vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vdiv_vx_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                    int8_t rs1, size_t vl);
vint16mf4_t __riscv_vdiv_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, vint16mf4_t vs1,
                                        size_t vl);
vint16mf4_t __riscv_vdiv_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, int16_t rs1,
                                        size_t vl);
vint16mf2_t __riscv_vdiv_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, vint16mf2_t vs1,
                                        size_t vl);
vint16mf2_t __riscv_vdiv_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, int16_t rs1,
                                        size_t vl);
vint16m1_t __riscv_vdiv_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, vint16m1_t vs1,
                                      size_t vl);
vint16m1_t __riscv_vdiv_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vdiv_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, vint16m2_t vs1,
                                      size_t vl);
vint16m2_t __riscv_vdiv_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, int16_t rs1, size_t vl);
vint16m4_t __riscv_vdiv_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, vint16m4_t vs1,
                                      size_t vl);
vint16m4_t __riscv_vdiv_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, int16_t rs1, size_t vl);
vint16m8_t __riscv_vdiv_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, vint16m8_t vs1,
                                      size_t vl);
vint16m8_t __riscv_vdiv_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, int16_t rs1, size_t vl);
vint32mf2_t __riscv_vdiv_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, vint32mf2_t vs1,
                                        size_t vl);
vint32mf2_t __riscv_vdiv_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, int32_t rs1,
                                        size_t vl);
vint32m1_t __riscv_vdiv_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, vint32m1_t vs1,
                                      size_t vl);
vint32m1_t __riscv_vdiv_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vdiv_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, vint32m2_t vs1,
                                      size_t vl);
vint32m2_t __riscv_vdiv_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vdiv_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, vint32m4_t vs1,
                                      size_t vl);
vint32m4_t __riscv_vdiv_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, int32_t rs1, size_t vl);
vint32m8_t __riscv_vdiv_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, vint32m8_t vs1,
                                      size_t vl);
vint32m8_t __riscv_vdiv_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, int32_t rs1, size_t vl);
vint64m1_t __riscv_vdiv_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, vint64m1_t vs1,
                                      size_t vl);
vint64m1_t __riscv_vdiv_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vdiv_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, vint64m2_t vs1,
                                      size_t vl);
vint64m2_t __riscv_vdiv_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vdiv_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, vint64m4_t vs1,
                                      size_t vl);
vint64m4_t __riscv_vdiv_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vdiv_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, vint64m8_t vs1,
                                      size_t vl);
vint64m8_t __riscv_vdiv_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, int64_t rs1, size_t vl);
vint8mf8_t __riscv_vrem_vv_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs2, vint8mf8_t vs1,
                                      size_t vl);
vint8mf8_t __riscv_vrem_vx_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vrem_vv_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs2, vint8mf4_t vs1,
                                      size_t vl);
vint8mf4_t __riscv_vrem_vx_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vrem_vv_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs2, vint8mf2_t vs1,
                                      size_t vl);
vint8mf2_t __riscv_vrem_vx_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vrem_vv_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                    vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vrem_vx_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                    int8_t rs1, size_t vl);
vint8m2_t __riscv_vrem_vv_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                    vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vrem_vx_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                    int8_t rs1, size_t vl);
vint8m4_t __riscv_vrem_vv_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                    vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vrem_vx_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                    int8_t rs1, size_t vl);
vint8m8_t __riscv_vrem_vv_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                    vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vrem_vx_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                    int8_t rs1, size_t vl);
vint16mf4_t __riscv_vrem_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, vint16mf4_t vs1,
                                        size_t vl);
vint16mf4_t __riscv_vrem_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs2, int16_t rs1,
                                        size_t vl);
vint16mf2_t __riscv_vrem_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, vint16mf2_t vs1,
                                        size_t vl);
vint16mf2_t __riscv_vrem_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs2, int16_t rs1,
                                        size_t vl);
vint16m1_t __riscv_vrem_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, vint16m1_t vs1,
                                      size_t vl);
vint16m1_t __riscv_vrem_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vrem_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, vint16m2_t vs1,
                                      size_t vl);
vint16m2_t __riscv_vrem_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs2, int16_t rs1, size_t vl);
vint16m4_t __riscv_vrem_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, vint16m4_t vs1,
                                      size_t vl);
vint16m4_t __riscv_vrem_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs2, int16_t rs1, size_t vl);
vint16m8_t __riscv_vrem_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, vint16m8_t vs1,
                                      size_t vl);
vint16m8_t __riscv_vrem_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs2, int16_t rs1, size_t vl);
vint32mf2_t __riscv_vrem_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, vint32mf2_t vs1,
                                        size_t vl);
vint32mf2_t __riscv_vrem_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs2, int32_t rs1,
                                        size_t vl);
vint32m1_t __riscv_vrem_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, vint32m1_t vs1,
                                      size_t vl);
vint32m1_t __riscv_vrem_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vrem_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, vint32m2_t vs1,
                                      size_t vl);
vint32m2_t __riscv_vrem_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vrem_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, vint32m4_t vs1,
                                      size_t vl);
vint32m4_t __riscv_vrem_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs2, int32_t rs1, size_t vl);
vint32m8_t __riscv_vrem_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, vint32m8_t vs1,
                                      size_t vl);
vint32m8_t __riscv_vrem_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs2, int32_t rs1, size_t vl);
vint64m1_t __riscv_vrem_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, vint64m1_t vs1,
                                      size_t vl);
vint64m1_t __riscv_vrem_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vrem_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, vint64m2_t vs1,
                                      size_t vl);
vint64m2_t __riscv_vrem_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vrem_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, vint64m4_t vs1,
                                      size_t vl);
vint64m4_t __riscv_vrem_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vrem_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, vint64m8_t vs1,
                                      size_t vl);
vint64m8_t __riscv_vrem_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs2, int64_t rs1, size_t vl);
vuint8mf8_t __riscv_vdivu_vv_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                        vuint8mf8_t vs2, vuint8mf8_t vs1,
                                        size_t vl);
vuint8mf8_t __riscv_vdivu_vx_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                        vuint8mf8_t vs2, uint8_t rs1,
                                        size_t vl);
vuint8mf4_t __riscv_vdivu_vv_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                        vuint8mf4_t vs2, vuint8mf4_t vs1,
                                        size_t vl);
vuint8mf4_t __riscv_vdivu_vx_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                        vuint8mf4_t vs2, uint8_t rs1,
                                        size_t vl);
vuint8mf2_t __riscv_vdivu_vv_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                        vuint8mf2_t vs2, vuint8mf2_t vs1,
                                        size_t vl);
vuint8mf2_t __riscv_vdivu_vx_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                        vuint8mf2_t vs2, uint8_t rs1,
                                        size_t vl);
vuint8m1_t __riscv_vdivu_vv_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                      vuint8m1_t vs2, vuint8m1_t vs1,
                                      size_t vl);
vuint8m1_t __riscv_vdivu_vx_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                      vuint8m1_t vs2, uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vdivu_vv_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                      vuint8m2_t vs2, vuint8m2_t vs1,
                                      size_t vl);
vuint8m2_t __riscv_vdivu_vx_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                      vuint8m2_t vs2, uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vdivu_vv_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                      vuint8m4_t vs2, vuint8m4_t vs1,
                                      size_t vl);
vuint8m4_t __riscv_vdivu_vx_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                      vuint8m4_t vs2, uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vdivu_vv_u8m8_tumu(vbool1_t vm, vuint8m8_t vd,
                                      vuint8m8_t vs2, vuint8m8_t vs1,
                                      size_t vl);
vuint8m8_t __riscv_vdivu_vx_u8m8_tumu(vbool1_t vm, vuint8m8_t vd,
                                      vuint8m8_t vs2, uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vdivu_vv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                          vuint16mf4_t vs2, vuint16mf4_t vs1,
                                          size_t vl);
vuint16mf4_t __riscv_vdivu_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                          vuint16mf4_t vs2, uint16_t rs1,
                                          size_t vl);
vuint16mf2_t __riscv_vdivu_vv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                          vuint16mf2_t vs2, vuint16mf2_t vs1,
                                          size_t vl);
vuint16mf2_t __riscv_vdivu_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                          vuint16mf2_t vs2, uint16_t rs1,
                                          size_t vl);
vuint16m1_t __riscv_vdivu_vv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                        vuint16m1_t vs2, vuint16m1_t vs1,
                                        size_t vl);
vuint16m1_t __riscv_vdivu_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                        vuint16m1_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m2_t __riscv_vdivu_vv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                        vuint16m2_t vs2, vuint16m2_t vs1,
                                        size_t vl);
vuint16m2_t __riscv_vdivu_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                        vuint16m2_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m4_t __riscv_vdivu_vv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                        vuint16m4_t vs2, vuint16m4_t vs1,
                                        size_t vl);
vuint16m4_t __riscv_vdivu_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                        vuint16m4_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m8_t __riscv_vdivu_vv_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                        vuint16m8_t vs2, vuint16m8_t vs1,
                                        size_t vl);
vuint16m8_t __riscv_vdivu_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                        vuint16m8_t vs2, uint16_t rs1,
                                        size_t vl);
vuint32mf2_t __riscv_vdivu_vv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                          vuint32mf2_t vs2, vuint32mf2_t vs1,
                                          size_t vl);
vuint32mf2_t __riscv_vdivu_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                          vuint32mf2_t vs2, uint32_t rs1,
                                          size_t vl);
vuint32m1_t __riscv_vdivu_vv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                        vuint32m1_t vs2, vuint32m1_t vs1,
                                        size_t vl);
vuint32m1_t __riscv_vdivu_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                        vuint32m1_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m2_t __riscv_vdivu_vv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                        vuint32m2_t vs2, vuint32m2_t vs1,
                                        size_t vl);
vuint32m2_t __riscv_vdivu_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                        vuint32m2_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m4_t __riscv_vdivu_vv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                        vuint32m4_t vs2, vuint32m4_t vs1,
                                        size_t vl);
vuint32m4_t __riscv_vdivu_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                        vuint32m4_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m8_t __riscv_vdivu_vv_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                        vuint32m8_t vs2, vuint32m8_t vs1,
                                        size_t vl);
vuint32m8_t __riscv_vdivu_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                        vuint32m8_t vs2, uint32_t rs1,
                                        size_t vl);
vuint64m1_t __riscv_vdivu_vv_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                        vuint64m1_t vs2, vuint64m1_t vs1,
                                        size_t vl);
vuint64m1_t __riscv_vdivu_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                        vuint64m1_t vs2, uint64_t rs1,
                                        size_t vl);
vuint64m2_t __riscv_vdivu_vv_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                        vuint64m2_t vs2, vuint64m2_t vs1,
                                        size_t vl);
vuint64m2_t __riscv_vdivu_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                        vuint64m2_t vs2, uint64_t rs1,
                                        size_t vl);
vuint64m4_t __riscv_vdivu_vv_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                        vuint64m4_t vs2, vuint64m4_t vs1,
                                        size_t vl);
vuint64m4_t __riscv_vdivu_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                        vuint64m4_t vs2, uint64_t rs1,
                                        size_t vl);
vuint64m8_t __riscv_vdivu_vv_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                        vuint64m8_t vs2, vuint64m8_t vs1,
                                        size_t vl);
vuint64m8_t __riscv_vdivu_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                        vuint64m8_t vs2, uint64_t rs1,
                                        size_t vl);
vuint8mf8_t __riscv_vremu_vv_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                        vuint8mf8_t vs2, vuint8mf8_t vs1,
                                        size_t vl);
vuint8mf8_t __riscv_vremu_vx_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                        vuint8mf8_t vs2, uint8_t rs1,
                                        size_t vl);
vuint8mf4_t __riscv_vremu_vv_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                        vuint8mf4_t vs2, vuint8mf4_t vs1,
                                        size_t vl);
vuint8mf4_t __riscv_vremu_vx_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                        vuint8mf4_t vs2, uint8_t rs1,
                                        size_t vl);
vuint8mf2_t __riscv_vremu_vv_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                        vuint8mf2_t vs2, vuint8mf2_t vs1,
                                        size_t vl);
vuint8mf2_t __riscv_vremu_vx_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                        vuint8mf2_t vs2, uint8_t rs1,
                                        size_t vl);
vuint8m1_t __riscv_vremu_vv_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                      vuint8m1_t vs2, vuint8m1_t vs1,
                                      size_t vl);
vuint8m1_t __riscv_vremu_vx_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                      vuint8m1_t vs2, uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vremu_vv_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                      vuint8m2_t vs2, vuint8m2_t vs1,
                                      size_t vl);
vuint8m2_t __riscv_vremu_vx_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                      vuint8m2_t vs2, uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vremu_vv_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                      vuint8m4_t vs2, vuint8m4_t vs1,
                                      size_t vl);
vuint8m4_t __riscv_vremu_vx_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                      vuint8m4_t vs2, uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vremu_vv_u8m8_tumu(vbool1_t vm, vuint8m8_t vd,
                                      vuint8m8_t vs2, vuint8m8_t vs1,
                                      size_t vl);
vuint8m8_t __riscv_vremu_vx_u8m8_tumu(vbool1_t vm, vuint8m8_t vd,
                                      vuint8m8_t vs2, uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vremu_vv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                          vuint16mf4_t vs2, vuint16mf4_t vs1,
                                          size_t vl);
vuint16mf4_t __riscv_vremu_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                          vuint16mf4_t vs2, uint16_t rs1,
                                          size_t vl);
vuint16mf2_t __riscv_vremu_vv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                          vuint16mf2_t vs2, vuint16mf2_t vs1,
                                          size_t vl);
vuint16mf2_t __riscv_vremu_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                          vuint16mf2_t vs2, uint16_t rs1,
                                          size_t vl);
vuint16m1_t __riscv_vremu_vv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                        vuint16m1_t vs2, vuint16m1_t vs1,
                                        size_t vl);
vuint16m1_t __riscv_vremu_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                        vuint16m1_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m2_t __riscv_vremu_vv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                        vuint16m2_t vs2, vuint16m2_t vs1,
                                        size_t vl);
vuint16m2_t __riscv_vremu_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                        vuint16m2_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m4_t __riscv_vremu_vv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                        vuint16m4_t vs2, vuint16m4_t vs1,
                                        size_t vl);
vuint16m4_t __riscv_vremu_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                        vuint16m4_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m8_t __riscv_vremu_vv_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                        vuint16m8_t vs2, vuint16m8_t vs1,
                                        size_t vl);
vuint16m8_t __riscv_vremu_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                        vuint16m8_t vs2, uint16_t rs1,
                                        size_t vl);
vuint32mf2_t __riscv_vremu_vv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                          vuint32mf2_t vs2, vuint32mf2_t vs1,
                                          size_t vl);
vuint32mf2_t __riscv_vremu_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                          vuint32mf2_t vs2, uint32_t rs1,
                                          size_t vl);
vuint32m1_t __riscv_vremu_vv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                        vuint32m1_t vs2, vuint32m1_t vs1,
                                        size_t vl);
vuint32m1_t __riscv_vremu_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                        vuint32m1_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m2_t __riscv_vremu_vv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                        vuint32m2_t vs2, vuint32m2_t vs1,
                                        size_t vl);
vuint32m2_t __riscv_vremu_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                        vuint32m2_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m4_t __riscv_vremu_vv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                        vuint32m4_t vs2, vuint32m4_t vs1,
                                        size_t vl);
vuint32m4_t __riscv_vremu_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                        vuint32m4_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m8_t __riscv_vremu_vv_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                        vuint32m8_t vs2, vuint32m8_t vs1,
                                        size_t vl);
vuint32m8_t __riscv_vremu_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                        vuint32m8_t vs2, uint32_t rs1,
                                        size_t vl);
vuint64m1_t __riscv_vremu_vv_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                        vuint64m1_t vs2, vuint64m1_t vs1,
                                        size_t vl);
vuint64m1_t __riscv_vremu_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                        vuint64m1_t vs2, uint64_t rs1,
                                        size_t vl);
vuint64m2_t __riscv_vremu_vv_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                        vuint64m2_t vs2, vuint64m2_t vs1,
                                        size_t vl);
vuint64m2_t __riscv_vremu_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                        vuint64m2_t vs2, uint64_t rs1,
                                        size_t vl);
vuint64m4_t __riscv_vremu_vv_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                        vuint64m4_t vs2, vuint64m4_t vs1,
                                        size_t vl);
vuint64m4_t __riscv_vremu_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                        vuint64m4_t vs2, uint64_t rs1,
                                        size_t vl);
vuint64m8_t __riscv_vremu_vv_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                        vuint64m8_t vs2, vuint64m8_t vs1,
                                        size_t vl);
vuint64m8_t __riscv_vremu_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                        vuint64m8_t vs2, uint64_t rs1,
                                        size_t vl);
// masked functions
vint8mf8_t __riscv_vdiv_vv_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                    vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vdiv_vx_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                    int8_t rs1, size_t vl);
vint8mf4_t __riscv_vdiv_vv_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                    vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vdiv_vx_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                    int8_t rs1, size_t vl);
vint8mf2_t __riscv_vdiv_vv_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                    vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vdiv_vx_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                    int8_t rs1, size_t vl);
vint8m1_t __riscv_vdiv_vv_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                  vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vdiv_vx_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                  int8_t rs1, size_t vl);
vint8m2_t __riscv_vdiv_vv_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                  vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vdiv_vx_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                  int8_t rs1, size_t vl);
vint8m4_t __riscv_vdiv_vv_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                  vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vdiv_vx_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                  int8_t rs1, size_t vl);
vint8m8_t __riscv_vdiv_vv_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                  vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vdiv_vx_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                  int8_t rs1, size_t vl);
vint16mf4_t __riscv_vdiv_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs2, vint16mf4_t vs1,
                                      size_t vl);
vint16mf4_t __riscv_vdiv_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs2, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vdiv_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs2, vint16mf2_t vs1,
                                      size_t vl);
vint16mf2_t __riscv_vdiv_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs2, int16_t rs1, size_t vl);
vint16m1_t __riscv_vdiv_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                    vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vdiv_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                    int16_t rs1, size_t vl);
vint16m2_t __riscv_vdiv_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                    vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vdiv_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                    int16_t rs1, size_t vl);
vint16m4_t __riscv_vdiv_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                    vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vdiv_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                    int16_t rs1, size_t vl);
vint16m8_t __riscv_vdiv_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                    vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vdiv_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                    int16_t rs1, size_t vl);
vint32mf2_t __riscv_vdiv_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs2, vint32mf2_t vs1,
                                      size_t vl);
vint32mf2_t __riscv_vdiv_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs2, int32_t rs1, size_t vl);
vint32m1_t __riscv_vdiv_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                    vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vdiv_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                    int32_t rs1, size_t vl);
vint32m2_t __riscv_vdiv_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                    vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vdiv_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                    int32_t rs1, size_t vl);
vint32m4_t __riscv_vdiv_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                    vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vdiv_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                    int32_t rs1, size_t vl);
vint32m8_t __riscv_vdiv_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                    vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vdiv_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                    int32_t rs1, size_t vl);
vint64m1_t __riscv_vdiv_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                    vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vdiv_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                    int64_t rs1, size_t vl);
vint64m2_t __riscv_vdiv_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                    vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vdiv_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                    int64_t rs1, size_t vl);
vint64m4_t __riscv_vdiv_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                    vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vdiv_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                    int64_t rs1, size_t vl);
vint64m8_t __riscv_vdiv_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                    vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vdiv_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                    int64_t rs1, size_t vl);
vint8mf8_t __riscv_vrem_vv_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                    vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vrem_vx_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                                    int8_t rs1, size_t vl);
vint8mf4_t __riscv_vrem_vv_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                    vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vrem_vx_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                                    int8_t rs1, size_t vl);
vint8mf2_t __riscv_vrem_vv_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                    vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vrem_vx_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                                    int8_t rs1, size_t vl);
vint8m1_t __riscv_vrem_vv_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                  vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vrem_vx_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                  int8_t rs1, size_t vl);
vint8m2_t __riscv_vrem_vv_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                  vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vrem_vx_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                  int8_t rs1, size_t vl);
vint8m4_t __riscv_vrem_vv_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                  vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vrem_vx_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                  int8_t rs1, size_t vl);
vint8m8_t __riscv_vrem_vv_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                  vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vrem_vx_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                  int8_t rs1, size_t vl);
vint16mf4_t __riscv_vrem_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs2, vint16mf4_t vs1,
                                      size_t vl);
vint16mf4_t __riscv_vrem_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                      vint16mf4_t vs2, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vrem_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs2, vint16mf2_t vs1,
                                      size_t vl);
vint16mf2_t __riscv_vrem_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                      vint16mf2_t vs2, int16_t rs1, size_t vl);
vint16m1_t __riscv_vrem_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                    vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vrem_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                                    int16_t rs1, size_t vl);
vint16m2_t __riscv_vrem_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                    vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vrem_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                                    int16_t rs1, size_t vl);
vint16m4_t __riscv_vrem_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                    vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vrem_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                                    int16_t rs1, size_t vl);
vint16m8_t __riscv_vrem_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                    vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vrem_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                                    int16_t rs1, size_t vl);
vint32mf2_t __riscv_vrem_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs2, vint32mf2_t vs1,
                                      size_t vl);
vint32mf2_t __riscv_vrem_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                      vint32mf2_t vs2, int32_t rs1, size_t vl);
vint32m1_t __riscv_vrem_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                    vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vrem_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                                    int32_t rs1, size_t vl);
vint32m2_t __riscv_vrem_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                    vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vrem_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                                    int32_t rs1, size_t vl);
vint32m4_t __riscv_vrem_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                    vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vrem_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                                    int32_t rs1, size_t vl);
vint32m8_t __riscv_vrem_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                    vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vrem_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                                    int32_t rs1, size_t vl);
vint64m1_t __riscv_vrem_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                    vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vrem_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                                    int64_t rs1, size_t vl);
vint64m2_t __riscv_vrem_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                    vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vrem_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                                    int64_t rs1, size_t vl);
vint64m4_t __riscv_vrem_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                    vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vrem_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                                    int64_t rs1, size_t vl);
vint64m8_t __riscv_vrem_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                    vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vrem_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                                    int64_t rs1, size_t vl);
vuint8mf8_t __riscv_vdivu_vv_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs2, vuint8mf8_t vs1,
                                      size_t vl);
vuint8mf8_t __riscv_vdivu_vx_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vdivu_vv_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs2, vuint8mf4_t vs1,
                                      size_t vl);
vuint8mf4_t __riscv_vdivu_vx_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vdivu_vv_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs2, vuint8mf2_t vs1,
                                      size_t vl);
vuint8mf2_t __riscv_vdivu_vx_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vdivu_vv_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                    vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vdivu_vx_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vdivu_vv_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                    vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vdivu_vx_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vdivu_vv_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                    vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vdivu_vx_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vdivu_vv_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                    vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vdivu_vx_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                    uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vdivu_vv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs2, vuint16mf4_t vs1,
                                        size_t vl);
vuint16mf4_t __riscv_vdivu_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16mf2_t __riscv_vdivu_vv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs2, vuint16mf2_t vs1,
                                        size_t vl);
vuint16mf2_t __riscv_vdivu_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m1_t __riscv_vdivu_vv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs2, vuint16m1_t vs1,
                                      size_t vl);
vuint16m1_t __riscv_vdivu_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs2, uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vdivu_vv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs2, vuint16m2_t vs1,
                                      size_t vl);
vuint16m2_t __riscv_vdivu_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs2, uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vdivu_vv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs2, vuint16m4_t vs1,
                                      size_t vl);
vuint16m4_t __riscv_vdivu_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs2, uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vdivu_vv_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs2, vuint16m8_t vs1,
                                      size_t vl);
vuint16m8_t __riscv_vdivu_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs2, uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vdivu_vv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs2, vuint32mf2_t vs1,
                                        size_t vl);
vuint32mf2_t __riscv_vdivu_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m1_t __riscv_vdivu_vv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs2, vuint32m1_t vs1,
                                      size_t vl);
vuint32m1_t __riscv_vdivu_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs2, uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vdivu_vv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs2, vuint32m2_t vs1,
                                      size_t vl);
vuint32m2_t __riscv_vdivu_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs2, uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vdivu_vv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs2, vuint32m4_t vs1,
                                      size_t vl);
vuint32m4_t __riscv_vdivu_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs2, uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vdivu_vv_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs2, vuint32m8_t vs1,
                                      size_t vl);
vuint32m8_t __riscv_vdivu_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs2, uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vdivu_vv_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs2, vuint64m1_t vs1,
                                      size_t vl);
vuint64m1_t __riscv_vdivu_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs2, uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vdivu_vv_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs2, vuint64m2_t vs1,
                                      size_t vl);
vuint64m2_t __riscv_vdivu_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs2, uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vdivu_vv_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs2, vuint64m4_t vs1,
                                      size_t vl);
vuint64m4_t __riscv_vdivu_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs2, uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vdivu_vv_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs2, vuint64m8_t vs1,
                                      size_t vl);
vuint64m8_t __riscv_vdivu_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs2, uint64_t rs1, size_t vl);
vuint8mf8_t __riscv_vremu_vv_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs2, vuint8mf8_t vs1,
                                      size_t vl);
vuint8mf8_t __riscv_vremu_vx_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vremu_vv_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs2, vuint8mf4_t vs1,
                                      size_t vl);
vuint8mf4_t __riscv_vremu_vx_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vremu_vv_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs2, vuint8mf2_t vs1,
                                      size_t vl);
vuint8mf2_t __riscv_vremu_vx_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vremu_vv_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                    vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vremu_vx_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vremu_vv_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                    vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vremu_vx_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vremu_vv_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                    vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vremu_vx_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                                    uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vremu_vv_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                    vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vremu_vx_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                                    uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vremu_vv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs2, vuint16mf4_t vs1,
                                        size_t vl);
vuint16mf4_t __riscv_vremu_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16mf2_t __riscv_vremu_vv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs2, vuint16mf2_t vs1,
                                        size_t vl);
vuint16mf2_t __riscv_vremu_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs2, uint16_t rs1,
                                        size_t vl);
vuint16m1_t __riscv_vremu_vv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs2, vuint16m1_t vs1,
                                      size_t vl);
vuint16m1_t __riscv_vremu_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs2, uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vremu_vv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs2, vuint16m2_t vs1,
                                      size_t vl);
vuint16m2_t __riscv_vremu_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs2, uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vremu_vv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs2, vuint16m4_t vs1,
                                      size_t vl);
vuint16m4_t __riscv_vremu_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs2, uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vremu_vv_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs2, vuint16m8_t vs1,
                                      size_t vl);
vuint16m8_t __riscv_vremu_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs2, uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vremu_vv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs2, vuint32mf2_t vs1,
                                        size_t vl);
vuint32mf2_t __riscv_vremu_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs2, uint32_t rs1,
                                        size_t vl);
vuint32m1_t __riscv_vremu_vv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs2, vuint32m1_t vs1,
                                      size_t vl);
vuint32m1_t __riscv_vremu_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs2, uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vremu_vv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs2, vuint32m2_t vs1,
                                      size_t vl);
vuint32m2_t __riscv_vremu_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs2, uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vremu_vv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs2, vuint32m4_t vs1,
                                      size_t vl);
vuint32m4_t __riscv_vremu_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs2, uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vremu_vv_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs2, vuint32m8_t vs1,
                                      size_t vl);
vuint32m8_t __riscv_vremu_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs2, uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vremu_vv_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs2, vuint64m1_t vs1,
                                      size_t vl);
vuint64m1_t __riscv_vremu_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs2, uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vremu_vv_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs2, vuint64m2_t vs1,
                                      size_t vl);
vuint64m2_t __riscv_vremu_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs2, uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vremu_vv_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs2, vuint64m4_t vs1,
                                      size_t vl);
vuint64m4_t __riscv_vremu_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs2, uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vremu_vv_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs2, vuint64m8_t vs1,
                                      size_t vl);
vuint64m8_t __riscv_vremu_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs2, uint64_t rs1, size_t vl);

Vector Widening Integer Multiply Intrinsics

vint16mf4_t __riscv_vwmul_vv_i16mf4_tu(vint16mf4_t vd, vint8mf8_t vs2,
                                       vint8mf8_t vs1, size_t vl);
vint16mf4_t __riscv_vwmul_vx_i16mf4_tu(vint16mf4_t vd, vint8mf8_t vs2,
                                       int8_t rs1, size_t vl);
vint16mf2_t __riscv_vwmul_vv_i16mf2_tu(vint16mf2_t vd, vint8mf4_t vs2,
                                       vint8mf4_t vs1, size_t vl);
vint16mf2_t __riscv_vwmul_vx_i16mf2_tu(vint16mf2_t vd, vint8mf4_t vs2,
                                       int8_t rs1, size_t vl);
vint16m1_t __riscv_vwmul_vv_i16m1_tu(vint16m1_t vd, vint8mf2_t vs2,
                                     vint8mf2_t vs1, size_t vl);
vint16m1_t __riscv_vwmul_vx_i16m1_tu(vint16m1_t vd, vint8mf2_t vs2, int8_t rs1,
                                     size_t vl);
vint16m2_t __riscv_vwmul_vv_i16m2_tu(vint16m2_t vd, vint8m1_t vs2,
                                     vint8m1_t vs1, size_t vl);
vint16m2_t __riscv_vwmul_vx_i16m2_tu(vint16m2_t vd, vint8m1_t vs2, int8_t rs1,
                                     size_t vl);
vint16m4_t __riscv_vwmul_vv_i16m4_tu(vint16m4_t vd, vint8m2_t vs2,
                                     vint8m2_t vs1, size_t vl);
vint16m4_t __riscv_vwmul_vx_i16m4_tu(vint16m4_t vd, vint8m2_t vs2, int8_t rs1,
                                     size_t vl);
vint16m8_t __riscv_vwmul_vv_i16m8_tu(vint16m8_t vd, vint8m4_t vs2,
                                     vint8m4_t vs1, size_t vl);
vint16m8_t __riscv_vwmul_vx_i16m8_tu(vint16m8_t vd, vint8m4_t vs2, int8_t rs1,
                                     size_t vl);
vint32mf2_t __riscv_vwmul_vv_i32mf2_tu(vint32mf2_t vd, vint16mf4_t vs2,
                                       vint16mf4_t vs1, size_t vl);
vint32mf2_t __riscv_vwmul_vx_i32mf2_tu(vint32mf2_t vd, vint16mf4_t vs2,
                                       int16_t rs1, size_t vl);
vint32m1_t __riscv_vwmul_vv_i32m1_tu(vint32m1_t vd, vint16mf2_t vs2,
                                     vint16mf2_t vs1, size_t vl);
vint32m1_t __riscv_vwmul_vx_i32m1_tu(vint32m1_t vd, vint16mf2_t vs2,
                                     int16_t rs1, size_t vl);
vint32m2_t __riscv_vwmul_vv_i32m2_tu(vint32m2_t vd, vint16m1_t vs2,
                                     vint16m1_t vs1, size_t vl);
vint32m2_t __riscv_vwmul_vx_i32m2_tu(vint32m2_t vd, vint16m1_t vs2, int16_t rs1,
                                     size_t vl);
vint32m4_t __riscv_vwmul_vv_i32m4_tu(vint32m4_t vd, vint16m2_t vs2,
                                     vint16m2_t vs1, size_t vl);
vint32m4_t __riscv_vwmul_vx_i32m4_tu(vint32m4_t vd, vint16m2_t vs2, int16_t rs1,
                                     size_t vl);
vint32m8_t __riscv_vwmul_vv_i32m8_tu(vint32m8_t vd, vint16m4_t vs2,
                                     vint16m4_t vs1, size_t vl);
vint32m8_t __riscv_vwmul_vx_i32m8_tu(vint32m8_t vd, vint16m4_t vs2, int16_t rs1,
                                     size_t vl);
vint64m1_t __riscv_vwmul_vv_i64m1_tu(vint64m1_t vd, vint32mf2_t vs2,
                                     vint32mf2_t vs1, size_t vl);
vint64m1_t __riscv_vwmul_vx_i64m1_tu(vint64m1_t vd, vint32mf2_t vs2,
                                     int32_t rs1, size_t vl);
vint64m2_t __riscv_vwmul_vv_i64m2_tu(vint64m2_t vd, vint32m1_t vs2,
                                     vint32m1_t vs1, size_t vl);
vint64m2_t __riscv_vwmul_vx_i64m2_tu(vint64m2_t vd, vint32m1_t vs2, int32_t rs1,
                                     size_t vl);
vint64m4_t __riscv_vwmul_vv_i64m4_tu(vint64m4_t vd, vint32m2_t vs2,
                                     vint32m2_t vs1, size_t vl);
vint64m4_t __riscv_vwmul_vx_i64m4_tu(vint64m4_t vd, vint32m2_t vs2, int32_t rs1,
                                     size_t vl);
vint64m8_t __riscv_vwmul_vv_i64m8_tu(vint64m8_t vd, vint32m4_t vs2,
                                     vint32m4_t vs1, size_t vl);
vint64m8_t __riscv_vwmul_vx_i64m8_tu(vint64m8_t vd, vint32m4_t vs2, int32_t rs1,
                                     size_t vl);
vint16mf4_t __riscv_vwmulsu_vv_i16mf4_tu(vint16mf4_t vd, vint8mf8_t vs2,
                                         vuint8mf8_t vs1, size_t vl);
vint16mf4_t __riscv_vwmulsu_vx_i16mf4_tu(vint16mf4_t vd, vint8mf8_t vs2,
                                         uint8_t rs1, size_t vl);
vint16mf2_t __riscv_vwmulsu_vv_i16mf2_tu(vint16mf2_t vd, vint8mf4_t vs2,
                                         vuint8mf4_t vs1, size_t vl);
vint16mf2_t __riscv_vwmulsu_vx_i16mf2_tu(vint16mf2_t vd, vint8mf4_t vs2,
                                         uint8_t rs1, size_t vl);
vint16m1_t __riscv_vwmulsu_vv_i16m1_tu(vint16m1_t vd, vint8mf2_t vs2,
                                       vuint8mf2_t vs1, size_t vl);
vint16m1_t __riscv_vwmulsu_vx_i16m1_tu(vint16m1_t vd, vint8mf2_t vs2,
                                       uint8_t rs1, size_t vl);
vint16m2_t __riscv_vwmulsu_vv_i16m2_tu(vint16m2_t vd, vint8m1_t vs2,
                                       vuint8m1_t vs1, size_t vl);
vint16m2_t __riscv_vwmulsu_vx_i16m2_tu(vint16m2_t vd, vint8m1_t vs2,
                                       uint8_t rs1, size_t vl);
vint16m4_t __riscv_vwmulsu_vv_i16m4_tu(vint16m4_t vd, vint8m2_t vs2,
                                       vuint8m2_t vs1, size_t vl);
vint16m4_t __riscv_vwmulsu_vx_i16m4_tu(vint16m4_t vd, vint8m2_t vs2,
                                       uint8_t rs1, size_t vl);
vint16m8_t __riscv_vwmulsu_vv_i16m8_tu(vint16m8_t vd, vint8m4_t vs2,
                                       vuint8m4_t vs1, size_t vl);
vint16m8_t __riscv_vwmulsu_vx_i16m8_tu(vint16m8_t vd, vint8m4_t vs2,
                                       uint8_t rs1, size_t vl);
vint32mf2_t __riscv_vwmulsu_vv_i32mf2_tu(vint32mf2_t vd, vint16mf4_t vs2,
                                         vuint16mf4_t vs1, size_t vl);
vint32mf2_t __riscv_vwmulsu_vx_i32mf2_tu(vint32mf2_t vd, vint16mf4_t vs2,
                                         uint16_t rs1, size_t vl);
vint32m1_t __riscv_vwmulsu_vv_i32m1_tu(vint32m1_t vd, vint16mf2_t vs2,
                                       vuint16mf2_t vs1, size_t vl);
vint32m1_t __riscv_vwmulsu_vx_i32m1_tu(vint32m1_t vd, vint16mf2_t vs2,
                                       uint16_t rs1, size_t vl);
vint32m2_t __riscv_vwmulsu_vv_i32m2_tu(vint32m2_t vd, vint16m1_t vs2,
                                       vuint16m1_t vs1, size_t vl);
vint32m2_t __riscv_vwmulsu_vx_i32m2_tu(vint32m2_t vd, vint16m1_t vs2,
                                       uint16_t rs1, size_t vl);
vint32m4_t __riscv_vwmulsu_vv_i32m4_tu(vint32m4_t vd, vint16m2_t vs2,
                                       vuint16m2_t vs1, size_t vl);
vint32m4_t __riscv_vwmulsu_vx_i32m4_tu(vint32m4_t vd, vint16m2_t vs2,
                                       uint16_t rs1, size_t vl);
vint32m8_t __riscv_vwmulsu_vv_i32m8_tu(vint32m8_t vd, vint16m4_t vs2,
                                       vuint16m4_t vs1, size_t vl);
vint32m8_t __riscv_vwmulsu_vx_i32m8_tu(vint32m8_t vd, vint16m4_t vs2,
                                       uint16_t rs1, size_t vl);
vint64m1_t __riscv_vwmulsu_vv_i64m1_tu(vint64m1_t vd, vint32mf2_t vs2,
                                       vuint32mf2_t vs1, size_t vl);
vint64m1_t __riscv_vwmulsu_vx_i64m1_tu(vint64m1_t vd, vint32mf2_t vs2,
                                       uint32_t rs1, size_t vl);
vint64m2_t __riscv_vwmulsu_vv_i64m2_tu(vint64m2_t vd, vint32m1_t vs2,
                                       vuint32m1_t vs1, size_t vl);
vint64m2_t __riscv_vwmulsu_vx_i64m2_tu(vint64m2_t vd, vint32m1_t vs2,
                                       uint32_t rs1, size_t vl);
vint64m4_t __riscv_vwmulsu_vv_i64m4_tu(vint64m4_t vd, vint32m2_t vs2,
                                       vuint32m2_t vs1, size_t vl);
vint64m4_t __riscv_vwmulsu_vx_i64m4_tu(vint64m4_t vd, vint32m2_t vs2,
                                       uint32_t rs1, size_t vl);
vint64m8_t __riscv_vwmulsu_vv_i64m8_tu(vint64m8_t vd, vint32m4_t vs2,
                                       vuint32m4_t vs1, size_t vl);
vint64m8_t __riscv_vwmulsu_vx_i64m8_tu(vint64m8_t vd, vint32m4_t vs2,
                                       uint32_t rs1, size_t vl);
vuint16mf4_t __riscv_vwmulu_vv_u16mf4_tu(vuint16mf4_t vd, vuint8mf8_t vs2,
                                         vuint8mf8_t vs1, size_t vl);
vuint16mf4_t __riscv_vwmulu_vx_u16mf4_tu(vuint16mf4_t vd, vuint8mf8_t vs2,
                                         uint8_t rs1, size_t vl);
vuint16mf2_t __riscv_vwmulu_vv_u16mf2_tu(vuint16mf2_t vd, vuint8mf4_t vs2,
                                         vuint8mf4_t vs1, size_t vl);
vuint16mf2_t __riscv_vwmulu_vx_u16mf2_tu(vuint16mf2_t vd, vuint8mf4_t vs2,
                                         uint8_t rs1, size_t vl);
vuint16m1_t __riscv_vwmulu_vv_u16m1_tu(vuint16m1_t vd, vuint8mf2_t vs2,
                                       vuint8mf2_t vs1, size_t vl);
vuint16m1_t __riscv_vwmulu_vx_u16m1_tu(vuint16m1_t vd, vuint8mf2_t vs2,
                                       uint8_t rs1, size_t vl);
vuint16m2_t __riscv_vwmulu_vv_u16m2_tu(vuint16m2_t vd, vuint8m1_t vs2,
                                       vuint8m1_t vs1, size_t vl);
vuint16m2_t __riscv_vwmulu_vx_u16m2_tu(vuint16m2_t vd, vuint8m1_t vs2,
                                       uint8_t rs1, size_t vl);
vuint16m4_t __riscv_vwmulu_vv_u16m4_tu(vuint16m4_t vd, vuint8m2_t vs2,
                                       vuint8m2_t vs1, size_t vl);
vuint16m4_t __riscv_vwmulu_vx_u16m4_tu(vuint16m4_t vd, vuint8m2_t vs2,
                                       uint8_t rs1, size_t vl);
vuint16m8_t __riscv_vwmulu_vv_u16m8_tu(vuint16m8_t vd, vuint8m4_t vs2,
                                       vuint8m4_t vs1, size_t vl);
vuint16m8_t __riscv_vwmulu_vx_u16m8_tu(vuint16m8_t vd, vuint8m4_t vs2,
                                       uint8_t rs1, size_t vl);
vuint32mf2_t __riscv_vwmulu_vv_u32mf2_tu(vuint32mf2_t vd, vuint16mf4_t vs2,
                                         vuint16mf4_t vs1, size_t vl);
vuint32mf2_t __riscv_vwmulu_vx_u32mf2_tu(vuint32mf2_t vd, vuint16mf4_t vs2,
                                         uint16_t rs1, size_t vl);
vuint32m1_t __riscv_vwmulu_vv_u32m1_tu(vuint32m1_t vd, vuint16mf2_t vs2,
                                       vuint16mf2_t vs1, size_t vl);
vuint32m1_t __riscv_vwmulu_vx_u32m1_tu(vuint32m1_t vd, vuint16mf2_t vs2,
                                       uint16_t rs1, size_t vl);
vuint32m2_t __riscv_vwmulu_vv_u32m2_tu(vuint32m2_t vd, vuint16m1_t vs2,
                                       vuint16m1_t vs1, size_t vl);
vuint32m2_t __riscv_vwmulu_vx_u32m2_tu(vuint32m2_t vd, vuint16m1_t vs2,
                                       uint16_t rs1, size_t vl);
vuint32m4_t __riscv_vwmulu_vv_u32m4_tu(vuint32m4_t vd, vuint16m2_t vs2,
                                       vuint16m2_t vs1, size_t vl);
vuint32m4_t __riscv_vwmulu_vx_u32m4_tu(vuint32m4_t vd, vuint16m2_t vs2,
                                       uint16_t rs1, size_t vl);
vuint32m8_t __riscv_vwmulu_vv_u32m8_tu(vuint32m8_t vd, vuint16m4_t vs2,
                                       vuint16m4_t vs1, size_t vl);
vuint32m8_t __riscv_vwmulu_vx_u32m8_tu(vuint32m8_t vd, vuint16m4_t vs2,
                                       uint16_t rs1, size_t vl);
vuint64m1_t __riscv_vwmulu_vv_u64m1_tu(vuint64m1_t vd, vuint32mf2_t vs2,
                                       vuint32mf2_t vs1, size_t vl);
vuint64m1_t __riscv_vwmulu_vx_u64m1_tu(vuint64m1_t vd, vuint32mf2_t vs2,
                                       uint32_t rs1, size_t vl);
vuint64m2_t __riscv_vwmulu_vv_u64m2_tu(vuint64m2_t vd, vuint32m1_t vs2,
                                       vuint32m1_t vs1, size_t vl);
vuint64m2_t __riscv_vwmulu_vx_u64m2_tu(vuint64m2_t vd, vuint32m1_t vs2,
                                       uint32_t rs1, size_t vl);
vuint64m4_t __riscv_vwmulu_vv_u64m4_tu(vuint64m4_t vd, vuint32m2_t vs2,
                                       vuint32m2_t vs1, size_t vl);
vuint64m4_t __riscv_vwmulu_vx_u64m4_tu(vuint64m4_t vd, vuint32m2_t vs2,
                                       uint32_t rs1, size_t vl);
vuint64m8_t __riscv_vwmulu_vv_u64m8_tu(vuint64m8_t vd, vuint32m4_t vs2,
                                       vuint32m4_t vs1, size_t vl);
vuint64m8_t __riscv_vwmulu_vx_u64m8_tu(vuint64m8_t vd, vuint32m4_t vs2,
                                       uint32_t rs1, size_t vl);
// masked functions
vint16mf4_t __riscv_vwmul_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                        vint8mf8_t vs2, vint8mf8_t vs1,
                                        size_t vl);
vint16mf4_t __riscv_vwmul_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                        vint8mf8_t vs2, int8_t rs1, size_t vl);
vint16mf2_t __riscv_vwmul_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                        vint8mf4_t vs2, vint8mf4_t vs1,
                                        size_t vl);
vint16mf2_t __riscv_vwmul_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                        vint8mf4_t vs2, int8_t rs1, size_t vl);
vint16m1_t __riscv_vwmul_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                      vint8mf2_t vs2, vint8mf2_t vs1,
                                      size_t vl);
vint16m1_t __riscv_vwmul_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                      vint8mf2_t vs2, int8_t rs1, size_t vl);
vint16m2_t __riscv_vwmul_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint8m1_t vs2,
                                      vint8m1_t vs1, size_t vl);
vint16m2_t __riscv_vwmul_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd, vint8m1_t vs2,
                                      int8_t rs1, size_t vl);
vint16m4_t __riscv_vwmul_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint8m2_t vs2,
                                      vint8m2_t vs1, size_t vl);
vint16m4_t __riscv_vwmul_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd, vint8m2_t vs2,
                                      int8_t rs1, size_t vl);
vint16m8_t __riscv_vwmul_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint8m4_t vs2,
                                      vint8m4_t vs1, size_t vl);
vint16m8_t __riscv_vwmul_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd, vint8m4_t vs2,
                                      int8_t rs1, size_t vl);
vint32mf2_t __riscv_vwmul_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                        vint16mf4_t vs2, vint16mf4_t vs1,
                                        size_t vl);
vint32mf2_t __riscv_vwmul_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                        vint16mf4_t vs2, int16_t rs1,
                                        size_t vl);
vint32m1_t __riscv_vwmul_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                      vint16mf2_t vs2, vint16mf2_t vs1,
                                      size_t vl);
vint32m1_t __riscv_vwmul_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                      vint16mf2_t vs2, int16_t rs1, size_t vl);
vint32m2_t __riscv_vwmul_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                      vint16m1_t vs2, vint16m1_t vs1,
                                      size_t vl);
vint32m2_t __riscv_vwmul_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                      vint16m1_t vs2, int16_t rs1, size_t vl);
vint32m4_t __riscv_vwmul_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                      vint16m2_t vs2, vint16m2_t vs1,
                                      size_t vl);
vint32m4_t __riscv_vwmul_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                      vint16m2_t vs2, int16_t rs1, size_t vl);
vint32m8_t __riscv_vwmul_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                      vint16m4_t vs2, vint16m4_t vs1,
                                      size_t vl);
vint32m8_t __riscv_vwmul_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                      vint16m4_t vs2, int16_t rs1, size_t vl);
vint64m1_t __riscv_vwmul_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                      vint32mf2_t vs2, vint32mf2_t vs1,
                                      size_t vl);
vint64m1_t __riscv_vwmul_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                      vint32mf2_t vs2, int32_t rs1, size_t vl);
vint64m2_t __riscv_vwmul_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                      vint32m1_t vs2, vint32m1_t vs1,
                                      size_t vl);
vint64m2_t __riscv_vwmul_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                      vint32m1_t vs2, int32_t rs1, size_t vl);
vint64m4_t __riscv_vwmul_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                      vint32m2_t vs2, vint32m2_t vs1,
                                      size_t vl);
vint64m4_t __riscv_vwmul_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                      vint32m2_t vs2, int32_t rs1, size_t vl);
vint64m8_t __riscv_vwmul_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                      vint32m4_t vs2, vint32m4_t vs1,
                                      size_t vl);
vint64m8_t __riscv_vwmul_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                      vint32m4_t vs2, int32_t rs1, size_t vl);
vint16mf4_t __riscv_vwmulsu_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                          vint8mf8_t vs2, vuint8mf8_t vs1,
                                          size_t vl);
vint16mf4_t __riscv_vwmulsu_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                          vint8mf8_t vs2, uint8_t rs1,
                                          size_t vl);
vint16mf2_t __riscv_vwmulsu_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                          vint8mf4_t vs2, vuint8mf4_t vs1,
                                          size_t vl);
vint16mf2_t __riscv_vwmulsu_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                          vint8mf4_t vs2, uint8_t rs1,
                                          size_t vl);
vint16m1_t __riscv_vwmulsu_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                        vint8mf2_t vs2, vuint8mf2_t vs1,
                                        size_t vl);
vint16m1_t __riscv_vwmulsu_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                        vint8mf2_t vs2, uint8_t rs1, size_t vl);
vint16m2_t __riscv_vwmulsu_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                        vint8m1_t vs2, vuint8m1_t vs1,
                                        size_t vl);
vint16m2_t __riscv_vwmulsu_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                        vint8m1_t vs2, uint8_t rs1, size_t vl);
vint16m4_t __riscv_vwmulsu_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                        vint8m2_t vs2, vuint8m2_t vs1,
                                        size_t vl);
vint16m4_t __riscv_vwmulsu_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                        vint8m2_t vs2, uint8_t rs1, size_t vl);
vint16m8_t __riscv_vwmulsu_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                        vint8m4_t vs2, vuint8m4_t vs1,
                                        size_t vl);
vint16m8_t __riscv_vwmulsu_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                        vint8m4_t vs2, uint8_t rs1, size_t vl);
vint32mf2_t __riscv_vwmulsu_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                          vint16mf4_t vs2, vuint16mf4_t vs1,
                                          size_t vl);
vint32mf2_t __riscv_vwmulsu_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                          vint16mf4_t vs2, uint16_t rs1,
                                          size_t vl);
vint32m1_t __riscv_vwmulsu_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                        vint16mf2_t vs2, vuint16mf2_t vs1,
                                        size_t vl);
vint32m1_t __riscv_vwmulsu_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                        vint16mf2_t vs2, uint16_t rs1,
                                        size_t vl);
vint32m2_t __riscv_vwmulsu_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                        vint16m1_t vs2, vuint16m1_t vs1,
                                        size_t vl);
vint32m2_t __riscv_vwmulsu_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                        vint16m1_t vs2, uint16_t rs1,
                                        size_t vl);
vint32m4_t __riscv_vwmulsu_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                        vint16m2_t vs2, vuint16m2_t vs1,
                                        size_t vl);
vint32m4_t __riscv_vwmulsu_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                        vint16m2_t vs2, uint16_t rs1,
                                        size_t vl);
vint32m8_t __riscv_vwmulsu_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                        vint16m4_t vs2, vuint16m4_t vs1,
                                        size_t vl);
vint32m8_t __riscv_vwmulsu_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                        vint16m4_t vs2, uint16_t rs1,
                                        size_t vl);
vint64m1_t __riscv_vwmulsu_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                        vint32mf2_t vs2, vuint32mf2_t vs1,
                                        size_t vl);
vint64m1_t __riscv_vwmulsu_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                        vint32mf2_t vs2, uint32_t rs1,
                                        size_t vl);
vint64m2_t __riscv_vwmulsu_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                        vint32m1_t vs2, vuint32m1_t vs1,
                                        size_t vl);
vint64m2_t __riscv_vwmulsu_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                        vint32m1_t vs2, uint32_t rs1,
                                        size_t vl);
vint64m4_t __riscv_vwmulsu_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                        vint32m2_t vs2, vuint32m2_t vs1,
                                        size_t vl);
vint64m4_t __riscv_vwmulsu_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                        vint32m2_t vs2, uint32_t rs1,
                                        size_t vl);
vint64m8_t __riscv_vwmulsu_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                        vint32m4_t vs2, vuint32m4_t vs1,
                                        size_t vl);
vint64m8_t __riscv_vwmulsu_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                        vint32m4_t vs2, uint32_t rs1,
                                        size_t vl);
vuint16mf4_t __riscv_vwmulu_vv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                          vuint8mf8_t vs2, vuint8mf8_t vs1,
                                          size_t vl);
vuint16mf4_t __riscv_vwmulu_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                          vuint8mf8_t vs2, uint8_t rs1,
                                          size_t vl);
vuint16mf2_t __riscv_vwmulu_vv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                          vuint8mf4_t vs2, vuint8mf4_t vs1,
                                          size_t vl);
vuint16mf2_t __riscv_vwmulu_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                          vuint8mf4_t vs2, uint8_t rs1,
                                          size_t vl);
vuint16m1_t __riscv_vwmulu_vv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                        vuint8mf2_t vs2, vuint8mf2_t vs1,
                                        size_t vl);
vuint16m1_t __riscv_vwmulu_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                        vuint8mf2_t vs2, uint8_t rs1,
                                        size_t vl);
vuint16m2_t __riscv_vwmulu_vv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                        vuint8m1_t vs2, vuint8m1_t vs1,
                                        size_t vl);
vuint16m2_t __riscv_vwmulu_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                        vuint8m1_t vs2, uint8_t rs1, size_t vl);
vuint16m4_t __riscv_vwmulu_vv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                        vuint8m2_t vs2, vuint8m2_t vs1,
                                        size_t vl);
vuint16m4_t __riscv_vwmulu_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                        vuint8m2_t vs2, uint8_t rs1, size_t vl);
vuint16m8_t __riscv_vwmulu_vv_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                        vuint8m4_t vs2, vuint8m4_t vs1,
                                        size_t vl);
vuint16m8_t __riscv_vwmulu_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                        vuint8m4_t vs2, uint8_t rs1, size_t vl);
vuint32mf2_t __riscv_vwmulu_vv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                          vuint16mf4_t vs2, vuint16mf4_t vs1,
                                          size_t vl);
vuint32mf2_t __riscv_vwmulu_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                          vuint16mf4_t vs2, uint16_t rs1,
                                          size_t vl);
vuint32m1_t __riscv_vwmulu_vv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                        vuint16mf2_t vs2, vuint16mf2_t vs1,
                                        size_t vl);
vuint32m1_t __riscv_vwmulu_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                        vuint16mf2_t vs2, uint16_t rs1,
                                        size_t vl);
vuint32m2_t __riscv_vwmulu_vv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                        vuint16m1_t vs2, vuint16m1_t vs1,
                                        size_t vl);
vuint32m2_t __riscv_vwmulu_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                        vuint16m1_t vs2, uint16_t rs1,
                                        size_t vl);
vuint32m4_t __riscv_vwmulu_vv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                        vuint16m2_t vs2, vuint16m2_t vs1,
                                        size_t vl);
vuint32m4_t __riscv_vwmulu_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                        vuint16m2_t vs2, uint16_t rs1,
                                        size_t vl);
vuint32m8_t __riscv_vwmulu_vv_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                        vuint16m4_t vs2, vuint16m4_t vs1,
                                        size_t vl);
vuint32m8_t __riscv_vwmulu_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                        vuint16m4_t vs2, uint16_t rs1,
                                        size_t vl);
vuint64m1_t __riscv_vwmulu_vv_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                        vuint32mf2_t vs2, vuint32mf2_t vs1,
                                        size_t vl);
vuint64m1_t __riscv_vwmulu_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                        vuint32mf2_t vs2, uint32_t rs1,
                                        size_t vl);
vuint64m2_t __riscv_vwmulu_vv_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                        vuint32m1_t vs2, vuint32m1_t vs1,
                                        size_t vl);
vuint64m2_t __riscv_vwmulu_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                        vuint32m1_t vs2, uint32_t rs1,
                                        size_t vl);
vuint64m4_t __riscv_vwmulu_vv_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                        vuint32m2_t vs2, vuint32m2_t vs1,
                                        size_t vl);
vuint64m4_t __riscv_vwmulu_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                        vuint32m2_t vs2, uint32_t rs1,
                                        size_t vl);
vuint64m8_t __riscv_vwmulu_vv_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                        vuint32m4_t vs2, vuint32m4_t vs1,
                                        size_t vl);
vuint64m8_t __riscv_vwmulu_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                        vuint32m4_t vs2, uint32_t rs1,
                                        size_t vl);
// masked functions
vint16mf4_t __riscv_vwmul_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                         vint8mf8_t vs2, vint8mf8_t vs1,
                                         size_t vl);
vint16mf4_t __riscv_vwmul_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                         vint8mf8_t vs2, int8_t rs1, size_t vl);
vint16mf2_t __riscv_vwmul_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                         vint8mf4_t vs2, vint8mf4_t vs1,
                                         size_t vl);
vint16mf2_t __riscv_vwmul_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                         vint8mf4_t vs2, int8_t rs1, size_t vl);
vint16m1_t __riscv_vwmul_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                       vint8mf2_t vs2, vint8mf2_t vs1,
                                       size_t vl);
vint16m1_t __riscv_vwmul_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                       vint8mf2_t vs2, int8_t rs1, size_t vl);
vint16m2_t __riscv_vwmul_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                       vint8m1_t vs2, vint8m1_t vs1, size_t vl);
vint16m2_t __riscv_vwmul_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                       vint8m1_t vs2, int8_t rs1, size_t vl);
vint16m4_t __riscv_vwmul_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                       vint8m2_t vs2, vint8m2_t vs1, size_t vl);
vint16m4_t __riscv_vwmul_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                       vint8m2_t vs2, int8_t rs1, size_t vl);
vint16m8_t __riscv_vwmul_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                       vint8m4_t vs2, vint8m4_t vs1, size_t vl);
vint16m8_t __riscv_vwmul_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                       vint8m4_t vs2, int8_t rs1, size_t vl);
vint32mf2_t __riscv_vwmul_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                         vint16mf4_t vs2, vint16mf4_t vs1,
                                         size_t vl);
vint32mf2_t __riscv_vwmul_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                         vint16mf4_t vs2, int16_t rs1,
                                         size_t vl);
vint32m1_t __riscv_vwmul_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                       vint16mf2_t vs2, vint16mf2_t vs1,
                                       size_t vl);
vint32m1_t __riscv_vwmul_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                       vint16mf2_t vs2, int16_t rs1, size_t vl);
vint32m2_t __riscv_vwmul_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                       vint16m1_t vs2, vint16m1_t vs1,
                                       size_t vl);
vint32m2_t __riscv_vwmul_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                       vint16m1_t vs2, int16_t rs1, size_t vl);
vint32m4_t __riscv_vwmul_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                       vint16m2_t vs2, vint16m2_t vs1,
                                       size_t vl);
vint32m4_t __riscv_vwmul_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                       vint16m2_t vs2, int16_t rs1, size_t vl);
vint32m8_t __riscv_vwmul_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                       vint16m4_t vs2, vint16m4_t vs1,
                                       size_t vl);
vint32m8_t __riscv_vwmul_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                       vint16m4_t vs2, int16_t rs1, size_t vl);
vint64m1_t __riscv_vwmul_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                       vint32mf2_t vs2, vint32mf2_t vs1,
                                       size_t vl);
vint64m1_t __riscv_vwmul_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                       vint32mf2_t vs2, int32_t rs1, size_t vl);
vint64m2_t __riscv_vwmul_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                       vint32m1_t vs2, vint32m1_t vs1,
                                       size_t vl);
vint64m2_t __riscv_vwmul_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                       vint32m1_t vs2, int32_t rs1, size_t vl);
vint64m4_t __riscv_vwmul_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                       vint32m2_t vs2, vint32m2_t vs1,
                                       size_t vl);
vint64m4_t __riscv_vwmul_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                       vint32m2_t vs2, int32_t rs1, size_t vl);
vint64m8_t __riscv_vwmul_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                       vint32m4_t vs2, vint32m4_t vs1,
                                       size_t vl);
vint64m8_t __riscv_vwmul_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                       vint32m4_t vs2, int32_t rs1, size_t vl);
vint16mf4_t __riscv_vwmulsu_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                           vint8mf8_t vs2, vuint8mf8_t vs1,
                                           size_t vl);
vint16mf4_t __riscv_vwmulsu_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                           vint8mf8_t vs2, uint8_t rs1,
                                           size_t vl);
vint16mf2_t __riscv_vwmulsu_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                           vint8mf4_t vs2, vuint8mf4_t vs1,
                                           size_t vl);
vint16mf2_t __riscv_vwmulsu_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                           vint8mf4_t vs2, uint8_t rs1,
                                           size_t vl);
vint16m1_t __riscv_vwmulsu_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                         vint8mf2_t vs2, vuint8mf2_t vs1,
                                         size_t vl);
vint16m1_t __riscv_vwmulsu_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                         vint8mf2_t vs2, uint8_t rs1,
                                         size_t vl);
vint16m2_t __riscv_vwmulsu_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                         vint8m1_t vs2, vuint8m1_t vs1,
                                         size_t vl);
vint16m2_t __riscv_vwmulsu_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                         vint8m1_t vs2, uint8_t rs1, size_t vl);
vint16m4_t __riscv_vwmulsu_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                         vint8m2_t vs2, vuint8m2_t vs1,
                                         size_t vl);
vint16m4_t __riscv_vwmulsu_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                         vint8m2_t vs2, uint8_t rs1, size_t vl);
vint16m8_t __riscv_vwmulsu_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                         vint8m4_t vs2, vuint8m4_t vs1,
                                         size_t vl);
vint16m8_t __riscv_vwmulsu_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                         vint8m4_t vs2, uint8_t rs1, size_t vl);
vint32mf2_t __riscv_vwmulsu_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                           vint16mf4_t vs2, vuint16mf4_t vs1,
                                           size_t vl);
vint32mf2_t __riscv_vwmulsu_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                           vint16mf4_t vs2, uint16_t rs1,
                                           size_t vl);
vint32m1_t __riscv_vwmulsu_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                         vint16mf2_t vs2, vuint16mf2_t vs1,
                                         size_t vl);
vint32m1_t __riscv_vwmulsu_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                         vint16mf2_t vs2, uint16_t rs1,
                                         size_t vl);
vint32m2_t __riscv_vwmulsu_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                         vint16m1_t vs2, vuint16m1_t vs1,
                                         size_t vl);
vint32m2_t __riscv_vwmulsu_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                         vint16m1_t vs2, uint16_t rs1,
                                         size_t vl);
vint32m4_t __riscv_vwmulsu_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                         vint16m2_t vs2, vuint16m2_t vs1,
                                         size_t vl);
vint32m4_t __riscv_vwmulsu_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                         vint16m2_t vs2, uint16_t rs1,
                                         size_t vl);
vint32m8_t __riscv_vwmulsu_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                         vint16m4_t vs2, vuint16m4_t vs1,
                                         size_t vl);
vint32m8_t __riscv_vwmulsu_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                         vint16m4_t vs2, uint16_t rs1,
                                         size_t vl);
vint64m1_t __riscv_vwmulsu_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                         vint32mf2_t vs2, vuint32mf2_t vs1,
                                         size_t vl);
vint64m1_t __riscv_vwmulsu_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                         vint32mf2_t vs2, uint32_t rs1,
                                         size_t vl);
vint64m2_t __riscv_vwmulsu_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                         vint32m1_t vs2, vuint32m1_t vs1,
                                         size_t vl);
vint64m2_t __riscv_vwmulsu_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                         vint32m1_t vs2, uint32_t rs1,
                                         size_t vl);
vint64m4_t __riscv_vwmulsu_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                         vint32m2_t vs2, vuint32m2_t vs1,
                                         size_t vl);
vint64m4_t __riscv_vwmulsu_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                         vint32m2_t vs2, uint32_t rs1,
                                         size_t vl);
vint64m8_t __riscv_vwmulsu_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                         vint32m4_t vs2, vuint32m4_t vs1,
                                         size_t vl);
vint64m8_t __riscv_vwmulsu_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                         vint32m4_t vs2, uint32_t rs1,
                                         size_t vl);
vuint16mf4_t __riscv_vwmulu_vv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                           vuint8mf8_t vs2, vuint8mf8_t vs1,
                                           size_t vl);
vuint16mf4_t __riscv_vwmulu_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                           vuint8mf8_t vs2, uint8_t rs1,
                                           size_t vl);
vuint16mf2_t __riscv_vwmulu_vv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                           vuint8mf4_t vs2, vuint8mf4_t vs1,
                                           size_t vl);
vuint16mf2_t __riscv_vwmulu_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                           vuint8mf4_t vs2, uint8_t rs1,
                                           size_t vl);
vuint16m1_t __riscv_vwmulu_vv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                         vuint8mf2_t vs2, vuint8mf2_t vs1,
                                         size_t vl);
vuint16m1_t __riscv_vwmulu_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                         vuint8mf2_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16m2_t __riscv_vwmulu_vv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                         vuint8m1_t vs2, vuint8m1_t vs1,
                                         size_t vl);
vuint16m2_t __riscv_vwmulu_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                         vuint8m1_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16m4_t __riscv_vwmulu_vv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                         vuint8m2_t vs2, vuint8m2_t vs1,
                                         size_t vl);
vuint16m4_t __riscv_vwmulu_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                         vuint8m2_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16m8_t __riscv_vwmulu_vv_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                         vuint8m4_t vs2, vuint8m4_t vs1,
                                         size_t vl);
vuint16m8_t __riscv_vwmulu_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                         vuint8m4_t vs2, uint8_t rs1,
                                         size_t vl);
vuint32mf2_t __riscv_vwmulu_vv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                           vuint16mf4_t vs2, vuint16mf4_t vs1,
                                           size_t vl);
vuint32mf2_t __riscv_vwmulu_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                           vuint16mf4_t vs2, uint16_t rs1,
                                           size_t vl);
vuint32m1_t __riscv_vwmulu_vv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                         vuint16mf2_t vs2, vuint16mf2_t vs1,
                                         size_t vl);
vuint32m1_t __riscv_vwmulu_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                         vuint16mf2_t vs2, uint16_t rs1,
                                         size_t vl);
vuint32m2_t __riscv_vwmulu_vv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                         vuint16m1_t vs2, vuint16m1_t vs1,
                                         size_t vl);
vuint32m2_t __riscv_vwmulu_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                         vuint16m1_t vs2, uint16_t rs1,
                                         size_t vl);
vuint32m4_t __riscv_vwmulu_vv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                         vuint16m2_t vs2, vuint16m2_t vs1,
                                         size_t vl);
vuint32m4_t __riscv_vwmulu_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                         vuint16m2_t vs2, uint16_t rs1,
                                         size_t vl);
vuint32m8_t __riscv_vwmulu_vv_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                         vuint16m4_t vs2, vuint16m4_t vs1,
                                         size_t vl);
vuint32m8_t __riscv_vwmulu_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                         vuint16m4_t vs2, uint16_t rs1,
                                         size_t vl);
vuint64m1_t __riscv_vwmulu_vv_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                         vuint32mf2_t vs2, vuint32mf2_t vs1,
                                         size_t vl);
vuint64m1_t __riscv_vwmulu_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                         vuint32mf2_t vs2, uint32_t rs1,
                                         size_t vl);
vuint64m2_t __riscv_vwmulu_vv_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                         vuint32m1_t vs2, vuint32m1_t vs1,
                                         size_t vl);
vuint64m2_t __riscv_vwmulu_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                         vuint32m1_t vs2, uint32_t rs1,
                                         size_t vl);
vuint64m4_t __riscv_vwmulu_vv_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                         vuint32m2_t vs2, vuint32m2_t vs1,
                                         size_t vl);
vuint64m4_t __riscv_vwmulu_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                         vuint32m2_t vs2, uint32_t rs1,
                                         size_t vl);
vuint64m8_t __riscv_vwmulu_vv_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                         vuint32m4_t vs2, vuint32m4_t vs1,
                                         size_t vl);
vuint64m8_t __riscv_vwmulu_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                         vuint32m4_t vs2, uint32_t rs1,
                                         size_t vl);
// masked functions
vint16mf4_t __riscv_vwmul_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                       vint8mf8_t vs2, vint8mf8_t vs1,
                                       size_t vl);
vint16mf4_t __riscv_vwmul_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                       vint8mf8_t vs2, int8_t rs1, size_t vl);
vint16mf2_t __riscv_vwmul_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                       vint8mf4_t vs2, vint8mf4_t vs1,
                                       size_t vl);
vint16mf2_t __riscv_vwmul_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                       vint8mf4_t vs2, int8_t rs1, size_t vl);
vint16m1_t __riscv_vwmul_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                     vint8mf2_t vs2, vint8mf2_t vs1, size_t vl);
vint16m1_t __riscv_vwmul_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                     vint8mf2_t vs2, int8_t rs1, size_t vl);
vint16m2_t __riscv_vwmul_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint8m1_t vs2,
                                     vint8m1_t vs1, size_t vl);
vint16m2_t __riscv_vwmul_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint8m1_t vs2,
                                     int8_t rs1, size_t vl);
vint16m4_t __riscv_vwmul_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint8m2_t vs2,
                                     vint8m2_t vs1, size_t vl);
vint16m4_t __riscv_vwmul_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint8m2_t vs2,
                                     int8_t rs1, size_t vl);
vint16m8_t __riscv_vwmul_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint8m4_t vs2,
                                     vint8m4_t vs1, size_t vl);
vint16m8_t __riscv_vwmul_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint8m4_t vs2,
                                     int8_t rs1, size_t vl);
vint32mf2_t __riscv_vwmul_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                       vint16mf4_t vs2, vint16mf4_t vs1,
                                       size_t vl);
vint32mf2_t __riscv_vwmul_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                       vint16mf4_t vs2, int16_t rs1, size_t vl);
vint32m1_t __riscv_vwmul_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                     vint16mf2_t vs2, vint16mf2_t vs1,
                                     size_t vl);
vint32m1_t __riscv_vwmul_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                     vint16mf2_t vs2, int16_t rs1, size_t vl);
vint32m2_t __riscv_vwmul_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                     vint16m1_t vs2, vint16m1_t vs1, size_t vl);
vint32m2_t __riscv_vwmul_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                     vint16m1_t vs2, int16_t rs1, size_t vl);
vint32m4_t __riscv_vwmul_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint16m2_t vs2,
                                     vint16m2_t vs1, size_t vl);
vint32m4_t __riscv_vwmul_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint16m2_t vs2,
                                     int16_t rs1, size_t vl);
vint32m8_t __riscv_vwmul_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint16m4_t vs2,
                                     vint16m4_t vs1, size_t vl);
vint32m8_t __riscv_vwmul_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint16m4_t vs2,
                                     int16_t rs1, size_t vl);
vint64m1_t __riscv_vwmul_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                     vint32mf2_t vs2, vint32mf2_t vs1,
                                     size_t vl);
vint64m1_t __riscv_vwmul_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                     vint32mf2_t vs2, int32_t rs1, size_t vl);
vint64m2_t __riscv_vwmul_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                     vint32m1_t vs2, vint32m1_t vs1, size_t vl);
vint64m2_t __riscv_vwmul_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                     vint32m1_t vs2, int32_t rs1, size_t vl);
vint64m4_t __riscv_vwmul_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                     vint32m2_t vs2, vint32m2_t vs1, size_t vl);
vint64m4_t __riscv_vwmul_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                     vint32m2_t vs2, int32_t rs1, size_t vl);
vint64m8_t __riscv_vwmul_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint32m4_t vs2,
                                     vint32m4_t vs1, size_t vl);
vint64m8_t __riscv_vwmul_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint32m4_t vs2,
                                     int32_t rs1, size_t vl);
vint16mf4_t __riscv_vwmulsu_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                         vint8mf8_t vs2, vuint8mf8_t vs1,
                                         size_t vl);
vint16mf4_t __riscv_vwmulsu_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                         vint8mf8_t vs2, uint8_t rs1,
                                         size_t vl);
vint16mf2_t __riscv_vwmulsu_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                         vint8mf4_t vs2, vuint8mf4_t vs1,
                                         size_t vl);
vint16mf2_t __riscv_vwmulsu_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                         vint8mf4_t vs2, uint8_t rs1,
                                         size_t vl);
vint16m1_t __riscv_vwmulsu_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                       vint8mf2_t vs2, vuint8mf2_t vs1,
                                       size_t vl);
vint16m1_t __riscv_vwmulsu_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                       vint8mf2_t vs2, uint8_t rs1, size_t vl);
vint16m2_t __riscv_vwmulsu_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd,
                                       vint8m1_t vs2, vuint8m1_t vs1,
                                       size_t vl);
vint16m2_t __riscv_vwmulsu_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd,
                                       vint8m1_t vs2, uint8_t rs1, size_t vl);
vint16m4_t __riscv_vwmulsu_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd,
                                       vint8m2_t vs2, vuint8m2_t vs1,
                                       size_t vl);
vint16m4_t __riscv_vwmulsu_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd,
                                       vint8m2_t vs2, uint8_t rs1, size_t vl);
vint16m8_t __riscv_vwmulsu_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd,
                                       vint8m4_t vs2, vuint8m4_t vs1,
                                       size_t vl);
vint16m8_t __riscv_vwmulsu_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd,
                                       vint8m4_t vs2, uint8_t rs1, size_t vl);
vint32mf2_t __riscv_vwmulsu_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                         vint16mf4_t vs2, vuint16mf4_t vs1,
                                         size_t vl);
vint32mf2_t __riscv_vwmulsu_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                         vint16mf4_t vs2, uint16_t rs1,
                                         size_t vl);
vint32m1_t __riscv_vwmulsu_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                       vint16mf2_t vs2, vuint16mf2_t vs1,
                                       size_t vl);
vint32m1_t __riscv_vwmulsu_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                       vint16mf2_t vs2, uint16_t rs1,
                                       size_t vl);
vint32m2_t __riscv_vwmulsu_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                       vint16m1_t vs2, vuint16m1_t vs1,
                                       size_t vl);
vint32m2_t __riscv_vwmulsu_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                       vint16m1_t vs2, uint16_t rs1, size_t vl);
vint32m4_t __riscv_vwmulsu_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd,
                                       vint16m2_t vs2, vuint16m2_t vs1,
                                       size_t vl);
vint32m4_t __riscv_vwmulsu_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd,
                                       vint16m2_t vs2, uint16_t rs1, size_t vl);
vint32m8_t __riscv_vwmulsu_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd,
                                       vint16m4_t vs2, vuint16m4_t vs1,
                                       size_t vl);
vint32m8_t __riscv_vwmulsu_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd,
                                       vint16m4_t vs2, uint16_t rs1, size_t vl);
vint64m1_t __riscv_vwmulsu_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                       vint32mf2_t vs2, vuint32mf2_t vs1,
                                       size_t vl);
vint64m1_t __riscv_vwmulsu_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                       vint32mf2_t vs2, uint32_t rs1,
                                       size_t vl);
vint64m2_t __riscv_vwmulsu_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                       vint32m1_t vs2, vuint32m1_t vs1,
                                       size_t vl);
vint64m2_t __riscv_vwmulsu_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                       vint32m1_t vs2, uint32_t rs1, size_t vl);
vint64m4_t __riscv_vwmulsu_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                       vint32m2_t vs2, vuint32m2_t vs1,
                                       size_t vl);
vint64m4_t __riscv_vwmulsu_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                       vint32m2_t vs2, uint32_t rs1, size_t vl);
vint64m8_t __riscv_vwmulsu_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd,
                                       vint32m4_t vs2, vuint32m4_t vs1,
                                       size_t vl);
vint64m8_t __riscv_vwmulsu_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd,
                                       vint32m4_t vs2, uint32_t rs1, size_t vl);
vuint16mf4_t __riscv_vwmulu_vv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint8mf8_t vs2, vuint8mf8_t vs1,
                                         size_t vl);
vuint16mf4_t __riscv_vwmulu_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint8mf8_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16mf2_t __riscv_vwmulu_vv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint8mf4_t vs2, vuint8mf4_t vs1,
                                         size_t vl);
vuint16mf2_t __riscv_vwmulu_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint8mf4_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16m1_t __riscv_vwmulu_vv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                       vuint8mf2_t vs2, vuint8mf2_t vs1,
                                       size_t vl);
vuint16m1_t __riscv_vwmulu_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                       vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint16m2_t __riscv_vwmulu_vv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                       vuint8m1_t vs2, vuint8m1_t vs1,
                                       size_t vl);
vuint16m2_t __riscv_vwmulu_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                       vuint8m1_t vs2, uint8_t rs1, size_t vl);
vuint16m4_t __riscv_vwmulu_vv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                       vuint8m2_t vs2, vuint8m2_t vs1,
                                       size_t vl);
vuint16m4_t __riscv_vwmulu_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                       vuint8m2_t vs2, uint8_t rs1, size_t vl);
vuint16m8_t __riscv_vwmulu_vv_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                       vuint8m4_t vs2, vuint8m4_t vs1,
                                       size_t vl);
vuint16m8_t __riscv_vwmulu_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                       vuint8m4_t vs2, uint8_t rs1, size_t vl);
vuint32mf2_t __riscv_vwmulu_vv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint16mf4_t vs2, vuint16mf4_t vs1,
                                         size_t vl);
vuint32mf2_t __riscv_vwmulu_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint16mf4_t vs2, uint16_t rs1,
                                         size_t vl);
vuint32m1_t __riscv_vwmulu_vv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                       vuint16mf2_t vs2, vuint16mf2_t vs1,
                                       size_t vl);
vuint32m1_t __riscv_vwmulu_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                       vuint16mf2_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32m2_t __riscv_vwmulu_vv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                       vuint16m1_t vs2, vuint16m1_t vs1,
                                       size_t vl);
vuint32m2_t __riscv_vwmulu_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                       vuint16m1_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32m4_t __riscv_vwmulu_vv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                       vuint16m2_t vs2, vuint16m2_t vs1,
                                       size_t vl);
vuint32m4_t __riscv_vwmulu_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                       vuint16m2_t vs2, uint16_t rs1,
                                       size_t vl);
vuint32m8_t __riscv_vwmulu_vv_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                       vuint16m4_t vs2, vuint16m4_t vs1,
                                       size_t vl);
vuint32m8_t __riscv_vwmulu_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                       vuint16m4_t vs2, uint16_t rs1,
                                       size_t vl);
vuint64m1_t __riscv_vwmulu_vv_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                       vuint32mf2_t vs2, vuint32mf2_t vs1,
                                       size_t vl);
vuint64m1_t __riscv_vwmulu_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                       vuint32mf2_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m2_t __riscv_vwmulu_vv_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                       vuint32m1_t vs2, vuint32m1_t vs1,
                                       size_t vl);
vuint64m2_t __riscv_vwmulu_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                       vuint32m1_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m4_t __riscv_vwmulu_vv_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                       vuint32m2_t vs2, vuint32m2_t vs1,
                                       size_t vl);
vuint64m4_t __riscv_vwmulu_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                       vuint32m2_t vs2, uint32_t rs1,
                                       size_t vl);
vuint64m8_t __riscv_vwmulu_vv_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                       vuint32m4_t vs2, vuint32m4_t vs1,
                                       size_t vl);
vuint64m8_t __riscv_vwmulu_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                       vuint32m4_t vs2, uint32_t rs1,
                                       size_t vl);

Vector Single-Width Integer Multiply-Add Intrinsics

vint8mf8_t __riscv_vmacc_vv_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs1,
                                     vint8mf8_t vs2, size_t vl);
vint8mf8_t __riscv_vmacc_vx_i8mf8_tu(vint8mf8_t vd, int8_t rs1, vint8mf8_t vs2,
                                     size_t vl);
vint8mf4_t __riscv_vmacc_vv_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs1,
                                     vint8mf4_t vs2, size_t vl);
vint8mf4_t __riscv_vmacc_vx_i8mf4_tu(vint8mf4_t vd, int8_t rs1, vint8mf4_t vs2,
                                     size_t vl);
vint8mf2_t __riscv_vmacc_vv_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs1,
                                     vint8mf2_t vs2, size_t vl);
vint8mf2_t __riscv_vmacc_vx_i8mf2_tu(vint8mf2_t vd, int8_t rs1, vint8mf2_t vs2,
                                     size_t vl);
vint8m1_t __riscv_vmacc_vv_i8m1_tu(vint8m1_t vd, vint8m1_t vs1, vint8m1_t vs2,
                                   size_t vl);
vint8m1_t __riscv_vmacc_vx_i8m1_tu(vint8m1_t vd, int8_t rs1, vint8m1_t vs2,
                                   size_t vl);
vint8m2_t __riscv_vmacc_vv_i8m2_tu(vint8m2_t vd, vint8m2_t vs1, vint8m2_t vs2,
                                   size_t vl);
vint8m2_t __riscv_vmacc_vx_i8m2_tu(vint8m2_t vd, int8_t rs1, vint8m2_t vs2,
                                   size_t vl);
vint8m4_t __riscv_vmacc_vv_i8m4_tu(vint8m4_t vd, vint8m4_t vs1, vint8m4_t vs2,
                                   size_t vl);
vint8m4_t __riscv_vmacc_vx_i8m4_tu(vint8m4_t vd, int8_t rs1, vint8m4_t vs2,
                                   size_t vl);
vint8m8_t __riscv_vmacc_vv_i8m8_tu(vint8m8_t vd, vint8m8_t vs1, vint8m8_t vs2,
                                   size_t vl);
vint8m8_t __riscv_vmacc_vx_i8m8_tu(vint8m8_t vd, int8_t rs1, vint8m8_t vs2,
                                   size_t vl);
vint16mf4_t __riscv_vmacc_vv_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs1,
                                       vint16mf4_t vs2, size_t vl);
vint16mf4_t __riscv_vmacc_vx_i16mf4_tu(vint16mf4_t vd, int16_t rs1,
                                       vint16mf4_t vs2, size_t vl);
vint16mf2_t __riscv_vmacc_vv_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs1,
                                       vint16mf2_t vs2, size_t vl);
vint16mf2_t __riscv_vmacc_vx_i16mf2_tu(vint16mf2_t vd, int16_t rs1,
                                       vint16mf2_t vs2, size_t vl);
vint16m1_t __riscv_vmacc_vv_i16m1_tu(vint16m1_t vd, vint16m1_t vs1,
                                     vint16m1_t vs2, size_t vl);
vint16m1_t __riscv_vmacc_vx_i16m1_tu(vint16m1_t vd, int16_t rs1, vint16m1_t vs2,
                                     size_t vl);
vint16m2_t __riscv_vmacc_vv_i16m2_tu(vint16m2_t vd, vint16m2_t vs1,
                                     vint16m2_t vs2, size_t vl);
vint16m2_t __riscv_vmacc_vx_i16m2_tu(vint16m2_t vd, int16_t rs1, vint16m2_t vs2,
                                     size_t vl);
vint16m4_t __riscv_vmacc_vv_i16m4_tu(vint16m4_t vd, vint16m4_t vs1,
                                     vint16m4_t vs2, size_t vl);
vint16m4_t __riscv_vmacc_vx_i16m4_tu(vint16m4_t vd, int16_t rs1, vint16m4_t vs2,
                                     size_t vl);
vint16m8_t __riscv_vmacc_vv_i16m8_tu(vint16m8_t vd, vint16m8_t vs1,
                                     vint16m8_t vs2, size_t vl);
vint16m8_t __riscv_vmacc_vx_i16m8_tu(vint16m8_t vd, int16_t rs1, vint16m8_t vs2,
                                     size_t vl);
vint32mf2_t __riscv_vmacc_vv_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs1,
                                       vint32mf2_t vs2, size_t vl);
vint32mf2_t __riscv_vmacc_vx_i32mf2_tu(vint32mf2_t vd, int32_t rs1,
                                       vint32mf2_t vs2, size_t vl);
vint32m1_t __riscv_vmacc_vv_i32m1_tu(vint32m1_t vd, vint32m1_t vs1,
                                     vint32m1_t vs2, size_t vl);
vint32m1_t __riscv_vmacc_vx_i32m1_tu(vint32m1_t vd, int32_t rs1, vint32m1_t vs2,
                                     size_t vl);
vint32m2_t __riscv_vmacc_vv_i32m2_tu(vint32m2_t vd, vint32m2_t vs1,
                                     vint32m2_t vs2, size_t vl);
vint32m2_t __riscv_vmacc_vx_i32m2_tu(vint32m2_t vd, int32_t rs1, vint32m2_t vs2,
                                     size_t vl);
vint32m4_t __riscv_vmacc_vv_i32m4_tu(vint32m4_t vd, vint32m4_t vs1,
                                     vint32m4_t vs2, size_t vl);
vint32m4_t __riscv_vmacc_vx_i32m4_tu(vint32m4_t vd, int32_t rs1, vint32m4_t vs2,
                                     size_t vl);
vint32m8_t __riscv_vmacc_vv_i32m8_tu(vint32m8_t vd, vint32m8_t vs1,
                                     vint32m8_t vs2, size_t vl);
vint32m8_t __riscv_vmacc_vx_i32m8_tu(vint32m8_t vd, int32_t rs1, vint32m8_t vs2,
                                     size_t vl);
vint64m1_t __riscv_vmacc_vv_i64m1_tu(vint64m1_t vd, vint64m1_t vs1,
                                     vint64m1_t vs2, size_t vl);
vint64m1_t __riscv_vmacc_vx_i64m1_tu(vint64m1_t vd, int64_t rs1, vint64m1_t vs2,
                                     size_t vl);
vint64m2_t __riscv_vmacc_vv_i64m2_tu(vint64m2_t vd, vint64m2_t vs1,
                                     vint64m2_t vs2, size_t vl);
vint64m2_t __riscv_vmacc_vx_i64m2_tu(vint64m2_t vd, int64_t rs1, vint64m2_t vs2,
                                     size_t vl);
vint64m4_t __riscv_vmacc_vv_i64m4_tu(vint64m4_t vd, vint64m4_t vs1,
                                     vint64m4_t vs2, size_t vl);
vint64m4_t __riscv_vmacc_vx_i64m4_tu(vint64m4_t vd, int64_t rs1, vint64m4_t vs2,
                                     size_t vl);
vint64m8_t __riscv_vmacc_vv_i64m8_tu(vint64m8_t vd, vint64m8_t vs1,
                                     vint64m8_t vs2, size_t vl);
vint64m8_t __riscv_vmacc_vx_i64m8_tu(vint64m8_t vd, int64_t rs1, vint64m8_t vs2,
                                     size_t vl);
vint8mf8_t __riscv_vnmsac_vv_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs1,
                                      vint8mf8_t vs2, size_t vl);
vint8mf8_t __riscv_vnmsac_vx_i8mf8_tu(vint8mf8_t vd, int8_t rs1, vint8mf8_t vs2,
                                      size_t vl);
vint8mf4_t __riscv_vnmsac_vv_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs1,
                                      vint8mf4_t vs2, size_t vl);
vint8mf4_t __riscv_vnmsac_vx_i8mf4_tu(vint8mf4_t vd, int8_t rs1, vint8mf4_t vs2,
                                      size_t vl);
vint8mf2_t __riscv_vnmsac_vv_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs1,
                                      vint8mf2_t vs2, size_t vl);
vint8mf2_t __riscv_vnmsac_vx_i8mf2_tu(vint8mf2_t vd, int8_t rs1, vint8mf2_t vs2,
                                      size_t vl);
vint8m1_t __riscv_vnmsac_vv_i8m1_tu(vint8m1_t vd, vint8m1_t vs1, vint8m1_t vs2,
                                    size_t vl);
vint8m1_t __riscv_vnmsac_vx_i8m1_tu(vint8m1_t vd, int8_t rs1, vint8m1_t vs2,
                                    size_t vl);
vint8m2_t __riscv_vnmsac_vv_i8m2_tu(vint8m2_t vd, vint8m2_t vs1, vint8m2_t vs2,
                                    size_t vl);
vint8m2_t __riscv_vnmsac_vx_i8m2_tu(vint8m2_t vd, int8_t rs1, vint8m2_t vs2,
                                    size_t vl);
vint8m4_t __riscv_vnmsac_vv_i8m4_tu(vint8m4_t vd, vint8m4_t vs1, vint8m4_t vs2,
                                    size_t vl);
vint8m4_t __riscv_vnmsac_vx_i8m4_tu(vint8m4_t vd, int8_t rs1, vint8m4_t vs2,
                                    size_t vl);
vint8m8_t __riscv_vnmsac_vv_i8m8_tu(vint8m8_t vd, vint8m8_t vs1, vint8m8_t vs2,
                                    size_t vl);
vint8m8_t __riscv_vnmsac_vx_i8m8_tu(vint8m8_t vd, int8_t rs1, vint8m8_t vs2,
                                    size_t vl);
vint16mf4_t __riscv_vnmsac_vv_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs1,
                                        vint16mf4_t vs2, size_t vl);
vint16mf4_t __riscv_vnmsac_vx_i16mf4_tu(vint16mf4_t vd, int16_t rs1,
                                        vint16mf4_t vs2, size_t vl);
vint16mf2_t __riscv_vnmsac_vv_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs1,
                                        vint16mf2_t vs2, size_t vl);
vint16mf2_t __riscv_vnmsac_vx_i16mf2_tu(vint16mf2_t vd, int16_t rs1,
                                        vint16mf2_t vs2, size_t vl);
vint16m1_t __riscv_vnmsac_vv_i16m1_tu(vint16m1_t vd, vint16m1_t vs1,
                                      vint16m1_t vs2, size_t vl);
vint16m1_t __riscv_vnmsac_vx_i16m1_tu(vint16m1_t vd, int16_t rs1,
                                      vint16m1_t vs2, size_t vl);
vint16m2_t __riscv_vnmsac_vv_i16m2_tu(vint16m2_t vd, vint16m2_t vs1,
                                      vint16m2_t vs2, size_t vl);
vint16m2_t __riscv_vnmsac_vx_i16m2_tu(vint16m2_t vd, int16_t rs1,
                                      vint16m2_t vs2, size_t vl);
vint16m4_t __riscv_vnmsac_vv_i16m4_tu(vint16m4_t vd, vint16m4_t vs1,
                                      vint16m4_t vs2, size_t vl);
vint16m4_t __riscv_vnmsac_vx_i16m4_tu(vint16m4_t vd, int16_t rs1,
                                      vint16m4_t vs2, size_t vl);
vint16m8_t __riscv_vnmsac_vv_i16m8_tu(vint16m8_t vd, vint16m8_t vs1,
                                      vint16m8_t vs2, size_t vl);
vint16m8_t __riscv_vnmsac_vx_i16m8_tu(vint16m8_t vd, int16_t rs1,
                                      vint16m8_t vs2, size_t vl);
vint32mf2_t __riscv_vnmsac_vv_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs1,
                                        vint32mf2_t vs2, size_t vl);
vint32mf2_t __riscv_vnmsac_vx_i32mf2_tu(vint32mf2_t vd, int32_t rs1,
                                        vint32mf2_t vs2, size_t vl);
vint32m1_t __riscv_vnmsac_vv_i32m1_tu(vint32m1_t vd, vint32m1_t vs1,
                                      vint32m1_t vs2, size_t vl);
vint32m1_t __riscv_vnmsac_vx_i32m1_tu(vint32m1_t vd, int32_t rs1,
                                      vint32m1_t vs2, size_t vl);
vint32m2_t __riscv_vnmsac_vv_i32m2_tu(vint32m2_t vd, vint32m2_t vs1,
                                      vint32m2_t vs2, size_t vl);
vint32m2_t __riscv_vnmsac_vx_i32m2_tu(vint32m2_t vd, int32_t rs1,
                                      vint32m2_t vs2, size_t vl);
vint32m4_t __riscv_vnmsac_vv_i32m4_tu(vint32m4_t vd, vint32m4_t vs1,
                                      vint32m4_t vs2, size_t vl);
vint32m4_t __riscv_vnmsac_vx_i32m4_tu(vint32m4_t vd, int32_t rs1,
                                      vint32m4_t vs2, size_t vl);
vint32m8_t __riscv_vnmsac_vv_i32m8_tu(vint32m8_t vd, vint32m8_t vs1,
                                      vint32m8_t vs2, size_t vl);
vint32m8_t __riscv_vnmsac_vx_i32m8_tu(vint32m8_t vd, int32_t rs1,
                                      vint32m8_t vs2, size_t vl);
vint64m1_t __riscv_vnmsac_vv_i64m1_tu(vint64m1_t vd, vint64m1_t vs1,
                                      vint64m1_t vs2, size_t vl);
vint64m1_t __riscv_vnmsac_vx_i64m1_tu(vint64m1_t vd, int64_t rs1,
                                      vint64m1_t vs2, size_t vl);
vint64m2_t __riscv_vnmsac_vv_i64m2_tu(vint64m2_t vd, vint64m2_t vs1,
                                      vint64m2_t vs2, size_t vl);
vint64m2_t __riscv_vnmsac_vx_i64m2_tu(vint64m2_t vd, int64_t rs1,
                                      vint64m2_t vs2, size_t vl);
vint64m4_t __riscv_vnmsac_vv_i64m4_tu(vint64m4_t vd, vint64m4_t vs1,
                                      vint64m4_t vs2, size_t vl);
vint64m4_t __riscv_vnmsac_vx_i64m4_tu(vint64m4_t vd, int64_t rs1,
                                      vint64m4_t vs2, size_t vl);
vint64m8_t __riscv_vnmsac_vv_i64m8_tu(vint64m8_t vd, vint64m8_t vs1,
                                      vint64m8_t vs2, size_t vl);
vint64m8_t __riscv_vnmsac_vx_i64m8_tu(vint64m8_t vd, int64_t rs1,
                                      vint64m8_t vs2, size_t vl);
vint8mf8_t __riscv_vmadd_vv_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs1,
                                     vint8mf8_t vs2, size_t vl);
vint8mf8_t __riscv_vmadd_vx_i8mf8_tu(vint8mf8_t vd, int8_t rs1, vint8mf8_t vs2,
                                     size_t vl);
vint8mf4_t __riscv_vmadd_vv_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs1,
                                     vint8mf4_t vs2, size_t vl);
vint8mf4_t __riscv_vmadd_vx_i8mf4_tu(vint8mf4_t vd, int8_t rs1, vint8mf4_t vs2,
                                     size_t vl);
vint8mf2_t __riscv_vmadd_vv_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs1,
                                     vint8mf2_t vs2, size_t vl);
vint8mf2_t __riscv_vmadd_vx_i8mf2_tu(vint8mf2_t vd, int8_t rs1, vint8mf2_t vs2,
                                     size_t vl);
vint8m1_t __riscv_vmadd_vv_i8m1_tu(vint8m1_t vd, vint8m1_t vs1, vint8m1_t vs2,
                                   size_t vl);
vint8m1_t __riscv_vmadd_vx_i8m1_tu(vint8m1_t vd, int8_t rs1, vint8m1_t vs2,
                                   size_t vl);
vint8m2_t __riscv_vmadd_vv_i8m2_tu(vint8m2_t vd, vint8m2_t vs1, vint8m2_t vs2,
                                   size_t vl);
vint8m2_t __riscv_vmadd_vx_i8m2_tu(vint8m2_t vd, int8_t rs1, vint8m2_t vs2,
                                   size_t vl);
vint8m4_t __riscv_vmadd_vv_i8m4_tu(vint8m4_t vd, vint8m4_t vs1, vint8m4_t vs2,
                                   size_t vl);
vint8m4_t __riscv_vmadd_vx_i8m4_tu(vint8m4_t vd, int8_t rs1, vint8m4_t vs2,
                                   size_t vl);
vint8m8_t __riscv_vmadd_vv_i8m8_tu(vint8m8_t vd, vint8m8_t vs1, vint8m8_t vs2,
                                   size_t vl);
vint8m8_t __riscv_vmadd_vx_i8m8_tu(vint8m8_t vd, int8_t rs1, vint8m8_t vs2,
                                   size_t vl);
vint16mf4_t __riscv_vmadd_vv_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs1,
                                       vint16mf4_t vs2, size_t vl);
vint16mf4_t __riscv_vmadd_vx_i16mf4_tu(vint16mf4_t vd, int16_t rs1,
                                       vint16mf4_t vs2, size_t vl);
vint16mf2_t __riscv_vmadd_vv_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs1,
                                       vint16mf2_t vs2, size_t vl);
vint16mf2_t __riscv_vmadd_vx_i16mf2_tu(vint16mf2_t vd, int16_t rs1,
                                       vint16mf2_t vs2, size_t vl);
vint16m1_t __riscv_vmadd_vv_i16m1_tu(vint16m1_t vd, vint16m1_t vs1,
                                     vint16m1_t vs2, size_t vl);
vint16m1_t __riscv_vmadd_vx_i16m1_tu(vint16m1_t vd, int16_t rs1, vint16m1_t vs2,
                                     size_t vl);
vint16m2_t __riscv_vmadd_vv_i16m2_tu(vint16m2_t vd, vint16m2_t vs1,
                                     vint16m2_t vs2, size_t vl);
vint16m2_t __riscv_vmadd_vx_i16m2_tu(vint16m2_t vd, int16_t rs1, vint16m2_t vs2,
                                     size_t vl);
vint16m4_t __riscv_vmadd_vv_i16m4_tu(vint16m4_t vd, vint16m4_t vs1,
                                     vint16m4_t vs2, size_t vl);
vint16m4_t __riscv_vmadd_vx_i16m4_tu(vint16m4_t vd, int16_t rs1, vint16m4_t vs2,
                                     size_t vl);
vint16m8_t __riscv_vmadd_vv_i16m8_tu(vint16m8_t vd, vint16m8_t vs1,
                                     vint16m8_t vs2, size_t vl);
vint16m8_t __riscv_vmadd_vx_i16m8_tu(vint16m8_t vd, int16_t rs1, vint16m8_t vs2,
                                     size_t vl);
vint32mf2_t __riscv_vmadd_vv_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs1,
                                       vint32mf2_t vs2, size_t vl);
vint32mf2_t __riscv_vmadd_vx_i32mf2_tu(vint32mf2_t vd, int32_t rs1,
                                       vint32mf2_t vs2, size_t vl);
vint32m1_t __riscv_vmadd_vv_i32m1_tu(vint32m1_t vd, vint32m1_t vs1,
                                     vint32m1_t vs2, size_t vl);
vint32m1_t __riscv_vmadd_vx_i32m1_tu(vint32m1_t vd, int32_t rs1, vint32m1_t vs2,
                                     size_t vl);
vint32m2_t __riscv_vmadd_vv_i32m2_tu(vint32m2_t vd, vint32m2_t vs1,
                                     vint32m2_t vs2, size_t vl);
vint32m2_t __riscv_vmadd_vx_i32m2_tu(vint32m2_t vd, int32_t rs1, vint32m2_t vs2,
                                     size_t vl);
vint32m4_t __riscv_vmadd_vv_i32m4_tu(vint32m4_t vd, vint32m4_t vs1,
                                     vint32m4_t vs2, size_t vl);
vint32m4_t __riscv_vmadd_vx_i32m4_tu(vint32m4_t vd, int32_t rs1, vint32m4_t vs2,
                                     size_t vl);
vint32m8_t __riscv_vmadd_vv_i32m8_tu(vint32m8_t vd, vint32m8_t vs1,
                                     vint32m8_t vs2, size_t vl);
vint32m8_t __riscv_vmadd_vx_i32m8_tu(vint32m8_t vd, int32_t rs1, vint32m8_t vs2,
                                     size_t vl);
vint64m1_t __riscv_vmadd_vv_i64m1_tu(vint64m1_t vd, vint64m1_t vs1,
                                     vint64m1_t vs2, size_t vl);
vint64m1_t __riscv_vmadd_vx_i64m1_tu(vint64m1_t vd, int64_t rs1, vint64m1_t vs2,
                                     size_t vl);
vint64m2_t __riscv_vmadd_vv_i64m2_tu(vint64m2_t vd, vint64m2_t vs1,
                                     vint64m2_t vs2, size_t vl);
vint64m2_t __riscv_vmadd_vx_i64m2_tu(vint64m2_t vd, int64_t rs1, vint64m2_t vs2,
                                     size_t vl);
vint64m4_t __riscv_vmadd_vv_i64m4_tu(vint64m4_t vd, vint64m4_t vs1,
                                     vint64m4_t vs2, size_t vl);
vint64m4_t __riscv_vmadd_vx_i64m4_tu(vint64m4_t vd, int64_t rs1, vint64m4_t vs2,
                                     size_t vl);
vint64m8_t __riscv_vmadd_vv_i64m8_tu(vint64m8_t vd, vint64m8_t vs1,
                                     vint64m8_t vs2, size_t vl);
vint64m8_t __riscv_vmadd_vx_i64m8_tu(vint64m8_t vd, int64_t rs1, vint64m8_t vs2,
                                     size_t vl);
vint8mf8_t __riscv_vnmsub_vv_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs1,
                                      vint8mf8_t vs2, size_t vl);
vint8mf8_t __riscv_vnmsub_vx_i8mf8_tu(vint8mf8_t vd, int8_t rs1, vint8mf8_t vs2,
                                      size_t vl);
vint8mf4_t __riscv_vnmsub_vv_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs1,
                                      vint8mf4_t vs2, size_t vl);
vint8mf4_t __riscv_vnmsub_vx_i8mf4_tu(vint8mf4_t vd, int8_t rs1, vint8mf4_t vs2,
                                      size_t vl);
vint8mf2_t __riscv_vnmsub_vv_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs1,
                                      vint8mf2_t vs2, size_t vl);
vint8mf2_t __riscv_vnmsub_vx_i8mf2_tu(vint8mf2_t vd, int8_t rs1, vint8mf2_t vs2,
                                      size_t vl);
vint8m1_t __riscv_vnmsub_vv_i8m1_tu(vint8m1_t vd, vint8m1_t vs1, vint8m1_t vs2,
                                    size_t vl);
vint8m1_t __riscv_vnmsub_vx_i8m1_tu(vint8m1_t vd, int8_t rs1, vint8m1_t vs2,
                                    size_t vl);
vint8m2_t __riscv_vnmsub_vv_i8m2_tu(vint8m2_t vd, vint8m2_t vs1, vint8m2_t vs2,
                                    size_t vl);
vint8m2_t __riscv_vnmsub_vx_i8m2_tu(vint8m2_t vd, int8_t rs1, vint8m2_t vs2,
                                    size_t vl);
vint8m4_t __riscv_vnmsub_vv_i8m4_tu(vint8m4_t vd, vint8m4_t vs1, vint8m4_t vs2,
                                    size_t vl);
vint8m4_t __riscv_vnmsub_vx_i8m4_tu(vint8m4_t vd, int8_t rs1, vint8m4_t vs2,
                                    size_t vl);
vint8m8_t __riscv_vnmsub_vv_i8m8_tu(vint8m8_t vd, vint8m8_t vs1, vint8m8_t vs2,
                                    size_t vl);
vint8m8_t __riscv_vnmsub_vx_i8m8_tu(vint8m8_t vd, int8_t rs1, vint8m8_t vs2,
                                    size_t vl);
vint16mf4_t __riscv_vnmsub_vv_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs1,
                                        vint16mf4_t vs2, size_t vl);
vint16mf4_t __riscv_vnmsub_vx_i16mf4_tu(vint16mf4_t vd, int16_t rs1,
                                        vint16mf4_t vs2, size_t vl);
vint16mf2_t __riscv_vnmsub_vv_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs1,
                                        vint16mf2_t vs2, size_t vl);
vint16mf2_t __riscv_vnmsub_vx_i16mf2_tu(vint16mf2_t vd, int16_t rs1,
                                        vint16mf2_t vs2, size_t vl);
vint16m1_t __riscv_vnmsub_vv_i16m1_tu(vint16m1_t vd, vint16m1_t vs1,
                                      vint16m1_t vs2, size_t vl);
vint16m1_t __riscv_vnmsub_vx_i16m1_tu(vint16m1_t vd, int16_t rs1,
                                      vint16m1_t vs2, size_t vl);
vint16m2_t __riscv_vnmsub_vv_i16m2_tu(vint16m2_t vd, vint16m2_t vs1,
                                      vint16m2_t vs2, size_t vl);
vint16m2_t __riscv_vnmsub_vx_i16m2_tu(vint16m2_t vd, int16_t rs1,
                                      vint16m2_t vs2, size_t vl);
vint16m4_t __riscv_vnmsub_vv_i16m4_tu(vint16m4_t vd, vint16m4_t vs1,
                                      vint16m4_t vs2, size_t vl);
vint16m4_t __riscv_vnmsub_vx_i16m4_tu(vint16m4_t vd, int16_t rs1,
                                      vint16m4_t vs2, size_t vl);
vint16m8_t __riscv_vnmsub_vv_i16m8_tu(vint16m8_t vd, vint16m8_t vs1,
                                      vint16m8_t vs2, size_t vl);
vint16m8_t __riscv_vnmsub_vx_i16m8_tu(vint16m8_t vd, int16_t rs1,
                                      vint16m8_t vs2, size_t vl);
vint32mf2_t __riscv_vnmsub_vv_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs1,
                                        vint32mf2_t vs2, size_t vl);
vint32mf2_t __riscv_vnmsub_vx_i32mf2_tu(vint32mf2_t vd, int32_t rs1,
                                        vint32mf2_t vs2, size_t vl);
vint32m1_t __riscv_vnmsub_vv_i32m1_tu(vint32m1_t vd, vint32m1_t vs1,
                                      vint32m1_t vs2, size_t vl);
vint32m1_t __riscv_vnmsub_vx_i32m1_tu(vint32m1_t vd, int32_t rs1,
                                      vint32m1_t vs2, size_t vl);
vint32m2_t __riscv_vnmsub_vv_i32m2_tu(vint32m2_t vd, vint32m2_t vs1,
                                      vint32m2_t vs2, size_t vl);
vint32m2_t __riscv_vnmsub_vx_i32m2_tu(vint32m2_t vd, int32_t rs1,
                                      vint32m2_t vs2, size_t vl);
vint32m4_t __riscv_vnmsub_vv_i32m4_tu(vint32m4_t vd, vint32m4_t vs1,
                                      vint32m4_t vs2, size_t vl);
vint32m4_t __riscv_vnmsub_vx_i32m4_tu(vint32m4_t vd, int32_t rs1,
                                      vint32m4_t vs2, size_t vl);
vint32m8_t __riscv_vnmsub_vv_i32m8_tu(vint32m8_t vd, vint32m8_t vs1,
                                      vint32m8_t vs2, size_t vl);
vint32m8_t __riscv_vnmsub_vx_i32m8_tu(vint32m8_t vd, int32_t rs1,
                                      vint32m8_t vs2, size_t vl);
vint64m1_t __riscv_vnmsub_vv_i64m1_tu(vint64m1_t vd, vint64m1_t vs1,
                                      vint64m1_t vs2, size_t vl);
vint64m1_t __riscv_vnmsub_vx_i64m1_tu(vint64m1_t vd, int64_t rs1,
                                      vint64m1_t vs2, size_t vl);
vint64m2_t __riscv_vnmsub_vv_i64m2_tu(vint64m2_t vd, vint64m2_t vs1,
                                      vint64m2_t vs2, size_t vl);
vint64m2_t __riscv_vnmsub_vx_i64m2_tu(vint64m2_t vd, int64_t rs1,
                                      vint64m2_t vs2, size_t vl);
vint64m4_t __riscv_vnmsub_vv_i64m4_tu(vint64m4_t vd, vint64m4_t vs1,
                                      vint64m4_t vs2, size_t vl);
vint64m4_t __riscv_vnmsub_vx_i64m4_tu(vint64m4_t vd, int64_t rs1,
                                      vint64m4_t vs2, size_t vl);
vint64m8_t __riscv_vnmsub_vv_i64m8_tu(vint64m8_t vd, vint64m8_t vs1,
                                      vint64m8_t vs2, size_t vl);
vint64m8_t __riscv_vnmsub_vx_i64m8_tu(vint64m8_t vd, int64_t rs1,
                                      vint64m8_t vs2, size_t vl);
vuint8mf8_t __riscv_vmacc_vv_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs1,
                                      vuint8mf8_t vs2, size_t vl);
vuint8mf8_t __riscv_vmacc_vx_u8mf8_tu(vuint8mf8_t vd, uint8_t rs1,
                                      vuint8mf8_t vs2, size_t vl);
vuint8mf4_t __riscv_vmacc_vv_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs1,
                                      vuint8mf4_t vs2, size_t vl);
vuint8mf4_t __riscv_vmacc_vx_u8mf4_tu(vuint8mf4_t vd, uint8_t rs1,
                                      vuint8mf4_t vs2, size_t vl);
vuint8mf2_t __riscv_vmacc_vv_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs1,
                                      vuint8mf2_t vs2, size_t vl);
vuint8mf2_t __riscv_vmacc_vx_u8mf2_tu(vuint8mf2_t vd, uint8_t rs1,
                                      vuint8mf2_t vs2, size_t vl);
vuint8m1_t __riscv_vmacc_vv_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs1,
                                    vuint8m1_t vs2, size_t vl);
vuint8m1_t __riscv_vmacc_vx_u8m1_tu(vuint8m1_t vd, uint8_t rs1, vuint8m1_t vs2,
                                    size_t vl);
vuint8m2_t __riscv_vmacc_vv_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs1,
                                    vuint8m2_t vs2, size_t vl);
vuint8m2_t __riscv_vmacc_vx_u8m2_tu(vuint8m2_t vd, uint8_t rs1, vuint8m2_t vs2,
                                    size_t vl);
vuint8m4_t __riscv_vmacc_vv_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs1,
                                    vuint8m4_t vs2, size_t vl);
vuint8m4_t __riscv_vmacc_vx_u8m4_tu(vuint8m4_t vd, uint8_t rs1, vuint8m4_t vs2,
                                    size_t vl);
vuint8m8_t __riscv_vmacc_vv_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs1,
                                    vuint8m8_t vs2, size_t vl);
vuint8m8_t __riscv_vmacc_vx_u8m8_tu(vuint8m8_t vd, uint8_t rs1, vuint8m8_t vs2,
                                    size_t vl);
vuint16mf4_t __riscv_vmacc_vv_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs1,
                                        vuint16mf4_t vs2, size_t vl);
vuint16mf4_t __riscv_vmacc_vx_u16mf4_tu(vuint16mf4_t vd, uint16_t rs1,
                                        vuint16mf4_t vs2, size_t vl);
vuint16mf2_t __riscv_vmacc_vv_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs1,
                                        vuint16mf2_t vs2, size_t vl);
vuint16mf2_t __riscv_vmacc_vx_u16mf2_tu(vuint16mf2_t vd, uint16_t rs1,
                                        vuint16mf2_t vs2, size_t vl);
vuint16m1_t __riscv_vmacc_vv_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs1,
                                      vuint16m1_t vs2, size_t vl);
vuint16m1_t __riscv_vmacc_vx_u16m1_tu(vuint16m1_t vd, uint16_t rs1,
                                      vuint16m1_t vs2, size_t vl);
vuint16m2_t __riscv_vmacc_vv_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs1,
                                      vuint16m2_t vs2, size_t vl);
vuint16m2_t __riscv_vmacc_vx_u16m2_tu(vuint16m2_t vd, uint16_t rs1,
                                      vuint16m2_t vs2, size_t vl);
vuint16m4_t __riscv_vmacc_vv_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs1,
                                      vuint16m4_t vs2, size_t vl);
vuint16m4_t __riscv_vmacc_vx_u16m4_tu(vuint16m4_t vd, uint16_t rs1,
                                      vuint16m4_t vs2, size_t vl);
vuint16m8_t __riscv_vmacc_vv_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs1,
                                      vuint16m8_t vs2, size_t vl);
vuint16m8_t __riscv_vmacc_vx_u16m8_tu(vuint16m8_t vd, uint16_t rs1,
                                      vuint16m8_t vs2, size_t vl);
vuint32mf2_t __riscv_vmacc_vv_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs1,
                                        vuint32mf2_t vs2, size_t vl);
vuint32mf2_t __riscv_vmacc_vx_u32mf2_tu(vuint32mf2_t vd, uint32_t rs1,
                                        vuint32mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vmacc_vv_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs1,
                                      vuint32m1_t vs2, size_t vl);
vuint32m1_t __riscv_vmacc_vx_u32m1_tu(vuint32m1_t vd, uint32_t rs1,
                                      vuint32m1_t vs2, size_t vl);
vuint32m2_t __riscv_vmacc_vv_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs1,
                                      vuint32m2_t vs2, size_t vl);
vuint32m2_t __riscv_vmacc_vx_u32m2_tu(vuint32m2_t vd, uint32_t rs1,
                                      vuint32m2_t vs2, size_t vl);
vuint32m4_t __riscv_vmacc_vv_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs1,
                                      vuint32m4_t vs2, size_t vl);
vuint32m4_t __riscv_vmacc_vx_u32m4_tu(vuint32m4_t vd, uint32_t rs1,
                                      vuint32m4_t vs2, size_t vl);
vuint32m8_t __riscv_vmacc_vv_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs1,
                                      vuint32m8_t vs2, size_t vl);
vuint32m8_t __riscv_vmacc_vx_u32m8_tu(vuint32m8_t vd, uint32_t rs1,
                                      vuint32m8_t vs2, size_t vl);
vuint64m1_t __riscv_vmacc_vv_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs1,
                                      vuint64m1_t vs2, size_t vl);
vuint64m1_t __riscv_vmacc_vx_u64m1_tu(vuint64m1_t vd, uint64_t rs1,
                                      vuint64m1_t vs2, size_t vl);
vuint64m2_t __riscv_vmacc_vv_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs1,
                                      vuint64m2_t vs2, size_t vl);
vuint64m2_t __riscv_vmacc_vx_u64m2_tu(vuint64m2_t vd, uint64_t rs1,
                                      vuint64m2_t vs2, size_t vl);
vuint64m4_t __riscv_vmacc_vv_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs1,
                                      vuint64m4_t vs2, size_t vl);
vuint64m4_t __riscv_vmacc_vx_u64m4_tu(vuint64m4_t vd, uint64_t rs1,
                                      vuint64m4_t vs2, size_t vl);
vuint64m8_t __riscv_vmacc_vv_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs1,
                                      vuint64m8_t vs2, size_t vl);
vuint64m8_t __riscv_vmacc_vx_u64m8_tu(vuint64m8_t vd, uint64_t rs1,
                                      vuint64m8_t vs2, size_t vl);
vuint8mf8_t __riscv_vnmsac_vv_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs1,
                                       vuint8mf8_t vs2, size_t vl);
vuint8mf8_t __riscv_vnmsac_vx_u8mf8_tu(vuint8mf8_t vd, uint8_t rs1,
                                       vuint8mf8_t vs2, size_t vl);
vuint8mf4_t __riscv_vnmsac_vv_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs1,
                                       vuint8mf4_t vs2, size_t vl);
vuint8mf4_t __riscv_vnmsac_vx_u8mf4_tu(vuint8mf4_t vd, uint8_t rs1,
                                       vuint8mf4_t vs2, size_t vl);
vuint8mf2_t __riscv_vnmsac_vv_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs1,
                                       vuint8mf2_t vs2, size_t vl);
vuint8mf2_t __riscv_vnmsac_vx_u8mf2_tu(vuint8mf2_t vd, uint8_t rs1,
                                       vuint8mf2_t vs2, size_t vl);
vuint8m1_t __riscv_vnmsac_vv_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs1,
                                     vuint8m1_t vs2, size_t vl);
vuint8m1_t __riscv_vnmsac_vx_u8m1_tu(vuint8m1_t vd, uint8_t rs1, vuint8m1_t vs2,
                                     size_t vl);
vuint8m2_t __riscv_vnmsac_vv_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs1,
                                     vuint8m2_t vs2, size_t vl);
vuint8m2_t __riscv_vnmsac_vx_u8m2_tu(vuint8m2_t vd, uint8_t rs1, vuint8m2_t vs2,
                                     size_t vl);
vuint8m4_t __riscv_vnmsac_vv_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs1,
                                     vuint8m4_t vs2, size_t vl);
vuint8m4_t __riscv_vnmsac_vx_u8m4_tu(vuint8m4_t vd, uint8_t rs1, vuint8m4_t vs2,
                                     size_t vl);
vuint8m8_t __riscv_vnmsac_vv_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs1,
                                     vuint8m8_t vs2, size_t vl);
vuint8m8_t __riscv_vnmsac_vx_u8m8_tu(vuint8m8_t vd, uint8_t rs1, vuint8m8_t vs2,
                                     size_t vl);
vuint16mf4_t __riscv_vnmsac_vv_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs1,
                                         vuint16mf4_t vs2, size_t vl);
vuint16mf4_t __riscv_vnmsac_vx_u16mf4_tu(vuint16mf4_t vd, uint16_t rs1,
                                         vuint16mf4_t vs2, size_t vl);
vuint16mf2_t __riscv_vnmsac_vv_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs1,
                                         vuint16mf2_t vs2, size_t vl);
vuint16mf2_t __riscv_vnmsac_vx_u16mf2_tu(vuint16mf2_t vd, uint16_t rs1,
                                         vuint16mf2_t vs2, size_t vl);
vuint16m1_t __riscv_vnmsac_vv_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs1,
                                       vuint16m1_t vs2, size_t vl);
vuint16m1_t __riscv_vnmsac_vx_u16m1_tu(vuint16m1_t vd, uint16_t rs1,
                                       vuint16m1_t vs2, size_t vl);
vuint16m2_t __riscv_vnmsac_vv_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs1,
                                       vuint16m2_t vs2, size_t vl);
vuint16m2_t __riscv_vnmsac_vx_u16m2_tu(vuint16m2_t vd, uint16_t rs1,
                                       vuint16m2_t vs2, size_t vl);
vuint16m4_t __riscv_vnmsac_vv_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs1,
                                       vuint16m4_t vs2, size_t vl);
vuint16m4_t __riscv_vnmsac_vx_u16m4_tu(vuint16m4_t vd, uint16_t rs1,
                                       vuint16m4_t vs2, size_t vl);
vuint16m8_t __riscv_vnmsac_vv_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs1,
                                       vuint16m8_t vs2, size_t vl);
vuint16m8_t __riscv_vnmsac_vx_u16m8_tu(vuint16m8_t vd, uint16_t rs1,
                                       vuint16m8_t vs2, size_t vl);
vuint32mf2_t __riscv_vnmsac_vv_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs1,
                                         vuint32mf2_t vs2, size_t vl);
vuint32mf2_t __riscv_vnmsac_vx_u32mf2_tu(vuint32mf2_t vd, uint32_t rs1,
                                         vuint32mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vnmsac_vv_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs1,
                                       vuint32m1_t vs2, size_t vl);
vuint32m1_t __riscv_vnmsac_vx_u32m1_tu(vuint32m1_t vd, uint32_t rs1,
                                       vuint32m1_t vs2, size_t vl);
vuint32m2_t __riscv_vnmsac_vv_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs1,
                                       vuint32m2_t vs2, size_t vl);
vuint32m2_t __riscv_vnmsac_vx_u32m2_tu(vuint32m2_t vd, uint32_t rs1,
                                       vuint32m2_t vs2, size_t vl);
vuint32m4_t __riscv_vnmsac_vv_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs1,
                                       vuint32m4_t vs2, size_t vl);
vuint32m4_t __riscv_vnmsac_vx_u32m4_tu(vuint32m4_t vd, uint32_t rs1,
                                       vuint32m4_t vs2, size_t vl);
vuint32m8_t __riscv_vnmsac_vv_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs1,
                                       vuint32m8_t vs2, size_t vl);
vuint32m8_t __riscv_vnmsac_vx_u32m8_tu(vuint32m8_t vd, uint32_t rs1,
                                       vuint32m8_t vs2, size_t vl);
vuint64m1_t __riscv_vnmsac_vv_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs1,
                                       vuint64m1_t vs2, size_t vl);
vuint64m1_t __riscv_vnmsac_vx_u64m1_tu(vuint64m1_t vd, uint64_t rs1,
                                       vuint64m1_t vs2, size_t vl);
vuint64m2_t __riscv_vnmsac_vv_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs1,
                                       vuint64m2_t vs2, size_t vl);
vuint64m2_t __riscv_vnmsac_vx_u64m2_tu(vuint64m2_t vd, uint64_t rs1,
                                       vuint64m2_t vs2, size_t vl);
vuint64m4_t __riscv_vnmsac_vv_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs1,
                                       vuint64m4_t vs2, size_t vl);
vuint64m4_t __riscv_vnmsac_vx_u64m4_tu(vuint64m4_t vd, uint64_t rs1,
                                       vuint64m4_t vs2, size_t vl);
vuint64m8_t __riscv_vnmsac_vv_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs1,
                                       vuint64m8_t vs2, size_t vl);
vuint64m8_t __riscv_vnmsac_vx_u64m8_tu(vuint64m8_t vd, uint64_t rs1,
                                       vuint64m8_t vs2, size_t vl);
vuint8mf8_t __riscv_vmadd_vv_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs1,
                                      vuint8mf8_t vs2, size_t vl);
vuint8mf8_t __riscv_vmadd_vx_u8mf8_tu(vuint8mf8_t vd, uint8_t rs1,
                                      vuint8mf8_t vs2, size_t vl);
vuint8mf4_t __riscv_vmadd_vv_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs1,
                                      vuint8mf4_t vs2, size_t vl);
vuint8mf4_t __riscv_vmadd_vx_u8mf4_tu(vuint8mf4_t vd, uint8_t rs1,
                                      vuint8mf4_t vs2, size_t vl);
vuint8mf2_t __riscv_vmadd_vv_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs1,
                                      vuint8mf2_t vs2, size_t vl);
vuint8mf2_t __riscv_vmadd_vx_u8mf2_tu(vuint8mf2_t vd, uint8_t rs1,
                                      vuint8mf2_t vs2, size_t vl);
vuint8m1_t __riscv_vmadd_vv_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs1,
                                    vuint8m1_t vs2, size_t vl);
vuint8m1_t __riscv_vmadd_vx_u8m1_tu(vuint8m1_t vd, uint8_t rs1, vuint8m1_t vs2,
                                    size_t vl);
vuint8m2_t __riscv_vmadd_vv_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs1,
                                    vuint8m2_t vs2, size_t vl);
vuint8m2_t __riscv_vmadd_vx_u8m2_tu(vuint8m2_t vd, uint8_t rs1, vuint8m2_t vs2,
                                    size_t vl);
vuint8m4_t __riscv_vmadd_vv_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs1,
                                    vuint8m4_t vs2, size_t vl);
vuint8m4_t __riscv_vmadd_vx_u8m4_tu(vuint8m4_t vd, uint8_t rs1, vuint8m4_t vs2,
                                    size_t vl);
vuint8m8_t __riscv_vmadd_vv_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs1,
                                    vuint8m8_t vs2, size_t vl);
vuint8m8_t __riscv_vmadd_vx_u8m8_tu(vuint8m8_t vd, uint8_t rs1, vuint8m8_t vs2,
                                    size_t vl);
vuint16mf4_t __riscv_vmadd_vv_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs1,
                                        vuint16mf4_t vs2, size_t vl);
vuint16mf4_t __riscv_vmadd_vx_u16mf4_tu(vuint16mf4_t vd, uint16_t rs1,
                                        vuint16mf4_t vs2, size_t vl);
vuint16mf2_t __riscv_vmadd_vv_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs1,
                                        vuint16mf2_t vs2, size_t vl);
vuint16mf2_t __riscv_vmadd_vx_u16mf2_tu(vuint16mf2_t vd, uint16_t rs1,
                                        vuint16mf2_t vs2, size_t vl);
vuint16m1_t __riscv_vmadd_vv_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs1,
                                      vuint16m1_t vs2, size_t vl);
vuint16m1_t __riscv_vmadd_vx_u16m1_tu(vuint16m1_t vd, uint16_t rs1,
                                      vuint16m1_t vs2, size_t vl);
vuint16m2_t __riscv_vmadd_vv_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs1,
                                      vuint16m2_t vs2, size_t vl);
vuint16m2_t __riscv_vmadd_vx_u16m2_tu(vuint16m2_t vd, uint16_t rs1,
                                      vuint16m2_t vs2, size_t vl);
vuint16m4_t __riscv_vmadd_vv_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs1,
                                      vuint16m4_t vs2, size_t vl);
vuint16m4_t __riscv_vmadd_vx_u16m4_tu(vuint16m4_t vd, uint16_t rs1,
                                      vuint16m4_t vs2, size_t vl);
vuint16m8_t __riscv_vmadd_vv_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs1,
                                      vuint16m8_t vs2, size_t vl);
vuint16m8_t __riscv_vmadd_vx_u16m8_tu(vuint16m8_t vd, uint16_t rs1,
                                      vuint16m8_t vs2, size_t vl);
vuint32mf2_t __riscv_vmadd_vv_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs1,
                                        vuint32mf2_t vs2, size_t vl);
vuint32mf2_t __riscv_vmadd_vx_u32mf2_tu(vuint32mf2_t vd, uint32_t rs1,
                                        vuint32mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vmadd_vv_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs1,
                                      vuint32m1_t vs2, size_t vl);
vuint32m1_t __riscv_vmadd_vx_u32m1_tu(vuint32m1_t vd, uint32_t rs1,
                                      vuint32m1_t vs2, size_t vl);
vuint32m2_t __riscv_vmadd_vv_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs1,
                                      vuint32m2_t vs2, size_t vl);
vuint32m2_t __riscv_vmadd_vx_u32m2_tu(vuint32m2_t vd, uint32_t rs1,
                                      vuint32m2_t vs2, size_t vl);
vuint32m4_t __riscv_vmadd_vv_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs1,
                                      vuint32m4_t vs2, size_t vl);
vuint32m4_t __riscv_vmadd_vx_u32m4_tu(vuint32m4_t vd, uint32_t rs1,
                                      vuint32m4_t vs2, size_t vl);
vuint32m8_t __riscv_vmadd_vv_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs1,
                                      vuint32m8_t vs2, size_t vl);
vuint32m8_t __riscv_vmadd_vx_u32m8_tu(vuint32m8_t vd, uint32_t rs1,
                                      vuint32m8_t vs2, size_t vl);
vuint64m1_t __riscv_vmadd_vv_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs1,
                                      vuint64m1_t vs2, size_t vl);
vuint64m1_t __riscv_vmadd_vx_u64m1_tu(vuint64m1_t vd, uint64_t rs1,
                                      vuint64m1_t vs2, size_t vl);
vuint64m2_t __riscv_vmadd_vv_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs1,
                                      vuint64m2_t vs2, size_t vl);
vuint64m2_t __riscv_vmadd_vx_u64m2_tu(vuint64m2_t vd, uint64_t rs1,
                                      vuint64m2_t vs2, size_t vl);
vuint64m4_t __riscv_vmadd_vv_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs1,
                                      vuint64m4_t vs2, size_t vl);
vuint64m4_t __riscv_vmadd_vx_u64m4_tu(vuint64m4_t vd, uint64_t rs1,
                                      vuint64m4_t vs2, size_t vl);
vuint64m8_t __riscv_vmadd_vv_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs1,
                                      vuint64m8_t vs2, size_t vl);
vuint64m8_t __riscv_vmadd_vx_u64m8_tu(vuint64m8_t vd, uint64_t rs1,
                                      vuint64m8_t vs2, size_t vl);
vuint8mf8_t __riscv_vnmsub_vv_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs1,
                                       vuint8mf8_t vs2, size_t vl);
vuint8mf8_t __riscv_vnmsub_vx_u8mf8_tu(vuint8mf8_t vd, uint8_t rs1,
                                       vuint8mf8_t vs2, size_t vl);
vuint8mf4_t __riscv_vnmsub_vv_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs1,
                                       vuint8mf4_t vs2, size_t vl);
vuint8mf4_t __riscv_vnmsub_vx_u8mf4_tu(vuint8mf4_t vd, uint8_t rs1,
                                       vuint8mf4_t vs2, size_t vl);
vuint8mf2_t __riscv_vnmsub_vv_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs1,
                                       vuint8mf2_t vs2, size_t vl);
vuint8mf2_t __riscv_vnmsub_vx_u8mf2_tu(vuint8mf2_t vd, uint8_t rs1,
                                       vuint8mf2_t vs2, size_t vl);
vuint8m1_t __riscv_vnmsub_vv_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs1,
                                     vuint8m1_t vs2, size_t vl);
vuint8m1_t __riscv_vnmsub_vx_u8m1_tu(vuint8m1_t vd, uint8_t rs1, vuint8m1_t vs2,
                                     size_t vl);
vuint8m2_t __riscv_vnmsub_vv_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs1,
                                     vuint8m2_t vs2, size_t vl);
vuint8m2_t __riscv_vnmsub_vx_u8m2_tu(vuint8m2_t vd, uint8_t rs1, vuint8m2_t vs2,
                                     size_t vl);
vuint8m4_t __riscv_vnmsub_vv_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs1,
                                     vuint8m4_t vs2, size_t vl);
vuint8m4_t __riscv_vnmsub_vx_u8m4_tu(vuint8m4_t vd, uint8_t rs1, vuint8m4_t vs2,
                                     size_t vl);
vuint8m8_t __riscv_vnmsub_vv_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs1,
                                     vuint8m8_t vs2, size_t vl);
vuint8m8_t __riscv_vnmsub_vx_u8m8_tu(vuint8m8_t vd, uint8_t rs1, vuint8m8_t vs2,
                                     size_t vl);
vuint16mf4_t __riscv_vnmsub_vv_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs1,
                                         vuint16mf4_t vs2, size_t vl);
vuint16mf4_t __riscv_vnmsub_vx_u16mf4_tu(vuint16mf4_t vd, uint16_t rs1,
                                         vuint16mf4_t vs2, size_t vl);
vuint16mf2_t __riscv_vnmsub_vv_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs1,
                                         vuint16mf2_t vs2, size_t vl);
vuint16mf2_t __riscv_vnmsub_vx_u16mf2_tu(vuint16mf2_t vd, uint16_t rs1,
                                         vuint16mf2_t vs2, size_t vl);
vuint16m1_t __riscv_vnmsub_vv_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs1,
                                       vuint16m1_t vs2, size_t vl);
vuint16m1_t __riscv_vnmsub_vx_u16m1_tu(vuint16m1_t vd, uint16_t rs1,
                                       vuint16m1_t vs2, size_t vl);
vuint16m2_t __riscv_vnmsub_vv_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs1,
                                       vuint16m2_t vs2, size_t vl);
vuint16m2_t __riscv_vnmsub_vx_u16m2_tu(vuint16m2_t vd, uint16_t rs1,
                                       vuint16m2_t vs2, size_t vl);
vuint16m4_t __riscv_vnmsub_vv_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs1,
                                       vuint16m4_t vs2, size_t vl);
vuint16m4_t __riscv_vnmsub_vx_u16m4_tu(vuint16m4_t vd, uint16_t rs1,
                                       vuint16m4_t vs2, size_t vl);
vuint16m8_t __riscv_vnmsub_vv_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs1,
                                       vuint16m8_t vs2, size_t vl);
vuint16m8_t __riscv_vnmsub_vx_u16m8_tu(vuint16m8_t vd, uint16_t rs1,
                                       vuint16m8_t vs2, size_t vl);
vuint32mf2_t __riscv_vnmsub_vv_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs1,
                                         vuint32mf2_t vs2, size_t vl);
vuint32mf2_t __riscv_vnmsub_vx_u32mf2_tu(vuint32mf2_t vd, uint32_t rs1,
                                         vuint32mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vnmsub_vv_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs1,
                                       vuint32m1_t vs2, size_t vl);
vuint32m1_t __riscv_vnmsub_vx_u32m1_tu(vuint32m1_t vd, uint32_t rs1,
                                       vuint32m1_t vs2, size_t vl);
vuint32m2_t __riscv_vnmsub_vv_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs1,
                                       vuint32m2_t vs2, size_t vl);
vuint32m2_t __riscv_vnmsub_vx_u32m2_tu(vuint32m2_t vd, uint32_t rs1,
                                       vuint32m2_t vs2, size_t vl);
vuint32m4_t __riscv_vnmsub_vv_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs1,
                                       vuint32m4_t vs2, size_t vl);
vuint32m4_t __riscv_vnmsub_vx_u32m4_tu(vuint32m4_t vd, uint32_t rs1,
                                       vuint32m4_t vs2, size_t vl);
vuint32m8_t __riscv_vnmsub_vv_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs1,
                                       vuint32m8_t vs2, size_t vl);
vuint32m8_t __riscv_vnmsub_vx_u32m8_tu(vuint32m8_t vd, uint32_t rs1,
                                       vuint32m8_t vs2, size_t vl);
vuint64m1_t __riscv_vnmsub_vv_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs1,
                                       vuint64m1_t vs2, size_t vl);
vuint64m1_t __riscv_vnmsub_vx_u64m1_tu(vuint64m1_t vd, uint64_t rs1,
                                       vuint64m1_t vs2, size_t vl);
vuint64m2_t __riscv_vnmsub_vv_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs1,
                                       vuint64m2_t vs2, size_t vl);
vuint64m2_t __riscv_vnmsub_vx_u64m2_tu(vuint64m2_t vd, uint64_t rs1,
                                       vuint64m2_t vs2, size_t vl);
vuint64m4_t __riscv_vnmsub_vv_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs1,
                                       vuint64m4_t vs2, size_t vl);
vuint64m4_t __riscv_vnmsub_vx_u64m4_tu(vuint64m4_t vd, uint64_t rs1,
                                       vuint64m4_t vs2, size_t vl);
vuint64m8_t __riscv_vnmsub_vv_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs1,
                                       vuint64m8_t vs2, size_t vl);
vuint64m8_t __riscv_vnmsub_vx_u64m8_tu(vuint64m8_t vd, uint64_t rs1,
                                       vuint64m8_t vs2, size_t vl);
// masked functions
vint8mf8_t __riscv_vmacc_vv_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs1, vint8mf8_t vs2,
                                      size_t vl);
vint8mf8_t __riscv_vmacc_vx_i8mf8_tum(vbool64_t vm, vint8mf8_t vd, int8_t rs1,
                                      vint8mf8_t vs2, size_t vl);
vint8mf4_t __riscv_vmacc_vv_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs1, vint8mf4_t vs2,
                                      size_t vl);
vint8mf4_t __riscv_vmacc_vx_i8mf4_tum(vbool32_t vm, vint8mf4_t vd, int8_t rs1,
                                      vint8mf4_t vs2, size_t vl);
vint8mf2_t __riscv_vmacc_vv_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs1, vint8mf2_t vs2,
                                      size_t vl);
vint8mf2_t __riscv_vmacc_vx_i8mf2_tum(vbool16_t vm, vint8mf2_t vd, int8_t rs1,
                                      vint8mf2_t vs2, size_t vl);
vint8m1_t __riscv_vmacc_vv_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs1,
                                    vint8m1_t vs2, size_t vl);
vint8m1_t __riscv_vmacc_vx_i8m1_tum(vbool8_t vm, vint8m1_t vd, int8_t rs1,
                                    vint8m1_t vs2, size_t vl);
vint8m2_t __riscv_vmacc_vv_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs1,
                                    vint8m2_t vs2, size_t vl);
vint8m2_t __riscv_vmacc_vx_i8m2_tum(vbool4_t vm, vint8m2_t vd, int8_t rs1,
                                    vint8m2_t vs2, size_t vl);
vint8m4_t __riscv_vmacc_vv_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs1,
                                    vint8m4_t vs2, size_t vl);
vint8m4_t __riscv_vmacc_vx_i8m4_tum(vbool2_t vm, vint8m4_t vd, int8_t rs1,
                                    vint8m4_t vs2, size_t vl);
vint8m8_t __riscv_vmacc_vv_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs1,
                                    vint8m8_t vs2, size_t vl);
vint8m8_t __riscv_vmacc_vx_i8m8_tum(vbool1_t vm, vint8m8_t vd, int8_t rs1,
                                    vint8m8_t vs2, size_t vl);
vint16mf4_t __riscv_vmacc_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs1, vint16mf4_t vs2,
                                        size_t vl);
vint16mf4_t __riscv_vmacc_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                        int16_t rs1, vint16mf4_t vs2,
                                        size_t vl);
vint16mf2_t __riscv_vmacc_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs1, vint16mf2_t vs2,
                                        size_t vl);
vint16mf2_t __riscv_vmacc_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                        int16_t rs1, vint16mf2_t vs2,
                                        size_t vl);
vint16m1_t __riscv_vmacc_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs1, vint16m1_t vs2,
                                      size_t vl);
vint16m1_t __riscv_vmacc_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd, int16_t rs1,
                                      vint16m1_t vs2, size_t vl);
vint16m2_t __riscv_vmacc_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs1, vint16m2_t vs2,
                                      size_t vl);
vint16m2_t __riscv_vmacc_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd, int16_t rs1,
                                      vint16m2_t vs2, size_t vl);
vint16m4_t __riscv_vmacc_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs1, vint16m4_t vs2,
                                      size_t vl);
vint16m4_t __riscv_vmacc_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd, int16_t rs1,
                                      vint16m4_t vs2, size_t vl);
vint16m8_t __riscv_vmacc_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs1, vint16m8_t vs2,
                                      size_t vl);
vint16m8_t __riscv_vmacc_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd, int16_t rs1,
                                      vint16m8_t vs2, size_t vl);
vint32mf2_t __riscv_vmacc_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs1, vint32mf2_t vs2,
                                        size_t vl);
vint32mf2_t __riscv_vmacc_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                        int32_t rs1, vint32mf2_t vs2,
                                        size_t vl);
vint32m1_t __riscv_vmacc_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs1, vint32m1_t vs2,
                                      size_t vl);
vint32m1_t __riscv_vmacc_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd, int32_t rs1,
                                      vint32m1_t vs2, size_t vl);
vint32m2_t __riscv_vmacc_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs1, vint32m2_t vs2,
                                      size_t vl);
vint32m2_t __riscv_vmacc_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd, int32_t rs1,
                                      vint32m2_t vs2, size_t vl);
vint32m4_t __riscv_vmacc_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs1, vint32m4_t vs2,
                                      size_t vl);
vint32m4_t __riscv_vmacc_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd, int32_t rs1,
                                      vint32m4_t vs2, size_t vl);
vint32m8_t __riscv_vmacc_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs1, vint32m8_t vs2,
                                      size_t vl);
vint32m8_t __riscv_vmacc_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd, int32_t rs1,
                                      vint32m8_t vs2, size_t vl);
vint64m1_t __riscv_vmacc_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs1, vint64m1_t vs2,
                                      size_t vl);
vint64m1_t __riscv_vmacc_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd, int64_t rs1,
                                      vint64m1_t vs2, size_t vl);
vint64m2_t __riscv_vmacc_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs1, vint64m2_t vs2,
                                      size_t vl);
vint64m2_t __riscv_vmacc_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd, int64_t rs1,
                                      vint64m2_t vs2, size_t vl);
vint64m4_t __riscv_vmacc_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs1, vint64m4_t vs2,
                                      size_t vl);
vint64m4_t __riscv_vmacc_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd, int64_t rs1,
                                      vint64m4_t vs2, size_t vl);
vint64m8_t __riscv_vmacc_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs1, vint64m8_t vs2,
                                      size_t vl);
vint64m8_t __riscv_vmacc_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd, int64_t rs1,
                                      vint64m8_t vs2, size_t vl);
vint8mf8_t __riscv_vnmsac_vv_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                       vint8mf8_t vs1, vint8mf8_t vs2,
                                       size_t vl);
vint8mf8_t __riscv_vnmsac_vx_i8mf8_tum(vbool64_t vm, vint8mf8_t vd, int8_t rs1,
                                       vint8mf8_t vs2, size_t vl);
vint8mf4_t __riscv_vnmsac_vv_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                       vint8mf4_t vs1, vint8mf4_t vs2,
                                       size_t vl);
vint8mf4_t __riscv_vnmsac_vx_i8mf4_tum(vbool32_t vm, vint8mf4_t vd, int8_t rs1,
                                       vint8mf4_t vs2, size_t vl);
vint8mf2_t __riscv_vnmsac_vv_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                       vint8mf2_t vs1, vint8mf2_t vs2,
                                       size_t vl);
vint8mf2_t __riscv_vnmsac_vx_i8mf2_tum(vbool16_t vm, vint8mf2_t vd, int8_t rs1,
                                       vint8mf2_t vs2, size_t vl);
vint8m1_t __riscv_vnmsac_vv_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs1,
                                     vint8m1_t vs2, size_t vl);
vint8m1_t __riscv_vnmsac_vx_i8m1_tum(vbool8_t vm, vint8m1_t vd, int8_t rs1,
                                     vint8m1_t vs2, size_t vl);
vint8m2_t __riscv_vnmsac_vv_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs1,
                                     vint8m2_t vs2, size_t vl);
vint8m2_t __riscv_vnmsac_vx_i8m2_tum(vbool4_t vm, vint8m2_t vd, int8_t rs1,
                                     vint8m2_t vs2, size_t vl);
vint8m4_t __riscv_vnmsac_vv_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs1,
                                     vint8m4_t vs2, size_t vl);
vint8m4_t __riscv_vnmsac_vx_i8m4_tum(vbool2_t vm, vint8m4_t vd, int8_t rs1,
                                     vint8m4_t vs2, size_t vl);
vint8m8_t __riscv_vnmsac_vv_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs1,
                                     vint8m8_t vs2, size_t vl);
vint8m8_t __riscv_vnmsac_vx_i8m8_tum(vbool1_t vm, vint8m8_t vd, int8_t rs1,
                                     vint8m8_t vs2, size_t vl);
vint16mf4_t __riscv_vnmsac_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                         vint16mf4_t vs1, vint16mf4_t vs2,
                                         size_t vl);
vint16mf4_t __riscv_vnmsac_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                         int16_t rs1, vint16mf4_t vs2,
                                         size_t vl);
vint16mf2_t __riscv_vnmsac_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                         vint16mf2_t vs1, vint16mf2_t vs2,
                                         size_t vl);
vint16mf2_t __riscv_vnmsac_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                         int16_t rs1, vint16mf2_t vs2,
                                         size_t vl);
vint16m1_t __riscv_vnmsac_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                       vint16m1_t vs1, vint16m1_t vs2,
                                       size_t vl);
vint16m1_t __riscv_vnmsac_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd, int16_t rs1,
                                       vint16m1_t vs2, size_t vl);
vint16m2_t __riscv_vnmsac_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                       vint16m2_t vs1, vint16m2_t vs2,
                                       size_t vl);
vint16m2_t __riscv_vnmsac_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd, int16_t rs1,
                                       vint16m2_t vs2, size_t vl);
vint16m4_t __riscv_vnmsac_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                       vint16m4_t vs1, vint16m4_t vs2,
                                       size_t vl);
vint16m4_t __riscv_vnmsac_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd, int16_t rs1,
                                       vint16m4_t vs2, size_t vl);
vint16m8_t __riscv_vnmsac_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                       vint16m8_t vs1, vint16m8_t vs2,
                                       size_t vl);
vint16m8_t __riscv_vnmsac_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd, int16_t rs1,
                                       vint16m8_t vs2, size_t vl);
vint32mf2_t __riscv_vnmsac_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                         vint32mf2_t vs1, vint32mf2_t vs2,
                                         size_t vl);
vint32mf2_t __riscv_vnmsac_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                         int32_t rs1, vint32mf2_t vs2,
                                         size_t vl);
vint32m1_t __riscv_vnmsac_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                       vint32m1_t vs1, vint32m1_t vs2,
                                       size_t vl);
vint32m1_t __riscv_vnmsac_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd, int32_t rs1,
                                       vint32m1_t vs2, size_t vl);
vint32m2_t __riscv_vnmsac_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                       vint32m2_t vs1, vint32m2_t vs2,
                                       size_t vl);
vint32m2_t __riscv_vnmsac_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd, int32_t rs1,
                                       vint32m2_t vs2, size_t vl);
vint32m4_t __riscv_vnmsac_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                       vint32m4_t vs1, vint32m4_t vs2,
                                       size_t vl);
vint32m4_t __riscv_vnmsac_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd, int32_t rs1,
                                       vint32m4_t vs2, size_t vl);
vint32m8_t __riscv_vnmsac_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                       vint32m8_t vs1, vint32m8_t vs2,
                                       size_t vl);
vint32m8_t __riscv_vnmsac_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd, int32_t rs1,
                                       vint32m8_t vs2, size_t vl);
vint64m1_t __riscv_vnmsac_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                       vint64m1_t vs1, vint64m1_t vs2,
                                       size_t vl);
vint64m1_t __riscv_vnmsac_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd, int64_t rs1,
                                       vint64m1_t vs2, size_t vl);
vint64m2_t __riscv_vnmsac_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                       vint64m2_t vs1, vint64m2_t vs2,
                                       size_t vl);
vint64m2_t __riscv_vnmsac_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd, int64_t rs1,
                                       vint64m2_t vs2, size_t vl);
vint64m4_t __riscv_vnmsac_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                       vint64m4_t vs1, vint64m4_t vs2,
                                       size_t vl);
vint64m4_t __riscv_vnmsac_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd, int64_t rs1,
                                       vint64m4_t vs2, size_t vl);
vint64m8_t __riscv_vnmsac_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                       vint64m8_t vs1, vint64m8_t vs2,
                                       size_t vl);
vint64m8_t __riscv_vnmsac_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd, int64_t rs1,
                                       vint64m8_t vs2, size_t vl);
vint8mf8_t __riscv_vmadd_vv_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs1, vint8mf8_t vs2,
                                      size_t vl);
vint8mf8_t __riscv_vmadd_vx_i8mf8_tum(vbool64_t vm, vint8mf8_t vd, int8_t rs1,
                                      vint8mf8_t vs2, size_t vl);
vint8mf4_t __riscv_vmadd_vv_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs1, vint8mf4_t vs2,
                                      size_t vl);
vint8mf4_t __riscv_vmadd_vx_i8mf4_tum(vbool32_t vm, vint8mf4_t vd, int8_t rs1,
                                      vint8mf4_t vs2, size_t vl);
vint8mf2_t __riscv_vmadd_vv_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs1, vint8mf2_t vs2,
                                      size_t vl);
vint8mf2_t __riscv_vmadd_vx_i8mf2_tum(vbool16_t vm, vint8mf2_t vd, int8_t rs1,
                                      vint8mf2_t vs2, size_t vl);
vint8m1_t __riscv_vmadd_vv_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs1,
                                    vint8m1_t vs2, size_t vl);
vint8m1_t __riscv_vmadd_vx_i8m1_tum(vbool8_t vm, vint8m1_t vd, int8_t rs1,
                                    vint8m1_t vs2, size_t vl);
vint8m2_t __riscv_vmadd_vv_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs1,
                                    vint8m2_t vs2, size_t vl);
vint8m2_t __riscv_vmadd_vx_i8m2_tum(vbool4_t vm, vint8m2_t vd, int8_t rs1,
                                    vint8m2_t vs2, size_t vl);
vint8m4_t __riscv_vmadd_vv_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs1,
                                    vint8m4_t vs2, size_t vl);
vint8m4_t __riscv_vmadd_vx_i8m4_tum(vbool2_t vm, vint8m4_t vd, int8_t rs1,
                                    vint8m4_t vs2, size_t vl);
vint8m8_t __riscv_vmadd_vv_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs1,
                                    vint8m8_t vs2, size_t vl);
vint8m8_t __riscv_vmadd_vx_i8m8_tum(vbool1_t vm, vint8m8_t vd, int8_t rs1,
                                    vint8m8_t vs2, size_t vl);
vint16mf4_t __riscv_vmadd_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs1, vint16mf4_t vs2,
                                        size_t vl);
vint16mf4_t __riscv_vmadd_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                        int16_t rs1, vint16mf4_t vs2,
                                        size_t vl);
vint16mf2_t __riscv_vmadd_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs1, vint16mf2_t vs2,
                                        size_t vl);
vint16mf2_t __riscv_vmadd_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                        int16_t rs1, vint16mf2_t vs2,
                                        size_t vl);
vint16m1_t __riscv_vmadd_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs1, vint16m1_t vs2,
                                      size_t vl);
vint16m1_t __riscv_vmadd_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd, int16_t rs1,
                                      vint16m1_t vs2, size_t vl);
vint16m2_t __riscv_vmadd_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs1, vint16m2_t vs2,
                                      size_t vl);
vint16m2_t __riscv_vmadd_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd, int16_t rs1,
                                      vint16m2_t vs2, size_t vl);
vint16m4_t __riscv_vmadd_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs1, vint16m4_t vs2,
                                      size_t vl);
vint16m4_t __riscv_vmadd_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd, int16_t rs1,
                                      vint16m4_t vs2, size_t vl);
vint16m8_t __riscv_vmadd_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs1, vint16m8_t vs2,
                                      size_t vl);
vint16m8_t __riscv_vmadd_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd, int16_t rs1,
                                      vint16m8_t vs2, size_t vl);
vint32mf2_t __riscv_vmadd_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs1, vint32mf2_t vs2,
                                        size_t vl);
vint32mf2_t __riscv_vmadd_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                        int32_t rs1, vint32mf2_t vs2,
                                        size_t vl);
vint32m1_t __riscv_vmadd_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs1, vint32m1_t vs2,
                                      size_t vl);
vint32m1_t __riscv_vmadd_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd, int32_t rs1,
                                      vint32m1_t vs2, size_t vl);
vint32m2_t __riscv_vmadd_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs1, vint32m2_t vs2,
                                      size_t vl);
vint32m2_t __riscv_vmadd_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd, int32_t rs1,
                                      vint32m2_t vs2, size_t vl);
vint32m4_t __riscv_vmadd_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs1, vint32m4_t vs2,
                                      size_t vl);
vint32m4_t __riscv_vmadd_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd, int32_t rs1,
                                      vint32m4_t vs2, size_t vl);
vint32m8_t __riscv_vmadd_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs1, vint32m8_t vs2,
                                      size_t vl);
vint32m8_t __riscv_vmadd_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd, int32_t rs1,
                                      vint32m8_t vs2, size_t vl);
vint64m1_t __riscv_vmadd_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs1, vint64m1_t vs2,
                                      size_t vl);
vint64m1_t __riscv_vmadd_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd, int64_t rs1,
                                      vint64m1_t vs2, size_t vl);
vint64m2_t __riscv_vmadd_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs1, vint64m2_t vs2,
                                      size_t vl);
vint64m2_t __riscv_vmadd_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd, int64_t rs1,
                                      vint64m2_t vs2, size_t vl);
vint64m4_t __riscv_vmadd_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs1, vint64m4_t vs2,
                                      size_t vl);
vint64m4_t __riscv_vmadd_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd, int64_t rs1,
                                      vint64m4_t vs2, size_t vl);
vint64m8_t __riscv_vmadd_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs1, vint64m8_t vs2,
                                      size_t vl);
vint64m8_t __riscv_vmadd_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd, int64_t rs1,
                                      vint64m8_t vs2, size_t vl);
vint8mf8_t __riscv_vnmsub_vv_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                       vint8mf8_t vs1, vint8mf8_t vs2,
                                       size_t vl);
vint8mf8_t __riscv_vnmsub_vx_i8mf8_tum(vbool64_t vm, vint8mf8_t vd, int8_t rs1,
                                       vint8mf8_t vs2, size_t vl);
vint8mf4_t __riscv_vnmsub_vv_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                       vint8mf4_t vs1, vint8mf4_t vs2,
                                       size_t vl);
vint8mf4_t __riscv_vnmsub_vx_i8mf4_tum(vbool32_t vm, vint8mf4_t vd, int8_t rs1,
                                       vint8mf4_t vs2, size_t vl);
vint8mf2_t __riscv_vnmsub_vv_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                       vint8mf2_t vs1, vint8mf2_t vs2,
                                       size_t vl);
vint8mf2_t __riscv_vnmsub_vx_i8mf2_tum(vbool16_t vm, vint8mf2_t vd, int8_t rs1,
                                       vint8mf2_t vs2, size_t vl);
vint8m1_t __riscv_vnmsub_vv_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs1,
                                     vint8m1_t vs2, size_t vl);
vint8m1_t __riscv_vnmsub_vx_i8m1_tum(vbool8_t vm, vint8m1_t vd, int8_t rs1,
                                     vint8m1_t vs2, size_t vl);
vint8m2_t __riscv_vnmsub_vv_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs1,
                                     vint8m2_t vs2, size_t vl);
vint8m2_t __riscv_vnmsub_vx_i8m2_tum(vbool4_t vm, vint8m2_t vd, int8_t rs1,
                                     vint8m2_t vs2, size_t vl);
vint8m4_t __riscv_vnmsub_vv_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs1,
                                     vint8m4_t vs2, size_t vl);
vint8m4_t __riscv_vnmsub_vx_i8m4_tum(vbool2_t vm, vint8m4_t vd, int8_t rs1,
                                     vint8m4_t vs2, size_t vl);
vint8m8_t __riscv_vnmsub_vv_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs1,
                                     vint8m8_t vs2, size_t vl);
vint8m8_t __riscv_vnmsub_vx_i8m8_tum(vbool1_t vm, vint8m8_t vd, int8_t rs1,
                                     vint8m8_t vs2, size_t vl);
vint16mf4_t __riscv_vnmsub_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                         vint16mf4_t vs1, vint16mf4_t vs2,
                                         size_t vl);
vint16mf4_t __riscv_vnmsub_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                         int16_t rs1, vint16mf4_t vs2,
                                         size_t vl);
vint16mf2_t __riscv_vnmsub_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                         vint16mf2_t vs1, vint16mf2_t vs2,
                                         size_t vl);
vint16mf2_t __riscv_vnmsub_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                         int16_t rs1, vint16mf2_t vs2,
                                         size_t vl);
vint16m1_t __riscv_vnmsub_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                       vint16m1_t vs1, vint16m1_t vs2,
                                       size_t vl);
vint16m1_t __riscv_vnmsub_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd, int16_t rs1,
                                       vint16m1_t vs2, size_t vl);
vint16m2_t __riscv_vnmsub_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                       vint16m2_t vs1, vint16m2_t vs2,
                                       size_t vl);
vint16m2_t __riscv_vnmsub_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd, int16_t rs1,
                                       vint16m2_t vs2, size_t vl);
vint16m4_t __riscv_vnmsub_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                       vint16m4_t vs1, vint16m4_t vs2,
                                       size_t vl);
vint16m4_t __riscv_vnmsub_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd, int16_t rs1,
                                       vint16m4_t vs2, size_t vl);
vint16m8_t __riscv_vnmsub_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                       vint16m8_t vs1, vint16m8_t vs2,
                                       size_t vl);
vint16m8_t __riscv_vnmsub_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd, int16_t rs1,
                                       vint16m8_t vs2, size_t vl);
vint32mf2_t __riscv_vnmsub_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                         vint32mf2_t vs1, vint32mf2_t vs2,
                                         size_t vl);
vint32mf2_t __riscv_vnmsub_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                         int32_t rs1, vint32mf2_t vs2,
                                         size_t vl);
vint32m1_t __riscv_vnmsub_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                       vint32m1_t vs1, vint32m1_t vs2,
                                       size_t vl);
vint32m1_t __riscv_vnmsub_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd, int32_t rs1,
                                       vint32m1_t vs2, size_t vl);
vint32m2_t __riscv_vnmsub_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                       vint32m2_t vs1, vint32m2_t vs2,
                                       size_t vl);
vint32m2_t __riscv_vnmsub_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd, int32_t rs1,
                                       vint32m2_t vs2, size_t vl);
vint32m4_t __riscv_vnmsub_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                       vint32m4_t vs1, vint32m4_t vs2,
                                       size_t vl);
vint32m4_t __riscv_vnmsub_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd, int32_t rs1,
                                       vint32m4_t vs2, size_t vl);
vint32m8_t __riscv_vnmsub_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                       vint32m8_t vs1, vint32m8_t vs2,
                                       size_t vl);
vint32m8_t __riscv_vnmsub_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd, int32_t rs1,
                                       vint32m8_t vs2, size_t vl);
vint64m1_t __riscv_vnmsub_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                       vint64m1_t vs1, vint64m1_t vs2,
                                       size_t vl);
vint64m1_t __riscv_vnmsub_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd, int64_t rs1,
                                       vint64m1_t vs2, size_t vl);
vint64m2_t __riscv_vnmsub_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                       vint64m2_t vs1, vint64m2_t vs2,
                                       size_t vl);
vint64m2_t __riscv_vnmsub_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd, int64_t rs1,
                                       vint64m2_t vs2, size_t vl);
vint64m4_t __riscv_vnmsub_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                       vint64m4_t vs1, vint64m4_t vs2,
                                       size_t vl);
vint64m4_t __riscv_vnmsub_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd, int64_t rs1,
                                       vint64m4_t vs2, size_t vl);
vint64m8_t __riscv_vnmsub_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                       vint64m8_t vs1, vint64m8_t vs2,
                                       size_t vl);
vint64m8_t __riscv_vnmsub_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd, int64_t rs1,
                                       vint64m8_t vs2, size_t vl);
vuint8mf8_t __riscv_vmacc_vv_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs1, vuint8mf8_t vs2,
                                       size_t vl);
vuint8mf8_t __riscv_vmacc_vx_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                       uint8_t rs1, vuint8mf8_t vs2, size_t vl);
vuint8mf4_t __riscv_vmacc_vv_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs1, vuint8mf4_t vs2,
                                       size_t vl);
vuint8mf4_t __riscv_vmacc_vx_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                       uint8_t rs1, vuint8mf4_t vs2, size_t vl);
vuint8mf2_t __riscv_vmacc_vv_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs1, vuint8mf2_t vs2,
                                       size_t vl);
vuint8mf2_t __riscv_vmacc_vx_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                       uint8_t rs1, vuint8mf2_t vs2, size_t vl);
vuint8m1_t __riscv_vmacc_vv_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs1,
                                     vuint8m1_t vs2, size_t vl);
vuint8m1_t __riscv_vmacc_vx_u8m1_tum(vbool8_t vm, vuint8m1_t vd, uint8_t rs1,
                                     vuint8m1_t vs2, size_t vl);
vuint8m2_t __riscv_vmacc_vv_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs1,
                                     vuint8m2_t vs2, size_t vl);
vuint8m2_t __riscv_vmacc_vx_u8m2_tum(vbool4_t vm, vuint8m2_t vd, uint8_t rs1,
                                     vuint8m2_t vs2, size_t vl);
vuint8m4_t __riscv_vmacc_vv_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs1,
                                     vuint8m4_t vs2, size_t vl);
vuint8m4_t __riscv_vmacc_vx_u8m4_tum(vbool2_t vm, vuint8m4_t vd, uint8_t rs1,
                                     vuint8m4_t vs2, size_t vl);
vuint8m8_t __riscv_vmacc_vv_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs1,
                                     vuint8m8_t vs2, size_t vl);
vuint8m8_t __riscv_vmacc_vx_u8m8_tum(vbool1_t vm, vuint8m8_t vd, uint8_t rs1,
                                     vuint8m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vmacc_vv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs1, vuint16mf4_t vs2,
                                         size_t vl);
vuint16mf4_t __riscv_vmacc_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                         uint16_t rs1, vuint16mf4_t vs2,
                                         size_t vl);
vuint16mf2_t __riscv_vmacc_vv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs1, vuint16mf2_t vs2,
                                         size_t vl);
vuint16mf2_t __riscv_vmacc_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                         uint16_t rs1, vuint16mf2_t vs2,
                                         size_t vl);
vuint16m1_t __riscv_vmacc_vv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs1, vuint16m1_t vs2,
                                       size_t vl);
vuint16m1_t __riscv_vmacc_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                       uint16_t rs1, vuint16m1_t vs2,
                                       size_t vl);
vuint16m2_t __riscv_vmacc_vv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs1, vuint16m2_t vs2,
                                       size_t vl);
vuint16m2_t __riscv_vmacc_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                       uint16_t rs1, vuint16m2_t vs2,
                                       size_t vl);
vuint16m4_t __riscv_vmacc_vv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs1, vuint16m4_t vs2,
                                       size_t vl);
vuint16m4_t __riscv_vmacc_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                       uint16_t rs1, vuint16m4_t vs2,
                                       size_t vl);
vuint16m8_t __riscv_vmacc_vv_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs1, vuint16m8_t vs2,
                                       size_t vl);
vuint16m8_t __riscv_vmacc_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                       uint16_t rs1, vuint16m8_t vs2,
                                       size_t vl);
vuint32mf2_t __riscv_vmacc_vv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs1, vuint32mf2_t vs2,
                                         size_t vl);
vuint32mf2_t __riscv_vmacc_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                         uint32_t rs1, vuint32mf2_t vs2,
                                         size_t vl);
vuint32m1_t __riscv_vmacc_vv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs1, vuint32m1_t vs2,
                                       size_t vl);
vuint32m1_t __riscv_vmacc_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                       uint32_t rs1, vuint32m1_t vs2,
                                       size_t vl);
vuint32m2_t __riscv_vmacc_vv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs1, vuint32m2_t vs2,
                                       size_t vl);
vuint32m2_t __riscv_vmacc_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                       uint32_t rs1, vuint32m2_t vs2,
                                       size_t vl);
vuint32m4_t __riscv_vmacc_vv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs1, vuint32m4_t vs2,
                                       size_t vl);
vuint32m4_t __riscv_vmacc_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                       uint32_t rs1, vuint32m4_t vs2,
                                       size_t vl);
vuint32m8_t __riscv_vmacc_vv_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs1, vuint32m8_t vs2,
                                       size_t vl);
vuint32m8_t __riscv_vmacc_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                       uint32_t rs1, vuint32m8_t vs2,
                                       size_t vl);
vuint64m1_t __riscv_vmacc_vv_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs1, vuint64m1_t vs2,
                                       size_t vl);
vuint64m1_t __riscv_vmacc_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                       uint64_t rs1, vuint64m1_t vs2,
                                       size_t vl);
vuint64m2_t __riscv_vmacc_vv_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs1, vuint64m2_t vs2,
                                       size_t vl);
vuint64m2_t __riscv_vmacc_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                       uint64_t rs1, vuint64m2_t vs2,
                                       size_t vl);
vuint64m4_t __riscv_vmacc_vv_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs1, vuint64m4_t vs2,
                                       size_t vl);
vuint64m4_t __riscv_vmacc_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                       uint64_t rs1, vuint64m4_t vs2,
                                       size_t vl);
vuint64m8_t __riscv_vmacc_vv_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs1, vuint64m8_t vs2,
                                       size_t vl);
vuint64m8_t __riscv_vmacc_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                       uint64_t rs1, vuint64m8_t vs2,
                                       size_t vl);
vuint8mf8_t __riscv_vnmsac_vv_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                        vuint8mf8_t vs1, vuint8mf8_t vs2,
                                        size_t vl);
vuint8mf8_t __riscv_vnmsac_vx_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                        uint8_t rs1, vuint8mf8_t vs2,
                                        size_t vl);
vuint8mf4_t __riscv_vnmsac_vv_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                        vuint8mf4_t vs1, vuint8mf4_t vs2,
                                        size_t vl);
vuint8mf4_t __riscv_vnmsac_vx_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                        uint8_t rs1, vuint8mf4_t vs2,
                                        size_t vl);
vuint8mf2_t __riscv_vnmsac_vv_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                        vuint8mf2_t vs1, vuint8mf2_t vs2,
                                        size_t vl);
vuint8mf2_t __riscv_vnmsac_vx_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                        uint8_t rs1, vuint8mf2_t vs2,
                                        size_t vl);
vuint8m1_t __riscv_vnmsac_vv_u8m1_tum(vbool8_t vm, vuint8m1_t vd,
                                      vuint8m1_t vs1, vuint8m1_t vs2,
                                      size_t vl);
vuint8m1_t __riscv_vnmsac_vx_u8m1_tum(vbool8_t vm, vuint8m1_t vd, uint8_t rs1,
                                      vuint8m1_t vs2, size_t vl);
vuint8m2_t __riscv_vnmsac_vv_u8m2_tum(vbool4_t vm, vuint8m2_t vd,
                                      vuint8m2_t vs1, vuint8m2_t vs2,
                                      size_t vl);
vuint8m2_t __riscv_vnmsac_vx_u8m2_tum(vbool4_t vm, vuint8m2_t vd, uint8_t rs1,
                                      vuint8m2_t vs2, size_t vl);
vuint8m4_t __riscv_vnmsac_vv_u8m4_tum(vbool2_t vm, vuint8m4_t vd,
                                      vuint8m4_t vs1, vuint8m4_t vs2,
                                      size_t vl);
vuint8m4_t __riscv_vnmsac_vx_u8m4_tum(vbool2_t vm, vuint8m4_t vd, uint8_t rs1,
                                      vuint8m4_t vs2, size_t vl);
vuint8m8_t __riscv_vnmsac_vv_u8m8_tum(vbool1_t vm, vuint8m8_t vd,
                                      vuint8m8_t vs1, vuint8m8_t vs2,
                                      size_t vl);
vuint8m8_t __riscv_vnmsac_vx_u8m8_tum(vbool1_t vm, vuint8m8_t vd, uint8_t rs1,
                                      vuint8m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vnmsac_vv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                          vuint16mf4_t vs1, vuint16mf4_t vs2,
                                          size_t vl);
vuint16mf4_t __riscv_vnmsac_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                          uint16_t rs1, vuint16mf4_t vs2,
                                          size_t vl);
vuint16mf2_t __riscv_vnmsac_vv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                          vuint16mf2_t vs1, vuint16mf2_t vs2,
                                          size_t vl);
vuint16mf2_t __riscv_vnmsac_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                          uint16_t rs1, vuint16mf2_t vs2,
                                          size_t vl);
vuint16m1_t __riscv_vnmsac_vv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                        vuint16m1_t vs1, vuint16m1_t vs2,
                                        size_t vl);
vuint16m1_t __riscv_vnmsac_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                        uint16_t rs1, vuint16m1_t vs2,
                                        size_t vl);
vuint16m2_t __riscv_vnmsac_vv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                        vuint16m2_t vs1, vuint16m2_t vs2,
                                        size_t vl);
vuint16m2_t __riscv_vnmsac_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                        uint16_t rs1, vuint16m2_t vs2,
                                        size_t vl);
vuint16m4_t __riscv_vnmsac_vv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                        vuint16m4_t vs1, vuint16m4_t vs2,
                                        size_t vl);
vuint16m4_t __riscv_vnmsac_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                        uint16_t rs1, vuint16m4_t vs2,
                                        size_t vl);
vuint16m8_t __riscv_vnmsac_vv_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                        vuint16m8_t vs1, vuint16m8_t vs2,
                                        size_t vl);
vuint16m8_t __riscv_vnmsac_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                        uint16_t rs1, vuint16m8_t vs2,
                                        size_t vl);
vuint32mf2_t __riscv_vnmsac_vv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                          vuint32mf2_t vs1, vuint32mf2_t vs2,
                                          size_t vl);
vuint32mf2_t __riscv_vnmsac_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                          uint32_t rs1, vuint32mf2_t vs2,
                                          size_t vl);
vuint32m1_t __riscv_vnmsac_vv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                        vuint32m1_t vs1, vuint32m1_t vs2,
                                        size_t vl);
vuint32m1_t __riscv_vnmsac_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                        uint32_t rs1, vuint32m1_t vs2,
                                        size_t vl);
vuint32m2_t __riscv_vnmsac_vv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                        vuint32m2_t vs1, vuint32m2_t vs2,
                                        size_t vl);
vuint32m2_t __riscv_vnmsac_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                        uint32_t rs1, vuint32m2_t vs2,
                                        size_t vl);
vuint32m4_t __riscv_vnmsac_vv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                        vuint32m4_t vs1, vuint32m4_t vs2,
                                        size_t vl);
vuint32m4_t __riscv_vnmsac_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                        uint32_t rs1, vuint32m4_t vs2,
                                        size_t vl);
vuint32m8_t __riscv_vnmsac_vv_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                        vuint32m8_t vs1, vuint32m8_t vs2,
                                        size_t vl);
vuint32m8_t __riscv_vnmsac_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                        uint32_t rs1, vuint32m8_t vs2,
                                        size_t vl);
vuint64m1_t __riscv_vnmsac_vv_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                        vuint64m1_t vs1, vuint64m1_t vs2,
                                        size_t vl);
vuint64m1_t __riscv_vnmsac_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                        uint64_t rs1, vuint64m1_t vs2,
                                        size_t vl);
vuint64m2_t __riscv_vnmsac_vv_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                        vuint64m2_t vs1, vuint64m2_t vs2,
                                        size_t vl);
vuint64m2_t __riscv_vnmsac_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                        uint64_t rs1, vuint64m2_t vs2,
                                        size_t vl);
vuint64m4_t __riscv_vnmsac_vv_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                        vuint64m4_t vs1, vuint64m4_t vs2,
                                        size_t vl);
vuint64m4_t __riscv_vnmsac_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                        uint64_t rs1, vuint64m4_t vs2,
                                        size_t vl);
vuint64m8_t __riscv_vnmsac_vv_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                        vuint64m8_t vs1, vuint64m8_t vs2,
                                        size_t vl);
vuint64m8_t __riscv_vnmsac_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                        uint64_t rs1, vuint64m8_t vs2,
                                        size_t vl);
vuint8mf8_t __riscv_vmadd_vv_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs1, vuint8mf8_t vs2,
                                       size_t vl);
vuint8mf8_t __riscv_vmadd_vx_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                       uint8_t rs1, vuint8mf8_t vs2, size_t vl);
vuint8mf4_t __riscv_vmadd_vv_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs1, vuint8mf4_t vs2,
                                       size_t vl);
vuint8mf4_t __riscv_vmadd_vx_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                       uint8_t rs1, vuint8mf4_t vs2, size_t vl);
vuint8mf2_t __riscv_vmadd_vv_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs1, vuint8mf2_t vs2,
                                       size_t vl);
vuint8mf2_t __riscv_vmadd_vx_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                       uint8_t rs1, vuint8mf2_t vs2, size_t vl);
vuint8m1_t __riscv_vmadd_vv_u8m1_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs1,
                                     vuint8m1_t vs2, size_t vl);
vuint8m1_t __riscv_vmadd_vx_u8m1_tum(vbool8_t vm, vuint8m1_t vd, uint8_t rs1,
                                     vuint8m1_t vs2, size_t vl);
vuint8m2_t __riscv_vmadd_vv_u8m2_tum(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs1,
                                     vuint8m2_t vs2, size_t vl);
vuint8m2_t __riscv_vmadd_vx_u8m2_tum(vbool4_t vm, vuint8m2_t vd, uint8_t rs1,
                                     vuint8m2_t vs2, size_t vl);
vuint8m4_t __riscv_vmadd_vv_u8m4_tum(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs1,
                                     vuint8m4_t vs2, size_t vl);
vuint8m4_t __riscv_vmadd_vx_u8m4_tum(vbool2_t vm, vuint8m4_t vd, uint8_t rs1,
                                     vuint8m4_t vs2, size_t vl);
vuint8m8_t __riscv_vmadd_vv_u8m8_tum(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs1,
                                     vuint8m8_t vs2, size_t vl);
vuint8m8_t __riscv_vmadd_vx_u8m8_tum(vbool1_t vm, vuint8m8_t vd, uint8_t rs1,
                                     vuint8m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vmadd_vv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs1, vuint16mf4_t vs2,
                                         size_t vl);
vuint16mf4_t __riscv_vmadd_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                         uint16_t rs1, vuint16mf4_t vs2,
                                         size_t vl);
vuint16mf2_t __riscv_vmadd_vv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs1, vuint16mf2_t vs2,
                                         size_t vl);
vuint16mf2_t __riscv_vmadd_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                         uint16_t rs1, vuint16mf2_t vs2,
                                         size_t vl);
vuint16m1_t __riscv_vmadd_vv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs1, vuint16m1_t vs2,
                                       size_t vl);
vuint16m1_t __riscv_vmadd_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                       uint16_t rs1, vuint16m1_t vs2,
                                       size_t vl);
vuint16m2_t __riscv_vmadd_vv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs1, vuint16m2_t vs2,
                                       size_t vl);
vuint16m2_t __riscv_vmadd_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                       uint16_t rs1, vuint16m2_t vs2,
                                       size_t vl);
vuint16m4_t __riscv_vmadd_vv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs1, vuint16m4_t vs2,
                                       size_t vl);
vuint16m4_t __riscv_vmadd_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                       uint16_t rs1, vuint16m4_t vs2,
                                       size_t vl);
vuint16m8_t __riscv_vmadd_vv_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs1, vuint16m8_t vs2,
                                       size_t vl);
vuint16m8_t __riscv_vmadd_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                       uint16_t rs1, vuint16m8_t vs2,
                                       size_t vl);
vuint32mf2_t __riscv_vmadd_vv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs1, vuint32mf2_t vs2,
                                         size_t vl);
vuint32mf2_t __riscv_vmadd_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                         uint32_t rs1, vuint32mf2_t vs2,
                                         size_t vl);
vuint32m1_t __riscv_vmadd_vv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs1, vuint32m1_t vs2,
                                       size_t vl);
vuint32m1_t __riscv_vmadd_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                       uint32_t rs1, vuint32m1_t vs2,
                                       size_t vl);
vuint32m2_t __riscv_vmadd_vv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs1, vuint32m2_t vs2,
                                       size_t vl);
vuint32m2_t __riscv_vmadd_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                       uint32_t rs1, vuint32m2_t vs2,
                                       size_t vl);
vuint32m4_t __riscv_vmadd_vv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs1, vuint32m4_t vs2,
                                       size_t vl);
vuint32m4_t __riscv_vmadd_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                       uint32_t rs1, vuint32m4_t vs2,
                                       size_t vl);
vuint32m8_t __riscv_vmadd_vv_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs1, vuint32m8_t vs2,
                                       size_t vl);
vuint32m8_t __riscv_vmadd_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                       uint32_t rs1, vuint32m8_t vs2,
                                       size_t vl);
vuint64m1_t __riscv_vmadd_vv_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs1, vuint64m1_t vs2,
                                       size_t vl);
vuint64m1_t __riscv_vmadd_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                       uint64_t rs1, vuint64m1_t vs2,
                                       size_t vl);
vuint64m2_t __riscv_vmadd_vv_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs1, vuint64m2_t vs2,
                                       size_t vl);
vuint64m2_t __riscv_vmadd_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                       uint64_t rs1, vuint64m2_t vs2,
                                       size_t vl);
vuint64m4_t __riscv_vmadd_vv_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs1, vuint64m4_t vs2,
                                       size_t vl);
vuint64m4_t __riscv_vmadd_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                       uint64_t rs1, vuint64m4_t vs2,
                                       size_t vl);
vuint64m8_t __riscv_vmadd_vv_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs1, vuint64m8_t vs2,
                                       size_t vl);
vuint64m8_t __riscv_vmadd_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                       uint64_t rs1, vuint64m8_t vs2,
                                       size_t vl);
vuint8mf8_t __riscv_vnmsub_vv_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                        vuint8mf8_t vs1, vuint8mf8_t vs2,
                                        size_t vl);
vuint8mf8_t __riscv_vnmsub_vx_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                        uint8_t rs1, vuint8mf8_t vs2,
                                        size_t vl);
vuint8mf4_t __riscv_vnmsub_vv_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                        vuint8mf4_t vs1, vuint8mf4_t vs2,
                                        size_t vl);
vuint8mf4_t __riscv_vnmsub_vx_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                        uint8_t rs1, vuint8mf4_t vs2,
                                        size_t vl);
vuint8mf2_t __riscv_vnmsub_vv_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                        vuint8mf2_t vs1, vuint8mf2_t vs2,
                                        size_t vl);
vuint8mf2_t __riscv_vnmsub_vx_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                        uint8_t rs1, vuint8mf2_t vs2,
                                        size_t vl);
vuint8m1_t __riscv_vnmsub_vv_u8m1_tum(vbool8_t vm, vuint8m1_t vd,
                                      vuint8m1_t vs1, vuint8m1_t vs2,
                                      size_t vl);
vuint8m1_t __riscv_vnmsub_vx_u8m1_tum(vbool8_t vm, vuint8m1_t vd, uint8_t rs1,
                                      vuint8m1_t vs2, size_t vl);
vuint8m2_t __riscv_vnmsub_vv_u8m2_tum(vbool4_t vm, vuint8m2_t vd,
                                      vuint8m2_t vs1, vuint8m2_t vs2,
                                      size_t vl);
vuint8m2_t __riscv_vnmsub_vx_u8m2_tum(vbool4_t vm, vuint8m2_t vd, uint8_t rs1,
                                      vuint8m2_t vs2, size_t vl);
vuint8m4_t __riscv_vnmsub_vv_u8m4_tum(vbool2_t vm, vuint8m4_t vd,
                                      vuint8m4_t vs1, vuint8m4_t vs2,
                                      size_t vl);
vuint8m4_t __riscv_vnmsub_vx_u8m4_tum(vbool2_t vm, vuint8m4_t vd, uint8_t rs1,
                                      vuint8m4_t vs2, size_t vl);
vuint8m8_t __riscv_vnmsub_vv_u8m8_tum(vbool1_t vm, vuint8m8_t vd,
                                      vuint8m8_t vs1, vuint8m8_t vs2,
                                      size_t vl);
vuint8m8_t __riscv_vnmsub_vx_u8m8_tum(vbool1_t vm, vuint8m8_t vd, uint8_t rs1,
                                      vuint8m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vnmsub_vv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                          vuint16mf4_t vs1, vuint16mf4_t vs2,
                                          size_t vl);
vuint16mf4_t __riscv_vnmsub_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                          uint16_t rs1, vuint16mf4_t vs2,
                                          size_t vl);
vuint16mf2_t __riscv_vnmsub_vv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                          vuint16mf2_t vs1, vuint16mf2_t vs2,
                                          size_t vl);
vuint16mf2_t __riscv_vnmsub_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                          uint16_t rs1, vuint16mf2_t vs2,
                                          size_t vl);
vuint16m1_t __riscv_vnmsub_vv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                        vuint16m1_t vs1, vuint16m1_t vs2,
                                        size_t vl);
vuint16m1_t __riscv_vnmsub_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                        uint16_t rs1, vuint16m1_t vs2,
                                        size_t vl);
vuint16m2_t __riscv_vnmsub_vv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                        vuint16m2_t vs1, vuint16m2_t vs2,
                                        size_t vl);
vuint16m2_t __riscv_vnmsub_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                        uint16_t rs1, vuint16m2_t vs2,
                                        size_t vl);
vuint16m4_t __riscv_vnmsub_vv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                        vuint16m4_t vs1, vuint16m4_t vs2,
                                        size_t vl);
vuint16m4_t __riscv_vnmsub_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                        uint16_t rs1, vuint16m4_t vs2,
                                        size_t vl);
vuint16m8_t __riscv_vnmsub_vv_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                        vuint16m8_t vs1, vuint16m8_t vs2,
                                        size_t vl);
vuint16m8_t __riscv_vnmsub_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                        uint16_t rs1, vuint16m8_t vs2,
                                        size_t vl);
vuint32mf2_t __riscv_vnmsub_vv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                          vuint32mf2_t vs1, vuint32mf2_t vs2,
                                          size_t vl);
vuint32mf2_t __riscv_vnmsub_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                          uint32_t rs1, vuint32mf2_t vs2,
                                          size_t vl);
vuint32m1_t __riscv_vnmsub_vv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                        vuint32m1_t vs1, vuint32m1_t vs2,
                                        size_t vl);
vuint32m1_t __riscv_vnmsub_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                        uint32_t rs1, vuint32m1_t vs2,
                                        size_t vl);
vuint32m2_t __riscv_vnmsub_vv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                        vuint32m2_t vs1, vuint32m2_t vs2,
                                        size_t vl);
vuint32m2_t __riscv_vnmsub_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                        uint32_t rs1, vuint32m2_t vs2,
                                        size_t vl);
vuint32m4_t __riscv_vnmsub_vv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                        vuint32m4_t vs1, vuint32m4_t vs2,
                                        size_t vl);
vuint32m4_t __riscv_vnmsub_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                        uint32_t rs1, vuint32m4_t vs2,
                                        size_t vl);
vuint32m8_t __riscv_vnmsub_vv_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                        vuint32m8_t vs1, vuint32m8_t vs2,
                                        size_t vl);
vuint32m8_t __riscv_vnmsub_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                        uint32_t rs1, vuint32m8_t vs2,
                                        size_t vl);
vuint64m1_t __riscv_vnmsub_vv_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                        vuint64m1_t vs1, vuint64m1_t vs2,
                                        size_t vl);
vuint64m1_t __riscv_vnmsub_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                        uint64_t rs1, vuint64m1_t vs2,
                                        size_t vl);
vuint64m2_t __riscv_vnmsub_vv_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                        vuint64m2_t vs1, vuint64m2_t vs2,
                                        size_t vl);
vuint64m2_t __riscv_vnmsub_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                        uint64_t rs1, vuint64m2_t vs2,
                                        size_t vl);
vuint64m4_t __riscv_vnmsub_vv_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                        vuint64m4_t vs1, vuint64m4_t vs2,
                                        size_t vl);
vuint64m4_t __riscv_vnmsub_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                        uint64_t rs1, vuint64m4_t vs2,
                                        size_t vl);
vuint64m8_t __riscv_vnmsub_vv_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                        vuint64m8_t vs1, vuint64m8_t vs2,
                                        size_t vl);
vuint64m8_t __riscv_vnmsub_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                        uint64_t rs1, vuint64m8_t vs2,
                                        size_t vl);
// masked functions
vint8mf8_t __riscv_vmacc_vv_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                       vint8mf8_t vs1, vint8mf8_t vs2,
                                       size_t vl);
vint8mf8_t __riscv_vmacc_vx_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd, int8_t rs1,
                                       vint8mf8_t vs2, size_t vl);
vint8mf4_t __riscv_vmacc_vv_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                       vint8mf4_t vs1, vint8mf4_t vs2,
                                       size_t vl);
vint8mf4_t __riscv_vmacc_vx_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd, int8_t rs1,
                                       vint8mf4_t vs2, size_t vl);
vint8mf2_t __riscv_vmacc_vv_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                       vint8mf2_t vs1, vint8mf2_t vs2,
                                       size_t vl);
vint8mf2_t __riscv_vmacc_vx_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd, int8_t rs1,
                                       vint8mf2_t vs2, size_t vl);
vint8m1_t __riscv_vmacc_vv_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs1,
                                     vint8m1_t vs2, size_t vl);
vint8m1_t __riscv_vmacc_vx_i8m1_tumu(vbool8_t vm, vint8m1_t vd, int8_t rs1,
                                     vint8m1_t vs2, size_t vl);
vint8m2_t __riscv_vmacc_vv_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs1,
                                     vint8m2_t vs2, size_t vl);
vint8m2_t __riscv_vmacc_vx_i8m2_tumu(vbool4_t vm, vint8m2_t vd, int8_t rs1,
                                     vint8m2_t vs2, size_t vl);
vint8m4_t __riscv_vmacc_vv_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs1,
                                     vint8m4_t vs2, size_t vl);
vint8m4_t __riscv_vmacc_vx_i8m4_tumu(vbool2_t vm, vint8m4_t vd, int8_t rs1,
                                     vint8m4_t vs2, size_t vl);
vint8m8_t __riscv_vmacc_vv_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs1,
                                     vint8m8_t vs2, size_t vl);
vint8m8_t __riscv_vmacc_vx_i8m8_tumu(vbool1_t vm, vint8m8_t vd, int8_t rs1,
                                     vint8m8_t vs2, size_t vl);
vint16mf4_t __riscv_vmacc_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                         vint16mf4_t vs1, vint16mf4_t vs2,
                                         size_t vl);
vint16mf4_t __riscv_vmacc_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                         int16_t rs1, vint16mf4_t vs2,
                                         size_t vl);
vint16mf2_t __riscv_vmacc_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                         vint16mf2_t vs1, vint16mf2_t vs2,
                                         size_t vl);
vint16mf2_t __riscv_vmacc_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                         int16_t rs1, vint16mf2_t vs2,
                                         size_t vl);
vint16m1_t __riscv_vmacc_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                       vint16m1_t vs1, vint16m1_t vs2,
                                       size_t vl);
vint16m1_t __riscv_vmacc_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd, int16_t rs1,
                                       vint16m1_t vs2, size_t vl);
vint16m2_t __riscv_vmacc_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                       vint16m2_t vs1, vint16m2_t vs2,
                                       size_t vl);
vint16m2_t __riscv_vmacc_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd, int16_t rs1,
                                       vint16m2_t vs2, size_t vl);
vint16m4_t __riscv_vmacc_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                       vint16m4_t vs1, vint16m4_t vs2,
                                       size_t vl);
vint16m4_t __riscv_vmacc_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd, int16_t rs1,
                                       vint16m4_t vs2, size_t vl);
vint16m8_t __riscv_vmacc_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                       vint16m8_t vs1, vint16m8_t vs2,
                                       size_t vl);
vint16m8_t __riscv_vmacc_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd, int16_t rs1,
                                       vint16m8_t vs2, size_t vl);
vint32mf2_t __riscv_vmacc_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                         vint32mf2_t vs1, vint32mf2_t vs2,
                                         size_t vl);
vint32mf2_t __riscv_vmacc_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                         int32_t rs1, vint32mf2_t vs2,
                                         size_t vl);
vint32m1_t __riscv_vmacc_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                       vint32m1_t vs1, vint32m1_t vs2,
                                       size_t vl);
vint32m1_t __riscv_vmacc_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd, int32_t rs1,
                                       vint32m1_t vs2, size_t vl);
vint32m2_t __riscv_vmacc_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                       vint32m2_t vs1, vint32m2_t vs2,
                                       size_t vl);
vint32m2_t __riscv_vmacc_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd, int32_t rs1,
                                       vint32m2_t vs2, size_t vl);
vint32m4_t __riscv_vmacc_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                       vint32m4_t vs1, vint32m4_t vs2,
                                       size_t vl);
vint32m4_t __riscv_vmacc_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd, int32_t rs1,
                                       vint32m4_t vs2, size_t vl);
vint32m8_t __riscv_vmacc_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                       vint32m8_t vs1, vint32m8_t vs2,
                                       size_t vl);
vint32m8_t __riscv_vmacc_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd, int32_t rs1,
                                       vint32m8_t vs2, size_t vl);
vint64m1_t __riscv_vmacc_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                       vint64m1_t vs1, vint64m1_t vs2,
                                       size_t vl);
vint64m1_t __riscv_vmacc_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd, int64_t rs1,
                                       vint64m1_t vs2, size_t vl);
vint64m2_t __riscv_vmacc_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                       vint64m2_t vs1, vint64m2_t vs2,
                                       size_t vl);
vint64m2_t __riscv_vmacc_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd, int64_t rs1,
                                       vint64m2_t vs2, size_t vl);
vint64m4_t __riscv_vmacc_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                       vint64m4_t vs1, vint64m4_t vs2,
                                       size_t vl);
vint64m4_t __riscv_vmacc_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd, int64_t rs1,
                                       vint64m4_t vs2, size_t vl);
vint64m8_t __riscv_vmacc_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                       vint64m8_t vs1, vint64m8_t vs2,
                                       size_t vl);
vint64m8_t __riscv_vmacc_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd, int64_t rs1,
                                       vint64m8_t vs2, size_t vl);
vint8mf8_t __riscv_vnmsac_vv_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                        vint8mf8_t vs1, vint8mf8_t vs2,
                                        size_t vl);
vint8mf8_t __riscv_vnmsac_vx_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd, int8_t rs1,
                                        vint8mf8_t vs2, size_t vl);
vint8mf4_t __riscv_vnmsac_vv_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                        vint8mf4_t vs1, vint8mf4_t vs2,
                                        size_t vl);
vint8mf4_t __riscv_vnmsac_vx_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd, int8_t rs1,
                                        vint8mf4_t vs2, size_t vl);
vint8mf2_t __riscv_vnmsac_vv_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                        vint8mf2_t vs1, vint8mf2_t vs2,
                                        size_t vl);
vint8mf2_t __riscv_vnmsac_vx_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd, int8_t rs1,
                                        vint8mf2_t vs2, size_t vl);
vint8m1_t __riscv_vnmsac_vv_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs1,
                                      vint8m1_t vs2, size_t vl);
vint8m1_t __riscv_vnmsac_vx_i8m1_tumu(vbool8_t vm, vint8m1_t vd, int8_t rs1,
                                      vint8m1_t vs2, size_t vl);
vint8m2_t __riscv_vnmsac_vv_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs1,
                                      vint8m2_t vs2, size_t vl);
vint8m2_t __riscv_vnmsac_vx_i8m2_tumu(vbool4_t vm, vint8m2_t vd, int8_t rs1,
                                      vint8m2_t vs2, size_t vl);
vint8m4_t __riscv_vnmsac_vv_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs1,
                                      vint8m4_t vs2, size_t vl);
vint8m4_t __riscv_vnmsac_vx_i8m4_tumu(vbool2_t vm, vint8m4_t vd, int8_t rs1,
                                      vint8m4_t vs2, size_t vl);
vint8m8_t __riscv_vnmsac_vv_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs1,
                                      vint8m8_t vs2, size_t vl);
vint8m8_t __riscv_vnmsac_vx_i8m8_tumu(vbool1_t vm, vint8m8_t vd, int8_t rs1,
                                      vint8m8_t vs2, size_t vl);
vint16mf4_t __riscv_vnmsac_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                          vint16mf4_t vs1, vint16mf4_t vs2,
                                          size_t vl);
vint16mf4_t __riscv_vnmsac_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                          int16_t rs1, vint16mf4_t vs2,
                                          size_t vl);
vint16mf2_t __riscv_vnmsac_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                          vint16mf2_t vs1, vint16mf2_t vs2,
                                          size_t vl);
vint16mf2_t __riscv_vnmsac_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                          int16_t rs1, vint16mf2_t vs2,
                                          size_t vl);
vint16m1_t __riscv_vnmsac_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                        vint16m1_t vs1, vint16m1_t vs2,
                                        size_t vl);
vint16m1_t __riscv_vnmsac_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                        int16_t rs1, vint16m1_t vs2, size_t vl);
vint16m2_t __riscv_vnmsac_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                        vint16m2_t vs1, vint16m2_t vs2,
                                        size_t vl);
vint16m2_t __riscv_vnmsac_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd, int16_t rs1,
                                        vint16m2_t vs2, size_t vl);
vint16m4_t __riscv_vnmsac_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                        vint16m4_t vs1, vint16m4_t vs2,
                                        size_t vl);
vint16m4_t __riscv_vnmsac_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd, int16_t rs1,
                                        vint16m4_t vs2, size_t vl);
vint16m8_t __riscv_vnmsac_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                        vint16m8_t vs1, vint16m8_t vs2,
                                        size_t vl);
vint16m8_t __riscv_vnmsac_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd, int16_t rs1,
                                        vint16m8_t vs2, size_t vl);
vint32mf2_t __riscv_vnmsac_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                          vint32mf2_t vs1, vint32mf2_t vs2,
                                          size_t vl);
vint32mf2_t __riscv_vnmsac_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                          int32_t rs1, vint32mf2_t vs2,
                                          size_t vl);
vint32m1_t __riscv_vnmsac_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                        vint32m1_t vs1, vint32m1_t vs2,
                                        size_t vl);
vint32m1_t __riscv_vnmsac_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                        int32_t rs1, vint32m1_t vs2, size_t vl);
vint32m2_t __riscv_vnmsac_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                        vint32m2_t vs1, vint32m2_t vs2,
                                        size_t vl);
vint32m2_t __riscv_vnmsac_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                        int32_t rs1, vint32m2_t vs2, size_t vl);
vint32m4_t __riscv_vnmsac_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                        vint32m4_t vs1, vint32m4_t vs2,
                                        size_t vl);
vint32m4_t __riscv_vnmsac_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd, int32_t rs1,
                                        vint32m4_t vs2, size_t vl);
vint32m8_t __riscv_vnmsac_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                        vint32m8_t vs1, vint32m8_t vs2,
                                        size_t vl);
vint32m8_t __riscv_vnmsac_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd, int32_t rs1,
                                        vint32m8_t vs2, size_t vl);
vint64m1_t __riscv_vnmsac_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                        vint64m1_t vs1, vint64m1_t vs2,
                                        size_t vl);
vint64m1_t __riscv_vnmsac_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                        int64_t rs1, vint64m1_t vs2, size_t vl);
vint64m2_t __riscv_vnmsac_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                        vint64m2_t vs1, vint64m2_t vs2,
                                        size_t vl);
vint64m2_t __riscv_vnmsac_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                        int64_t rs1, vint64m2_t vs2, size_t vl);
vint64m4_t __riscv_vnmsac_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                        vint64m4_t vs1, vint64m4_t vs2,
                                        size_t vl);
vint64m4_t __riscv_vnmsac_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                        int64_t rs1, vint64m4_t vs2, size_t vl);
vint64m8_t __riscv_vnmsac_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                        vint64m8_t vs1, vint64m8_t vs2,
                                        size_t vl);
vint64m8_t __riscv_vnmsac_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd, int64_t rs1,
                                        vint64m8_t vs2, size_t vl);
vint8mf8_t __riscv_vmadd_vv_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                       vint8mf8_t vs1, vint8mf8_t vs2,
                                       size_t vl);
vint8mf8_t __riscv_vmadd_vx_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd, int8_t rs1,
                                       vint8mf8_t vs2, size_t vl);
vint8mf4_t __riscv_vmadd_vv_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                       vint8mf4_t vs1, vint8mf4_t vs2,
                                       size_t vl);
vint8mf4_t __riscv_vmadd_vx_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd, int8_t rs1,
                                       vint8mf4_t vs2, size_t vl);
vint8mf2_t __riscv_vmadd_vv_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                       vint8mf2_t vs1, vint8mf2_t vs2,
                                       size_t vl);
vint8mf2_t __riscv_vmadd_vx_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd, int8_t rs1,
                                       vint8mf2_t vs2, size_t vl);
vint8m1_t __riscv_vmadd_vv_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs1,
                                     vint8m1_t vs2, size_t vl);
vint8m1_t __riscv_vmadd_vx_i8m1_tumu(vbool8_t vm, vint8m1_t vd, int8_t rs1,
                                     vint8m1_t vs2, size_t vl);
vint8m2_t __riscv_vmadd_vv_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs1,
                                     vint8m2_t vs2, size_t vl);
vint8m2_t __riscv_vmadd_vx_i8m2_tumu(vbool4_t vm, vint8m2_t vd, int8_t rs1,
                                     vint8m2_t vs2, size_t vl);
vint8m4_t __riscv_vmadd_vv_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs1,
                                     vint8m4_t vs2, size_t vl);
vint8m4_t __riscv_vmadd_vx_i8m4_tumu(vbool2_t vm, vint8m4_t vd, int8_t rs1,
                                     vint8m4_t vs2, size_t vl);
vint8m8_t __riscv_vmadd_vv_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs1,
                                     vint8m8_t vs2, size_t vl);
vint8m8_t __riscv_vmadd_vx_i8m8_tumu(vbool1_t vm, vint8m8_t vd, int8_t rs1,
                                     vint8m8_t vs2, size_t vl);
vint16mf4_t __riscv_vmadd_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                         vint16mf4_t vs1, vint16mf4_t vs2,
                                         size_t vl);
vint16mf4_t __riscv_vmadd_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                         int16_t rs1, vint16mf4_t vs2,
                                         size_t vl);
vint16mf2_t __riscv_vmadd_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                         vint16mf2_t vs1, vint16mf2_t vs2,
                                         size_t vl);
vint16mf2_t __riscv_vmadd_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                         int16_t rs1, vint16mf2_t vs2,
                                         size_t vl);
vint16m1_t __riscv_vmadd_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                       vint16m1_t vs1, vint16m1_t vs2,
                                       size_t vl);
vint16m1_t __riscv_vmadd_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd, int16_t rs1,
                                       vint16m1_t vs2, size_t vl);
vint16m2_t __riscv_vmadd_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                       vint16m2_t vs1, vint16m2_t vs2,
                                       size_t vl);
vint16m2_t __riscv_vmadd_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd, int16_t rs1,
                                       vint16m2_t vs2, size_t vl);
vint16m4_t __riscv_vmadd_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                       vint16m4_t vs1, vint16m4_t vs2,
                                       size_t vl);
vint16m4_t __riscv_vmadd_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd, int16_t rs1,
                                       vint16m4_t vs2, size_t vl);
vint16m8_t __riscv_vmadd_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                       vint16m8_t vs1, vint16m8_t vs2,
                                       size_t vl);
vint16m8_t __riscv_vmadd_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd, int16_t rs1,
                                       vint16m8_t vs2, size_t vl);
vint32mf2_t __riscv_vmadd_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                         vint32mf2_t vs1, vint32mf2_t vs2,
                                         size_t vl);
vint32mf2_t __riscv_vmadd_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                         int32_t rs1, vint32mf2_t vs2,
                                         size_t vl);
vint32m1_t __riscv_vmadd_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                       vint32m1_t vs1, vint32m1_t vs2,
                                       size_t vl);
vint32m1_t __riscv_vmadd_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd, int32_t rs1,
                                       vint32m1_t vs2, size_t vl);
vint32m2_t __riscv_vmadd_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                       vint32m2_t vs1, vint32m2_t vs2,
                                       size_t vl);
vint32m2_t __riscv_vmadd_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd, int32_t rs1,
                                       vint32m2_t vs2, size_t vl);
vint32m4_t __riscv_vmadd_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                       vint32m4_t vs1, vint32m4_t vs2,
                                       size_t vl);
vint32m4_t __riscv_vmadd_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd, int32_t rs1,
                                       vint32m4_t vs2, size_t vl);
vint32m8_t __riscv_vmadd_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                       vint32m8_t vs1, vint32m8_t vs2,
                                       size_t vl);
vint32m8_t __riscv_vmadd_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd, int32_t rs1,
                                       vint32m8_t vs2, size_t vl);
vint64m1_t __riscv_vmadd_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                       vint64m1_t vs1, vint64m1_t vs2,
                                       size_t vl);
vint64m1_t __riscv_vmadd_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd, int64_t rs1,
                                       vint64m1_t vs2, size_t vl);
vint64m2_t __riscv_vmadd_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                       vint64m2_t vs1, vint64m2_t vs2,
                                       size_t vl);
vint64m2_t __riscv_vmadd_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd, int64_t rs1,
                                       vint64m2_t vs2, size_t vl);
vint64m4_t __riscv_vmadd_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                       vint64m4_t vs1, vint64m4_t vs2,
                                       size_t vl);
vint64m4_t __riscv_vmadd_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd, int64_t rs1,
                                       vint64m4_t vs2, size_t vl);
vint64m8_t __riscv_vmadd_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                       vint64m8_t vs1, vint64m8_t vs2,
                                       size_t vl);
vint64m8_t __riscv_vmadd_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd, int64_t rs1,
                                       vint64m8_t vs2, size_t vl);
vint8mf8_t __riscv_vnmsub_vv_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                        vint8mf8_t vs1, vint8mf8_t vs2,
                                        size_t vl);
vint8mf8_t __riscv_vnmsub_vx_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd, int8_t rs1,
                                        vint8mf8_t vs2, size_t vl);
vint8mf4_t __riscv_vnmsub_vv_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                        vint8mf4_t vs1, vint8mf4_t vs2,
                                        size_t vl);
vint8mf4_t __riscv_vnmsub_vx_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd, int8_t rs1,
                                        vint8mf4_t vs2, size_t vl);
vint8mf2_t __riscv_vnmsub_vv_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                        vint8mf2_t vs1, vint8mf2_t vs2,
                                        size_t vl);
vint8mf2_t __riscv_vnmsub_vx_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd, int8_t rs1,
                                        vint8mf2_t vs2, size_t vl);
vint8m1_t __riscv_vnmsub_vv_i8m1_tumu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs1,
                                      vint8m1_t vs2, size_t vl);
vint8m1_t __riscv_vnmsub_vx_i8m1_tumu(vbool8_t vm, vint8m1_t vd, int8_t rs1,
                                      vint8m1_t vs2, size_t vl);
vint8m2_t __riscv_vnmsub_vv_i8m2_tumu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs1,
                                      vint8m2_t vs2, size_t vl);
vint8m2_t __riscv_vnmsub_vx_i8m2_tumu(vbool4_t vm, vint8m2_t vd, int8_t rs1,
                                      vint8m2_t vs2, size_t vl);
vint8m4_t __riscv_vnmsub_vv_i8m4_tumu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs1,
                                      vint8m4_t vs2, size_t vl);
vint8m4_t __riscv_vnmsub_vx_i8m4_tumu(vbool2_t vm, vint8m4_t vd, int8_t rs1,
                                      vint8m4_t vs2, size_t vl);
vint8m8_t __riscv_vnmsub_vv_i8m8_tumu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs1,
                                      vint8m8_t vs2, size_t vl);
vint8m8_t __riscv_vnmsub_vx_i8m8_tumu(vbool1_t vm, vint8m8_t vd, int8_t rs1,
                                      vint8m8_t vs2, size_t vl);
vint16mf4_t __riscv_vnmsub_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                          vint16mf4_t vs1, vint16mf4_t vs2,
                                          size_t vl);
vint16mf4_t __riscv_vnmsub_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                          int16_t rs1, vint16mf4_t vs2,
                                          size_t vl);
vint16mf2_t __riscv_vnmsub_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                          vint16mf2_t vs1, vint16mf2_t vs2,
                                          size_t vl);
vint16mf2_t __riscv_vnmsub_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                          int16_t rs1, vint16mf2_t vs2,
                                          size_t vl);
vint16m1_t __riscv_vnmsub_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                        vint16m1_t vs1, vint16m1_t vs2,
                                        size_t vl);
vint16m1_t __riscv_vnmsub_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                        int16_t rs1, vint16m1_t vs2, size_t vl);
vint16m2_t __riscv_vnmsub_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                        vint16m2_t vs1, vint16m2_t vs2,
                                        size_t vl);
vint16m2_t __riscv_vnmsub_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd, int16_t rs1,
                                        vint16m2_t vs2, size_t vl);
vint16m4_t __riscv_vnmsub_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                        vint16m4_t vs1, vint16m4_t vs2,
                                        size_t vl);
vint16m4_t __riscv_vnmsub_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd, int16_t rs1,
                                        vint16m4_t vs2, size_t vl);
vint16m8_t __riscv_vnmsub_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                        vint16m8_t vs1, vint16m8_t vs2,
                                        size_t vl);
vint16m8_t __riscv_vnmsub_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd, int16_t rs1,
                                        vint16m8_t vs2, size_t vl);
vint32mf2_t __riscv_vnmsub_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                          vint32mf2_t vs1, vint32mf2_t vs2,
                                          size_t vl);
vint32mf2_t __riscv_vnmsub_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                          int32_t rs1, vint32mf2_t vs2,
                                          size_t vl);
vint32m1_t __riscv_vnmsub_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                        vint32m1_t vs1, vint32m1_t vs2,
                                        size_t vl);
vint32m1_t __riscv_vnmsub_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                        int32_t rs1, vint32m1_t vs2, size_t vl);
vint32m2_t __riscv_vnmsub_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                        vint32m2_t vs1, vint32m2_t vs2,
                                        size_t vl);
vint32m2_t __riscv_vnmsub_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                        int32_t rs1, vint32m2_t vs2, size_t vl);
vint32m4_t __riscv_vnmsub_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                        vint32m4_t vs1, vint32m4_t vs2,
                                        size_t vl);
vint32m4_t __riscv_vnmsub_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd, int32_t rs1,
                                        vint32m4_t vs2, size_t vl);
vint32m8_t __riscv_vnmsub_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                        vint32m8_t vs1, vint32m8_t vs2,
                                        size_t vl);
vint32m8_t __riscv_vnmsub_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd, int32_t rs1,
                                        vint32m8_t vs2, size_t vl);
vint64m1_t __riscv_vnmsub_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                        vint64m1_t vs1, vint64m1_t vs2,
                                        size_t vl);
vint64m1_t __riscv_vnmsub_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                        int64_t rs1, vint64m1_t vs2, size_t vl);
vint64m2_t __riscv_vnmsub_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                        vint64m2_t vs1, vint64m2_t vs2,
                                        size_t vl);
vint64m2_t __riscv_vnmsub_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                        int64_t rs1, vint64m2_t vs2, size_t vl);
vint64m4_t __riscv_vnmsub_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                        vint64m4_t vs1, vint64m4_t vs2,
                                        size_t vl);
vint64m4_t __riscv_vnmsub_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                        int64_t rs1, vint64m4_t vs2, size_t vl);
vint64m8_t __riscv_vnmsub_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                        vint64m8_t vs1, vint64m8_t vs2,
                                        size_t vl);
vint64m8_t __riscv_vnmsub_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd, int64_t rs1,
                                        vint64m8_t vs2, size_t vl);
vuint8mf8_t __riscv_vmacc_vv_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                        vuint8mf8_t vs1, vuint8mf8_t vs2,
                                        size_t vl);
vuint8mf8_t __riscv_vmacc_vx_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                        uint8_t rs1, vuint8mf8_t vs2,
                                        size_t vl);
vuint8mf4_t __riscv_vmacc_vv_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                        vuint8mf4_t vs1, vuint8mf4_t vs2,
                                        size_t vl);
vuint8mf4_t __riscv_vmacc_vx_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                        uint8_t rs1, vuint8mf4_t vs2,
                                        size_t vl);
vuint8mf2_t __riscv_vmacc_vv_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                        vuint8mf2_t vs1, vuint8mf2_t vs2,
                                        size_t vl);
vuint8mf2_t __riscv_vmacc_vx_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                        uint8_t rs1, vuint8mf2_t vs2,
                                        size_t vl);
vuint8m1_t __riscv_vmacc_vv_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                      vuint8m1_t vs1, vuint8m1_t vs2,
                                      size_t vl);
vuint8m1_t __riscv_vmacc_vx_u8m1_tumu(vbool8_t vm, vuint8m1_t vd, uint8_t rs1,
                                      vuint8m1_t vs2, size_t vl);
vuint8m2_t __riscv_vmacc_vv_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                      vuint8m2_t vs1, vuint8m2_t vs2,
                                      size_t vl);
vuint8m2_t __riscv_vmacc_vx_u8m2_tumu(vbool4_t vm, vuint8m2_t vd, uint8_t rs1,
                                      vuint8m2_t vs2, size_t vl);
vuint8m4_t __riscv_vmacc_vv_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                      vuint8m4_t vs1, vuint8m4_t vs2,
                                      size_t vl);
vuint8m4_t __riscv_vmacc_vx_u8m4_tumu(vbool2_t vm, vuint8m4_t vd, uint8_t rs1,
                                      vuint8m4_t vs2, size_t vl);
vuint8m8_t __riscv_vmacc_vv_u8m8_tumu(vbool1_t vm, vuint8m8_t vd,
                                      vuint8m8_t vs1, vuint8m8_t vs2,
                                      size_t vl);
vuint8m8_t __riscv_vmacc_vx_u8m8_tumu(vbool1_t vm, vuint8m8_t vd, uint8_t rs1,
                                      vuint8m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vmacc_vv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                          vuint16mf4_t vs1, vuint16mf4_t vs2,
                                          size_t vl);
vuint16mf4_t __riscv_vmacc_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                          uint16_t rs1, vuint16mf4_t vs2,
                                          size_t vl);
vuint16mf2_t __riscv_vmacc_vv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                          vuint16mf2_t vs1, vuint16mf2_t vs2,
                                          size_t vl);
vuint16mf2_t __riscv_vmacc_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                          uint16_t rs1, vuint16mf2_t vs2,
                                          size_t vl);
vuint16m1_t __riscv_vmacc_vv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                        vuint16m1_t vs1, vuint16m1_t vs2,
                                        size_t vl);
vuint16m1_t __riscv_vmacc_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                        uint16_t rs1, vuint16m1_t vs2,
                                        size_t vl);
vuint16m2_t __riscv_vmacc_vv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                        vuint16m2_t vs1, vuint16m2_t vs2,
                                        size_t vl);
vuint16m2_t __riscv_vmacc_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                        uint16_t rs1, vuint16m2_t vs2,
                                        size_t vl);
vuint16m4_t __riscv_vmacc_vv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                        vuint16m4_t vs1, vuint16m4_t vs2,
                                        size_t vl);
vuint16m4_t __riscv_vmacc_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                        uint16_t rs1, vuint16m4_t vs2,
                                        size_t vl);
vuint16m8_t __riscv_vmacc_vv_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                        vuint16m8_t vs1, vuint16m8_t vs2,
                                        size_t vl);
vuint16m8_t __riscv_vmacc_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                        uint16_t rs1, vuint16m8_t vs2,
                                        size_t vl);
vuint32mf2_t __riscv_vmacc_vv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                          vuint32mf2_t vs1, vuint32mf2_t vs2,
                                          size_t vl);
vuint32mf2_t __riscv_vmacc_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                          uint32_t rs1, vuint32mf2_t vs2,
                                          size_t vl);
vuint32m1_t __riscv_vmacc_vv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                        vuint32m1_t vs1, vuint32m1_t vs2,
                                        size_t vl);
vuint32m1_t __riscv_vmacc_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                        uint32_t rs1, vuint32m1_t vs2,
                                        size_t vl);
vuint32m2_t __riscv_vmacc_vv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                        vuint32m2_t vs1, vuint32m2_t vs2,
                                        size_t vl);
vuint32m2_t __riscv_vmacc_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                        uint32_t rs1, vuint32m2_t vs2,
                                        size_t vl);
vuint32m4_t __riscv_vmacc_vv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                        vuint32m4_t vs1, vuint32m4_t vs2,
                                        size_t vl);
vuint32m4_t __riscv_vmacc_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                        uint32_t rs1, vuint32m4_t vs2,
                                        size_t vl);
vuint32m8_t __riscv_vmacc_vv_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                        vuint32m8_t vs1, vuint32m8_t vs2,
                                        size_t vl);
vuint32m8_t __riscv_vmacc_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                        uint32_t rs1, vuint32m8_t vs2,
                                        size_t vl);
vuint64m1_t __riscv_vmacc_vv_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                        vuint64m1_t vs1, vuint64m1_t vs2,
                                        size_t vl);
vuint64m1_t __riscv_vmacc_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                        uint64_t rs1, vuint64m1_t vs2,
                                        size_t vl);
vuint64m2_t __riscv_vmacc_vv_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                        vuint64m2_t vs1, vuint64m2_t vs2,
                                        size_t vl);
vuint64m2_t __riscv_vmacc_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                        uint64_t rs1, vuint64m2_t vs2,
                                        size_t vl);
vuint64m4_t __riscv_vmacc_vv_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                        vuint64m4_t vs1, vuint64m4_t vs2,
                                        size_t vl);
vuint64m4_t __riscv_vmacc_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                        uint64_t rs1, vuint64m4_t vs2,
                                        size_t vl);
vuint64m8_t __riscv_vmacc_vv_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                        vuint64m8_t vs1, vuint64m8_t vs2,
                                        size_t vl);
vuint64m8_t __riscv_vmacc_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                        uint64_t rs1, vuint64m8_t vs2,
                                        size_t vl);
vuint8mf8_t __riscv_vnmsac_vv_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                         vuint8mf8_t vs1, vuint8mf8_t vs2,
                                         size_t vl);
vuint8mf8_t __riscv_vnmsac_vx_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                         uint8_t rs1, vuint8mf8_t vs2,
                                         size_t vl);
vuint8mf4_t __riscv_vnmsac_vv_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                         vuint8mf4_t vs1, vuint8mf4_t vs2,
                                         size_t vl);
vuint8mf4_t __riscv_vnmsac_vx_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                         uint8_t rs1, vuint8mf4_t vs2,
                                         size_t vl);
vuint8mf2_t __riscv_vnmsac_vv_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                         vuint8mf2_t vs1, vuint8mf2_t vs2,
                                         size_t vl);
vuint8mf2_t __riscv_vnmsac_vx_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                         uint8_t rs1, vuint8mf2_t vs2,
                                         size_t vl);
vuint8m1_t __riscv_vnmsac_vv_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                       vuint8m1_t vs1, vuint8m1_t vs2,
                                       size_t vl);
vuint8m1_t __riscv_vnmsac_vx_u8m1_tumu(vbool8_t vm, vuint8m1_t vd, uint8_t rs1,
                                       vuint8m1_t vs2, size_t vl);
vuint8m2_t __riscv_vnmsac_vv_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                       vuint8m2_t vs1, vuint8m2_t vs2,
                                       size_t vl);
vuint8m2_t __riscv_vnmsac_vx_u8m2_tumu(vbool4_t vm, vuint8m2_t vd, uint8_t rs1,
                                       vuint8m2_t vs2, size_t vl);
vuint8m4_t __riscv_vnmsac_vv_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                       vuint8m4_t vs1, vuint8m4_t vs2,
                                       size_t vl);
vuint8m4_t __riscv_vnmsac_vx_u8m4_tumu(vbool2_t vm, vuint8m4_t vd, uint8_t rs1,
                                       vuint8m4_t vs2, size_t vl);
vuint8m8_t __riscv_vnmsac_vv_u8m8_tumu(vbool1_t vm, vuint8m8_t vd,
                                       vuint8m8_t vs1, vuint8m8_t vs2,
                                       size_t vl);
vuint8m8_t __riscv_vnmsac_vx_u8m8_tumu(vbool1_t vm, vuint8m8_t vd, uint8_t rs1,
                                       vuint8m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vnmsac_vv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                           vuint16mf4_t vs1, vuint16mf4_t vs2,
                                           size_t vl);
vuint16mf4_t __riscv_vnmsac_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                           uint16_t rs1, vuint16mf4_t vs2,
                                           size_t vl);
vuint16mf2_t __riscv_vnmsac_vv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                           vuint16mf2_t vs1, vuint16mf2_t vs2,
                                           size_t vl);
vuint16mf2_t __riscv_vnmsac_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                           uint16_t rs1, vuint16mf2_t vs2,
                                           size_t vl);
vuint16m1_t __riscv_vnmsac_vv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                         vuint16m1_t vs1, vuint16m1_t vs2,
                                         size_t vl);
vuint16m1_t __riscv_vnmsac_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                         uint16_t rs1, vuint16m1_t vs2,
                                         size_t vl);
vuint16m2_t __riscv_vnmsac_vv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                         vuint16m2_t vs1, vuint16m2_t vs2,
                                         size_t vl);
vuint16m2_t __riscv_vnmsac_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                         uint16_t rs1, vuint16m2_t vs2,
                                         size_t vl);
vuint16m4_t __riscv_vnmsac_vv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                         vuint16m4_t vs1, vuint16m4_t vs2,
                                         size_t vl);
vuint16m4_t __riscv_vnmsac_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                         uint16_t rs1, vuint16m4_t vs2,
                                         size_t vl);
vuint16m8_t __riscv_vnmsac_vv_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                         vuint16m8_t vs1, vuint16m8_t vs2,
                                         size_t vl);
vuint16m8_t __riscv_vnmsac_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                         uint16_t rs1, vuint16m8_t vs2,
                                         size_t vl);
vuint32mf2_t __riscv_vnmsac_vv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                           vuint32mf2_t vs1, vuint32mf2_t vs2,
                                           size_t vl);
vuint32mf2_t __riscv_vnmsac_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                           uint32_t rs1, vuint32mf2_t vs2,
                                           size_t vl);
vuint32m1_t __riscv_vnmsac_vv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                         vuint32m1_t vs1, vuint32m1_t vs2,
                                         size_t vl);
vuint32m1_t __riscv_vnmsac_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                         uint32_t rs1, vuint32m1_t vs2,
                                         size_t vl);
vuint32m2_t __riscv_vnmsac_vv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                         vuint32m2_t vs1, vuint32m2_t vs2,
                                         size_t vl);
vuint32m2_t __riscv_vnmsac_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                         uint32_t rs1, vuint32m2_t vs2,
                                         size_t vl);
vuint32m4_t __riscv_vnmsac_vv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                         vuint32m4_t vs1, vuint32m4_t vs2,
                                         size_t vl);
vuint32m4_t __riscv_vnmsac_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                         uint32_t rs1, vuint32m4_t vs2,
                                         size_t vl);
vuint32m8_t __riscv_vnmsac_vv_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                         vuint32m8_t vs1, vuint32m8_t vs2,
                                         size_t vl);
vuint32m8_t __riscv_vnmsac_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                         uint32_t rs1, vuint32m8_t vs2,
                                         size_t vl);
vuint64m1_t __riscv_vnmsac_vv_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                         vuint64m1_t vs1, vuint64m1_t vs2,
                                         size_t vl);
vuint64m1_t __riscv_vnmsac_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                         uint64_t rs1, vuint64m1_t vs2,
                                         size_t vl);
vuint64m2_t __riscv_vnmsac_vv_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                         vuint64m2_t vs1, vuint64m2_t vs2,
                                         size_t vl);
vuint64m2_t __riscv_vnmsac_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                         uint64_t rs1, vuint64m2_t vs2,
                                         size_t vl);
vuint64m4_t __riscv_vnmsac_vv_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                         vuint64m4_t vs1, vuint64m4_t vs2,
                                         size_t vl);
vuint64m4_t __riscv_vnmsac_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                         uint64_t rs1, vuint64m4_t vs2,
                                         size_t vl);
vuint64m8_t __riscv_vnmsac_vv_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                         vuint64m8_t vs1, vuint64m8_t vs2,
                                         size_t vl);
vuint64m8_t __riscv_vnmsac_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                         uint64_t rs1, vuint64m8_t vs2,
                                         size_t vl);
vuint8mf8_t __riscv_vmadd_vv_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                        vuint8mf8_t vs1, vuint8mf8_t vs2,
                                        size_t vl);
vuint8mf8_t __riscv_vmadd_vx_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                        uint8_t rs1, vuint8mf8_t vs2,
                                        size_t vl);
vuint8mf4_t __riscv_vmadd_vv_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                        vuint8mf4_t vs1, vuint8mf4_t vs2,
                                        size_t vl);
vuint8mf4_t __riscv_vmadd_vx_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                        uint8_t rs1, vuint8mf4_t vs2,
                                        size_t vl);
vuint8mf2_t __riscv_vmadd_vv_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                        vuint8mf2_t vs1, vuint8mf2_t vs2,
                                        size_t vl);
vuint8mf2_t __riscv_vmadd_vx_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                        uint8_t rs1, vuint8mf2_t vs2,
                                        size_t vl);
vuint8m1_t __riscv_vmadd_vv_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                      vuint8m1_t vs1, vuint8m1_t vs2,
                                      size_t vl);
vuint8m1_t __riscv_vmadd_vx_u8m1_tumu(vbool8_t vm, vuint8m1_t vd, uint8_t rs1,
                                      vuint8m1_t vs2, size_t vl);
vuint8m2_t __riscv_vmadd_vv_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                      vuint8m2_t vs1, vuint8m2_t vs2,
                                      size_t vl);
vuint8m2_t __riscv_vmadd_vx_u8m2_tumu(vbool4_t vm, vuint8m2_t vd, uint8_t rs1,
                                      vuint8m2_t vs2, size_t vl);
vuint8m4_t __riscv_vmadd_vv_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                      vuint8m4_t vs1, vuint8m4_t vs2,
                                      size_t vl);
vuint8m4_t __riscv_vmadd_vx_u8m4_tumu(vbool2_t vm, vuint8m4_t vd, uint8_t rs1,
                                      vuint8m4_t vs2, size_t vl);
vuint8m8_t __riscv_vmadd_vv_u8m8_tumu(vbool1_t vm, vuint8m8_t vd,
                                      vuint8m8_t vs1, vuint8m8_t vs2,
                                      size_t vl);
vuint8m8_t __riscv_vmadd_vx_u8m8_tumu(vbool1_t vm, vuint8m8_t vd, uint8_t rs1,
                                      vuint8m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vmadd_vv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                          vuint16mf4_t vs1, vuint16mf4_t vs2,
                                          size_t vl);
vuint16mf4_t __riscv_vmadd_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                          uint16_t rs1, vuint16mf4_t vs2,
                                          size_t vl);
vuint16mf2_t __riscv_vmadd_vv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                          vuint16mf2_t vs1, vuint16mf2_t vs2,
                                          size_t vl);
vuint16mf2_t __riscv_vmadd_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                          uint16_t rs1, vuint16mf2_t vs2,
                                          size_t vl);
vuint16m1_t __riscv_vmadd_vv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                        vuint16m1_t vs1, vuint16m1_t vs2,
                                        size_t vl);
vuint16m1_t __riscv_vmadd_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                        uint16_t rs1, vuint16m1_t vs2,
                                        size_t vl);
vuint16m2_t __riscv_vmadd_vv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                        vuint16m2_t vs1, vuint16m2_t vs2,
                                        size_t vl);
vuint16m2_t __riscv_vmadd_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                        uint16_t rs1, vuint16m2_t vs2,
                                        size_t vl);
vuint16m4_t __riscv_vmadd_vv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                        vuint16m4_t vs1, vuint16m4_t vs2,
                                        size_t vl);
vuint16m4_t __riscv_vmadd_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                        uint16_t rs1, vuint16m4_t vs2,
                                        size_t vl);
vuint16m8_t __riscv_vmadd_vv_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                        vuint16m8_t vs1, vuint16m8_t vs2,
                                        size_t vl);
vuint16m8_t __riscv_vmadd_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                        uint16_t rs1, vuint16m8_t vs2,
                                        size_t vl);
vuint32mf2_t __riscv_vmadd_vv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                          vuint32mf2_t vs1, vuint32mf2_t vs2,
                                          size_t vl);
vuint32mf2_t __riscv_vmadd_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                          uint32_t rs1, vuint32mf2_t vs2,
                                          size_t vl);
vuint32m1_t __riscv_vmadd_vv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                        vuint32m1_t vs1, vuint32m1_t vs2,
                                        size_t vl);
vuint32m1_t __riscv_vmadd_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                        uint32_t rs1, vuint32m1_t vs2,
                                        size_t vl);
vuint32m2_t __riscv_vmadd_vv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                        vuint32m2_t vs1, vuint32m2_t vs2,
                                        size_t vl);
vuint32m2_t __riscv_vmadd_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                        uint32_t rs1, vuint32m2_t vs2,
                                        size_t vl);
vuint32m4_t __riscv_vmadd_vv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                        vuint32m4_t vs1, vuint32m4_t vs2,
                                        size_t vl);
vuint32m4_t __riscv_vmadd_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                        uint32_t rs1, vuint32m4_t vs2,
                                        size_t vl);
vuint32m8_t __riscv_vmadd_vv_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                        vuint32m8_t vs1, vuint32m8_t vs2,
                                        size_t vl);
vuint32m8_t __riscv_vmadd_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                        uint32_t rs1, vuint32m8_t vs2,
                                        size_t vl);
vuint64m1_t __riscv_vmadd_vv_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                        vuint64m1_t vs1, vuint64m1_t vs2,
                                        size_t vl);
vuint64m1_t __riscv_vmadd_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                        uint64_t rs1, vuint64m1_t vs2,
                                        size_t vl);
vuint64m2_t __riscv_vmadd_vv_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                        vuint64m2_t vs1, vuint64m2_t vs2,
                                        size_t vl);
vuint64m2_t __riscv_vmadd_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                        uint64_t rs1, vuint64m2_t vs2,
                                        size_t vl);
vuint64m4_t __riscv_vmadd_vv_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                        vuint64m4_t vs1, vuint64m4_t vs2,
                                        size_t vl);
vuint64m4_t __riscv_vmadd_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                        uint64_t rs1, vuint64m4_t vs2,
                                        size_t vl);
vuint64m8_t __riscv_vmadd_vv_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                        vuint64m8_t vs1, vuint64m8_t vs2,
                                        size_t vl);
vuint64m8_t __riscv_vmadd_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                        uint64_t rs1, vuint64m8_t vs2,
                                        size_t vl);
vuint8mf8_t __riscv_vnmsub_vv_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                         vuint8mf8_t vs1, vuint8mf8_t vs2,
                                         size_t vl);
vuint8mf8_t __riscv_vnmsub_vx_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                         uint8_t rs1, vuint8mf8_t vs2,
                                         size_t vl);
vuint8mf4_t __riscv_vnmsub_vv_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                         vuint8mf4_t vs1, vuint8mf4_t vs2,
                                         size_t vl);
vuint8mf4_t __riscv_vnmsub_vx_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                         uint8_t rs1, vuint8mf4_t vs2,
                                         size_t vl);
vuint8mf2_t __riscv_vnmsub_vv_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                         vuint8mf2_t vs1, vuint8mf2_t vs2,
                                         size_t vl);
vuint8mf2_t __riscv_vnmsub_vx_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                         uint8_t rs1, vuint8mf2_t vs2,
                                         size_t vl);
vuint8m1_t __riscv_vnmsub_vv_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                       vuint8m1_t vs1, vuint8m1_t vs2,
                                       size_t vl);
vuint8m1_t __riscv_vnmsub_vx_u8m1_tumu(vbool8_t vm, vuint8m1_t vd, uint8_t rs1,
                                       vuint8m1_t vs2, size_t vl);
vuint8m2_t __riscv_vnmsub_vv_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                       vuint8m2_t vs1, vuint8m2_t vs2,
                                       size_t vl);
vuint8m2_t __riscv_vnmsub_vx_u8m2_tumu(vbool4_t vm, vuint8m2_t vd, uint8_t rs1,
                                       vuint8m2_t vs2, size_t vl);
vuint8m4_t __riscv_vnmsub_vv_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                       vuint8m4_t vs1, vuint8m4_t vs2,
                                       size_t vl);
vuint8m4_t __riscv_vnmsub_vx_u8m4_tumu(vbool2_t vm, vuint8m4_t vd, uint8_t rs1,
                                       vuint8m4_t vs2, size_t vl);
vuint8m8_t __riscv_vnmsub_vv_u8m8_tumu(vbool1_t vm, vuint8m8_t vd,
                                       vuint8m8_t vs1, vuint8m8_t vs2,
                                       size_t vl);
vuint8m8_t __riscv_vnmsub_vx_u8m8_tumu(vbool1_t vm, vuint8m8_t vd, uint8_t rs1,
                                       vuint8m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vnmsub_vv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                           vuint16mf4_t vs1, vuint16mf4_t vs2,
                                           size_t vl);
vuint16mf4_t __riscv_vnmsub_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                           uint16_t rs1, vuint16mf4_t vs2,
                                           size_t vl);
vuint16mf2_t __riscv_vnmsub_vv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                           vuint16mf2_t vs1, vuint16mf2_t vs2,
                                           size_t vl);
vuint16mf2_t __riscv_vnmsub_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                           uint16_t rs1, vuint16mf2_t vs2,
                                           size_t vl);
vuint16m1_t __riscv_vnmsub_vv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                         vuint16m1_t vs1, vuint16m1_t vs2,
                                         size_t vl);
vuint16m1_t __riscv_vnmsub_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                         uint16_t rs1, vuint16m1_t vs2,
                                         size_t vl);
vuint16m2_t __riscv_vnmsub_vv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                         vuint16m2_t vs1, vuint16m2_t vs2,
                                         size_t vl);
vuint16m2_t __riscv_vnmsub_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                         uint16_t rs1, vuint16m2_t vs2,
                                         size_t vl);
vuint16m4_t __riscv_vnmsub_vv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                         vuint16m4_t vs1, vuint16m4_t vs2,
                                         size_t vl);
vuint16m4_t __riscv_vnmsub_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                         uint16_t rs1, vuint16m4_t vs2,
                                         size_t vl);
vuint16m8_t __riscv_vnmsub_vv_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                         vuint16m8_t vs1, vuint16m8_t vs2,
                                         size_t vl);
vuint16m8_t __riscv_vnmsub_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                         uint16_t rs1, vuint16m8_t vs2,
                                         size_t vl);
vuint32mf2_t __riscv_vnmsub_vv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                           vuint32mf2_t vs1, vuint32mf2_t vs2,
                                           size_t vl);
vuint32mf2_t __riscv_vnmsub_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                           uint32_t rs1, vuint32mf2_t vs2,
                                           size_t vl);
vuint32m1_t __riscv_vnmsub_vv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                         vuint32m1_t vs1, vuint32m1_t vs2,
                                         size_t vl);
vuint32m1_t __riscv_vnmsub_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                         uint32_t rs1, vuint32m1_t vs2,
                                         size_t vl);
vuint32m2_t __riscv_vnmsub_vv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                         vuint32m2_t vs1, vuint32m2_t vs2,
                                         size_t vl);
vuint32m2_t __riscv_vnmsub_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                         uint32_t rs1, vuint32m2_t vs2,
                                         size_t vl);
vuint32m4_t __riscv_vnmsub_vv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                         vuint32m4_t vs1, vuint32m4_t vs2,
                                         size_t vl);
vuint32m4_t __riscv_vnmsub_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                         uint32_t rs1, vuint32m4_t vs2,
                                         size_t vl);
vuint32m8_t __riscv_vnmsub_vv_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                         vuint32m8_t vs1, vuint32m8_t vs2,
                                         size_t vl);
vuint32m8_t __riscv_vnmsub_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                         uint32_t rs1, vuint32m8_t vs2,
                                         size_t vl);
vuint64m1_t __riscv_vnmsub_vv_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                         vuint64m1_t vs1, vuint64m1_t vs2,
                                         size_t vl);
vuint64m1_t __riscv_vnmsub_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                         uint64_t rs1, vuint64m1_t vs2,
                                         size_t vl);
vuint64m2_t __riscv_vnmsub_vv_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                         vuint64m2_t vs1, vuint64m2_t vs2,
                                         size_t vl);
vuint64m2_t __riscv_vnmsub_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                         uint64_t rs1, vuint64m2_t vs2,
                                         size_t vl);
vuint64m4_t __riscv_vnmsub_vv_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                         vuint64m4_t vs1, vuint64m4_t vs2,
                                         size_t vl);
vuint64m4_t __riscv_vnmsub_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                         uint64_t rs1, vuint64m4_t vs2,
                                         size_t vl);
vuint64m8_t __riscv_vnmsub_vv_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                         vuint64m8_t vs1, vuint64m8_t vs2,
                                         size_t vl);
vuint64m8_t __riscv_vnmsub_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                         uint64_t rs1, vuint64m8_t vs2,
                                         size_t vl);
// masked functions
vint8mf8_t __riscv_vmacc_vv_i8mf8_mu(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs1, vint8mf8_t vs2, size_t vl);
vint8mf8_t __riscv_vmacc_vx_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, int8_t rs1,
                                     vint8mf8_t vs2, size_t vl);
vint8mf4_t __riscv_vmacc_vv_i8mf4_mu(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs1, vint8mf4_t vs2, size_t vl);
vint8mf4_t __riscv_vmacc_vx_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, int8_t rs1,
                                     vint8mf4_t vs2, size_t vl);
vint8mf2_t __riscv_vmacc_vv_i8mf2_mu(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs1, vint8mf2_t vs2, size_t vl);
vint8mf2_t __riscv_vmacc_vx_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, int8_t rs1,
                                     vint8mf2_t vs2, size_t vl);
vint8m1_t __riscv_vmacc_vv_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs1,
                                   vint8m1_t vs2, size_t vl);
vint8m1_t __riscv_vmacc_vx_i8m1_mu(vbool8_t vm, vint8m1_t vd, int8_t rs1,
                                   vint8m1_t vs2, size_t vl);
vint8m2_t __riscv_vmacc_vv_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs1,
                                   vint8m2_t vs2, size_t vl);
vint8m2_t __riscv_vmacc_vx_i8m2_mu(vbool4_t vm, vint8m2_t vd, int8_t rs1,
                                   vint8m2_t vs2, size_t vl);
vint8m4_t __riscv_vmacc_vv_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs1,
                                   vint8m4_t vs2, size_t vl);
vint8m4_t __riscv_vmacc_vx_i8m4_mu(vbool2_t vm, vint8m4_t vd, int8_t rs1,
                                   vint8m4_t vs2, size_t vl);
vint8m8_t __riscv_vmacc_vv_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs1,
                                   vint8m8_t vs2, size_t vl);
vint8m8_t __riscv_vmacc_vx_i8m8_mu(vbool1_t vm, vint8m8_t vd, int8_t rs1,
                                   vint8m8_t vs2, size_t vl);
vint16mf4_t __riscv_vmacc_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs1, vint16mf4_t vs2,
                                       size_t vl);
vint16mf4_t __riscv_vmacc_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                       int16_t rs1, vint16mf4_t vs2, size_t vl);
vint16mf2_t __riscv_vmacc_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs1, vint16mf2_t vs2,
                                       size_t vl);
vint16mf2_t __riscv_vmacc_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                       int16_t rs1, vint16mf2_t vs2, size_t vl);
vint16m1_t __riscv_vmacc_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs1, vint16m1_t vs2, size_t vl);
vint16m1_t __riscv_vmacc_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd, int16_t rs1,
                                     vint16m1_t vs2, size_t vl);
vint16m2_t __riscv_vmacc_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs1,
                                     vint16m2_t vs2, size_t vl);
vint16m2_t __riscv_vmacc_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd, int16_t rs1,
                                     vint16m2_t vs2, size_t vl);
vint16m4_t __riscv_vmacc_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs1,
                                     vint16m4_t vs2, size_t vl);
vint16m4_t __riscv_vmacc_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd, int16_t rs1,
                                     vint16m4_t vs2, size_t vl);
vint16m8_t __riscv_vmacc_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs1,
                                     vint16m8_t vs2, size_t vl);
vint16m8_t __riscv_vmacc_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd, int16_t rs1,
                                     vint16m8_t vs2, size_t vl);
vint32mf2_t __riscv_vmacc_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs1, vint32mf2_t vs2,
                                       size_t vl);
vint32mf2_t __riscv_vmacc_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                       int32_t rs1, vint32mf2_t vs2, size_t vl);
vint32m1_t __riscv_vmacc_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs1, vint32m1_t vs2, size_t vl);
vint32m1_t __riscv_vmacc_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd, int32_t rs1,
                                     vint32m1_t vs2, size_t vl);
vint32m2_t __riscv_vmacc_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs1, vint32m2_t vs2, size_t vl);
vint32m2_t __riscv_vmacc_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd, int32_t rs1,
                                     vint32m2_t vs2, size_t vl);
vint32m4_t __riscv_vmacc_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs1,
                                     vint32m4_t vs2, size_t vl);
vint32m4_t __riscv_vmacc_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd, int32_t rs1,
                                     vint32m4_t vs2, size_t vl);
vint32m8_t __riscv_vmacc_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs1,
                                     vint32m8_t vs2, size_t vl);
vint32m8_t __riscv_vmacc_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd, int32_t rs1,
                                     vint32m8_t vs2, size_t vl);
vint64m1_t __riscv_vmacc_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs1, vint64m1_t vs2, size_t vl);
vint64m1_t __riscv_vmacc_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd, int64_t rs1,
                                     vint64m1_t vs2, size_t vl);
vint64m2_t __riscv_vmacc_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs1, vint64m2_t vs2, size_t vl);
vint64m2_t __riscv_vmacc_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd, int64_t rs1,
                                     vint64m2_t vs2, size_t vl);
vint64m4_t __riscv_vmacc_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs1, vint64m4_t vs2, size_t vl);
vint64m4_t __riscv_vmacc_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd, int64_t rs1,
                                     vint64m4_t vs2, size_t vl);
vint64m8_t __riscv_vmacc_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs1,
                                     vint64m8_t vs2, size_t vl);
vint64m8_t __riscv_vmacc_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd, int64_t rs1,
                                     vint64m8_t vs2, size_t vl);
vint8mf8_t __riscv_vnmsac_vv_i8mf8_mu(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs1, vint8mf8_t vs2,
                                      size_t vl);
vint8mf8_t __riscv_vnmsac_vx_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, int8_t rs1,
                                      vint8mf8_t vs2, size_t vl);
vint8mf4_t __riscv_vnmsac_vv_i8mf4_mu(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs1, vint8mf4_t vs2,
                                      size_t vl);
vint8mf4_t __riscv_vnmsac_vx_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, int8_t rs1,
                                      vint8mf4_t vs2, size_t vl);
vint8mf2_t __riscv_vnmsac_vv_i8mf2_mu(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs1, vint8mf2_t vs2,
                                      size_t vl);
vint8mf2_t __riscv_vnmsac_vx_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, int8_t rs1,
                                      vint8mf2_t vs2, size_t vl);
vint8m1_t __riscv_vnmsac_vv_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs1,
                                    vint8m1_t vs2, size_t vl);
vint8m1_t __riscv_vnmsac_vx_i8m1_mu(vbool8_t vm, vint8m1_t vd, int8_t rs1,
                                    vint8m1_t vs2, size_t vl);
vint8m2_t __riscv_vnmsac_vv_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs1,
                                    vint8m2_t vs2, size_t vl);
vint8m2_t __riscv_vnmsac_vx_i8m2_mu(vbool4_t vm, vint8m2_t vd, int8_t rs1,
                                    vint8m2_t vs2, size_t vl);
vint8m4_t __riscv_vnmsac_vv_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs1,
                                    vint8m4_t vs2, size_t vl);
vint8m4_t __riscv_vnmsac_vx_i8m4_mu(vbool2_t vm, vint8m4_t vd, int8_t rs1,
                                    vint8m4_t vs2, size_t vl);
vint8m8_t __riscv_vnmsac_vv_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs1,
                                    vint8m8_t vs2, size_t vl);
vint8m8_t __riscv_vnmsac_vx_i8m8_mu(vbool1_t vm, vint8m8_t vd, int8_t rs1,
                                    vint8m8_t vs2, size_t vl);
vint16mf4_t __riscv_vnmsac_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs1, vint16mf4_t vs2,
                                        size_t vl);
vint16mf4_t __riscv_vnmsac_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                        int16_t rs1, vint16mf4_t vs2,
                                        size_t vl);
vint16mf2_t __riscv_vnmsac_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs1, vint16mf2_t vs2,
                                        size_t vl);
vint16mf2_t __riscv_vnmsac_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                        int16_t rs1, vint16mf2_t vs2,
                                        size_t vl);
vint16m1_t __riscv_vnmsac_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs1, vint16m1_t vs2,
                                      size_t vl);
vint16m1_t __riscv_vnmsac_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd, int16_t rs1,
                                      vint16m1_t vs2, size_t vl);
vint16m2_t __riscv_vnmsac_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs1, vint16m2_t vs2,
                                      size_t vl);
vint16m2_t __riscv_vnmsac_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd, int16_t rs1,
                                      vint16m2_t vs2, size_t vl);
vint16m4_t __riscv_vnmsac_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs1, vint16m4_t vs2,
                                      size_t vl);
vint16m4_t __riscv_vnmsac_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd, int16_t rs1,
                                      vint16m4_t vs2, size_t vl);
vint16m8_t __riscv_vnmsac_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs1, vint16m8_t vs2,
                                      size_t vl);
vint16m8_t __riscv_vnmsac_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd, int16_t rs1,
                                      vint16m8_t vs2, size_t vl);
vint32mf2_t __riscv_vnmsac_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs1, vint32mf2_t vs2,
                                        size_t vl);
vint32mf2_t __riscv_vnmsac_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                        int32_t rs1, vint32mf2_t vs2,
                                        size_t vl);
vint32m1_t __riscv_vnmsac_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs1, vint32m1_t vs2,
                                      size_t vl);
vint32m1_t __riscv_vnmsac_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd, int32_t rs1,
                                      vint32m1_t vs2, size_t vl);
vint32m2_t __riscv_vnmsac_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs1, vint32m2_t vs2,
                                      size_t vl);
vint32m2_t __riscv_vnmsac_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd, int32_t rs1,
                                      vint32m2_t vs2, size_t vl);
vint32m4_t __riscv_vnmsac_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs1, vint32m4_t vs2,
                                      size_t vl);
vint32m4_t __riscv_vnmsac_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd, int32_t rs1,
                                      vint32m4_t vs2, size_t vl);
vint32m8_t __riscv_vnmsac_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs1, vint32m8_t vs2,
                                      size_t vl);
vint32m8_t __riscv_vnmsac_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd, int32_t rs1,
                                      vint32m8_t vs2, size_t vl);
vint64m1_t __riscv_vnmsac_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs1, vint64m1_t vs2,
                                      size_t vl);
vint64m1_t __riscv_vnmsac_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd, int64_t rs1,
                                      vint64m1_t vs2, size_t vl);
vint64m2_t __riscv_vnmsac_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs1, vint64m2_t vs2,
                                      size_t vl);
vint64m2_t __riscv_vnmsac_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd, int64_t rs1,
                                      vint64m2_t vs2, size_t vl);
vint64m4_t __riscv_vnmsac_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs1, vint64m4_t vs2,
                                      size_t vl);
vint64m4_t __riscv_vnmsac_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd, int64_t rs1,
                                      vint64m4_t vs2, size_t vl);
vint64m8_t __riscv_vnmsac_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs1, vint64m8_t vs2,
                                      size_t vl);
vint64m8_t __riscv_vnmsac_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd, int64_t rs1,
                                      vint64m8_t vs2, size_t vl);
vint8mf8_t __riscv_vmadd_vv_i8mf8_mu(vbool64_t vm, vint8mf8_t vd,
                                     vint8mf8_t vs1, vint8mf8_t vs2, size_t vl);
vint8mf8_t __riscv_vmadd_vx_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, int8_t rs1,
                                     vint8mf8_t vs2, size_t vl);
vint8mf4_t __riscv_vmadd_vv_i8mf4_mu(vbool32_t vm, vint8mf4_t vd,
                                     vint8mf4_t vs1, vint8mf4_t vs2, size_t vl);
vint8mf4_t __riscv_vmadd_vx_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, int8_t rs1,
                                     vint8mf4_t vs2, size_t vl);
vint8mf2_t __riscv_vmadd_vv_i8mf2_mu(vbool16_t vm, vint8mf2_t vd,
                                     vint8mf2_t vs1, vint8mf2_t vs2, size_t vl);
vint8mf2_t __riscv_vmadd_vx_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, int8_t rs1,
                                     vint8mf2_t vs2, size_t vl);
vint8m1_t __riscv_vmadd_vv_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs1,
                                   vint8m1_t vs2, size_t vl);
vint8m1_t __riscv_vmadd_vx_i8m1_mu(vbool8_t vm, vint8m1_t vd, int8_t rs1,
                                   vint8m1_t vs2, size_t vl);
vint8m2_t __riscv_vmadd_vv_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs1,
                                   vint8m2_t vs2, size_t vl);
vint8m2_t __riscv_vmadd_vx_i8m2_mu(vbool4_t vm, vint8m2_t vd, int8_t rs1,
                                   vint8m2_t vs2, size_t vl);
vint8m4_t __riscv_vmadd_vv_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs1,
                                   vint8m4_t vs2, size_t vl);
vint8m4_t __riscv_vmadd_vx_i8m4_mu(vbool2_t vm, vint8m4_t vd, int8_t rs1,
                                   vint8m4_t vs2, size_t vl);
vint8m8_t __riscv_vmadd_vv_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs1,
                                   vint8m8_t vs2, size_t vl);
vint8m8_t __riscv_vmadd_vx_i8m8_mu(vbool1_t vm, vint8m8_t vd, int8_t rs1,
                                   vint8m8_t vs2, size_t vl);
vint16mf4_t __riscv_vmadd_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                       vint16mf4_t vs1, vint16mf4_t vs2,
                                       size_t vl);
vint16mf4_t __riscv_vmadd_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                       int16_t rs1, vint16mf4_t vs2, size_t vl);
vint16mf2_t __riscv_vmadd_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                       vint16mf2_t vs1, vint16mf2_t vs2,
                                       size_t vl);
vint16mf2_t __riscv_vmadd_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                       int16_t rs1, vint16mf2_t vs2, size_t vl);
vint16m1_t __riscv_vmadd_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                     vint16m1_t vs1, vint16m1_t vs2, size_t vl);
vint16m1_t __riscv_vmadd_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd, int16_t rs1,
                                     vint16m1_t vs2, size_t vl);
vint16m2_t __riscv_vmadd_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint16m2_t vs1,
                                     vint16m2_t vs2, size_t vl);
vint16m2_t __riscv_vmadd_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd, int16_t rs1,
                                     vint16m2_t vs2, size_t vl);
vint16m4_t __riscv_vmadd_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint16m4_t vs1,
                                     vint16m4_t vs2, size_t vl);
vint16m4_t __riscv_vmadd_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd, int16_t rs1,
                                     vint16m4_t vs2, size_t vl);
vint16m8_t __riscv_vmadd_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint16m8_t vs1,
                                     vint16m8_t vs2, size_t vl);
vint16m8_t __riscv_vmadd_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd, int16_t rs1,
                                     vint16m8_t vs2, size_t vl);
vint32mf2_t __riscv_vmadd_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                       vint32mf2_t vs1, vint32mf2_t vs2,
                                       size_t vl);
vint32mf2_t __riscv_vmadd_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                       int32_t rs1, vint32mf2_t vs2, size_t vl);
vint32m1_t __riscv_vmadd_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                     vint32m1_t vs1, vint32m1_t vs2, size_t vl);
vint32m1_t __riscv_vmadd_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd, int32_t rs1,
                                     vint32m1_t vs2, size_t vl);
vint32m2_t __riscv_vmadd_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                     vint32m2_t vs1, vint32m2_t vs2, size_t vl);
vint32m2_t __riscv_vmadd_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd, int32_t rs1,
                                     vint32m2_t vs2, size_t vl);
vint32m4_t __riscv_vmadd_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd, vint32m4_t vs1,
                                     vint32m4_t vs2, size_t vl);
vint32m4_t __riscv_vmadd_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd, int32_t rs1,
                                     vint32m4_t vs2, size_t vl);
vint32m8_t __riscv_vmadd_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd, vint32m8_t vs1,
                                     vint32m8_t vs2, size_t vl);
vint32m8_t __riscv_vmadd_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd, int32_t rs1,
                                     vint32m8_t vs2, size_t vl);
vint64m1_t __riscv_vmadd_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                     vint64m1_t vs1, vint64m1_t vs2, size_t vl);
vint64m1_t __riscv_vmadd_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd, int64_t rs1,
                                     vint64m1_t vs2, size_t vl);
vint64m2_t __riscv_vmadd_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                     vint64m2_t vs1, vint64m2_t vs2, size_t vl);
vint64m2_t __riscv_vmadd_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd, int64_t rs1,
                                     vint64m2_t vs2, size_t vl);
vint64m4_t __riscv_vmadd_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                     vint64m4_t vs1, vint64m4_t vs2, size_t vl);
vint64m4_t __riscv_vmadd_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd, int64_t rs1,
                                     vint64m4_t vs2, size_t vl);
vint64m8_t __riscv_vmadd_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd, vint64m8_t vs1,
                                     vint64m8_t vs2, size_t vl);
vint64m8_t __riscv_vmadd_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd, int64_t rs1,
                                     vint64m8_t vs2, size_t vl);
vint8mf8_t __riscv_vnmsub_vv_i8mf8_mu(vbool64_t vm, vint8mf8_t vd,
                                      vint8mf8_t vs1, vint8mf8_t vs2,
                                      size_t vl);
vint8mf8_t __riscv_vnmsub_vx_i8mf8_mu(vbool64_t vm, vint8mf8_t vd, int8_t rs1,
                                      vint8mf8_t vs2, size_t vl);
vint8mf4_t __riscv_vnmsub_vv_i8mf4_mu(vbool32_t vm, vint8mf4_t vd,
                                      vint8mf4_t vs1, vint8mf4_t vs2,
                                      size_t vl);
vint8mf4_t __riscv_vnmsub_vx_i8mf4_mu(vbool32_t vm, vint8mf4_t vd, int8_t rs1,
                                      vint8mf4_t vs2, size_t vl);
vint8mf2_t __riscv_vnmsub_vv_i8mf2_mu(vbool16_t vm, vint8mf2_t vd,
                                      vint8mf2_t vs1, vint8mf2_t vs2,
                                      size_t vl);
vint8mf2_t __riscv_vnmsub_vx_i8mf2_mu(vbool16_t vm, vint8mf2_t vd, int8_t rs1,
                                      vint8mf2_t vs2, size_t vl);
vint8m1_t __riscv_vnmsub_vv_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs1,
                                    vint8m1_t vs2, size_t vl);
vint8m1_t __riscv_vnmsub_vx_i8m1_mu(vbool8_t vm, vint8m1_t vd, int8_t rs1,
                                    vint8m1_t vs2, size_t vl);
vint8m2_t __riscv_vnmsub_vv_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs1,
                                    vint8m2_t vs2, size_t vl);
vint8m2_t __riscv_vnmsub_vx_i8m2_mu(vbool4_t vm, vint8m2_t vd, int8_t rs1,
                                    vint8m2_t vs2, size_t vl);
vint8m4_t __riscv_vnmsub_vv_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs1,
                                    vint8m4_t vs2, size_t vl);
vint8m4_t __riscv_vnmsub_vx_i8m4_mu(vbool2_t vm, vint8m4_t vd, int8_t rs1,
                                    vint8m4_t vs2, size_t vl);
vint8m8_t __riscv_vnmsub_vv_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs1,
                                    vint8m8_t vs2, size_t vl);
vint8m8_t __riscv_vnmsub_vx_i8m8_mu(vbool1_t vm, vint8m8_t vd, int8_t rs1,
                                    vint8m8_t vs2, size_t vl);
vint16mf4_t __riscv_vnmsub_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                        vint16mf4_t vs1, vint16mf4_t vs2,
                                        size_t vl);
vint16mf4_t __riscv_vnmsub_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                        int16_t rs1, vint16mf4_t vs2,
                                        size_t vl);
vint16mf2_t __riscv_vnmsub_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                        vint16mf2_t vs1, vint16mf2_t vs2,
                                        size_t vl);
vint16mf2_t __riscv_vnmsub_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                        int16_t rs1, vint16mf2_t vs2,
                                        size_t vl);
vint16m1_t __riscv_vnmsub_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                      vint16m1_t vs1, vint16m1_t vs2,
                                      size_t vl);
vint16m1_t __riscv_vnmsub_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd, int16_t rs1,
                                      vint16m1_t vs2, size_t vl);
vint16m2_t __riscv_vnmsub_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd,
                                      vint16m2_t vs1, vint16m2_t vs2,
                                      size_t vl);
vint16m2_t __riscv_vnmsub_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd, int16_t rs1,
                                      vint16m2_t vs2, size_t vl);
vint16m4_t __riscv_vnmsub_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd,
                                      vint16m4_t vs1, vint16m4_t vs2,
                                      size_t vl);
vint16m4_t __riscv_vnmsub_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd, int16_t rs1,
                                      vint16m4_t vs2, size_t vl);
vint16m8_t __riscv_vnmsub_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd,
                                      vint16m8_t vs1, vint16m8_t vs2,
                                      size_t vl);
vint16m8_t __riscv_vnmsub_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd, int16_t rs1,
                                      vint16m8_t vs2, size_t vl);
vint32mf2_t __riscv_vnmsub_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                        vint32mf2_t vs1, vint32mf2_t vs2,
                                        size_t vl);
vint32mf2_t __riscv_vnmsub_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                        int32_t rs1, vint32mf2_t vs2,
                                        size_t vl);
vint32m1_t __riscv_vnmsub_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                      vint32m1_t vs1, vint32m1_t vs2,
                                      size_t vl);
vint32m1_t __riscv_vnmsub_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd, int32_t rs1,
                                      vint32m1_t vs2, size_t vl);
vint32m2_t __riscv_vnmsub_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                      vint32m2_t vs1, vint32m2_t vs2,
                                      size_t vl);
vint32m2_t __riscv_vnmsub_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd, int32_t rs1,
                                      vint32m2_t vs2, size_t vl);
vint32m4_t __riscv_vnmsub_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd,
                                      vint32m4_t vs1, vint32m4_t vs2,
                                      size_t vl);
vint32m4_t __riscv_vnmsub_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd, int32_t rs1,
                                      vint32m4_t vs2, size_t vl);
vint32m8_t __riscv_vnmsub_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd,
                                      vint32m8_t vs1, vint32m8_t vs2,
                                      size_t vl);
vint32m8_t __riscv_vnmsub_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd, int32_t rs1,
                                      vint32m8_t vs2, size_t vl);
vint64m1_t __riscv_vnmsub_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                      vint64m1_t vs1, vint64m1_t vs2,
                                      size_t vl);
vint64m1_t __riscv_vnmsub_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd, int64_t rs1,
                                      vint64m1_t vs2, size_t vl);
vint64m2_t __riscv_vnmsub_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                      vint64m2_t vs1, vint64m2_t vs2,
                                      size_t vl);
vint64m2_t __riscv_vnmsub_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd, int64_t rs1,
                                      vint64m2_t vs2, size_t vl);
vint64m4_t __riscv_vnmsub_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                      vint64m4_t vs1, vint64m4_t vs2,
                                      size_t vl);
vint64m4_t __riscv_vnmsub_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd, int64_t rs1,
                                      vint64m4_t vs2, size_t vl);
vint64m8_t __riscv_vnmsub_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd,
                                      vint64m8_t vs1, vint64m8_t vs2,
                                      size_t vl);
vint64m8_t __riscv_vnmsub_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd, int64_t rs1,
                                      vint64m8_t vs2, size_t vl);
vuint8mf8_t __riscv_vmacc_vv_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs1, vuint8mf8_t vs2,
                                      size_t vl);
vuint8mf8_t __riscv_vmacc_vx_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd, uint8_t rs1,
                                      vuint8mf8_t vs2, size_t vl);
vuint8mf4_t __riscv_vmacc_vv_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs1, vuint8mf4_t vs2,
                                      size_t vl);
vuint8mf4_t __riscv_vmacc_vx_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd, uint8_t rs1,
                                      vuint8mf4_t vs2, size_t vl);
vuint8mf2_t __riscv_vmacc_vv_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs1, vuint8mf2_t vs2,
                                      size_t vl);
vuint8mf2_t __riscv_vmacc_vx_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd, uint8_t rs1,
                                      vuint8mf2_t vs2, size_t vl);
vuint8m1_t __riscv_vmacc_vv_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs1,
                                    vuint8m1_t vs2, size_t vl);
vuint8m1_t __riscv_vmacc_vx_u8m1_mu(vbool8_t vm, vuint8m1_t vd, uint8_t rs1,
                                    vuint8m1_t vs2, size_t vl);
vuint8m2_t __riscv_vmacc_vv_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs1,
                                    vuint8m2_t vs2, size_t vl);
vuint8m2_t __riscv_vmacc_vx_u8m2_mu(vbool4_t vm, vuint8m2_t vd, uint8_t rs1,
                                    vuint8m2_t vs2, size_t vl);
vuint8m4_t __riscv_vmacc_vv_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs1,
                                    vuint8m4_t vs2, size_t vl);
vuint8m4_t __riscv_vmacc_vx_u8m4_mu(vbool2_t vm, vuint8m4_t vd, uint8_t rs1,
                                    vuint8m4_t vs2, size_t vl);
vuint8m8_t __riscv_vmacc_vv_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs1,
                                    vuint8m8_t vs2, size_t vl);
vuint8m8_t __riscv_vmacc_vx_u8m8_mu(vbool1_t vm, vuint8m8_t vd, uint8_t rs1,
                                    vuint8m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vmacc_vv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs1, vuint16mf4_t vs2,
                                        size_t vl);
vuint16mf4_t __riscv_vmacc_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                        uint16_t rs1, vuint16mf4_t vs2,
                                        size_t vl);
vuint16mf2_t __riscv_vmacc_vv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs1, vuint16mf2_t vs2,
                                        size_t vl);
vuint16mf2_t __riscv_vmacc_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                        uint16_t rs1, vuint16mf2_t vs2,
                                        size_t vl);
vuint16m1_t __riscv_vmacc_vv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs1, vuint16m1_t vs2,
                                      size_t vl);
vuint16m1_t __riscv_vmacc_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                      uint16_t rs1, vuint16m1_t vs2, size_t vl);
vuint16m2_t __riscv_vmacc_vv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs1, vuint16m2_t vs2,
                                      size_t vl);
vuint16m2_t __riscv_vmacc_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd, uint16_t rs1,
                                      vuint16m2_t vs2, size_t vl);
vuint16m4_t __riscv_vmacc_vv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs1, vuint16m4_t vs2,
                                      size_t vl);
vuint16m4_t __riscv_vmacc_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd, uint16_t rs1,
                                      vuint16m4_t vs2, size_t vl);
vuint16m8_t __riscv_vmacc_vv_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs1, vuint16m8_t vs2,
                                      size_t vl);
vuint16m8_t __riscv_vmacc_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd, uint16_t rs1,
                                      vuint16m8_t vs2, size_t vl);
vuint32mf2_t __riscv_vmacc_vv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs1, vuint32mf2_t vs2,
                                        size_t vl);
vuint32mf2_t __riscv_vmacc_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                        uint32_t rs1, vuint32mf2_t vs2,
                                        size_t vl);
vuint32m1_t __riscv_vmacc_vv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs1, vuint32m1_t vs2,
                                      size_t vl);
vuint32m1_t __riscv_vmacc_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                      uint32_t rs1, vuint32m1_t vs2, size_t vl);
vuint32m2_t __riscv_vmacc_vv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs1, vuint32m2_t vs2,
                                      size_t vl);
vuint32m2_t __riscv_vmacc_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                      uint32_t rs1, vuint32m2_t vs2, size_t vl);
vuint32m4_t __riscv_vmacc_vv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs1, vuint32m4_t vs2,
                                      size_t vl);
vuint32m4_t __riscv_vmacc_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd, uint32_t rs1,
                                      vuint32m4_t vs2, size_t vl);
vuint32m8_t __riscv_vmacc_vv_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs1, vuint32m8_t vs2,
                                      size_t vl);
vuint32m8_t __riscv_vmacc_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd, uint32_t rs1,
                                      vuint32m8_t vs2, size_t vl);
vuint64m1_t __riscv_vmacc_vv_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs1, vuint64m1_t vs2,
                                      size_t vl);
vuint64m1_t __riscv_vmacc_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                      uint64_t rs1, vuint64m1_t vs2, size_t vl);
vuint64m2_t __riscv_vmacc_vv_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs1, vuint64m2_t vs2,
                                      size_t vl);
vuint64m2_t __riscv_vmacc_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                      uint64_t rs1, vuint64m2_t vs2, size_t vl);
vuint64m4_t __riscv_vmacc_vv_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs1, vuint64m4_t vs2,
                                      size_t vl);
vuint64m4_t __riscv_vmacc_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                      uint64_t rs1, vuint64m4_t vs2, size_t vl);
vuint64m8_t __riscv_vmacc_vv_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs1, vuint64m8_t vs2,
                                      size_t vl);
vuint64m8_t __riscv_vmacc_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd, uint64_t rs1,
                                      vuint64m8_t vs2, size_t vl);
vuint8mf8_t __riscv_vnmsac_vv_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs1, vuint8mf8_t vs2,
                                       size_t vl);
vuint8mf8_t __riscv_vnmsac_vx_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                       uint8_t rs1, vuint8mf8_t vs2, size_t vl);
vuint8mf4_t __riscv_vnmsac_vv_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs1, vuint8mf4_t vs2,
                                       size_t vl);
vuint8mf4_t __riscv_vnmsac_vx_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                       uint8_t rs1, vuint8mf4_t vs2, size_t vl);
vuint8mf2_t __riscv_vnmsac_vv_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs1, vuint8mf2_t vs2,
                                       size_t vl);
vuint8mf2_t __riscv_vnmsac_vx_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                       uint8_t rs1, vuint8mf2_t vs2, size_t vl);
vuint8m1_t __riscv_vnmsac_vv_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs1,
                                     vuint8m1_t vs2, size_t vl);
vuint8m1_t __riscv_vnmsac_vx_u8m1_mu(vbool8_t vm, vuint8m1_t vd, uint8_t rs1,
                                     vuint8m1_t vs2, size_t vl);
vuint8m2_t __riscv_vnmsac_vv_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs1,
                                     vuint8m2_t vs2, size_t vl);
vuint8m2_t __riscv_vnmsac_vx_u8m2_mu(vbool4_t vm, vuint8m2_t vd, uint8_t rs1,
                                     vuint8m2_t vs2, size_t vl);
vuint8m4_t __riscv_vnmsac_vv_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs1,
                                     vuint8m4_t vs2, size_t vl);
vuint8m4_t __riscv_vnmsac_vx_u8m4_mu(vbool2_t vm, vuint8m4_t vd, uint8_t rs1,
                                     vuint8m4_t vs2, size_t vl);
vuint8m8_t __riscv_vnmsac_vv_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs1,
                                     vuint8m8_t vs2, size_t vl);
vuint8m8_t __riscv_vnmsac_vx_u8m8_mu(vbool1_t vm, vuint8m8_t vd, uint8_t rs1,
                                     vuint8m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vnmsac_vv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs1, vuint16mf4_t vs2,
                                         size_t vl);
vuint16mf4_t __riscv_vnmsac_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                         uint16_t rs1, vuint16mf4_t vs2,
                                         size_t vl);
vuint16mf2_t __riscv_vnmsac_vv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs1, vuint16mf2_t vs2,
                                         size_t vl);
vuint16mf2_t __riscv_vnmsac_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                         uint16_t rs1, vuint16mf2_t vs2,
                                         size_t vl);
vuint16m1_t __riscv_vnmsac_vv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs1, vuint16m1_t vs2,
                                       size_t vl);
vuint16m1_t __riscv_vnmsac_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                       uint16_t rs1, vuint16m1_t vs2,
                                       size_t vl);
vuint16m2_t __riscv_vnmsac_vv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs1, vuint16m2_t vs2,
                                       size_t vl);
vuint16m2_t __riscv_vnmsac_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                       uint16_t rs1, vuint16m2_t vs2,
                                       size_t vl);
vuint16m4_t __riscv_vnmsac_vv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs1, vuint16m4_t vs2,
                                       size_t vl);
vuint16m4_t __riscv_vnmsac_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                       uint16_t rs1, vuint16m4_t vs2,
                                       size_t vl);
vuint16m8_t __riscv_vnmsac_vv_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs1, vuint16m8_t vs2,
                                       size_t vl);
vuint16m8_t __riscv_vnmsac_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                       uint16_t rs1, vuint16m8_t vs2,
                                       size_t vl);
vuint32mf2_t __riscv_vnmsac_vv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs1, vuint32mf2_t vs2,
                                         size_t vl);
vuint32mf2_t __riscv_vnmsac_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                         uint32_t rs1, vuint32mf2_t vs2,
                                         size_t vl);
vuint32m1_t __riscv_vnmsac_vv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs1, vuint32m1_t vs2,
                                       size_t vl);
vuint32m1_t __riscv_vnmsac_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                       uint32_t rs1, vuint32m1_t vs2,
                                       size_t vl);
vuint32m2_t __riscv_vnmsac_vv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs1, vuint32m2_t vs2,
                                       size_t vl);
vuint32m2_t __riscv_vnmsac_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                       uint32_t rs1, vuint32m2_t vs2,
                                       size_t vl);
vuint32m4_t __riscv_vnmsac_vv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs1, vuint32m4_t vs2,
                                       size_t vl);
vuint32m4_t __riscv_vnmsac_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                       uint32_t rs1, vuint32m4_t vs2,
                                       size_t vl);
vuint32m8_t __riscv_vnmsac_vv_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs1, vuint32m8_t vs2,
                                       size_t vl);
vuint32m8_t __riscv_vnmsac_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                       uint32_t rs1, vuint32m8_t vs2,
                                       size_t vl);
vuint64m1_t __riscv_vnmsac_vv_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs1, vuint64m1_t vs2,
                                       size_t vl);
vuint64m1_t __riscv_vnmsac_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                       uint64_t rs1, vuint64m1_t vs2,
                                       size_t vl);
vuint64m2_t __riscv_vnmsac_vv_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs1, vuint64m2_t vs2,
                                       size_t vl);
vuint64m2_t __riscv_vnmsac_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                       uint64_t rs1, vuint64m2_t vs2,
                                       size_t vl);
vuint64m4_t __riscv_vnmsac_vv_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs1, vuint64m4_t vs2,
                                       size_t vl);
vuint64m4_t __riscv_vnmsac_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                       uint64_t rs1, vuint64m4_t vs2,
                                       size_t vl);
vuint64m8_t __riscv_vnmsac_vv_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs1, vuint64m8_t vs2,
                                       size_t vl);
vuint64m8_t __riscv_vnmsac_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                       uint64_t rs1, vuint64m8_t vs2,
                                       size_t vl);
vuint8mf8_t __riscv_vmadd_vv_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                      vuint8mf8_t vs1, vuint8mf8_t vs2,
                                      size_t vl);
vuint8mf8_t __riscv_vmadd_vx_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd, uint8_t rs1,
                                      vuint8mf8_t vs2, size_t vl);
vuint8mf4_t __riscv_vmadd_vv_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                      vuint8mf4_t vs1, vuint8mf4_t vs2,
                                      size_t vl);
vuint8mf4_t __riscv_vmadd_vx_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd, uint8_t rs1,
                                      vuint8mf4_t vs2, size_t vl);
vuint8mf2_t __riscv_vmadd_vv_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                      vuint8mf2_t vs1, vuint8mf2_t vs2,
                                      size_t vl);
vuint8mf2_t __riscv_vmadd_vx_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd, uint8_t rs1,
                                      vuint8mf2_t vs2, size_t vl);
vuint8m1_t __riscv_vmadd_vv_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs1,
                                    vuint8m1_t vs2, size_t vl);
vuint8m1_t __riscv_vmadd_vx_u8m1_mu(vbool8_t vm, vuint8m1_t vd, uint8_t rs1,
                                    vuint8m1_t vs2, size_t vl);
vuint8m2_t __riscv_vmadd_vv_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs1,
                                    vuint8m2_t vs2, size_t vl);
vuint8m2_t __riscv_vmadd_vx_u8m2_mu(vbool4_t vm, vuint8m2_t vd, uint8_t rs1,
                                    vuint8m2_t vs2, size_t vl);
vuint8m4_t __riscv_vmadd_vv_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs1,
                                    vuint8m4_t vs2, size_t vl);
vuint8m4_t __riscv_vmadd_vx_u8m4_mu(vbool2_t vm, vuint8m4_t vd, uint8_t rs1,
                                    vuint8m4_t vs2, size_t vl);
vuint8m8_t __riscv_vmadd_vv_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs1,
                                    vuint8m8_t vs2, size_t vl);
vuint8m8_t __riscv_vmadd_vx_u8m8_mu(vbool1_t vm, vuint8m8_t vd, uint8_t rs1,
                                    vuint8m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vmadd_vv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                        vuint16mf4_t vs1, vuint16mf4_t vs2,
                                        size_t vl);
vuint16mf4_t __riscv_vmadd_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                        uint16_t rs1, vuint16mf4_t vs2,
                                        size_t vl);
vuint16mf2_t __riscv_vmadd_vv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                        vuint16mf2_t vs1, vuint16mf2_t vs2,
                                        size_t vl);
vuint16mf2_t __riscv_vmadd_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                        uint16_t rs1, vuint16mf2_t vs2,
                                        size_t vl);
vuint16m1_t __riscv_vmadd_vv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                      vuint16m1_t vs1, vuint16m1_t vs2,
                                      size_t vl);
vuint16m1_t __riscv_vmadd_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                      uint16_t rs1, vuint16m1_t vs2, size_t vl);
vuint16m2_t __riscv_vmadd_vv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                      vuint16m2_t vs1, vuint16m2_t vs2,
                                      size_t vl);
vuint16m2_t __riscv_vmadd_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd, uint16_t rs1,
                                      vuint16m2_t vs2, size_t vl);
vuint16m4_t __riscv_vmadd_vv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                      vuint16m4_t vs1, vuint16m4_t vs2,
                                      size_t vl);
vuint16m4_t __riscv_vmadd_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd, uint16_t rs1,
                                      vuint16m4_t vs2, size_t vl);
vuint16m8_t __riscv_vmadd_vv_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                      vuint16m8_t vs1, vuint16m8_t vs2,
                                      size_t vl);
vuint16m8_t __riscv_vmadd_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd, uint16_t rs1,
                                      vuint16m8_t vs2, size_t vl);
vuint32mf2_t __riscv_vmadd_vv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                        vuint32mf2_t vs1, vuint32mf2_t vs2,
                                        size_t vl);
vuint32mf2_t __riscv_vmadd_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                        uint32_t rs1, vuint32mf2_t vs2,
                                        size_t vl);
vuint32m1_t __riscv_vmadd_vv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                      vuint32m1_t vs1, vuint32m1_t vs2,
                                      size_t vl);
vuint32m1_t __riscv_vmadd_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                      uint32_t rs1, vuint32m1_t vs2, size_t vl);
vuint32m2_t __riscv_vmadd_vv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                      vuint32m2_t vs1, vuint32m2_t vs2,
                                      size_t vl);
vuint32m2_t __riscv_vmadd_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                      uint32_t rs1, vuint32m2_t vs2, size_t vl);
vuint32m4_t __riscv_vmadd_vv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                      vuint32m4_t vs1, vuint32m4_t vs2,
                                      size_t vl);
vuint32m4_t __riscv_vmadd_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd, uint32_t rs1,
                                      vuint32m4_t vs2, size_t vl);
vuint32m8_t __riscv_vmadd_vv_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                      vuint32m8_t vs1, vuint32m8_t vs2,
                                      size_t vl);
vuint32m8_t __riscv_vmadd_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd, uint32_t rs1,
                                      vuint32m8_t vs2, size_t vl);
vuint64m1_t __riscv_vmadd_vv_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                      vuint64m1_t vs1, vuint64m1_t vs2,
                                      size_t vl);
vuint64m1_t __riscv_vmadd_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                      uint64_t rs1, vuint64m1_t vs2, size_t vl);
vuint64m2_t __riscv_vmadd_vv_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                      vuint64m2_t vs1, vuint64m2_t vs2,
                                      size_t vl);
vuint64m2_t __riscv_vmadd_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                      uint64_t rs1, vuint64m2_t vs2, size_t vl);
vuint64m4_t __riscv_vmadd_vv_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                      vuint64m4_t vs1, vuint64m4_t vs2,
                                      size_t vl);
vuint64m4_t __riscv_vmadd_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                      uint64_t rs1, vuint64m4_t vs2, size_t vl);
vuint64m8_t __riscv_vmadd_vv_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                      vuint64m8_t vs1, vuint64m8_t vs2,
                                      size_t vl);
vuint64m8_t __riscv_vmadd_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd, uint64_t rs1,
                                      vuint64m8_t vs2, size_t vl);
vuint8mf8_t __riscv_vnmsub_vv_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                       vuint8mf8_t vs1, vuint8mf8_t vs2,
                                       size_t vl);
vuint8mf8_t __riscv_vnmsub_vx_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                       uint8_t rs1, vuint8mf8_t vs2, size_t vl);
vuint8mf4_t __riscv_vnmsub_vv_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                       vuint8mf4_t vs1, vuint8mf4_t vs2,
                                       size_t vl);
vuint8mf4_t __riscv_vnmsub_vx_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                       uint8_t rs1, vuint8mf4_t vs2, size_t vl);
vuint8mf2_t __riscv_vnmsub_vv_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                       vuint8mf2_t vs1, vuint8mf2_t vs2,
                                       size_t vl);
vuint8mf2_t __riscv_vnmsub_vx_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                       uint8_t rs1, vuint8mf2_t vs2, size_t vl);
vuint8m1_t __riscv_vnmsub_vv_u8m1_mu(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs1,
                                     vuint8m1_t vs2, size_t vl);
vuint8m1_t __riscv_vnmsub_vx_u8m1_mu(vbool8_t vm, vuint8m1_t vd, uint8_t rs1,
                                     vuint8m1_t vs2, size_t vl);
vuint8m2_t __riscv_vnmsub_vv_u8m2_mu(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs1,
                                     vuint8m2_t vs2, size_t vl);
vuint8m2_t __riscv_vnmsub_vx_u8m2_mu(vbool4_t vm, vuint8m2_t vd, uint8_t rs1,
                                     vuint8m2_t vs2, size_t vl);
vuint8m4_t __riscv_vnmsub_vv_u8m4_mu(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs1,
                                     vuint8m4_t vs2, size_t vl);
vuint8m4_t __riscv_vnmsub_vx_u8m4_mu(vbool2_t vm, vuint8m4_t vd, uint8_t rs1,
                                     vuint8m4_t vs2, size_t vl);
vuint8m8_t __riscv_vnmsub_vv_u8m8_mu(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs1,
                                     vuint8m8_t vs2, size_t vl);
vuint8m8_t __riscv_vnmsub_vx_u8m8_mu(vbool1_t vm, vuint8m8_t vd, uint8_t rs1,
                                     vuint8m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vnmsub_vv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                         vuint16mf4_t vs1, vuint16mf4_t vs2,
                                         size_t vl);
vuint16mf4_t __riscv_vnmsub_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                         uint16_t rs1, vuint16mf4_t vs2,
                                         size_t vl);
vuint16mf2_t __riscv_vnmsub_vv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                         vuint16mf2_t vs1, vuint16mf2_t vs2,
                                         size_t vl);
vuint16mf2_t __riscv_vnmsub_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                         uint16_t rs1, vuint16mf2_t vs2,
                                         size_t vl);
vuint16m1_t __riscv_vnmsub_vv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                       vuint16m1_t vs1, vuint16m1_t vs2,
                                       size_t vl);
vuint16m1_t __riscv_vnmsub_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                       uint16_t rs1, vuint16m1_t vs2,
                                       size_t vl);
vuint16m2_t __riscv_vnmsub_vv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                       vuint16m2_t vs1, vuint16m2_t vs2,
                                       size_t vl);
vuint16m2_t __riscv_vnmsub_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                       uint16_t rs1, vuint16m2_t vs2,
                                       size_t vl);
vuint16m4_t __riscv_vnmsub_vv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                       vuint16m4_t vs1, vuint16m4_t vs2,
                                       size_t vl);
vuint16m4_t __riscv_vnmsub_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                       uint16_t rs1, vuint16m4_t vs2,
                                       size_t vl);
vuint16m8_t __riscv_vnmsub_vv_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                       vuint16m8_t vs1, vuint16m8_t vs2,
                                       size_t vl);
vuint16m8_t __riscv_vnmsub_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                       uint16_t rs1, vuint16m8_t vs2,
                                       size_t vl);
vuint32mf2_t __riscv_vnmsub_vv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                         vuint32mf2_t vs1, vuint32mf2_t vs2,
                                         size_t vl);
vuint32mf2_t __riscv_vnmsub_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                         uint32_t rs1, vuint32mf2_t vs2,
                                         size_t vl);
vuint32m1_t __riscv_vnmsub_vv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                       vuint32m1_t vs1, vuint32m1_t vs2,
                                       size_t vl);
vuint32m1_t __riscv_vnmsub_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                       uint32_t rs1, vuint32m1_t vs2,
                                       size_t vl);
vuint32m2_t __riscv_vnmsub_vv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                       vuint32m2_t vs1, vuint32m2_t vs2,
                                       size_t vl);
vuint32m2_t __riscv_vnmsub_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                       uint32_t rs1, vuint32m2_t vs2,
                                       size_t vl);
vuint32m4_t __riscv_vnmsub_vv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                       vuint32m4_t vs1, vuint32m4_t vs2,
                                       size_t vl);
vuint32m4_t __riscv_vnmsub_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                       uint32_t rs1, vuint32m4_t vs2,
                                       size_t vl);
vuint32m8_t __riscv_vnmsub_vv_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                       vuint32m8_t vs1, vuint32m8_t vs2,
                                       size_t vl);
vuint32m8_t __riscv_vnmsub_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                       uint32_t rs1, vuint32m8_t vs2,
                                       size_t vl);
vuint64m1_t __riscv_vnmsub_vv_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                       vuint64m1_t vs1, vuint64m1_t vs2,
                                       size_t vl);
vuint64m1_t __riscv_vnmsub_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                       uint64_t rs1, vuint64m1_t vs2,
                                       size_t vl);
vuint64m2_t __riscv_vnmsub_vv_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                       vuint64m2_t vs1, vuint64m2_t vs2,
                                       size_t vl);
vuint64m2_t __riscv_vnmsub_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                       uint64_t rs1, vuint64m2_t vs2,
                                       size_t vl);
vuint64m4_t __riscv_vnmsub_vv_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                       vuint64m4_t vs1, vuint64m4_t vs2,
                                       size_t vl);
vuint64m4_t __riscv_vnmsub_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                       uint64_t rs1, vuint64m4_t vs2,
                                       size_t vl);
vuint64m8_t __riscv_vnmsub_vv_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                       vuint64m8_t vs1, vuint64m8_t vs2,
                                       size_t vl);
vuint64m8_t __riscv_vnmsub_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                       uint64_t rs1, vuint64m8_t vs2,
                                       size_t vl);

Vector Widening Integer Multiply-Add Intrinsics

vint16mf4_t __riscv_vwmacc_vv_i16mf4_tu(vint16mf4_t vd, vint8mf8_t vs1,
                                        vint8mf8_t vs2, size_t vl);
vint16mf4_t __riscv_vwmacc_vx_i16mf4_tu(vint16mf4_t vd, int8_t rs1,
                                        vint8mf8_t vs2, size_t vl);
vint16mf2_t __riscv_vwmacc_vv_i16mf2_tu(vint16mf2_t vd, vint8mf4_t vs1,
                                        vint8mf4_t vs2, size_t vl);
vint16mf2_t __riscv_vwmacc_vx_i16mf2_tu(vint16mf2_t vd, int8_t rs1,
                                        vint8mf4_t vs2, size_t vl);
vint16m1_t __riscv_vwmacc_vv_i16m1_tu(vint16m1_t vd, vint8mf2_t vs1,
                                      vint8mf2_t vs2, size_t vl);
vint16m1_t __riscv_vwmacc_vx_i16m1_tu(vint16m1_t vd, int8_t rs1, vint8mf2_t vs2,
                                      size_t vl);
vint16m2_t __riscv_vwmacc_vv_i16m2_tu(vint16m2_t vd, vint8m1_t vs1,
                                      vint8m1_t vs2, size_t vl);
vint16m2_t __riscv_vwmacc_vx_i16m2_tu(vint16m2_t vd, int8_t rs1, vint8m1_t vs2,
                                      size_t vl);
vint16m4_t __riscv_vwmacc_vv_i16m4_tu(vint16m4_t vd, vint8m2_t vs1,
                                      vint8m2_t vs2, size_t vl);
vint16m4_t __riscv_vwmacc_vx_i16m4_tu(vint16m4_t vd, int8_t rs1, vint8m2_t vs2,
                                      size_t vl);
vint16m8_t __riscv_vwmacc_vv_i16m8_tu(vint16m8_t vd, vint8m4_t vs1,
                                      vint8m4_t vs2, size_t vl);
vint16m8_t __riscv_vwmacc_vx_i16m8_tu(vint16m8_t vd, int8_t rs1, vint8m4_t vs2,
                                      size_t vl);
vint32mf2_t __riscv_vwmacc_vv_i32mf2_tu(vint32mf2_t vd, vint16mf4_t vs1,
                                        vint16mf4_t vs2, size_t vl);
vint32mf2_t __riscv_vwmacc_vx_i32mf2_tu(vint32mf2_t vd, int16_t rs1,
                                        vint16mf4_t vs2, size_t vl);
vint32m1_t __riscv_vwmacc_vv_i32m1_tu(vint32m1_t vd, vint16mf2_t vs1,
                                      vint16mf2_t vs2, size_t vl);
vint32m1_t __riscv_vwmacc_vx_i32m1_tu(vint32m1_t vd, int16_t rs1,
                                      vint16mf2_t vs2, size_t vl);
vint32m2_t __riscv_vwmacc_vv_i32m2_tu(vint32m2_t vd, vint16m1_t vs1,
                                      vint16m1_t vs2, size_t vl);
vint32m2_t __riscv_vwmacc_vx_i32m2_tu(vint32m2_t vd, int16_t rs1,
                                      vint16m1_t vs2, size_t vl);
vint32m4_t __riscv_vwmacc_vv_i32m4_tu(vint32m4_t vd, vint16m2_t vs1,
                                      vint16m2_t vs2, size_t vl);
vint32m4_t __riscv_vwmacc_vx_i32m4_tu(vint32m4_t vd, int16_t rs1,
                                      vint16m2_t vs2, size_t vl);
vint32m8_t __riscv_vwmacc_vv_i32m8_tu(vint32m8_t vd, vint16m4_t vs1,
                                      vint16m4_t vs2, size_t vl);
vint32m8_t __riscv_vwmacc_vx_i32m8_tu(vint32m8_t vd, int16_t rs1,
                                      vint16m4_t vs2, size_t vl);
vint64m1_t __riscv_vwmacc_vv_i64m1_tu(vint64m1_t vd, vint32mf2_t vs1,
                                      vint32mf2_t vs2, size_t vl);
vint64m1_t __riscv_vwmacc_vx_i64m1_tu(vint64m1_t vd, int32_t rs1,
                                      vint32mf2_t vs2, size_t vl);
vint64m2_t __riscv_vwmacc_vv_i64m2_tu(vint64m2_t vd, vint32m1_t vs1,
                                      vint32m1_t vs2, size_t vl);
vint64m2_t __riscv_vwmacc_vx_i64m2_tu(vint64m2_t vd, int32_t rs1,
                                      vint32m1_t vs2, size_t vl);
vint64m4_t __riscv_vwmacc_vv_i64m4_tu(vint64m4_t vd, vint32m2_t vs1,
                                      vint32m2_t vs2, size_t vl);
vint64m4_t __riscv_vwmacc_vx_i64m4_tu(vint64m4_t vd, int32_t rs1,
                                      vint32m2_t vs2, size_t vl);
vint64m8_t __riscv_vwmacc_vv_i64m8_tu(vint64m8_t vd, vint32m4_t vs1,
                                      vint32m4_t vs2, size_t vl);
vint64m8_t __riscv_vwmacc_vx_i64m8_tu(vint64m8_t vd, int32_t rs1,
                                      vint32m4_t vs2, size_t vl);
vint16mf4_t __riscv_vwmaccsu_vv_i16mf4_tu(vint16mf4_t vd, vint8mf8_t vs1,
                                          vuint8mf8_t vs2, size_t vl);
vint16mf4_t __riscv_vwmaccsu_vx_i16mf4_tu(vint16mf4_t vd, int8_t rs1,
                                          vuint8mf8_t vs2, size_t vl);
vint16mf2_t __riscv_vwmaccsu_vv_i16mf2_tu(vint16mf2_t vd, vint8mf4_t vs1,
                                          vuint8mf4_t vs2, size_t vl);
vint16mf2_t __riscv_vwmaccsu_vx_i16mf2_tu(vint16mf2_t vd, int8_t rs1,
                                          vuint8mf4_t vs2, size_t vl);
vint16m1_t __riscv_vwmaccsu_vv_i16m1_tu(vint16m1_t vd, vint8mf2_t vs1,
                                        vuint8mf2_t vs2, size_t vl);
vint16m1_t __riscv_vwmaccsu_vx_i16m1_tu(vint16m1_t vd, int8_t rs1,
                                        vuint8mf2_t vs2, size_t vl);
vint16m2_t __riscv_vwmaccsu_vv_i16m2_tu(vint16m2_t vd, vint8m1_t vs1,
                                        vuint8m1_t vs2, size_t vl);
vint16m2_t __riscv_vwmaccsu_vx_i16m2_tu(vint16m2_t vd, int8_t rs1,
                                        vuint8m1_t vs2, size_t vl);
vint16m4_t __riscv_vwmaccsu_vv_i16m4_tu(vint16m4_t vd, vint8m2_t vs1,
                                        vuint8m2_t vs2, size_t vl);
vint16m4_t __riscv_vwmaccsu_vx_i16m4_tu(vint16m4_t vd, int8_t rs1,
                                        vuint8m2_t vs2, size_t vl);
vint16m8_t __riscv_vwmaccsu_vv_i16m8_tu(vint16m8_t vd, vint8m4_t vs1,
                                        vuint8m4_t vs2, size_t vl);
vint16m8_t __riscv_vwmaccsu_vx_i16m8_tu(vint16m8_t vd, int8_t rs1,
                                        vuint8m4_t vs2, size_t vl);
vint32mf2_t __riscv_vwmaccsu_vv_i32mf2_tu(vint32mf2_t vd, vint16mf4_t vs1,
                                          vuint16mf4_t vs2, size_t vl);
vint32mf2_t __riscv_vwmaccsu_vx_i32mf2_tu(vint32mf2_t vd, int16_t rs1,
                                          vuint16mf4_t vs2, size_t vl);
vint32m1_t __riscv_vwmaccsu_vv_i32m1_tu(vint32m1_t vd, vint16mf2_t vs1,
                                        vuint16mf2_t vs2, size_t vl);
vint32m1_t __riscv_vwmaccsu_vx_i32m1_tu(vint32m1_t vd, int16_t rs1,
                                        vuint16mf2_t vs2, size_t vl);
vint32m2_t __riscv_vwmaccsu_vv_i32m2_tu(vint32m2_t vd, vint16m1_t vs1,
                                        vuint16m1_t vs2, size_t vl);
vint32m2_t __riscv_vwmaccsu_vx_i32m2_tu(vint32m2_t vd, int16_t rs1,
                                        vuint16m1_t vs2, size_t vl);
vint32m4_t __riscv_vwmaccsu_vv_i32m4_tu(vint32m4_t vd, vint16m2_t vs1,
                                        vuint16m2_t vs2, size_t vl);
vint32m4_t __riscv_vwmaccsu_vx_i32m4_tu(vint32m4_t vd, int16_t rs1,
                                        vuint16m2_t vs2, size_t vl);
vint32m8_t __riscv_vwmaccsu_vv_i32m8_tu(vint32m8_t vd, vint16m4_t vs1,
                                        vuint16m4_t vs2, size_t vl);
vint32m8_t __riscv_vwmaccsu_vx_i32m8_tu(vint32m8_t vd, int16_t rs1,
                                        vuint16m4_t vs2, size_t vl);
vint64m1_t __riscv_vwmaccsu_vv_i64m1_tu(vint64m1_t vd, vint32mf2_t vs1,
                                        vuint32mf2_t vs2, size_t vl);
vint64m1_t __riscv_vwmaccsu_vx_i64m1_tu(vint64m1_t vd, int32_t rs1,
                                        vuint32mf2_t vs2, size_t vl);
vint64m2_t __riscv_vwmaccsu_vv_i64m2_tu(vint64m2_t vd, vint32m1_t vs1,
                                        vuint32m1_t vs2, size_t vl);
vint64m2_t __riscv_vwmaccsu_vx_i64m2_tu(vint64m2_t vd, int32_t rs1,
                                        vuint32m1_t vs2, size_t vl);
vint64m4_t __riscv_vwmaccsu_vv_i64m4_tu(vint64m4_t vd, vint32m2_t vs1,
                                        vuint32m2_t vs2, size_t vl);
vint64m4_t __riscv_vwmaccsu_vx_i64m4_tu(vint64m4_t vd, int32_t rs1,
                                        vuint32m2_t vs2, size_t vl);
vint64m8_t __riscv_vwmaccsu_vv_i64m8_tu(vint64m8_t vd, vint32m4_t vs1,
                                        vuint32m4_t vs2, size_t vl);
vint64m8_t __riscv_vwmaccsu_vx_i64m8_tu(vint64m8_t vd, int32_t rs1,
                                        vuint32m4_t vs2, size_t vl);
vint16mf4_t __riscv_vwmaccus_vx_i16mf4_tu(vint16mf4_t vd, uint8_t rs1,
                                          vint8mf8_t vs2, size_t vl);
vint16mf2_t __riscv_vwmaccus_vx_i16mf2_tu(vint16mf2_t vd, uint8_t rs1,
                                          vint8mf4_t vs2, size_t vl);
vint16m1_t __riscv_vwmaccus_vx_i16m1_tu(vint16m1_t vd, uint8_t rs1,
                                        vint8mf2_t vs2, size_t vl);
vint16m2_t __riscv_vwmaccus_vx_i16m2_tu(vint16m2_t vd, uint8_t rs1,
                                        vint8m1_t vs2, size_t vl);
vint16m4_t __riscv_vwmaccus_vx_i16m4_tu(vint16m4_t vd, uint8_t rs1,
                                        vint8m2_t vs2, size_t vl);
vint16m8_t __riscv_vwmaccus_vx_i16m8_tu(vint16m8_t vd, uint8_t rs1,
                                        vint8m4_t vs2, size_t vl);
vint32mf2_t __riscv_vwmaccus_vx_i32mf2_tu(vint32mf2_t vd, uint16_t rs1,
                                          vint16mf4_t vs2, size_t vl);
vint32m1_t __riscv_vwmaccus_vx_i32m1_tu(vint32m1_t vd, uint16_t rs1,
                                        vint16mf2_t vs2, size_t vl);
vint32m2_t __riscv_vwmaccus_vx_i32m2_tu(vint32m2_t vd, uint16_t rs1,
                                        vint16m1_t vs2, size_t vl);
vint32m4_t __riscv_vwmaccus_vx_i32m4_tu(vint32m4_t vd, uint16_t rs1,
                                        vint16m2_t vs2, size_t vl);
vint32m8_t __riscv_vwmaccus_vx_i32m8_tu(vint32m8_t vd, uint16_t rs1,
                                        vint16m4_t vs2, size_t vl);
vint64m1_t __riscv_vwmaccus_vx_i64m1_tu(vint64m1_t vd, uint32_t rs1,
                                        vint32mf2_t vs2, size_t vl);
vint64m2_t __riscv_vwmaccus_vx_i64m2_tu(vint64m2_t vd, uint32_t rs1,
                                        vint32m1_t vs2, size_t vl);
vint64m4_t __riscv_vwmaccus_vx_i64m4_tu(vint64m4_t vd, uint32_t rs1,
                                        vint32m2_t vs2, size_t vl);
vint64m8_t __riscv_vwmaccus_vx_i64m8_tu(vint64m8_t vd, uint32_t rs1,
                                        vint32m4_t vs2, size_t vl);
vuint16mf4_t __riscv_vwmaccu_vv_u16mf4_tu(vuint16mf4_t vd, vuint8mf8_t vs1,
                                          vuint8mf8_t vs2, size_t vl);
vuint16mf4_t __riscv_vwmaccu_vx_u16mf4_tu(vuint16mf4_t vd, uint8_t rs1,
                                          vuint8mf8_t vs2, size_t vl);
vuint16mf2_t __riscv_vwmaccu_vv_u16mf2_tu(vuint16mf2_t vd, vuint8mf4_t vs1,
                                          vuint8mf4_t vs2, size_t vl);
vuint16mf2_t __riscv_vwmaccu_vx_u16mf2_tu(vuint16mf2_t vd, uint8_t rs1,
                                          vuint8mf4_t vs2, size_t vl);
vuint16m1_t __riscv_vwmaccu_vv_u16m1_tu(vuint16m1_t vd, vuint8mf2_t vs1,
                                        vuint8mf2_t vs2, size_t vl);
vuint16m1_t __riscv_vwmaccu_vx_u16m1_tu(vuint16m1_t vd, uint8_t rs1,
                                        vuint8mf2_t vs2, size_t vl);
vuint16m2_t __riscv_vwmaccu_vv_u16m2_tu(vuint16m2_t vd, vuint8m1_t vs1,
                                        vuint8m1_t vs2, size_t vl);
vuint16m2_t __riscv_vwmaccu_vx_u16m2_tu(vuint16m2_t vd, uint8_t rs1,
                                        vuint8m1_t vs2, size_t vl);
vuint16m4_t __riscv_vwmaccu_vv_u16m4_tu(vuint16m4_t vd, vuint8m2_t vs1,
                                        vuint8m2_t vs2, size_t vl);
vuint16m4_t __riscv_vwmaccu_vx_u16m4_tu(vuint16m4_t vd, uint8_t rs1,
                                        vuint8m2_t vs2, size_t vl);
vuint16m8_t __riscv_vwmaccu_vv_u16m8_tu(vuint16m8_t vd, vuint8m4_t vs1,
                                        vuint8m4_t vs2, size_t vl);
vuint16m8_t __riscv_vwmaccu_vx_u16m8_tu(vuint16m8_t vd, uint8_t rs1,
                                        vuint8m4_t vs2, size_t vl);
vuint32mf2_t __riscv_vwmaccu_vv_u32mf2_tu(vuint32mf2_t vd, vuint16mf4_t vs1,
                                          vuint16mf4_t vs2, size_t vl);
vuint32mf2_t __riscv_vwmaccu_vx_u32mf2_tu(vuint32mf2_t vd, uint16_t rs1,
                                          vuint16mf4_t vs2, size_t vl);
vuint32m1_t __riscv_vwmaccu_vv_u32m1_tu(vuint32m1_t vd, vuint16mf2_t vs1,
                                        vuint16mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vwmaccu_vx_u32m1_tu(vuint32m1_t vd, uint16_t rs1,
                                        vuint16mf2_t vs2, size_t vl);
vuint32m2_t __riscv_vwmaccu_vv_u32m2_tu(vuint32m2_t vd, vuint16m1_t vs1,
                                        vuint16m1_t vs2, size_t vl);
vuint32m2_t __riscv_vwmaccu_vx_u32m2_tu(vuint32m2_t vd, uint16_t rs1,
                                        vuint16m1_t vs2, size_t vl);
vuint32m4_t __riscv_vwmaccu_vv_u32m4_tu(vuint32m4_t vd, vuint16m2_t vs1,
                                        vuint16m2_t vs2, size_t vl);
vuint32m4_t __riscv_vwmaccu_vx_u32m4_tu(vuint32m4_t vd, uint16_t rs1,
                                        vuint16m2_t vs2, size_t vl);
vuint32m8_t __riscv_vwmaccu_vv_u32m8_tu(vuint32m8_t vd, vuint16m4_t vs1,
                                        vuint16m4_t vs2, size_t vl);
vuint32m8_t __riscv_vwmaccu_vx_u32m8_tu(vuint32m8_t vd, uint16_t rs1,
                                        vuint16m4_t vs2, size_t vl);
vuint64m1_t __riscv_vwmaccu_vv_u64m1_tu(vuint64m1_t vd, vuint32mf2_t vs1,
                                        vuint32mf2_t vs2, size_t vl);
vuint64m1_t __riscv_vwmaccu_vx_u64m1_tu(vuint64m1_t vd, uint32_t rs1,
                                        vuint32mf2_t vs2, size_t vl);
vuint64m2_t __riscv_vwmaccu_vv_u64m2_tu(vuint64m2_t vd, vuint32m1_t vs1,
                                        vuint32m1_t vs2, size_t vl);
vuint64m2_t __riscv_vwmaccu_vx_u64m2_tu(vuint64m2_t vd, uint32_t rs1,
                                        vuint32m1_t vs2, size_t vl);
vuint64m4_t __riscv_vwmaccu_vv_u64m4_tu(vuint64m4_t vd, vuint32m2_t vs1,
                                        vuint32m2_t vs2, size_t vl);
vuint64m4_t __riscv_vwmaccu_vx_u64m4_tu(vuint64m4_t vd, uint32_t rs1,
                                        vuint32m2_t vs2, size_t vl);
vuint64m8_t __riscv_vwmaccu_vv_u64m8_tu(vuint64m8_t vd, vuint32m4_t vs1,
                                        vuint32m4_t vs2, size_t vl);
vuint64m8_t __riscv_vwmaccu_vx_u64m8_tu(vuint64m8_t vd, uint32_t rs1,
                                        vuint32m4_t vs2, size_t vl);
// masked functions
vint16mf4_t __riscv_vwmacc_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                         vint8mf8_t vs1, vint8mf8_t vs2,
                                         size_t vl);
vint16mf4_t __riscv_vwmacc_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                         int8_t rs1, vint8mf8_t vs2, size_t vl);
vint16mf2_t __riscv_vwmacc_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                         vint8mf4_t vs1, vint8mf4_t vs2,
                                         size_t vl);
vint16mf2_t __riscv_vwmacc_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                         int8_t rs1, vint8mf4_t vs2, size_t vl);
vint16m1_t __riscv_vwmacc_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                       vint8mf2_t vs1, vint8mf2_t vs2,
                                       size_t vl);
vint16m1_t __riscv_vwmacc_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd, int8_t rs1,
                                       vint8mf2_t vs2, size_t vl);
vint16m2_t __riscv_vwmacc_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                       vint8m1_t vs1, vint8m1_t vs2, size_t vl);
vint16m2_t __riscv_vwmacc_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd, int8_t rs1,
                                       vint8m1_t vs2, size_t vl);
vint16m4_t __riscv_vwmacc_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                       vint8m2_t vs1, vint8m2_t vs2, size_t vl);
vint16m4_t __riscv_vwmacc_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd, int8_t rs1,
                                       vint8m2_t vs2, size_t vl);
vint16m8_t __riscv_vwmacc_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                       vint8m4_t vs1, vint8m4_t vs2, size_t vl);
vint16m8_t __riscv_vwmacc_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd, int8_t rs1,
                                       vint8m4_t vs2, size_t vl);
vint32mf2_t __riscv_vwmacc_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                         vint16mf4_t vs1, vint16mf4_t vs2,
                                         size_t vl);
vint32mf2_t __riscv_vwmacc_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                         int16_t rs1, vint16mf4_t vs2,
                                         size_t vl);
vint32m1_t __riscv_vwmacc_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                       vint16mf2_t vs1, vint16mf2_t vs2,
                                       size_t vl);
vint32m1_t __riscv_vwmacc_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd, int16_t rs1,
                                       vint16mf2_t vs2, size_t vl);
vint32m2_t __riscv_vwmacc_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                       vint16m1_t vs1, vint16m1_t vs2,
                                       size_t vl);
vint32m2_t __riscv_vwmacc_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd, int16_t rs1,
                                       vint16m1_t vs2, size_t vl);
vint32m4_t __riscv_vwmacc_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                       vint16m2_t vs1, vint16m2_t vs2,
                                       size_t vl);
vint32m4_t __riscv_vwmacc_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd, int16_t rs1,
                                       vint16m2_t vs2, size_t vl);
vint32m8_t __riscv_vwmacc_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                       vint16m4_t vs1, vint16m4_t vs2,
                                       size_t vl);
vint32m8_t __riscv_vwmacc_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd, int16_t rs1,
                                       vint16m4_t vs2, size_t vl);
vint64m1_t __riscv_vwmacc_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                       vint32mf2_t vs1, vint32mf2_t vs2,
                                       size_t vl);
vint64m1_t __riscv_vwmacc_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd, int32_t rs1,
                                       vint32mf2_t vs2, size_t vl);
vint64m2_t __riscv_vwmacc_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                       vint32m1_t vs1, vint32m1_t vs2,
                                       size_t vl);
vint64m2_t __riscv_vwmacc_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd, int32_t rs1,
                                       vint32m1_t vs2, size_t vl);
vint64m4_t __riscv_vwmacc_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                       vint32m2_t vs1, vint32m2_t vs2,
                                       size_t vl);
vint64m4_t __riscv_vwmacc_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd, int32_t rs1,
                                       vint32m2_t vs2, size_t vl);
vint64m8_t __riscv_vwmacc_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                       vint32m4_t vs1, vint32m4_t vs2,
                                       size_t vl);
vint64m8_t __riscv_vwmacc_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd, int32_t rs1,
                                       vint32m4_t vs2, size_t vl);
vint16mf4_t __riscv_vwmaccsu_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                           vint8mf8_t vs1, vuint8mf8_t vs2,
                                           size_t vl);
vint16mf4_t __riscv_vwmaccsu_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                           int8_t rs1, vuint8mf8_t vs2,
                                           size_t vl);
vint16mf2_t __riscv_vwmaccsu_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                           vint8mf4_t vs1, vuint8mf4_t vs2,
                                           size_t vl);
vint16mf2_t __riscv_vwmaccsu_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                           int8_t rs1, vuint8mf4_t vs2,
                                           size_t vl);
vint16m1_t __riscv_vwmaccsu_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                         vint8mf2_t vs1, vuint8mf2_t vs2,
                                         size_t vl);
vint16m1_t __riscv_vwmaccsu_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                         int8_t rs1, vuint8mf2_t vs2,
                                         size_t vl);
vint16m2_t __riscv_vwmaccsu_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                         vint8m1_t vs1, vuint8m1_t vs2,
                                         size_t vl);
vint16m2_t __riscv_vwmaccsu_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd, int8_t rs1,
                                         vuint8m1_t vs2, size_t vl);
vint16m4_t __riscv_vwmaccsu_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                         vint8m2_t vs1, vuint8m2_t vs2,
                                         size_t vl);
vint16m4_t __riscv_vwmaccsu_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd, int8_t rs1,
                                         vuint8m2_t vs2, size_t vl);
vint16m8_t __riscv_vwmaccsu_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                         vint8m4_t vs1, vuint8m4_t vs2,
                                         size_t vl);
vint16m8_t __riscv_vwmaccsu_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd, int8_t rs1,
                                         vuint8m4_t vs2, size_t vl);
vint32mf2_t __riscv_vwmaccsu_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                           vint16mf4_t vs1, vuint16mf4_t vs2,
                                           size_t vl);
vint32mf2_t __riscv_vwmaccsu_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                           int16_t rs1, vuint16mf4_t vs2,
                                           size_t vl);
vint32m1_t __riscv_vwmaccsu_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                         vint16mf2_t vs1, vuint16mf2_t vs2,
                                         size_t vl);
vint32m1_t __riscv_vwmaccsu_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                         int16_t rs1, vuint16mf2_t vs2,
                                         size_t vl);
vint32m2_t __riscv_vwmaccsu_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                         vint16m1_t vs1, vuint16m1_t vs2,
                                         size_t vl);
vint32m2_t __riscv_vwmaccsu_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                         int16_t rs1, vuint16m1_t vs2,
                                         size_t vl);
vint32m4_t __riscv_vwmaccsu_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                         vint16m2_t vs1, vuint16m2_t vs2,
                                         size_t vl);
vint32m4_t __riscv_vwmaccsu_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                         int16_t rs1, vuint16m2_t vs2,
                                         size_t vl);
vint32m8_t __riscv_vwmaccsu_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                         vint16m4_t vs1, vuint16m4_t vs2,
                                         size_t vl);
vint32m8_t __riscv_vwmaccsu_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                         int16_t rs1, vuint16m4_t vs2,
                                         size_t vl);
vint64m1_t __riscv_vwmaccsu_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                         vint32mf2_t vs1, vuint32mf2_t vs2,
                                         size_t vl);
vint64m1_t __riscv_vwmaccsu_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                         int32_t rs1, vuint32mf2_t vs2,
                                         size_t vl);
vint64m2_t __riscv_vwmaccsu_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                         vint32m1_t vs1, vuint32m1_t vs2,
                                         size_t vl);
vint64m2_t __riscv_vwmaccsu_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                         int32_t rs1, vuint32m1_t vs2,
                                         size_t vl);
vint64m4_t __riscv_vwmaccsu_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                         vint32m2_t vs1, vuint32m2_t vs2,
                                         size_t vl);
vint64m4_t __riscv_vwmaccsu_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                         int32_t rs1, vuint32m2_t vs2,
                                         size_t vl);
vint64m8_t __riscv_vwmaccsu_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                         vint32m4_t vs1, vuint32m4_t vs2,
                                         size_t vl);
vint64m8_t __riscv_vwmaccsu_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                         int32_t rs1, vuint32m4_t vs2,
                                         size_t vl);
vint16mf4_t __riscv_vwmaccus_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                           uint8_t rs1, vint8mf8_t vs2,
                                           size_t vl);
vint16mf2_t __riscv_vwmaccus_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                           uint8_t rs1, vint8mf4_t vs2,
                                           size_t vl);
vint16m1_t __riscv_vwmaccus_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                         uint8_t rs1, vint8mf2_t vs2,
                                         size_t vl);
vint16m2_t __riscv_vwmaccus_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                         uint8_t rs1, vint8m1_t vs2, size_t vl);
vint16m4_t __riscv_vwmaccus_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                         uint8_t rs1, vint8m2_t vs2, size_t vl);
vint16m8_t __riscv_vwmaccus_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                         uint8_t rs1, vint8m4_t vs2, size_t vl);
vint32mf2_t __riscv_vwmaccus_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                           uint16_t rs1, vint16mf4_t vs2,
                                           size_t vl);
vint32m1_t __riscv_vwmaccus_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                         uint16_t rs1, vint16mf2_t vs2,
                                         size_t vl);
vint32m2_t __riscv_vwmaccus_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                         uint16_t rs1, vint16m1_t vs2,
                                         size_t vl);
vint32m4_t __riscv_vwmaccus_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                         uint16_t rs1, vint16m2_t vs2,
                                         size_t vl);
vint32m8_t __riscv_vwmaccus_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                         uint16_t rs1, vint16m4_t vs2,
                                         size_t vl);
vint64m1_t __riscv_vwmaccus_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                         uint32_t rs1, vint32mf2_t vs2,
                                         size_t vl);
vint64m2_t __riscv_vwmaccus_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                         uint32_t rs1, vint32m1_t vs2,
                                         size_t vl);
vint64m4_t __riscv_vwmaccus_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                         uint32_t rs1, vint32m2_t vs2,
                                         size_t vl);
vint64m8_t __riscv_vwmaccus_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                         uint32_t rs1, vint32m4_t vs2,
                                         size_t vl);
vuint16mf4_t __riscv_vwmaccu_vv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                           vuint8mf8_t vs1, vuint8mf8_t vs2,
                                           size_t vl);
vuint16mf4_t __riscv_vwmaccu_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                           uint8_t rs1, vuint8mf8_t vs2,
                                           size_t vl);
vuint16mf2_t __riscv_vwmaccu_vv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                           vuint8mf4_t vs1, vuint8mf4_t vs2,
                                           size_t vl);
vuint16mf2_t __riscv_vwmaccu_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                           uint8_t rs1, vuint8mf4_t vs2,
                                           size_t vl);
vuint16m1_t __riscv_vwmaccu_vv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                         vuint8mf2_t vs1, vuint8mf2_t vs2,
                                         size_t vl);
vuint16m1_t __riscv_vwmaccu_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                         uint8_t rs1, vuint8mf2_t vs2,
                                         size_t vl);
vuint16m2_t __riscv_vwmaccu_vv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                         vuint8m1_t vs1, vuint8m1_t vs2,
                                         size_t vl);
vuint16m2_t __riscv_vwmaccu_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                         uint8_t rs1, vuint8m1_t vs2,
                                         size_t vl);
vuint16m4_t __riscv_vwmaccu_vv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                         vuint8m2_t vs1, vuint8m2_t vs2,
                                         size_t vl);
vuint16m4_t __riscv_vwmaccu_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                         uint8_t rs1, vuint8m2_t vs2,
                                         size_t vl);
vuint16m8_t __riscv_vwmaccu_vv_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                         vuint8m4_t vs1, vuint8m4_t vs2,
                                         size_t vl);
vuint16m8_t __riscv_vwmaccu_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                         uint8_t rs1, vuint8m4_t vs2,
                                         size_t vl);
vuint32mf2_t __riscv_vwmaccu_vv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                           vuint16mf4_t vs1, vuint16mf4_t vs2,
                                           size_t vl);
vuint32mf2_t __riscv_vwmaccu_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                           uint16_t rs1, vuint16mf4_t vs2,
                                           size_t vl);
vuint32m1_t __riscv_vwmaccu_vv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                         vuint16mf2_t vs1, vuint16mf2_t vs2,
                                         size_t vl);
vuint32m1_t __riscv_vwmaccu_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                         uint16_t rs1, vuint16mf2_t vs2,
                                         size_t vl);
vuint32m2_t __riscv_vwmaccu_vv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                         vuint16m1_t vs1, vuint16m1_t vs2,
                                         size_t vl);
vuint32m2_t __riscv_vwmaccu_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                         uint16_t rs1, vuint16m1_t vs2,
                                         size_t vl);
vuint32m4_t __riscv_vwmaccu_vv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                         vuint16m2_t vs1, vuint16m2_t vs2,
                                         size_t vl);
vuint32m4_t __riscv_vwmaccu_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                         uint16_t rs1, vuint16m2_t vs2,
                                         size_t vl);
vuint32m8_t __riscv_vwmaccu_vv_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                         vuint16m4_t vs1, vuint16m4_t vs2,
                                         size_t vl);
vuint32m8_t __riscv_vwmaccu_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                         uint16_t rs1, vuint16m4_t vs2,
                                         size_t vl);
vuint64m1_t __riscv_vwmaccu_vv_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                         vuint32mf2_t vs1, vuint32mf2_t vs2,
                                         size_t vl);
vuint64m1_t __riscv_vwmaccu_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                         uint32_t rs1, vuint32mf2_t vs2,
                                         size_t vl);
vuint64m2_t __riscv_vwmaccu_vv_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                         vuint32m1_t vs1, vuint32m1_t vs2,
                                         size_t vl);
vuint64m2_t __riscv_vwmaccu_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                         uint32_t rs1, vuint32m1_t vs2,
                                         size_t vl);
vuint64m4_t __riscv_vwmaccu_vv_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                         vuint32m2_t vs1, vuint32m2_t vs2,
                                         size_t vl);
vuint64m4_t __riscv_vwmaccu_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                         uint32_t rs1, vuint32m2_t vs2,
                                         size_t vl);
vuint64m8_t __riscv_vwmaccu_vv_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                         vuint32m4_t vs1, vuint32m4_t vs2,
                                         size_t vl);
vuint64m8_t __riscv_vwmaccu_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                         uint32_t rs1, vuint32m4_t vs2,
                                         size_t vl);
// masked functions
vint16mf4_t __riscv_vwmacc_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                          vint8mf8_t vs1, vint8mf8_t vs2,
                                          size_t vl);
vint16mf4_t __riscv_vwmacc_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                          int8_t rs1, vint8mf8_t vs2,
                                          size_t vl);
vint16mf2_t __riscv_vwmacc_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                          vint8mf4_t vs1, vint8mf4_t vs2,
                                          size_t vl);
vint16mf2_t __riscv_vwmacc_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                          int8_t rs1, vint8mf4_t vs2,
                                          size_t vl);
vint16m1_t __riscv_vwmacc_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                        vint8mf2_t vs1, vint8mf2_t vs2,
                                        size_t vl);
vint16m1_t __riscv_vwmacc_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd, int8_t rs1,
                                        vint8mf2_t vs2, size_t vl);
vint16m2_t __riscv_vwmacc_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                        vint8m1_t vs1, vint8m1_t vs2,
                                        size_t vl);
vint16m2_t __riscv_vwmacc_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd, int8_t rs1,
                                        vint8m1_t vs2, size_t vl);
vint16m4_t __riscv_vwmacc_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                        vint8m2_t vs1, vint8m2_t vs2,
                                        size_t vl);
vint16m4_t __riscv_vwmacc_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd, int8_t rs1,
                                        vint8m2_t vs2, size_t vl);
vint16m8_t __riscv_vwmacc_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                        vint8m4_t vs1, vint8m4_t vs2,
                                        size_t vl);
vint16m8_t __riscv_vwmacc_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd, int8_t rs1,
                                        vint8m4_t vs2, size_t vl);
vint32mf2_t __riscv_vwmacc_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                          vint16mf4_t vs1, vint16mf4_t vs2,
                                          size_t vl);
vint32mf2_t __riscv_vwmacc_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                          int16_t rs1, vint16mf4_t vs2,
                                          size_t vl);
vint32m1_t __riscv_vwmacc_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                        vint16mf2_t vs1, vint16mf2_t vs2,
                                        size_t vl);
vint32m1_t __riscv_vwmacc_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                        int16_t rs1, vint16mf2_t vs2,
                                        size_t vl);
vint32m2_t __riscv_vwmacc_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                        vint16m1_t vs1, vint16m1_t vs2,
                                        size_t vl);
vint32m2_t __riscv_vwmacc_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                        int16_t rs1, vint16m1_t vs2, size_t vl);
vint32m4_t __riscv_vwmacc_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                        vint16m2_t vs1, vint16m2_t vs2,
                                        size_t vl);
vint32m4_t __riscv_vwmacc_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd, int16_t rs1,
                                        vint16m2_t vs2, size_t vl);
vint32m8_t __riscv_vwmacc_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                        vint16m4_t vs1, vint16m4_t vs2,
                                        size_t vl);
vint32m8_t __riscv_vwmacc_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd, int16_t rs1,
                                        vint16m4_t vs2, size_t vl);
vint64m1_t __riscv_vwmacc_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                        vint32mf2_t vs1, vint32mf2_t vs2,
                                        size_t vl);
vint64m1_t __riscv_vwmacc_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                        int32_t rs1, vint32mf2_t vs2,
                                        size_t vl);
vint64m2_t __riscv_vwmacc_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                        vint32m1_t vs1, vint32m1_t vs2,
                                        size_t vl);
vint64m2_t __riscv_vwmacc_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                        int32_t rs1, vint32m1_t vs2, size_t vl);
vint64m4_t __riscv_vwmacc_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                        vint32m2_t vs1, vint32m2_t vs2,
                                        size_t vl);
vint64m4_t __riscv_vwmacc_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                        int32_t rs1, vint32m2_t vs2, size_t vl);
vint64m8_t __riscv_vwmacc_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                        vint32m4_t vs1, vint32m4_t vs2,
                                        size_t vl);
vint64m8_t __riscv_vwmacc_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd, int32_t rs1,
                                        vint32m4_t vs2, size_t vl);
vint16mf4_t __riscv_vwmaccsu_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                            vint8mf8_t vs1, vuint8mf8_t vs2,
                                            size_t vl);
vint16mf4_t __riscv_vwmaccsu_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                            int8_t rs1, vuint8mf8_t vs2,
                                            size_t vl);
vint16mf2_t __riscv_vwmaccsu_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                            vint8mf4_t vs1, vuint8mf4_t vs2,
                                            size_t vl);
vint16mf2_t __riscv_vwmaccsu_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                            int8_t rs1, vuint8mf4_t vs2,
                                            size_t vl);
vint16m1_t __riscv_vwmaccsu_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                          vint8mf2_t vs1, vuint8mf2_t vs2,
                                          size_t vl);
vint16m1_t __riscv_vwmaccsu_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                          int8_t rs1, vuint8mf2_t vs2,
                                          size_t vl);
vint16m2_t __riscv_vwmaccsu_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                          vint8m1_t vs1, vuint8m1_t vs2,
                                          size_t vl);
vint16m2_t __riscv_vwmaccsu_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                          int8_t rs1, vuint8m1_t vs2,
                                          size_t vl);
vint16m4_t __riscv_vwmaccsu_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                          vint8m2_t vs1, vuint8m2_t vs2,
                                          size_t vl);
vint16m4_t __riscv_vwmaccsu_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                          int8_t rs1, vuint8m2_t vs2,
                                          size_t vl);
vint16m8_t __riscv_vwmaccsu_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                          vint8m4_t vs1, vuint8m4_t vs2,
                                          size_t vl);
vint16m8_t __riscv_vwmaccsu_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                          int8_t rs1, vuint8m4_t vs2,
                                          size_t vl);
vint32mf2_t __riscv_vwmaccsu_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                            vint16mf4_t vs1, vuint16mf4_t vs2,
                                            size_t vl);
vint32mf2_t __riscv_vwmaccsu_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                            int16_t rs1, vuint16mf4_t vs2,
                                            size_t vl);
vint32m1_t __riscv_vwmaccsu_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                          vint16mf2_t vs1, vuint16mf2_t vs2,
                                          size_t vl);
vint32m1_t __riscv_vwmaccsu_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                          int16_t rs1, vuint16mf2_t vs2,
                                          size_t vl);
vint32m2_t __riscv_vwmaccsu_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                          vint16m1_t vs1, vuint16m1_t vs2,
                                          size_t vl);
vint32m2_t __riscv_vwmaccsu_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                          int16_t rs1, vuint16m1_t vs2,
                                          size_t vl);
vint32m4_t __riscv_vwmaccsu_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                          vint16m2_t vs1, vuint16m2_t vs2,
                                          size_t vl);
vint32m4_t __riscv_vwmaccsu_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                          int16_t rs1, vuint16m2_t vs2,
                                          size_t vl);
vint32m8_t __riscv_vwmaccsu_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                          vint16m4_t vs1, vuint16m4_t vs2,
                                          size_t vl);
vint32m8_t __riscv_vwmaccsu_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                          int16_t rs1, vuint16m4_t vs2,
                                          size_t vl);
vint64m1_t __riscv_vwmaccsu_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                          vint32mf2_t vs1, vuint32mf2_t vs2,
                                          size_t vl);
vint64m1_t __riscv_vwmaccsu_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                          int32_t rs1, vuint32mf2_t vs2,
                                          size_t vl);
vint64m2_t __riscv_vwmaccsu_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                          vint32m1_t vs1, vuint32m1_t vs2,
                                          size_t vl);
vint64m2_t __riscv_vwmaccsu_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                          int32_t rs1, vuint32m1_t vs2,
                                          size_t vl);
vint64m4_t __riscv_vwmaccsu_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                          vint32m2_t vs1, vuint32m2_t vs2,
                                          size_t vl);
vint64m4_t __riscv_vwmaccsu_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                          int32_t rs1, vuint32m2_t vs2,
                                          size_t vl);
vint64m8_t __riscv_vwmaccsu_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                          vint32m4_t vs1, vuint32m4_t vs2,
                                          size_t vl);
vint64m8_t __riscv_vwmaccsu_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                          int32_t rs1, vuint32m4_t vs2,
                                          size_t vl);
vint16mf4_t __riscv_vwmaccus_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                            uint8_t rs1, vint8mf8_t vs2,
                                            size_t vl);
vint16mf2_t __riscv_vwmaccus_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                            uint8_t rs1, vint8mf4_t vs2,
                                            size_t vl);
vint16m1_t __riscv_vwmaccus_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                          uint8_t rs1, vint8mf2_t vs2,
                                          size_t vl);
vint16m2_t __riscv_vwmaccus_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                          uint8_t rs1, vint8m1_t vs2,
                                          size_t vl);
vint16m4_t __riscv_vwmaccus_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                          uint8_t rs1, vint8m2_t vs2,
                                          size_t vl);
vint16m8_t __riscv_vwmaccus_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                          uint8_t rs1, vint8m4_t vs2,
                                          size_t vl);
vint32mf2_t __riscv_vwmaccus_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                            uint16_t rs1, vint16mf4_t vs2,
                                            size_t vl);
vint32m1_t __riscv_vwmaccus_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                          uint16_t rs1, vint16mf2_t vs2,
                                          size_t vl);
vint32m2_t __riscv_vwmaccus_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                          uint16_t rs1, vint16m1_t vs2,
                                          size_t vl);
vint32m4_t __riscv_vwmaccus_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                          uint16_t rs1, vint16m2_t vs2,
                                          size_t vl);
vint32m8_t __riscv_vwmaccus_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                          uint16_t rs1, vint16m4_t vs2,
                                          size_t vl);
vint64m1_t __riscv_vwmaccus_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                          uint32_t rs1, vint32mf2_t vs2,
                                          size_t vl);
vint64m2_t __riscv_vwmaccus_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                          uint32_t rs1, vint32m1_t vs2,
                                          size_t vl);
vint64m4_t __riscv_vwmaccus_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                          uint32_t rs1, vint32m2_t vs2,
                                          size_t vl);
vint64m8_t __riscv_vwmaccus_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                          uint32_t rs1, vint32m4_t vs2,
                                          size_t vl);
vuint16mf4_t __riscv_vwmaccu_vv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                            vuint8mf8_t vs1, vuint8mf8_t vs2,
                                            size_t vl);
vuint16mf4_t __riscv_vwmaccu_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                            uint8_t rs1, vuint8mf8_t vs2,
                                            size_t vl);
vuint16mf2_t __riscv_vwmaccu_vv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                            vuint8mf4_t vs1, vuint8mf4_t vs2,
                                            size_t vl);
vuint16mf2_t __riscv_vwmaccu_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                            uint8_t rs1, vuint8mf4_t vs2,
                                            size_t vl);
vuint16m1_t __riscv_vwmaccu_vv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                          vuint8mf2_t vs1, vuint8mf2_t vs2,
                                          size_t vl);
vuint16m1_t __riscv_vwmaccu_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                          uint8_t rs1, vuint8mf2_t vs2,
                                          size_t vl);
vuint16m2_t __riscv_vwmaccu_vv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                          vuint8m1_t vs1, vuint8m1_t vs2,
                                          size_t vl);
vuint16m2_t __riscv_vwmaccu_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                          uint8_t rs1, vuint8m1_t vs2,
                                          size_t vl);
vuint16m4_t __riscv_vwmaccu_vv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                          vuint8m2_t vs1, vuint8m2_t vs2,
                                          size_t vl);
vuint16m4_t __riscv_vwmaccu_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                          uint8_t rs1, vuint8m2_t vs2,
                                          size_t vl);
vuint16m8_t __riscv_vwmaccu_vv_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                          vuint8m4_t vs1, vuint8m4_t vs2,
                                          size_t vl);
vuint16m8_t __riscv_vwmaccu_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                          uint8_t rs1, vuint8m4_t vs2,
                                          size_t vl);
vuint32mf2_t __riscv_vwmaccu_vv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                            vuint16mf4_t vs1, vuint16mf4_t vs2,
                                            size_t vl);
vuint32mf2_t __riscv_vwmaccu_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                            uint16_t rs1, vuint16mf4_t vs2,
                                            size_t vl);
vuint32m1_t __riscv_vwmaccu_vv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                          vuint16mf2_t vs1, vuint16mf2_t vs2,
                                          size_t vl);
vuint32m1_t __riscv_vwmaccu_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                          uint16_t rs1, vuint16mf2_t vs2,
                                          size_t vl);
vuint32m2_t __riscv_vwmaccu_vv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                          vuint16m1_t vs1, vuint16m1_t vs2,
                                          size_t vl);
vuint32m2_t __riscv_vwmaccu_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                          uint16_t rs1, vuint16m1_t vs2,
                                          size_t vl);
vuint32m4_t __riscv_vwmaccu_vv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                          vuint16m2_t vs1, vuint16m2_t vs2,
                                          size_t vl);
vuint32m4_t __riscv_vwmaccu_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                          uint16_t rs1, vuint16m2_t vs2,
                                          size_t vl);
vuint32m8_t __riscv_vwmaccu_vv_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                          vuint16m4_t vs1, vuint16m4_t vs2,
                                          size_t vl);
vuint32m8_t __riscv_vwmaccu_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                          uint16_t rs1, vuint16m4_t vs2,
                                          size_t vl);
vuint64m1_t __riscv_vwmaccu_vv_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                          vuint32mf2_t vs1, vuint32mf2_t vs2,
                                          size_t vl);
vuint64m1_t __riscv_vwmaccu_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                          uint32_t rs1, vuint32mf2_t vs2,
                                          size_t vl);
vuint64m2_t __riscv_vwmaccu_vv_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                          vuint32m1_t vs1, vuint32m1_t vs2,
                                          size_t vl);
vuint64m2_t __riscv_vwmaccu_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                          uint32_t rs1, vuint32m1_t vs2,
                                          size_t vl);
vuint64m4_t __riscv_vwmaccu_vv_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                          vuint32m2_t vs1, vuint32m2_t vs2,
                                          size_t vl);
vuint64m4_t __riscv_vwmaccu_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                          uint32_t rs1, vuint32m2_t vs2,
                                          size_t vl);
vuint64m8_t __riscv_vwmaccu_vv_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                          vuint32m4_t vs1, vuint32m4_t vs2,
                                          size_t vl);
vuint64m8_t __riscv_vwmaccu_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                          uint32_t rs1, vuint32m4_t vs2,
                                          size_t vl);
// masked functions
vint16mf4_t __riscv_vwmacc_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                        vint8mf8_t vs1, vint8mf8_t vs2,
                                        size_t vl);
vint16mf4_t __riscv_vwmacc_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                        int8_t rs1, vint8mf8_t vs2, size_t vl);
vint16mf2_t __riscv_vwmacc_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                        vint8mf4_t vs1, vint8mf4_t vs2,
                                        size_t vl);
vint16mf2_t __riscv_vwmacc_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                        int8_t rs1, vint8mf4_t vs2, size_t vl);
vint16m1_t __riscv_vwmacc_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                      vint8mf2_t vs1, vint8mf2_t vs2,
                                      size_t vl);
vint16m1_t __riscv_vwmacc_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd, int8_t rs1,
                                      vint8mf2_t vs2, size_t vl);
vint16m2_t __riscv_vwmacc_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd, vint8m1_t vs1,
                                      vint8m1_t vs2, size_t vl);
vint16m2_t __riscv_vwmacc_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd, int8_t rs1,
                                      vint8m1_t vs2, size_t vl);
vint16m4_t __riscv_vwmacc_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd, vint8m2_t vs1,
                                      vint8m2_t vs2, size_t vl);
vint16m4_t __riscv_vwmacc_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd, int8_t rs1,
                                      vint8m2_t vs2, size_t vl);
vint16m8_t __riscv_vwmacc_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd, vint8m4_t vs1,
                                      vint8m4_t vs2, size_t vl);
vint16m8_t __riscv_vwmacc_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd, int8_t rs1,
                                      vint8m4_t vs2, size_t vl);
vint32mf2_t __riscv_vwmacc_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                        vint16mf4_t vs1, vint16mf4_t vs2,
                                        size_t vl);
vint32mf2_t __riscv_vwmacc_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                        int16_t rs1, vint16mf4_t vs2,
                                        size_t vl);
vint32m1_t __riscv_vwmacc_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                      vint16mf2_t vs1, vint16mf2_t vs2,
                                      size_t vl);
vint32m1_t __riscv_vwmacc_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd, int16_t rs1,
                                      vint16mf2_t vs2, size_t vl);
vint32m2_t __riscv_vwmacc_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                      vint16m1_t vs1, vint16m1_t vs2,
                                      size_t vl);
vint32m2_t __riscv_vwmacc_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd, int16_t rs1,
                                      vint16m1_t vs2, size_t vl);
vint32m4_t __riscv_vwmacc_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd,
                                      vint16m2_t vs1, vint16m2_t vs2,
                                      size_t vl);
vint32m4_t __riscv_vwmacc_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd, int16_t rs1,
                                      vint16m2_t vs2, size_t vl);
vint32m8_t __riscv_vwmacc_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd,
                                      vint16m4_t vs1, vint16m4_t vs2,
                                      size_t vl);
vint32m8_t __riscv_vwmacc_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd, int16_t rs1,
                                      vint16m4_t vs2, size_t vl);
vint64m1_t __riscv_vwmacc_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                      vint32mf2_t vs1, vint32mf2_t vs2,
                                      size_t vl);
vint64m1_t __riscv_vwmacc_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd, int32_t rs1,
                                      vint32mf2_t vs2, size_t vl);
vint64m2_t __riscv_vwmacc_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                      vint32m1_t vs1, vint32m1_t vs2,
                                      size_t vl);
vint64m2_t __riscv_vwmacc_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd, int32_t rs1,
                                      vint32m1_t vs2, size_t vl);
vint64m4_t __riscv_vwmacc_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                      vint32m2_t vs1, vint32m2_t vs2,
                                      size_t vl);
vint64m4_t __riscv_vwmacc_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd, int32_t rs1,
                                      vint32m2_t vs2, size_t vl);
vint64m8_t __riscv_vwmacc_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd,
                                      vint32m4_t vs1, vint32m4_t vs2,
                                      size_t vl);
vint64m8_t __riscv_vwmacc_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd, int32_t rs1,
                                      vint32m4_t vs2, size_t vl);
vint16mf4_t __riscv_vwmaccsu_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                          vint8mf8_t vs1, vuint8mf8_t vs2,
                                          size_t vl);
vint16mf4_t __riscv_vwmaccsu_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                          int8_t rs1, vuint8mf8_t vs2,
                                          size_t vl);
vint16mf2_t __riscv_vwmaccsu_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                          vint8mf4_t vs1, vuint8mf4_t vs2,
                                          size_t vl);
vint16mf2_t __riscv_vwmaccsu_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                          int8_t rs1, vuint8mf4_t vs2,
                                          size_t vl);
vint16m1_t __riscv_vwmaccsu_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                        vint8mf2_t vs1, vuint8mf2_t vs2,
                                        size_t vl);
vint16m1_t __riscv_vwmaccsu_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd, int8_t rs1,
                                        vuint8mf2_t vs2, size_t vl);
vint16m2_t __riscv_vwmaccsu_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd,
                                        vint8m1_t vs1, vuint8m1_t vs2,
                                        size_t vl);
vint16m2_t __riscv_vwmaccsu_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd, int8_t rs1,
                                        vuint8m1_t vs2, size_t vl);
vint16m4_t __riscv_vwmaccsu_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd,
                                        vint8m2_t vs1, vuint8m2_t vs2,
                                        size_t vl);
vint16m4_t __riscv_vwmaccsu_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd, int8_t rs1,
                                        vuint8m2_t vs2, size_t vl);
vint16m8_t __riscv_vwmaccsu_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd,
                                        vint8m4_t vs1, vuint8m4_t vs2,
                                        size_t vl);
vint16m8_t __riscv_vwmaccsu_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd, int8_t rs1,
                                        vuint8m4_t vs2, size_t vl);
vint32mf2_t __riscv_vwmaccsu_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                          vint16mf4_t vs1, vuint16mf4_t vs2,
                                          size_t vl);
vint32mf2_t __riscv_vwmaccsu_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                          int16_t rs1, vuint16mf4_t vs2,
                                          size_t vl);
vint32m1_t __riscv_vwmaccsu_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                        vint16mf2_t vs1, vuint16mf2_t vs2,
                                        size_t vl);
vint32m1_t __riscv_vwmaccsu_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                        int16_t rs1, vuint16mf2_t vs2,
                                        size_t vl);
vint32m2_t __riscv_vwmaccsu_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                        vint16m1_t vs1, vuint16m1_t vs2,
                                        size_t vl);
vint32m2_t __riscv_vwmaccsu_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                        int16_t rs1, vuint16m1_t vs2,
                                        size_t vl);
vint32m4_t __riscv_vwmaccsu_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd,
                                        vint16m2_t vs1, vuint16m2_t vs2,
                                        size_t vl);
vint32m4_t __riscv_vwmaccsu_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd, int16_t rs1,
                                        vuint16m2_t vs2, size_t vl);
vint32m8_t __riscv_vwmaccsu_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd,
                                        vint16m4_t vs1, vuint16m4_t vs2,
                                        size_t vl);
vint32m8_t __riscv_vwmaccsu_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd, int16_t rs1,
                                        vuint16m4_t vs2, size_t vl);
vint64m1_t __riscv_vwmaccsu_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                        vint32mf2_t vs1, vuint32mf2_t vs2,
                                        size_t vl);
vint64m1_t __riscv_vwmaccsu_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                        int32_t rs1, vuint32mf2_t vs2,
                                        size_t vl);
vint64m2_t __riscv_vwmaccsu_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                        vint32m1_t vs1, vuint32m1_t vs2,
                                        size_t vl);
vint64m2_t __riscv_vwmaccsu_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                        int32_t rs1, vuint32m1_t vs2,
                                        size_t vl);
vint64m4_t __riscv_vwmaccsu_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                        vint32m2_t vs1, vuint32m2_t vs2,
                                        size_t vl);
vint64m4_t __riscv_vwmaccsu_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                        int32_t rs1, vuint32m2_t vs2,
                                        size_t vl);
vint64m8_t __riscv_vwmaccsu_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd,
                                        vint32m4_t vs1, vuint32m4_t vs2,
                                        size_t vl);
vint64m8_t __riscv_vwmaccsu_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd, int32_t rs1,
                                        vuint32m4_t vs2, size_t vl);
vint16mf4_t __riscv_vwmaccus_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                          uint8_t rs1, vint8mf8_t vs2,
                                          size_t vl);
vint16mf2_t __riscv_vwmaccus_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                          uint8_t rs1, vint8mf4_t vs2,
                                          size_t vl);
vint16m1_t __riscv_vwmaccus_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                        uint8_t rs1, vint8mf2_t vs2, size_t vl);
vint16m2_t __riscv_vwmaccus_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd, uint8_t rs1,
                                        vint8m1_t vs2, size_t vl);
vint16m4_t __riscv_vwmaccus_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd, uint8_t rs1,
                                        vint8m2_t vs2, size_t vl);
vint16m8_t __riscv_vwmaccus_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd, uint8_t rs1,
                                        vint8m4_t vs2, size_t vl);
vint32mf2_t __riscv_vwmaccus_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                          uint16_t rs1, vint16mf4_t vs2,
                                          size_t vl);
vint32m1_t __riscv_vwmaccus_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                        uint16_t rs1, vint16mf2_t vs2,
                                        size_t vl);
vint32m2_t __riscv_vwmaccus_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                        uint16_t rs1, vint16m1_t vs2,
                                        size_t vl);
vint32m4_t __riscv_vwmaccus_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd,
                                        uint16_t rs1, vint16m2_t vs2,
                                        size_t vl);
vint32m8_t __riscv_vwmaccus_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd,
                                        uint16_t rs1, vint16m4_t vs2,
                                        size_t vl);
vint64m1_t __riscv_vwmaccus_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                        uint32_t rs1, vint32mf2_t vs2,
                                        size_t vl);
vint64m2_t __riscv_vwmaccus_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                        uint32_t rs1, vint32m1_t vs2,
                                        size_t vl);
vint64m4_t __riscv_vwmaccus_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                        uint32_t rs1, vint32m2_t vs2,
                                        size_t vl);
vint64m8_t __riscv_vwmaccus_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd,
                                        uint32_t rs1, vint32m4_t vs2,
                                        size_t vl);
vuint16mf4_t __riscv_vwmaccu_vv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                          vuint8mf8_t vs1, vuint8mf8_t vs2,
                                          size_t vl);
vuint16mf4_t __riscv_vwmaccu_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                          uint8_t rs1, vuint8mf8_t vs2,
                                          size_t vl);
vuint16mf2_t __riscv_vwmaccu_vv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                          vuint8mf4_t vs1, vuint8mf4_t vs2,
                                          size_t vl);
vuint16mf2_t __riscv_vwmaccu_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                          uint8_t rs1, vuint8mf4_t vs2,
                                          size_t vl);
vuint16m1_t __riscv_vwmaccu_vv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                        vuint8mf2_t vs1, vuint8mf2_t vs2,
                                        size_t vl);
vuint16m1_t __riscv_vwmaccu_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                        uint8_t rs1, vuint8mf2_t vs2,
                                        size_t vl);
vuint16m2_t __riscv_vwmaccu_vv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                        vuint8m1_t vs1, vuint8m1_t vs2,
                                        size_t vl);
vuint16m2_t __riscv_vwmaccu_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                        uint8_t rs1, vuint8m1_t vs2, size_t vl);
vuint16m4_t __riscv_vwmaccu_vv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                        vuint8m2_t vs1, vuint8m2_t vs2,
                                        size_t vl);
vuint16m4_t __riscv_vwmaccu_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                        uint8_t rs1, vuint8m2_t vs2, size_t vl);
vuint16m8_t __riscv_vwmaccu_vv_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                        vuint8m4_t vs1, vuint8m4_t vs2,
                                        size_t vl);
vuint16m8_t __riscv_vwmaccu_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                        uint8_t rs1, vuint8m4_t vs2, size_t vl);
vuint32mf2_t __riscv_vwmaccu_vv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                          vuint16mf4_t vs1, vuint16mf4_t vs2,
                                          size_t vl);
vuint32mf2_t __riscv_vwmaccu_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                          uint16_t rs1, vuint16mf4_t vs2,
                                          size_t vl);
vuint32m1_t __riscv_vwmaccu_vv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                        vuint16mf2_t vs1, vuint16mf2_t vs2,
                                        size_t vl);
vuint32m1_t __riscv_vwmaccu_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                        uint16_t rs1, vuint16mf2_t vs2,
                                        size_t vl);
vuint32m2_t __riscv_vwmaccu_vv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                        vuint16m1_t vs1, vuint16m1_t vs2,
                                        size_t vl);
vuint32m2_t __riscv_vwmaccu_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                        uint16_t rs1, vuint16m1_t vs2,
                                        size_t vl);
vuint32m4_t __riscv_vwmaccu_vv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                        vuint16m2_t vs1, vuint16m2_t vs2,
                                        size_t vl);
vuint32m4_t __riscv_vwmaccu_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                        uint16_t rs1, vuint16m2_t vs2,
                                        size_t vl);
vuint32m8_t __riscv_vwmaccu_vv_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                        vuint16m4_t vs1, vuint16m4_t vs2,
                                        size_t vl);
vuint32m8_t __riscv_vwmaccu_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                        uint16_t rs1, vuint16m4_t vs2,
                                        size_t vl);
vuint64m1_t __riscv_vwmaccu_vv_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                        vuint32mf2_t vs1, vuint32mf2_t vs2,
                                        size_t vl);
vuint64m1_t __riscv_vwmaccu_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                        uint32_t rs1, vuint32mf2_t vs2,
                                        size_t vl);
vuint64m2_t __riscv_vwmaccu_vv_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                        vuint32m1_t vs1, vuint32m1_t vs2,
                                        size_t vl);
vuint64m2_t __riscv_vwmaccu_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                        uint32_t rs1, vuint32m1_t vs2,
                                        size_t vl);
vuint64m4_t __riscv_vwmaccu_vv_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                        vuint32m2_t vs1, vuint32m2_t vs2,
                                        size_t vl);
vuint64m4_t __riscv_vwmaccu_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                        uint32_t rs1, vuint32m2_t vs2,
                                        size_t vl);
vuint64m8_t __riscv_vwmaccu_vv_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                        vuint32m4_t vs1, vuint32m4_t vs2,
                                        size_t vl);
vuint64m8_t __riscv_vwmaccu_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                        uint32_t rs1, vuint32m4_t vs2,
                                        size_t vl);

Vector Integer Merge Intrinsics

vint8mf8_t __riscv_vmerge_vvm_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                       vint8mf8_t vs1, vbool64_t v0, size_t vl);
vint8mf8_t __riscv_vmerge_vxm_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                       int8_t rs1, vbool64_t v0, size_t vl);
vint8mf4_t __riscv_vmerge_vvm_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                       vint8mf4_t vs1, vbool32_t v0, size_t vl);
vint8mf4_t __riscv_vmerge_vxm_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                       int8_t rs1, vbool32_t v0, size_t vl);
vint8mf2_t __riscv_vmerge_vvm_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                       vint8mf2_t vs1, vbool16_t v0, size_t vl);
vint8mf2_t __riscv_vmerge_vxm_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                       int8_t rs1, vbool16_t v0, size_t vl);
vint8m1_t __riscv_vmerge_vvm_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, vint8m1_t vs1,
                                     vbool8_t v0, size_t vl);
vint8m1_t __riscv_vmerge_vxm_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, int8_t rs1,
                                     vbool8_t v0, size_t vl);
vint8m2_t __riscv_vmerge_vvm_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, vint8m2_t vs1,
                                     vbool4_t v0, size_t vl);
vint8m2_t __riscv_vmerge_vxm_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, int8_t rs1,
                                     vbool4_t v0, size_t vl);
vint8m4_t __riscv_vmerge_vvm_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, vint8m4_t vs1,
                                     vbool2_t v0, size_t vl);
vint8m4_t __riscv_vmerge_vxm_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, int8_t rs1,
                                     vbool2_t v0, size_t vl);
vint8m8_t __riscv_vmerge_vvm_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, vint8m8_t vs1,
                                     vbool1_t v0, size_t vl);
vint8m8_t __riscv_vmerge_vxm_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, int8_t rs1,
                                     vbool1_t v0, size_t vl);
vint16mf4_t __riscv_vmerge_vvm_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                         vint16mf4_t vs1, vbool64_t v0,
                                         size_t vl);
vint16mf4_t __riscv_vmerge_vxm_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                         int16_t rs1, vbool64_t v0, size_t vl);
vint16mf2_t __riscv_vmerge_vvm_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                         vint16mf2_t vs1, vbool32_t v0,
                                         size_t vl);
vint16mf2_t __riscv_vmerge_vxm_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                         int16_t rs1, vbool32_t v0, size_t vl);
vint16m1_t __riscv_vmerge_vvm_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                       vint16m1_t vs1, vbool16_t v0, size_t vl);
vint16m1_t __riscv_vmerge_vxm_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                       int16_t rs1, vbool16_t v0, size_t vl);
vint16m2_t __riscv_vmerge_vvm_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                       vint16m2_t vs1, vbool8_t v0, size_t vl);
vint16m2_t __riscv_vmerge_vxm_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                       int16_t rs1, vbool8_t v0, size_t vl);
vint16m4_t __riscv_vmerge_vvm_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                       vint16m4_t vs1, vbool4_t v0, size_t vl);
vint16m4_t __riscv_vmerge_vxm_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                       int16_t rs1, vbool4_t v0, size_t vl);
vint16m8_t __riscv_vmerge_vvm_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                       vint16m8_t vs1, vbool2_t v0, size_t vl);
vint16m8_t __riscv_vmerge_vxm_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                       int16_t rs1, vbool2_t v0, size_t vl);
vint32mf2_t __riscv_vmerge_vvm_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                         vint32mf2_t vs1, vbool64_t v0,
                                         size_t vl);
vint32mf2_t __riscv_vmerge_vxm_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                         int32_t rs1, vbool64_t v0, size_t vl);
vint32m1_t __riscv_vmerge_vvm_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                       vint32m1_t vs1, vbool32_t v0, size_t vl);
vint32m1_t __riscv_vmerge_vxm_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                       int32_t rs1, vbool32_t v0, size_t vl);
vint32m2_t __riscv_vmerge_vvm_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                       vint32m2_t vs1, vbool16_t v0, size_t vl);
vint32m2_t __riscv_vmerge_vxm_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                       int32_t rs1, vbool16_t v0, size_t vl);
vint32m4_t __riscv_vmerge_vvm_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                       vint32m4_t vs1, vbool8_t v0, size_t vl);
vint32m4_t __riscv_vmerge_vxm_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                       int32_t rs1, vbool8_t v0, size_t vl);
vint32m8_t __riscv_vmerge_vvm_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                       vint32m8_t vs1, vbool4_t v0, size_t vl);
vint32m8_t __riscv_vmerge_vxm_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                       int32_t rs1, vbool4_t v0, size_t vl);
vint64m1_t __riscv_vmerge_vvm_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                       vint64m1_t vs1, vbool64_t v0, size_t vl);
vint64m1_t __riscv_vmerge_vxm_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                       int64_t rs1, vbool64_t v0, size_t vl);
vint64m2_t __riscv_vmerge_vvm_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                       vint64m2_t vs1, vbool32_t v0, size_t vl);
vint64m2_t __riscv_vmerge_vxm_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                       int64_t rs1, vbool32_t v0, size_t vl);
vint64m4_t __riscv_vmerge_vvm_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                       vint64m4_t vs1, vbool16_t v0, size_t vl);
vint64m4_t __riscv_vmerge_vxm_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                       int64_t rs1, vbool16_t v0, size_t vl);
vint64m8_t __riscv_vmerge_vvm_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                       vint64m8_t vs1, vbool8_t v0, size_t vl);
vint64m8_t __riscv_vmerge_vxm_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                       int64_t rs1, vbool8_t v0, size_t vl);
vuint8mf8_t __riscv_vmerge_vvm_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                        vuint8mf8_t vs1, vbool64_t v0,
                                        size_t vl);
vuint8mf8_t __riscv_vmerge_vxm_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                        uint8_t rs1, vbool64_t v0, size_t vl);
vuint8mf4_t __riscv_vmerge_vvm_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                        vuint8mf4_t vs1, vbool32_t v0,
                                        size_t vl);
vuint8mf4_t __riscv_vmerge_vxm_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                        uint8_t rs1, vbool32_t v0, size_t vl);
vuint8mf2_t __riscv_vmerge_vvm_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                        vuint8mf2_t vs1, vbool16_t v0,
                                        size_t vl);
vuint8mf2_t __riscv_vmerge_vxm_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                        uint8_t rs1, vbool16_t v0, size_t vl);
vuint8m1_t __riscv_vmerge_vvm_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2,
                                      vuint8m1_t vs1, vbool8_t v0, size_t vl);
vuint8m1_t __riscv_vmerge_vxm_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2,
                                      uint8_t rs1, vbool8_t v0, size_t vl);
vuint8m2_t __riscv_vmerge_vvm_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2,
                                      vuint8m2_t vs1, vbool4_t v0, size_t vl);
vuint8m2_t __riscv_vmerge_vxm_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2,
                                      uint8_t rs1, vbool4_t v0, size_t vl);
vuint8m4_t __riscv_vmerge_vvm_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2,
                                      vuint8m4_t vs1, vbool2_t v0, size_t vl);
vuint8m4_t __riscv_vmerge_vxm_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2,
                                      uint8_t rs1, vbool2_t v0, size_t vl);
vuint8m8_t __riscv_vmerge_vvm_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2,
                                      vuint8m8_t vs1, vbool1_t v0, size_t vl);
vuint8m8_t __riscv_vmerge_vxm_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2,
                                      uint8_t rs1, vbool1_t v0, size_t vl);
vuint16mf4_t __riscv_vmerge_vvm_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                          vuint16mf4_t vs1, vbool64_t v0,
                                          size_t vl);
vuint16mf4_t __riscv_vmerge_vxm_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                          uint16_t rs1, vbool64_t v0,
                                          size_t vl);
vuint16mf2_t __riscv_vmerge_vvm_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                          vuint16mf2_t vs1, vbool32_t v0,
                                          size_t vl);
vuint16mf2_t __riscv_vmerge_vxm_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                          uint16_t rs1, vbool32_t v0,
                                          size_t vl);
vuint16m1_t __riscv_vmerge_vvm_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                        vuint16m1_t vs1, vbool16_t v0,
                                        size_t vl);
vuint16m1_t __riscv_vmerge_vxm_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                        uint16_t rs1, vbool16_t v0, size_t vl);
vuint16m2_t __riscv_vmerge_vvm_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                        vuint16m2_t vs1, vbool8_t v0,
                                        size_t vl);
vuint16m2_t __riscv_vmerge_vxm_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                        uint16_t rs1, vbool8_t v0, size_t vl);
vuint16m4_t __riscv_vmerge_vvm_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                        vuint16m4_t vs1, vbool4_t v0,
                                        size_t vl);
vuint16m4_t __riscv_vmerge_vxm_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                        uint16_t rs1, vbool4_t v0, size_t vl);
vuint16m8_t __riscv_vmerge_vvm_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                        vuint16m8_t vs1, vbool2_t v0,
                                        size_t vl);
vuint16m8_t __riscv_vmerge_vxm_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                        uint16_t rs1, vbool2_t v0, size_t vl);
vuint32mf2_t __riscv_vmerge_vvm_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                          vuint32mf2_t vs1, vbool64_t v0,
                                          size_t vl);
vuint32mf2_t __riscv_vmerge_vxm_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                          uint32_t rs1, vbool64_t v0,
                                          size_t vl);
vuint32m1_t __riscv_vmerge_vvm_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                        vuint32m1_t vs1, vbool32_t v0,
                                        size_t vl);
vuint32m1_t __riscv_vmerge_vxm_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                        uint32_t rs1, vbool32_t v0, size_t vl);
vuint32m2_t __riscv_vmerge_vvm_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                        vuint32m2_t vs1, vbool16_t v0,
                                        size_t vl);
vuint32m2_t __riscv_vmerge_vxm_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                        uint32_t rs1, vbool16_t v0, size_t vl);
vuint32m4_t __riscv_vmerge_vvm_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                        vuint32m4_t vs1, vbool8_t v0,
                                        size_t vl);
vuint32m4_t __riscv_vmerge_vxm_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                        uint32_t rs1, vbool8_t v0, size_t vl);
vuint32m8_t __riscv_vmerge_vvm_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                        vuint32m8_t vs1, vbool4_t v0,
                                        size_t vl);
vuint32m8_t __riscv_vmerge_vxm_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                        uint32_t rs1, vbool4_t v0, size_t vl);
vuint64m1_t __riscv_vmerge_vvm_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                        vuint64m1_t vs1, vbool64_t v0,
                                        size_t vl);
vuint64m1_t __riscv_vmerge_vxm_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                        uint64_t rs1, vbool64_t v0, size_t vl);
vuint64m2_t __riscv_vmerge_vvm_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                        vuint64m2_t vs1, vbool32_t v0,
                                        size_t vl);
vuint64m2_t __riscv_vmerge_vxm_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                        uint64_t rs1, vbool32_t v0, size_t vl);
vuint64m4_t __riscv_vmerge_vvm_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                        vuint64m4_t vs1, vbool16_t v0,
                                        size_t vl);
vuint64m4_t __riscv_vmerge_vxm_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                        uint64_t rs1, vbool16_t v0, size_t vl);
vuint64m8_t __riscv_vmerge_vvm_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                        vuint64m8_t vs1, vbool8_t v0,
                                        size_t vl);
vuint64m8_t __riscv_vmerge_vxm_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                        uint64_t rs1, vbool8_t v0, size_t vl);

Vector Integer Move Intrinsics

vint8mf8_t __riscv_vmv_v_v_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vmv_v_x_i8mf8_tu(vint8mf8_t vd, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vmv_v_v_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vmv_v_x_i8mf4_tu(vint8mf4_t vd, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vmv_v_v_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vmv_v_x_i8mf2_tu(vint8mf2_t vd, int8_t rs1, size_t vl);
vint8m1_t __riscv_vmv_v_v_i8m1_tu(vint8m1_t vd, vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vmv_v_x_i8m1_tu(vint8m1_t vd, int8_t rs1, size_t vl);
vint8m2_t __riscv_vmv_v_v_i8m2_tu(vint8m2_t vd, vint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vmv_v_x_i8m2_tu(vint8m2_t vd, int8_t rs1, size_t vl);
vint8m4_t __riscv_vmv_v_v_i8m4_tu(vint8m4_t vd, vint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vmv_v_x_i8m4_tu(vint8m4_t vd, int8_t rs1, size_t vl);
vint8m8_t __riscv_vmv_v_v_i8m8_tu(vint8m8_t vd, vint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vmv_v_x_i8m8_tu(vint8m8_t vd, int8_t rs1, size_t vl);
vint16mf4_t __riscv_vmv_v_v_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs1,
                                      size_t vl);
vint16mf4_t __riscv_vmv_v_x_i16mf4_tu(vint16mf4_t vd, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vmv_v_v_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs1,
                                      size_t vl);
vint16mf2_t __riscv_vmv_v_x_i16mf2_tu(vint16mf2_t vd, int16_t rs1, size_t vl);
vint16m1_t __riscv_vmv_v_v_i16m1_tu(vint16m1_t vd, vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vmv_v_x_i16m1_tu(vint16m1_t vd, int16_t rs1, size_t vl);
vint16m2_t __riscv_vmv_v_v_i16m2_tu(vint16m2_t vd, vint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vmv_v_x_i16m2_tu(vint16m2_t vd, int16_t rs1, size_t vl);
vint16m4_t __riscv_vmv_v_v_i16m4_tu(vint16m4_t vd, vint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vmv_v_x_i16m4_tu(vint16m4_t vd, int16_t rs1, size_t vl);
vint16m8_t __riscv_vmv_v_v_i16m8_tu(vint16m8_t vd, vint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vmv_v_x_i16m8_tu(vint16m8_t vd, int16_t rs1, size_t vl);
vint32mf2_t __riscv_vmv_v_v_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs1,
                                      size_t vl);
vint32mf2_t __riscv_vmv_v_x_i32mf2_tu(vint32mf2_t vd, int32_t rs1, size_t vl);
vint32m1_t __riscv_vmv_v_v_i32m1_tu(vint32m1_t vd, vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vmv_v_x_i32m1_tu(vint32m1_t vd, int32_t rs1, size_t vl);
vint32m2_t __riscv_vmv_v_v_i32m2_tu(vint32m2_t vd, vint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vmv_v_x_i32m2_tu(vint32m2_t vd, int32_t rs1, size_t vl);
vint32m4_t __riscv_vmv_v_v_i32m4_tu(vint32m4_t vd, vint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vmv_v_x_i32m4_tu(vint32m4_t vd, int32_t rs1, size_t vl);
vint32m8_t __riscv_vmv_v_v_i32m8_tu(vint32m8_t vd, vint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vmv_v_x_i32m8_tu(vint32m8_t vd, int32_t rs1, size_t vl);
vint64m1_t __riscv_vmv_v_v_i64m1_tu(vint64m1_t vd, vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vmv_v_x_i64m1_tu(vint64m1_t vd, int64_t rs1, size_t vl);
vint64m2_t __riscv_vmv_v_v_i64m2_tu(vint64m2_t vd, vint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vmv_v_x_i64m2_tu(vint64m2_t vd, int64_t rs1, size_t vl);
vint64m4_t __riscv_vmv_v_v_i64m4_tu(vint64m4_t vd, vint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vmv_v_x_i64m4_tu(vint64m4_t vd, int64_t rs1, size_t vl);
vint64m8_t __riscv_vmv_v_v_i64m8_tu(vint64m8_t vd, vint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vmv_v_x_i64m8_tu(vint64m8_t vd, int64_t rs1, size_t vl);
vuint8mf8_t __riscv_vmv_v_v_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs1,
                                     size_t vl);
vuint8mf8_t __riscv_vmv_v_x_u8mf8_tu(vuint8mf8_t vd, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vmv_v_v_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs1,
                                     size_t vl);
vuint8mf4_t __riscv_vmv_v_x_u8mf4_tu(vuint8mf4_t vd, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vmv_v_v_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs1,
                                     size_t vl);
vuint8mf2_t __riscv_vmv_v_x_u8mf2_tu(vuint8mf2_t vd, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vmv_v_v_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vmv_v_x_u8m1_tu(vuint8m1_t vd, uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vmv_v_v_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vmv_v_x_u8m2_tu(vuint8m2_t vd, uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vmv_v_v_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vmv_v_x_u8m4_tu(vuint8m4_t vd, uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vmv_v_v_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vmv_v_x_u8m8_tu(vuint8m8_t vd, uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vmv_v_v_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs1,
                                       size_t vl);
vuint16mf4_t __riscv_vmv_v_x_u16mf4_tu(vuint16mf4_t vd, uint16_t rs1,
                                       size_t vl);
vuint16mf2_t __riscv_vmv_v_v_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs1,
                                       size_t vl);
vuint16mf2_t __riscv_vmv_v_x_u16mf2_tu(vuint16mf2_t vd, uint16_t rs1,
                                       size_t vl);
vuint16m1_t __riscv_vmv_v_v_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs1,
                                     size_t vl);
vuint16m1_t __riscv_vmv_v_x_u16m1_tu(vuint16m1_t vd, uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vmv_v_v_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs1,
                                     size_t vl);
vuint16m2_t __riscv_vmv_v_x_u16m2_tu(vuint16m2_t vd, uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vmv_v_v_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs1,
                                     size_t vl);
vuint16m4_t __riscv_vmv_v_x_u16m4_tu(vuint16m4_t vd, uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vmv_v_v_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs1,
                                     size_t vl);
vuint16m8_t __riscv_vmv_v_x_u16m8_tu(vuint16m8_t vd, uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vmv_v_v_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs1,
                                       size_t vl);
vuint32mf2_t __riscv_vmv_v_x_u32mf2_tu(vuint32mf2_t vd, uint32_t rs1,
                                       size_t vl);
vuint32m1_t __riscv_vmv_v_v_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs1,
                                     size_t vl);
vuint32m1_t __riscv_vmv_v_x_u32m1_tu(vuint32m1_t vd, uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vmv_v_v_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs1,
                                     size_t vl);
vuint32m2_t __riscv_vmv_v_x_u32m2_tu(vuint32m2_t vd, uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vmv_v_v_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs1,
                                     size_t vl);
vuint32m4_t __riscv_vmv_v_x_u32m4_tu(vuint32m4_t vd, uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vmv_v_v_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs1,
                                     size_t vl);
vuint32m8_t __riscv_vmv_v_x_u32m8_tu(vuint32m8_t vd, uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vmv_v_v_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs1,
                                     size_t vl);
vuint64m1_t __riscv_vmv_v_x_u64m1_tu(vuint64m1_t vd, uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vmv_v_v_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs1,
                                     size_t vl);
vuint64m2_t __riscv_vmv_v_x_u64m2_tu(vuint64m2_t vd, uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vmv_v_v_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs1,
                                     size_t vl);
vuint64m4_t __riscv_vmv_v_x_u64m4_tu(vuint64m4_t vd, uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vmv_v_v_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs1,
                                     size_t vl);
vuint64m8_t __riscv_vmv_v_x_u64m8_tu(vuint64m8_t vd, uint64_t rs1, size_t vl);