Vector Floating-Point Intrinsics

Vector Single-Width Floating-Point Add/Subtract Intrinsics

vfloat16mf4_t __riscv_vfadd_vv_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                         vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfadd_vf_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                         _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfadd_vv_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                         vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfadd_vf_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                         _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfadd_vv_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                       vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfadd_vf_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                       _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfadd_vv_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                       vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfadd_vf_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                       _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfadd_vv_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                       vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfadd_vf_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                       _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfadd_vv_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                       vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfadd_vf_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                       _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfadd_vv_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                         vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfadd_vf_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                         float rs1, size_t vl);
vfloat32m1_t __riscv_vfadd_vv_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                       vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfadd_vf_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                       float rs1, size_t vl);
vfloat32m2_t __riscv_vfadd_vv_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                       vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfadd_vf_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                       float rs1, size_t vl);
vfloat32m4_t __riscv_vfadd_vv_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                       vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfadd_vf_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                       float rs1, size_t vl);
vfloat32m8_t __riscv_vfadd_vv_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                       vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfadd_vf_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                       float rs1, size_t vl);
vfloat64m1_t __riscv_vfadd_vv_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                       vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfadd_vf_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                       double rs1, size_t vl);
vfloat64m2_t __riscv_vfadd_vv_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                       vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfadd_vf_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                       double rs1, size_t vl);
vfloat64m4_t __riscv_vfadd_vv_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                       vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfadd_vf_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                       double rs1, size_t vl);
vfloat64m8_t __riscv_vfadd_vv_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                       vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfadd_vf_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                       double rs1, size_t vl);
vfloat16mf4_t __riscv_vfsub_vv_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                         vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfsub_vf_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                         _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfsub_vv_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                         vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfsub_vf_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                         _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfsub_vv_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                       vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfsub_vf_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                       _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfsub_vv_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                       vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfsub_vf_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                       _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfsub_vv_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                       vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfsub_vf_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                       _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfsub_vv_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                       vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfsub_vf_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                       _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfsub_vv_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                         vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfsub_vf_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                         float rs1, size_t vl);
vfloat32m1_t __riscv_vfsub_vv_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                       vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfsub_vf_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                       float rs1, size_t vl);
vfloat32m2_t __riscv_vfsub_vv_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                       vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfsub_vf_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                       float rs1, size_t vl);
vfloat32m4_t __riscv_vfsub_vv_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                       vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfsub_vf_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                       float rs1, size_t vl);
vfloat32m8_t __riscv_vfsub_vv_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                       vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfsub_vf_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                       float rs1, size_t vl);
vfloat64m1_t __riscv_vfsub_vv_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                       vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfsub_vf_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                       double rs1, size_t vl);
vfloat64m2_t __riscv_vfsub_vv_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                       vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfsub_vf_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                       double rs1, size_t vl);
vfloat64m4_t __riscv_vfsub_vv_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                       vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfsub_vf_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                       double rs1, size_t vl);
vfloat64m8_t __riscv_vfsub_vv_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                       vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfsub_vf_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                       double rs1, size_t vl);
vfloat16mf4_t __riscv_vfrsub_vf_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                          _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfrsub_vf_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                          _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfrsub_vf_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfrsub_vf_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfrsub_vf_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfrsub_vf_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfrsub_vf_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                          float rs1, size_t vl);
vfloat32m1_t __riscv_vfrsub_vf_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                        float rs1, size_t vl);
vfloat32m2_t __riscv_vfrsub_vf_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                        float rs1, size_t vl);
vfloat32m4_t __riscv_vfrsub_vf_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                        float rs1, size_t vl);
vfloat32m8_t __riscv_vfrsub_vf_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                        float rs1, size_t vl);
vfloat64m1_t __riscv_vfrsub_vf_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                        double rs1, size_t vl);
vfloat64m2_t __riscv_vfrsub_vf_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                        double rs1, size_t vl);
vfloat64m4_t __riscv_vfrsub_vf_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                        double rs1, size_t vl);
vfloat64m8_t __riscv_vfrsub_vf_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                        double rs1, size_t vl);
vfloat16mf4_t __riscv_vfneg_v_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs,
                                        size_t vl);
vfloat16mf2_t __riscv_vfneg_v_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs,
                                        size_t vl);
vfloat16m1_t __riscv_vfneg_v_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs,
                                      size_t vl);
vfloat16m2_t __riscv_vfneg_v_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs,
                                      size_t vl);
vfloat16m4_t __riscv_vfneg_v_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs,
                                      size_t vl);
vfloat16m8_t __riscv_vfneg_v_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs,
                                      size_t vl);
vfloat32mf2_t __riscv_vfneg_v_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs,
                                        size_t vl);
vfloat32m1_t __riscv_vfneg_v_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs,
                                      size_t vl);
vfloat32m2_t __riscv_vfneg_v_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs,
                                      size_t vl);
vfloat32m4_t __riscv_vfneg_v_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs,
                                      size_t vl);
vfloat32m8_t __riscv_vfneg_v_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs,
                                      size_t vl);
vfloat64m1_t __riscv_vfneg_v_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs,
                                      size_t vl);
vfloat64m2_t __riscv_vfneg_v_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs,
                                      size_t vl);
vfloat64m4_t __riscv_vfneg_v_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs,
                                      size_t vl);
vfloat64m8_t __riscv_vfneg_v_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs,
                                      size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfadd_vv_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                          vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                          size_t vl);
vfloat16mf4_t __riscv_vfadd_vf_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                          vfloat16mf4_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16mf2_t __riscv_vfadd_vv_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                          vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                          size_t vl);
vfloat16mf2_t __riscv_vfadd_vf_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                          vfloat16mf2_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16m1_t __riscv_vfadd_vv_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                        vfloat16m1_t vs2, vfloat16m1_t vs1,
                                        size_t vl);
vfloat16m1_t __riscv_vfadd_vf_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                        vfloat16m1_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m2_t __riscv_vfadd_vv_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                        vfloat16m2_t vs2, vfloat16m2_t vs1,
                                        size_t vl);
vfloat16m2_t __riscv_vfadd_vf_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                        vfloat16m2_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m4_t __riscv_vfadd_vv_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                        vfloat16m4_t vs2, vfloat16m4_t vs1,
                                        size_t vl);
vfloat16m4_t __riscv_vfadd_vf_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                        vfloat16m4_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m8_t __riscv_vfadd_vv_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                        vfloat16m8_t vs2, vfloat16m8_t vs1,
                                        size_t vl);
vfloat16m8_t __riscv_vfadd_vf_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                        vfloat16m8_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32mf2_t __riscv_vfadd_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                          size_t vl);
vfloat32mf2_t __riscv_vfadd_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs2, float rs1,
                                          size_t vl);
vfloat32m1_t __riscv_vfadd_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs2, vfloat32m1_t vs1,
                                        size_t vl);
vfloat32m1_t __riscv_vfadd_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs2, float rs1, size_t vl);
vfloat32m2_t __riscv_vfadd_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs2, vfloat32m2_t vs1,
                                        size_t vl);
vfloat32m2_t __riscv_vfadd_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs2, float rs1, size_t vl);
vfloat32m4_t __riscv_vfadd_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs2, vfloat32m4_t vs1,
                                        size_t vl);
vfloat32m4_t __riscv_vfadd_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs2, float rs1, size_t vl);
vfloat32m8_t __riscv_vfadd_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs2, vfloat32m8_t vs1,
                                        size_t vl);
vfloat32m8_t __riscv_vfadd_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs2, float rs1, size_t vl);
vfloat64m1_t __riscv_vfadd_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs2, vfloat64m1_t vs1,
                                        size_t vl);
vfloat64m1_t __riscv_vfadd_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs2, double rs1,
                                        size_t vl);
vfloat64m2_t __riscv_vfadd_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs2, vfloat64m2_t vs1,
                                        size_t vl);
vfloat64m2_t __riscv_vfadd_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs2, double rs1,
                                        size_t vl);
vfloat64m4_t __riscv_vfadd_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs2, vfloat64m4_t vs1,
                                        size_t vl);
vfloat64m4_t __riscv_vfadd_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs2, double rs1,
                                        size_t vl);
vfloat64m8_t __riscv_vfadd_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs2, vfloat64m8_t vs1,
                                        size_t vl);
vfloat64m8_t __riscv_vfadd_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs2, double rs1,
                                        size_t vl);
vfloat16mf4_t __riscv_vfsub_vv_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                          vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                          size_t vl);
vfloat16mf4_t __riscv_vfsub_vf_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                          vfloat16mf4_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16mf2_t __riscv_vfsub_vv_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                          vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                          size_t vl);
vfloat16mf2_t __riscv_vfsub_vf_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                          vfloat16mf2_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16m1_t __riscv_vfsub_vv_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                        vfloat16m1_t vs2, vfloat16m1_t vs1,
                                        size_t vl);
vfloat16m1_t __riscv_vfsub_vf_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                        vfloat16m1_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m2_t __riscv_vfsub_vv_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                        vfloat16m2_t vs2, vfloat16m2_t vs1,
                                        size_t vl);
vfloat16m2_t __riscv_vfsub_vf_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                        vfloat16m2_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m4_t __riscv_vfsub_vv_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                        vfloat16m4_t vs2, vfloat16m4_t vs1,
                                        size_t vl);
vfloat16m4_t __riscv_vfsub_vf_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                        vfloat16m4_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m8_t __riscv_vfsub_vv_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                        vfloat16m8_t vs2, vfloat16m8_t vs1,
                                        size_t vl);
vfloat16m8_t __riscv_vfsub_vf_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                        vfloat16m8_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32mf2_t __riscv_vfsub_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                          size_t vl);
vfloat32mf2_t __riscv_vfsub_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs2, float rs1,
                                          size_t vl);
vfloat32m1_t __riscv_vfsub_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs2, vfloat32m1_t vs1,
                                        size_t vl);
vfloat32m1_t __riscv_vfsub_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs2, float rs1, size_t vl);
vfloat32m2_t __riscv_vfsub_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs2, vfloat32m2_t vs1,
                                        size_t vl);
vfloat32m2_t __riscv_vfsub_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs2, float rs1, size_t vl);
vfloat32m4_t __riscv_vfsub_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs2, vfloat32m4_t vs1,
                                        size_t vl);
vfloat32m4_t __riscv_vfsub_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs2, float rs1, size_t vl);
vfloat32m8_t __riscv_vfsub_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs2, vfloat32m8_t vs1,
                                        size_t vl);
vfloat32m8_t __riscv_vfsub_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs2, float rs1, size_t vl);
vfloat64m1_t __riscv_vfsub_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs2, vfloat64m1_t vs1,
                                        size_t vl);
vfloat64m1_t __riscv_vfsub_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs2, double rs1,
                                        size_t vl);
vfloat64m2_t __riscv_vfsub_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs2, vfloat64m2_t vs1,
                                        size_t vl);
vfloat64m2_t __riscv_vfsub_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs2, double rs1,
                                        size_t vl);
vfloat64m4_t __riscv_vfsub_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs2, vfloat64m4_t vs1,
                                        size_t vl);
vfloat64m4_t __riscv_vfsub_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs2, double rs1,
                                        size_t vl);
vfloat64m8_t __riscv_vfsub_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs2, vfloat64m8_t vs1,
                                        size_t vl);
vfloat64m8_t __riscv_vfsub_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs2, double rs1,
                                        size_t vl);
vfloat16mf4_t __riscv_vfrsub_vf_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16mf2_t __riscv_vfrsub_vf_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16m1_t __riscv_vfrsub_vf_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m2_t __riscv_vfrsub_vf_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m4_t __riscv_vfrsub_vf_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m8_t __riscv_vfrsub_vf_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32mf2_t __riscv_vfrsub_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, float rs1,
                                           size_t vl);
vfloat32m1_t __riscv_vfrsub_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, float rs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfrsub_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, float rs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfrsub_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, float rs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfrsub_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, float rs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfrsub_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, double rs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfrsub_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, double rs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfrsub_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, double rs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfrsub_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, double rs1,
                                         size_t vl);
vfloat16mf4_t __riscv_vfneg_v_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                         vfloat16mf4_t vs, size_t vl);
vfloat16mf2_t __riscv_vfneg_v_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                         vfloat16mf2_t vs, size_t vl);
vfloat16m1_t __riscv_vfneg_v_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                       vfloat16m1_t vs, size_t vl);
vfloat16m2_t __riscv_vfneg_v_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                       vfloat16m2_t vs, size_t vl);
vfloat16m4_t __riscv_vfneg_v_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                       vfloat16m4_t vs, size_t vl);
vfloat16m8_t __riscv_vfneg_v_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                       vfloat16m8_t vs, size_t vl);
vfloat32mf2_t __riscv_vfneg_v_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                         vfloat32mf2_t vs, size_t vl);
vfloat32m1_t __riscv_vfneg_v_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                       vfloat32m1_t vs, size_t vl);
vfloat32m2_t __riscv_vfneg_v_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                       vfloat32m2_t vs, size_t vl);
vfloat32m4_t __riscv_vfneg_v_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                       vfloat32m4_t vs, size_t vl);
vfloat32m8_t __riscv_vfneg_v_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                       vfloat32m8_t vs, size_t vl);
vfloat64m1_t __riscv_vfneg_v_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                       vfloat64m1_t vs, size_t vl);
vfloat64m2_t __riscv_vfneg_v_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                       vfloat64m2_t vs, size_t vl);
vfloat64m4_t __riscv_vfneg_v_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                       vfloat64m4_t vs, size_t vl);
vfloat64m8_t __riscv_vfneg_v_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                       vfloat64m8_t vs, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfadd_vv_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                           size_t vl);
vfloat16mf4_t __riscv_vfadd_vf_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16mf2_t __riscv_vfadd_vv_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                           size_t vl);
vfloat16mf2_t __riscv_vfadd_vf_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16m1_t __riscv_vfadd_vv_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs2, vfloat16m1_t vs1,
                                         size_t vl);
vfloat16m1_t __riscv_vfadd_vf_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m2_t __riscv_vfadd_vv_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs2, vfloat16m2_t vs1,
                                         size_t vl);
vfloat16m2_t __riscv_vfadd_vf_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m4_t __riscv_vfadd_vv_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs2, vfloat16m4_t vs1,
                                         size_t vl);
vfloat16m4_t __riscv_vfadd_vf_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m8_t __riscv_vfadd_vv_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs2, vfloat16m8_t vs1,
                                         size_t vl);
vfloat16m8_t __riscv_vfadd_vf_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32mf2_t __riscv_vfadd_vv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                           size_t vl);
vfloat32mf2_t __riscv_vfadd_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, float rs1,
                                           size_t vl);
vfloat32m1_t __riscv_vfadd_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, vfloat32m1_t vs1,
                                         size_t vl);
vfloat32m1_t __riscv_vfadd_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, float rs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfadd_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, vfloat32m2_t vs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfadd_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, float rs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfadd_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, vfloat32m4_t vs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfadd_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, float rs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfadd_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, vfloat32m8_t vs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfadd_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, float rs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfadd_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, vfloat64m1_t vs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfadd_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, double rs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfadd_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, vfloat64m2_t vs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfadd_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, double rs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfadd_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, vfloat64m4_t vs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfadd_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, double rs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfadd_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, vfloat64m8_t vs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfadd_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, double rs1,
                                         size_t vl);
vfloat16mf4_t __riscv_vfsub_vv_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                           size_t vl);
vfloat16mf4_t __riscv_vfsub_vf_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16mf2_t __riscv_vfsub_vv_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                           size_t vl);
vfloat16mf2_t __riscv_vfsub_vf_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16m1_t __riscv_vfsub_vv_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs2, vfloat16m1_t vs1,
                                         size_t vl);
vfloat16m1_t __riscv_vfsub_vf_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m2_t __riscv_vfsub_vv_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs2, vfloat16m2_t vs1,
                                         size_t vl);
vfloat16m2_t __riscv_vfsub_vf_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m4_t __riscv_vfsub_vv_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs2, vfloat16m4_t vs1,
                                         size_t vl);
vfloat16m4_t __riscv_vfsub_vf_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m8_t __riscv_vfsub_vv_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs2, vfloat16m8_t vs1,
                                         size_t vl);
vfloat16m8_t __riscv_vfsub_vf_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32mf2_t __riscv_vfsub_vv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                           size_t vl);
vfloat32mf2_t __riscv_vfsub_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, float rs1,
                                           size_t vl);
vfloat32m1_t __riscv_vfsub_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, vfloat32m1_t vs1,
                                         size_t vl);
vfloat32m1_t __riscv_vfsub_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, float rs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfsub_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, vfloat32m2_t vs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfsub_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, float rs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfsub_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, vfloat32m4_t vs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfsub_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, float rs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfsub_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, vfloat32m8_t vs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfsub_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, float rs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfsub_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, vfloat64m1_t vs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfsub_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, double rs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfsub_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, vfloat64m2_t vs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfsub_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, double rs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfsub_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, vfloat64m4_t vs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfsub_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, double rs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfsub_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, vfloat64m8_t vs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfsub_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, double rs1,
                                         size_t vl);
vfloat16mf4_t __riscv_vfrsub_vf_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs2, _Float16 rs1,
                                            size_t vl);
vfloat16mf2_t __riscv_vfrsub_vf_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs2, _Float16 rs1,
                                            size_t vl);
vfloat16m1_t __riscv_vfrsub_vf_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16m2_t __riscv_vfrsub_vf_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16m4_t __riscv_vfrsub_vf_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16m8_t __riscv_vfrsub_vf_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32mf2_t __riscv_vfrsub_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2, float rs1,
                                            size_t vl);
vfloat32m1_t __riscv_vfrsub_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, float rs1,
                                          size_t vl);
vfloat32m2_t __riscv_vfrsub_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, float rs1,
                                          size_t vl);
vfloat32m4_t __riscv_vfrsub_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, float rs1,
                                          size_t vl);
vfloat32m8_t __riscv_vfrsub_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, float rs1,
                                          size_t vl);
vfloat64m1_t __riscv_vfrsub_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, double rs1,
                                          size_t vl);
vfloat64m2_t __riscv_vfrsub_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, double rs1,
                                          size_t vl);
vfloat64m4_t __riscv_vfrsub_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, double rs1,
                                          size_t vl);
vfloat64m8_t __riscv_vfrsub_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, double rs1,
                                          size_t vl);
vfloat16mf4_t __riscv_vfneg_v_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                          vfloat16mf4_t vs, size_t vl);
vfloat16mf2_t __riscv_vfneg_v_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                          vfloat16mf2_t vs, size_t vl);
vfloat16m1_t __riscv_vfneg_v_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                        vfloat16m1_t vs, size_t vl);
vfloat16m2_t __riscv_vfneg_v_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                        vfloat16m2_t vs, size_t vl);
vfloat16m4_t __riscv_vfneg_v_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                        vfloat16m4_t vs, size_t vl);
vfloat16m8_t __riscv_vfneg_v_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                        vfloat16m8_t vs, size_t vl);
vfloat32mf2_t __riscv_vfneg_v_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs, size_t vl);
vfloat32m1_t __riscv_vfneg_v_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs, size_t vl);
vfloat32m2_t __riscv_vfneg_v_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs, size_t vl);
vfloat32m4_t __riscv_vfneg_v_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs, size_t vl);
vfloat32m8_t __riscv_vfneg_v_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs, size_t vl);
vfloat64m1_t __riscv_vfneg_v_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs, size_t vl);
vfloat64m2_t __riscv_vfneg_v_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs, size_t vl);
vfloat64m4_t __riscv_vfneg_v_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs, size_t vl);
vfloat64m8_t __riscv_vfneg_v_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfadd_vv_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                         vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                         size_t vl);
vfloat16mf4_t __riscv_vfadd_vf_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                         vfloat16mf4_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16mf2_t __riscv_vfadd_vv_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                         vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                         size_t vl);
vfloat16mf2_t __riscv_vfadd_vf_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                         vfloat16mf2_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m1_t __riscv_vfadd_vv_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                       vfloat16m1_t vs2, vfloat16m1_t vs1,
                                       size_t vl);
vfloat16m1_t __riscv_vfadd_vf_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                       vfloat16m1_t vs2, _Float16 rs1,
                                       size_t vl);
vfloat16m2_t __riscv_vfadd_vv_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                       vfloat16m2_t vs2, vfloat16m2_t vs1,
                                       size_t vl);
vfloat16m2_t __riscv_vfadd_vf_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                       vfloat16m2_t vs2, _Float16 rs1,
                                       size_t vl);
vfloat16m4_t __riscv_vfadd_vv_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                       vfloat16m4_t vs2, vfloat16m4_t vs1,
                                       size_t vl);
vfloat16m4_t __riscv_vfadd_vf_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                       vfloat16m4_t vs2, _Float16 rs1,
                                       size_t vl);
vfloat16m8_t __riscv_vfadd_vv_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                       vfloat16m8_t vs2, vfloat16m8_t vs1,
                                       size_t vl);
vfloat16m8_t __riscv_vfadd_vf_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                       vfloat16m8_t vs2, _Float16 rs1,
                                       size_t vl);
vfloat32mf2_t __riscv_vfadd_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                         vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                         size_t vl);
vfloat32mf2_t __riscv_vfadd_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                         vfloat32mf2_t vs2, float rs1,
                                         size_t vl);
vfloat32m1_t __riscv_vfadd_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                       vfloat32m1_t vs2, vfloat32m1_t vs1,
                                       size_t vl);
vfloat32m1_t __riscv_vfadd_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                       vfloat32m1_t vs2, float rs1, size_t vl);
vfloat32m2_t __riscv_vfadd_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                       vfloat32m2_t vs2, vfloat32m2_t vs1,
                                       size_t vl);
vfloat32m2_t __riscv_vfadd_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                       vfloat32m2_t vs2, float rs1, size_t vl);
vfloat32m4_t __riscv_vfadd_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                       vfloat32m4_t vs2, vfloat32m4_t vs1,
                                       size_t vl);
vfloat32m4_t __riscv_vfadd_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                       vfloat32m4_t vs2, float rs1, size_t vl);
vfloat32m8_t __riscv_vfadd_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                       vfloat32m8_t vs2, vfloat32m8_t vs1,
                                       size_t vl);
vfloat32m8_t __riscv_vfadd_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                       vfloat32m8_t vs2, float rs1, size_t vl);
vfloat64m1_t __riscv_vfadd_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                       vfloat64m1_t vs2, vfloat64m1_t vs1,
                                       size_t vl);
vfloat64m1_t __riscv_vfadd_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                       vfloat64m1_t vs2, double rs1, size_t vl);
vfloat64m2_t __riscv_vfadd_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                       vfloat64m2_t vs2, vfloat64m2_t vs1,
                                       size_t vl);
vfloat64m2_t __riscv_vfadd_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                       vfloat64m2_t vs2, double rs1, size_t vl);
vfloat64m4_t __riscv_vfadd_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                       vfloat64m4_t vs2, vfloat64m4_t vs1,
                                       size_t vl);
vfloat64m4_t __riscv_vfadd_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                       vfloat64m4_t vs2, double rs1, size_t vl);
vfloat64m8_t __riscv_vfadd_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                       vfloat64m8_t vs2, vfloat64m8_t vs1,
                                       size_t vl);
vfloat64m8_t __riscv_vfadd_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                       vfloat64m8_t vs2, double rs1, size_t vl);
vfloat16mf4_t __riscv_vfsub_vv_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                         vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                         size_t vl);
vfloat16mf4_t __riscv_vfsub_vf_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                         vfloat16mf4_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16mf2_t __riscv_vfsub_vv_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                         vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                         size_t vl);
vfloat16mf2_t __riscv_vfsub_vf_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                         vfloat16mf2_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m1_t __riscv_vfsub_vv_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                       vfloat16m1_t vs2, vfloat16m1_t vs1,
                                       size_t vl);
vfloat16m1_t __riscv_vfsub_vf_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                       vfloat16m1_t vs2, _Float16 rs1,
                                       size_t vl);
vfloat16m2_t __riscv_vfsub_vv_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                       vfloat16m2_t vs2, vfloat16m2_t vs1,
                                       size_t vl);
vfloat16m2_t __riscv_vfsub_vf_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                       vfloat16m2_t vs2, _Float16 rs1,
                                       size_t vl);
vfloat16m4_t __riscv_vfsub_vv_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                       vfloat16m4_t vs2, vfloat16m4_t vs1,
                                       size_t vl);
vfloat16m4_t __riscv_vfsub_vf_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                       vfloat16m4_t vs2, _Float16 rs1,
                                       size_t vl);
vfloat16m8_t __riscv_vfsub_vv_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                       vfloat16m8_t vs2, vfloat16m8_t vs1,
                                       size_t vl);
vfloat16m8_t __riscv_vfsub_vf_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                       vfloat16m8_t vs2, _Float16 rs1,
                                       size_t vl);
vfloat32mf2_t __riscv_vfsub_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                         vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                         size_t vl);
vfloat32mf2_t __riscv_vfsub_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                         vfloat32mf2_t vs2, float rs1,
                                         size_t vl);
vfloat32m1_t __riscv_vfsub_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                       vfloat32m1_t vs2, vfloat32m1_t vs1,
                                       size_t vl);
vfloat32m1_t __riscv_vfsub_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                       vfloat32m1_t vs2, float rs1, size_t vl);
vfloat32m2_t __riscv_vfsub_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                       vfloat32m2_t vs2, vfloat32m2_t vs1,
                                       size_t vl);
vfloat32m2_t __riscv_vfsub_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                       vfloat32m2_t vs2, float rs1, size_t vl);
vfloat32m4_t __riscv_vfsub_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                       vfloat32m4_t vs2, vfloat32m4_t vs1,
                                       size_t vl);
vfloat32m4_t __riscv_vfsub_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                       vfloat32m4_t vs2, float rs1, size_t vl);
vfloat32m8_t __riscv_vfsub_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                       vfloat32m8_t vs2, vfloat32m8_t vs1,
                                       size_t vl);
vfloat32m8_t __riscv_vfsub_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                       vfloat32m8_t vs2, float rs1, size_t vl);
vfloat64m1_t __riscv_vfsub_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                       vfloat64m1_t vs2, vfloat64m1_t vs1,
                                       size_t vl);
vfloat64m1_t __riscv_vfsub_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                       vfloat64m1_t vs2, double rs1, size_t vl);
vfloat64m2_t __riscv_vfsub_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                       vfloat64m2_t vs2, vfloat64m2_t vs1,
                                       size_t vl);
vfloat64m2_t __riscv_vfsub_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                       vfloat64m2_t vs2, double rs1, size_t vl);
vfloat64m4_t __riscv_vfsub_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                       vfloat64m4_t vs2, vfloat64m4_t vs1,
                                       size_t vl);
vfloat64m4_t __riscv_vfsub_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                       vfloat64m4_t vs2, double rs1, size_t vl);
vfloat64m8_t __riscv_vfsub_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                       vfloat64m8_t vs2, vfloat64m8_t vs1,
                                       size_t vl);
vfloat64m8_t __riscv_vfsub_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                       vfloat64m8_t vs2, double rs1, size_t vl);
vfloat16mf4_t __riscv_vfrsub_vf_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                          vfloat16mf4_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16mf2_t __riscv_vfrsub_vf_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                          vfloat16mf2_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16m1_t __riscv_vfrsub_vf_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                        vfloat16m1_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m2_t __riscv_vfrsub_vf_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                        vfloat16m2_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m4_t __riscv_vfrsub_vf_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                        vfloat16m4_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m8_t __riscv_vfrsub_vf_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                        vfloat16m8_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32mf2_t __riscv_vfrsub_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs2, float rs1,
                                          size_t vl);
vfloat32m1_t __riscv_vfrsub_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs2, float rs1, size_t vl);
vfloat32m2_t __riscv_vfrsub_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs2, float rs1, size_t vl);
vfloat32m4_t __riscv_vfrsub_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs2, float rs1, size_t vl);
vfloat32m8_t __riscv_vfrsub_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs2, float rs1, size_t vl);
vfloat64m1_t __riscv_vfrsub_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs2, double rs1,
                                        size_t vl);
vfloat64m2_t __riscv_vfrsub_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs2, double rs1,
                                        size_t vl);
vfloat64m4_t __riscv_vfrsub_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs2, double rs1,
                                        size_t vl);
vfloat64m8_t __riscv_vfrsub_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs2, double rs1,
                                        size_t vl);
vfloat16mf4_t __riscv_vfneg_v_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                        vfloat16mf4_t vs, size_t vl);
vfloat16mf2_t __riscv_vfneg_v_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                        vfloat16mf2_t vs, size_t vl);
vfloat16m1_t __riscv_vfneg_v_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                      vfloat16m1_t vs, size_t vl);
vfloat16m2_t __riscv_vfneg_v_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                      vfloat16m2_t vs, size_t vl);
vfloat16m4_t __riscv_vfneg_v_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                      vfloat16m4_t vs, size_t vl);
vfloat16m8_t __riscv_vfneg_v_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                      vfloat16m8_t vs, size_t vl);
vfloat32mf2_t __riscv_vfneg_v_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                        vfloat32mf2_t vs, size_t vl);
vfloat32m1_t __riscv_vfneg_v_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                      vfloat32m1_t vs, size_t vl);
vfloat32m2_t __riscv_vfneg_v_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                      vfloat32m2_t vs, size_t vl);
vfloat32m4_t __riscv_vfneg_v_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                      vfloat32m4_t vs, size_t vl);
vfloat32m8_t __riscv_vfneg_v_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                      vfloat32m8_t vs, size_t vl);
vfloat64m1_t __riscv_vfneg_v_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                      vfloat64m1_t vs, size_t vl);
vfloat64m2_t __riscv_vfneg_v_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                      vfloat64m2_t vs, size_t vl);
vfloat64m4_t __riscv_vfneg_v_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                      vfloat64m4_t vs, size_t vl);
vfloat64m8_t __riscv_vfneg_v_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                      vfloat64m8_t vs, size_t vl);
vfloat16mf4_t __riscv_vfadd_vv_f16mf4_rm_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                            vfloat16mf4_t vs1, unsigned int frm,
                                            size_t vl);
vfloat16mf4_t __riscv_vfadd_vf_f16mf4_rm_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                            _Float16 rs1, unsigned int frm,
                                            size_t vl);
vfloat16mf2_t __riscv_vfadd_vv_f16mf2_rm_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                            vfloat16mf2_t vs1, unsigned int frm,
                                            size_t vl);
vfloat16mf2_t __riscv_vfadd_vf_f16mf2_rm_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                            _Float16 rs1, unsigned int frm,
                                            size_t vl);
vfloat16m1_t __riscv_vfadd_vv_f16m1_rm_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                          vfloat16m1_t vs1, unsigned int frm,
                                          size_t vl);
vfloat16m1_t __riscv_vfadd_vf_f16m1_rm_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                          _Float16 rs1, unsigned int frm,
                                          size_t vl);
vfloat16m2_t __riscv_vfadd_vv_f16m2_rm_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                          vfloat16m2_t vs1, unsigned int frm,
                                          size_t vl);
vfloat16m2_t __riscv_vfadd_vf_f16m2_rm_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                          _Float16 rs1, unsigned int frm,
                                          size_t vl);
vfloat16m4_t __riscv_vfadd_vv_f16m4_rm_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                          vfloat16m4_t vs1, unsigned int frm,
                                          size_t vl);
vfloat16m4_t __riscv_vfadd_vf_f16m4_rm_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                          _Float16 rs1, unsigned int frm,
                                          size_t vl);
vfloat16m8_t __riscv_vfadd_vv_f16m8_rm_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                          vfloat16m8_t vs1, unsigned int frm,
                                          size_t vl);
vfloat16m8_t __riscv_vfadd_vf_f16m8_rm_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                          _Float16 rs1, unsigned int frm,
                                          size_t vl);
vfloat32mf2_t __riscv_vfadd_vv_f32mf2_rm_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                            vfloat32mf2_t vs1, unsigned int frm,
                                            size_t vl);
vfloat32mf2_t __riscv_vfadd_vf_f32mf2_rm_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                            float rs1, unsigned int frm,
                                            size_t vl);
vfloat32m1_t __riscv_vfadd_vv_f32m1_rm_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                          vfloat32m1_t vs1, unsigned int frm,
                                          size_t vl);
vfloat32m1_t __riscv_vfadd_vf_f32m1_rm_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                          float rs1, unsigned int frm,
                                          size_t vl);
vfloat32m2_t __riscv_vfadd_vv_f32m2_rm_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                          vfloat32m2_t vs1, unsigned int frm,
                                          size_t vl);
vfloat32m2_t __riscv_vfadd_vf_f32m2_rm_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                          float rs1, unsigned int frm,
                                          size_t vl);
vfloat32m4_t __riscv_vfadd_vv_f32m4_rm_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                          vfloat32m4_t vs1, unsigned int frm,
                                          size_t vl);
vfloat32m4_t __riscv_vfadd_vf_f32m4_rm_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                          float rs1, unsigned int frm,
                                          size_t vl);
vfloat32m8_t __riscv_vfadd_vv_f32m8_rm_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                          vfloat32m8_t vs1, unsigned int frm,
                                          size_t vl);
vfloat32m8_t __riscv_vfadd_vf_f32m8_rm_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                          float rs1, unsigned int frm,
                                          size_t vl);
vfloat64m1_t __riscv_vfadd_vv_f64m1_rm_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                          vfloat64m1_t vs1, unsigned int frm,
                                          size_t vl);
vfloat64m1_t __riscv_vfadd_vf_f64m1_rm_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                          double rs1, unsigned int frm,
                                          size_t vl);
vfloat64m2_t __riscv_vfadd_vv_f64m2_rm_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                          vfloat64m2_t vs1, unsigned int frm,
                                          size_t vl);
vfloat64m2_t __riscv_vfadd_vf_f64m2_rm_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                          double rs1, unsigned int frm,
                                          size_t vl);
vfloat64m4_t __riscv_vfadd_vv_f64m4_rm_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                          vfloat64m4_t vs1, unsigned int frm,
                                          size_t vl);
vfloat64m4_t __riscv_vfadd_vf_f64m4_rm_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                          double rs1, unsigned int frm,
                                          size_t vl);
vfloat64m8_t __riscv_vfadd_vv_f64m8_rm_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                          vfloat64m8_t vs1, unsigned int frm,
                                          size_t vl);
vfloat64m8_t __riscv_vfadd_vf_f64m8_rm_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                          double rs1, unsigned int frm,
                                          size_t vl);
vfloat16mf4_t __riscv_vfsub_vv_f16mf4_rm_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                            vfloat16mf4_t vs1, unsigned int frm,
                                            size_t vl);
vfloat16mf4_t __riscv_vfsub_vf_f16mf4_rm_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                            _Float16 rs1, unsigned int frm,
                                            size_t vl);
vfloat16mf2_t __riscv_vfsub_vv_f16mf2_rm_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                            vfloat16mf2_t vs1, unsigned int frm,
                                            size_t vl);
vfloat16mf2_t __riscv_vfsub_vf_f16mf2_rm_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                            _Float16 rs1, unsigned int frm,
                                            size_t vl);
vfloat16m1_t __riscv_vfsub_vv_f16m1_rm_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                          vfloat16m1_t vs1, unsigned int frm,
                                          size_t vl);
vfloat16m1_t __riscv_vfsub_vf_f16m1_rm_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                          _Float16 rs1, unsigned int frm,
                                          size_t vl);
vfloat16m2_t __riscv_vfsub_vv_f16m2_rm_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                          vfloat16m2_t vs1, unsigned int frm,
                                          size_t vl);
vfloat16m2_t __riscv_vfsub_vf_f16m2_rm_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                          _Float16 rs1, unsigned int frm,
                                          size_t vl);
vfloat16m4_t __riscv_vfsub_vv_f16m4_rm_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                          vfloat16m4_t vs1, unsigned int frm,
                                          size_t vl);
vfloat16m4_t __riscv_vfsub_vf_f16m4_rm_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                          _Float16 rs1, unsigned int frm,
                                          size_t vl);
vfloat16m8_t __riscv_vfsub_vv_f16m8_rm_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                          vfloat16m8_t vs1, unsigned int frm,
                                          size_t vl);
vfloat16m8_t __riscv_vfsub_vf_f16m8_rm_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                          _Float16 rs1, unsigned int frm,
                                          size_t vl);
vfloat32mf2_t __riscv_vfsub_vv_f32mf2_rm_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                            vfloat32mf2_t vs1, unsigned int frm,
                                            size_t vl);
vfloat32mf2_t __riscv_vfsub_vf_f32mf2_rm_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                            float rs1, unsigned int frm,
                                            size_t vl);
vfloat32m1_t __riscv_vfsub_vv_f32m1_rm_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                          vfloat32m1_t vs1, unsigned int frm,
                                          size_t vl);
vfloat32m1_t __riscv_vfsub_vf_f32m1_rm_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                          float rs1, unsigned int frm,
                                          size_t vl);
vfloat32m2_t __riscv_vfsub_vv_f32m2_rm_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                          vfloat32m2_t vs1, unsigned int frm,
                                          size_t vl);
vfloat32m2_t __riscv_vfsub_vf_f32m2_rm_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                          float rs1, unsigned int frm,
                                          size_t vl);
vfloat32m4_t __riscv_vfsub_vv_f32m4_rm_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                          vfloat32m4_t vs1, unsigned int frm,
                                          size_t vl);
vfloat32m4_t __riscv_vfsub_vf_f32m4_rm_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                          float rs1, unsigned int frm,
                                          size_t vl);
vfloat32m8_t __riscv_vfsub_vv_f32m8_rm_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                          vfloat32m8_t vs1, unsigned int frm,
                                          size_t vl);
vfloat32m8_t __riscv_vfsub_vf_f32m8_rm_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                          float rs1, unsigned int frm,
                                          size_t vl);
vfloat64m1_t __riscv_vfsub_vv_f64m1_rm_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                          vfloat64m1_t vs1, unsigned int frm,
                                          size_t vl);
vfloat64m1_t __riscv_vfsub_vf_f64m1_rm_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                          double rs1, unsigned int frm,
                                          size_t vl);
vfloat64m2_t __riscv_vfsub_vv_f64m2_rm_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                          vfloat64m2_t vs1, unsigned int frm,
                                          size_t vl);
vfloat64m2_t __riscv_vfsub_vf_f64m2_rm_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                          double rs1, unsigned int frm,
                                          size_t vl);
vfloat64m4_t __riscv_vfsub_vv_f64m4_rm_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                          vfloat64m4_t vs1, unsigned int frm,
                                          size_t vl);
vfloat64m4_t __riscv_vfsub_vf_f64m4_rm_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                          double rs1, unsigned int frm,
                                          size_t vl);
vfloat64m8_t __riscv_vfsub_vv_f64m8_rm_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                          vfloat64m8_t vs1, unsigned int frm,
                                          size_t vl);
vfloat64m8_t __riscv_vfsub_vf_f64m8_rm_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                          double rs1, unsigned int frm,
                                          size_t vl);
vfloat16mf4_t __riscv_vfrsub_vf_f16mf4_rm_tu(vfloat16mf4_t vd,
                                             vfloat16mf4_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfrsub_vf_f16mf2_rm_tu(vfloat16mf2_t vd,
                                             vfloat16mf2_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfrsub_vf_f16m1_rm_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat16m2_t __riscv_vfrsub_vf_f16m2_rm_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat16m4_t __riscv_vfrsub_vf_f16m4_rm_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat16m8_t __riscv_vfrsub_vf_f16m8_rm_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat32mf2_t __riscv_vfrsub_vf_f32mf2_rm_tu(vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfrsub_vf_f32m1_rm_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat32m2_t __riscv_vfrsub_vf_f32m2_rm_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat32m4_t __riscv_vfrsub_vf_f32m4_rm_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat32m8_t __riscv_vfrsub_vf_f32m8_rm_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat64m1_t __riscv_vfrsub_vf_f64m1_rm_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                           double rs1, unsigned int frm,
                                           size_t vl);
vfloat64m2_t __riscv_vfrsub_vf_f64m2_rm_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                           double rs1, unsigned int frm,
                                           size_t vl);
vfloat64m4_t __riscv_vfrsub_vf_f64m4_rm_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                           double rs1, unsigned int frm,
                                           size_t vl);
vfloat64m8_t __riscv_vfrsub_vf_f64m8_rm_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                           double rs1, unsigned int frm,
                                           size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfadd_vv_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs2,
                                             vfloat16mf4_t vs1,
                                             unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfadd_vf_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfadd_vv_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs2,
                                             vfloat16mf2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfadd_vf_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfadd_vv_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs2, vfloat16m1_t vs1,
                                           unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfadd_vf_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfadd_vv_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs2, vfloat16m2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfadd_vf_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfadd_vv_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs2, vfloat16m4_t vs1,
                                           unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfadd_vf_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfadd_vv_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs2, vfloat16m8_t vs1,
                                           unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfadd_vf_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfadd_vv_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2,
                                             vfloat32mf2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfadd_vf_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfadd_vv_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs2, vfloat32m1_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfadd_vf_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfadd_vv_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs2, vfloat32m2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfadd_vf_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfadd_vv_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs2, vfloat32m4_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfadd_vf_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfadd_vv_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs2, vfloat32m8_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfadd_vf_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfadd_vv_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs2, vfloat64m1_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfadd_vf_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs2, double rs1,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfadd_vv_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs2, vfloat64m2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfadd_vf_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs2, double rs1,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfadd_vv_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs2, vfloat64m4_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfadd_vf_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs2, double rs1,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfadd_vv_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs2, vfloat64m8_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfadd_vf_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs2, double rs1,
                                           unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfsub_vv_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs2,
                                             vfloat16mf4_t vs1,
                                             unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfsub_vf_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfsub_vv_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs2,
                                             vfloat16mf2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfsub_vf_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfsub_vv_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs2, vfloat16m1_t vs1,
                                           unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfsub_vf_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfsub_vv_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs2, vfloat16m2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfsub_vf_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfsub_vv_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs2, vfloat16m4_t vs1,
                                           unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfsub_vf_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfsub_vv_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs2, vfloat16m8_t vs1,
                                           unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfsub_vf_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfsub_vv_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2,
                                             vfloat32mf2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfsub_vf_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfsub_vv_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs2, vfloat32m1_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfsub_vf_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfsub_vv_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs2, vfloat32m2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfsub_vf_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfsub_vv_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs2, vfloat32m4_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfsub_vf_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfsub_vv_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs2, vfloat32m8_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfsub_vf_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfsub_vv_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs2, vfloat64m1_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfsub_vf_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs2, double rs1,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfsub_vv_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs2, vfloat64m2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfsub_vf_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs2, double rs1,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfsub_vv_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs2, vfloat64m4_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfsub_vf_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs2, double rs1,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfsub_vv_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs2, vfloat64m8_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfsub_vf_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs2, double rs1,
                                           unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfrsub_vf_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat16mf4_t vs2, _Float16 rs1,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfrsub_vf_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat16mf2_t vs2, _Float16 rs1,
                                              unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfrsub_vf_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat16m1_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfrsub_vf_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat16m2_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfrsub_vf_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat16m4_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfrsub_vf_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                            vfloat16m8_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfrsub_vf_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs2, float rs1,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfrsub_vf_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfrsub_vf_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfrsub_vf_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfrsub_vf_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfrsub_vf_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs2, double rs1,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfrsub_vf_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs2, double rs1,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfrsub_vf_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs2, double rs1,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfrsub_vf_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs2, double rs1,
                                            unsigned int frm, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfadd_vv_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat16mf4_t vs2,
                                              vfloat16mf4_t vs1,
                                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfadd_vf_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat16mf4_t vs2, _Float16 rs1,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfadd_vv_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat16mf2_t vs2,
                                              vfloat16mf2_t vs1,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfadd_vf_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat16mf2_t vs2, _Float16 rs1,
                                              unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfadd_vv_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat16m1_t vs2, vfloat16m1_t vs1,
                                            unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfadd_vf_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat16m1_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfadd_vv_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat16m2_t vs2, vfloat16m2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfadd_vf_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat16m2_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfadd_vv_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat16m4_t vs2, vfloat16m4_t vs1,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfadd_vf_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat16m4_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfadd_vv_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                            vfloat16m8_t vs2, vfloat16m8_t vs1,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfadd_vf_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                            vfloat16m8_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfadd_vv_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs2,
                                              vfloat32mf2_t vs1,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfadd_vf_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs2, float rs1,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfadd_vv_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs2, vfloat32m1_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfadd_vf_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfadd_vv_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs2, vfloat32m2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfadd_vf_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfadd_vv_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs2, vfloat32m4_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfadd_vf_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfadd_vv_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs2, vfloat32m8_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfadd_vf_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfadd_vv_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs2, vfloat64m1_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfadd_vf_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs2, double rs1,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfadd_vv_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs2, vfloat64m2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfadd_vf_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs2, double rs1,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfadd_vv_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs2, vfloat64m4_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfadd_vf_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs2, double rs1,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfadd_vv_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs2, vfloat64m8_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfadd_vf_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs2, double rs1,
                                            unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfsub_vv_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat16mf4_t vs2,
                                              vfloat16mf4_t vs1,
                                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfsub_vf_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat16mf4_t vs2, _Float16 rs1,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfsub_vv_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat16mf2_t vs2,
                                              vfloat16mf2_t vs1,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfsub_vf_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat16mf2_t vs2, _Float16 rs1,
                                              unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfsub_vv_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat16m1_t vs2, vfloat16m1_t vs1,
                                            unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfsub_vf_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat16m1_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfsub_vv_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat16m2_t vs2, vfloat16m2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfsub_vf_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat16m2_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfsub_vv_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat16m4_t vs2, vfloat16m4_t vs1,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfsub_vf_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat16m4_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfsub_vv_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                            vfloat16m8_t vs2, vfloat16m8_t vs1,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfsub_vf_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                            vfloat16m8_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfsub_vv_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs2,
                                              vfloat32mf2_t vs1,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfsub_vf_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs2, float rs1,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfsub_vv_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs2, vfloat32m1_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfsub_vf_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfsub_vv_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs2, vfloat32m2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfsub_vf_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfsub_vv_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs2, vfloat32m4_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfsub_vf_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfsub_vv_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs2, vfloat32m8_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfsub_vf_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfsub_vv_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs2, vfloat64m1_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfsub_vf_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs2, double rs1,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfsub_vv_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs2, vfloat64m2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfsub_vf_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs2, double rs1,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfsub_vv_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs2, vfloat64m4_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfsub_vf_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs2, double rs1,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfsub_vv_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs2, vfloat64m8_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfsub_vf_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs2, double rs1,
                                            unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfrsub_vf_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                               vfloat16mf4_t vs2, _Float16 rs1,
                                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfrsub_vf_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                               vfloat16mf2_t vs2, _Float16 rs1,
                                               unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfrsub_vf_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                             vfloat16m1_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfrsub_vf_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                             vfloat16m2_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfrsub_vf_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                             vfloat16m4_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfrsub_vf_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                             vfloat16m8_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfrsub_vf_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat32mf2_t vs2, float rs1,
                                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfrsub_vf_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat32m1_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfrsub_vf_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat32m2_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfrsub_vf_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat32m4_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfrsub_vf_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat32m8_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfrsub_vf_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat64m1_t vs2, double rs1,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfrsub_vf_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat64m2_t vs2, double rs1,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfrsub_vf_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat64m4_t vs2, double rs1,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfrsub_vf_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat64m8_t vs2, double rs1,
                                             unsigned int frm, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfadd_vv_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs2,
                                            vfloat16mf4_t vs1, unsigned int frm,
                                            size_t vl);
vfloat16mf4_t __riscv_vfadd_vf_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfadd_vv_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs2,
                                            vfloat16mf2_t vs1, unsigned int frm,
                                            size_t vl);
vfloat16mf2_t __riscv_vfadd_vf_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfadd_vv_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs2, vfloat16m1_t vs1,
                                          unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfadd_vf_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs2, _Float16 rs1,
                                          unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfadd_vv_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs2, vfloat16m2_t vs1,
                                          unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfadd_vf_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs2, _Float16 rs1,
                                          unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfadd_vv_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs2, vfloat16m4_t vs1,
                                          unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfadd_vf_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs2, _Float16 rs1,
                                          unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfadd_vv_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs2, vfloat16m8_t vs1,
                                          unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfadd_vf_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs2, _Float16 rs1,
                                          unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfadd_vv_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2,
                                            vfloat32mf2_t vs1, unsigned int frm,
                                            size_t vl);
vfloat32mf2_t __riscv_vfadd_vf_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfadd_vv_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, vfloat32m1_t vs1,
                                          unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfadd_vf_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, float rs1,
                                          unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfadd_vv_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, vfloat32m2_t vs1,
                                          unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfadd_vf_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, float rs1,
                                          unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfadd_vv_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, vfloat32m4_t vs1,
                                          unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfadd_vf_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, float rs1,
                                          unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfadd_vv_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, vfloat32m8_t vs1,
                                          unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfadd_vf_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, float rs1,
                                          unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfadd_vv_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, vfloat64m1_t vs1,
                                          unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfadd_vf_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, double rs1,
                                          unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfadd_vv_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, vfloat64m2_t vs1,
                                          unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfadd_vf_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, double rs1,
                                          unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfadd_vv_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, vfloat64m4_t vs1,
                                          unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfadd_vf_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, double rs1,
                                          unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfadd_vv_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, vfloat64m8_t vs1,
                                          unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfadd_vf_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, double rs1,
                                          unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfsub_vv_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs2,
                                            vfloat16mf4_t vs1, unsigned int frm,
                                            size_t vl);
vfloat16mf4_t __riscv_vfsub_vf_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfsub_vv_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs2,
                                            vfloat16mf2_t vs1, unsigned int frm,
                                            size_t vl);
vfloat16mf2_t __riscv_vfsub_vf_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfsub_vv_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs2, vfloat16m1_t vs1,
                                          unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfsub_vf_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs2, _Float16 rs1,
                                          unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfsub_vv_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs2, vfloat16m2_t vs1,
                                          unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfsub_vf_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs2, _Float16 rs1,
                                          unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfsub_vv_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs2, vfloat16m4_t vs1,
                                          unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfsub_vf_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs2, _Float16 rs1,
                                          unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfsub_vv_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs2, vfloat16m8_t vs1,
                                          unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfsub_vf_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs2, _Float16 rs1,
                                          unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfsub_vv_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2,
                                            vfloat32mf2_t vs1, unsigned int frm,
                                            size_t vl);
vfloat32mf2_t __riscv_vfsub_vf_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfsub_vv_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, vfloat32m1_t vs1,
                                          unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfsub_vf_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, float rs1,
                                          unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfsub_vv_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, vfloat32m2_t vs1,
                                          unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfsub_vf_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, float rs1,
                                          unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfsub_vv_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, vfloat32m4_t vs1,
                                          unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfsub_vf_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, float rs1,
                                          unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfsub_vv_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, vfloat32m8_t vs1,
                                          unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfsub_vf_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, float rs1,
                                          unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfsub_vv_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, vfloat64m1_t vs1,
                                          unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfsub_vf_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, double rs1,
                                          unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfsub_vv_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, vfloat64m2_t vs1,
                                          unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfsub_vf_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, double rs1,
                                          unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfsub_vv_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, vfloat64m4_t vs1,
                                          unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfsub_vf_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, double rs1,
                                          unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfsub_vv_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, vfloat64m8_t vs1,
                                          unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfsub_vf_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, double rs1,
                                          unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfrsub_vf_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfrsub_vf_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfrsub_vf_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfrsub_vf_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfrsub_vf_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfrsub_vf_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfrsub_vf_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfrsub_vf_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfrsub_vf_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfrsub_vf_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfrsub_vf_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfrsub_vf_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs2, double rs1,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfrsub_vf_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs2, double rs1,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfrsub_vf_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs2, double rs1,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfrsub_vf_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs2, double rs1,
                                           unsigned int frm, size_t vl);

Vector Widening Floating-Point Add/Subtract Intrinsics

vfloat32mf2_t __riscv_vfwadd_vv_f32mf2_tu(vfloat32mf2_t vd, vfloat16mf4_t vs2,
                                          vfloat16mf4_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfwadd_vf_f32mf2_tu(vfloat32mf2_t vd, vfloat16mf4_t vs2,
                                          _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfwadd_wv_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                          vfloat16mf4_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfwadd_wf_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                          _Float16 rs1, size_t vl);
vfloat32m1_t __riscv_vfwadd_vv_f32m1_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                                        vfloat16mf2_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwadd_vf_f32m1_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat32m1_t __riscv_vfwadd_wv_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                        vfloat16mf2_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwadd_wf_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat32m2_t __riscv_vfwadd_vv_f32m2_tu(vfloat32m2_t vd, vfloat16m1_t vs2,
                                        vfloat16m1_t vs1, size_t vl);
vfloat32m2_t __riscv_vfwadd_vf_f32m2_tu(vfloat32m2_t vd, vfloat16m1_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat32m2_t __riscv_vfwadd_wv_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                        vfloat16m1_t vs1, size_t vl);
vfloat32m2_t __riscv_vfwadd_wf_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat32m4_t __riscv_vfwadd_vv_f32m4_tu(vfloat32m4_t vd, vfloat16m2_t vs2,
                                        vfloat16m2_t vs1, size_t vl);
vfloat32m4_t __riscv_vfwadd_vf_f32m4_tu(vfloat32m4_t vd, vfloat16m2_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat32m4_t __riscv_vfwadd_wv_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                        vfloat16m2_t vs1, size_t vl);
vfloat32m4_t __riscv_vfwadd_wf_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat32m8_t __riscv_vfwadd_vv_f32m8_tu(vfloat32m8_t vd, vfloat16m4_t vs2,
                                        vfloat16m4_t vs1, size_t vl);
vfloat32m8_t __riscv_vfwadd_vf_f32m8_tu(vfloat32m8_t vd, vfloat16m4_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat32m8_t __riscv_vfwadd_wv_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                        vfloat16m4_t vs1, size_t vl);
vfloat32m8_t __riscv_vfwadd_wf_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat64m1_t __riscv_vfwadd_vv_f64m1_tu(vfloat64m1_t vd, vfloat32mf2_t vs2,
                                        vfloat32mf2_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwadd_vf_f64m1_tu(vfloat64m1_t vd, vfloat32mf2_t vs2,
                                        float rs1, size_t vl);
vfloat64m1_t __riscv_vfwadd_wv_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                        vfloat32mf2_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwadd_wf_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                        float rs1, size_t vl);
vfloat64m2_t __riscv_vfwadd_vv_f64m2_tu(vfloat64m2_t vd, vfloat32m1_t vs2,
                                        vfloat32m1_t vs1, size_t vl);
vfloat64m2_t __riscv_vfwadd_vf_f64m2_tu(vfloat64m2_t vd, vfloat32m1_t vs2,
                                        float rs1, size_t vl);
vfloat64m2_t __riscv_vfwadd_wv_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                        vfloat32m1_t vs1, size_t vl);
vfloat64m2_t __riscv_vfwadd_wf_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                        float rs1, size_t vl);
vfloat64m4_t __riscv_vfwadd_vv_f64m4_tu(vfloat64m4_t vd, vfloat32m2_t vs2,
                                        vfloat32m2_t vs1, size_t vl);
vfloat64m4_t __riscv_vfwadd_vf_f64m4_tu(vfloat64m4_t vd, vfloat32m2_t vs2,
                                        float rs1, size_t vl);
vfloat64m4_t __riscv_vfwadd_wv_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                        vfloat32m2_t vs1, size_t vl);
vfloat64m4_t __riscv_vfwadd_wf_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                        float rs1, size_t vl);
vfloat64m8_t __riscv_vfwadd_vv_f64m8_tu(vfloat64m8_t vd, vfloat32m4_t vs2,
                                        vfloat32m4_t vs1, size_t vl);
vfloat64m8_t __riscv_vfwadd_vf_f64m8_tu(vfloat64m8_t vd, vfloat32m4_t vs2,
                                        float rs1, size_t vl);
vfloat64m8_t __riscv_vfwadd_wv_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                        vfloat32m4_t vs1, size_t vl);
vfloat64m8_t __riscv_vfwadd_wf_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                        float rs1, size_t vl);
vfloat32mf2_t __riscv_vfwsub_vv_f32mf2_tu(vfloat32mf2_t vd, vfloat16mf4_t vs2,
                                          vfloat16mf4_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfwsub_vf_f32mf2_tu(vfloat32mf2_t vd, vfloat16mf4_t vs2,
                                          _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfwsub_wv_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                          vfloat16mf4_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfwsub_wf_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                          _Float16 rs1, size_t vl);
vfloat32m1_t __riscv_vfwsub_vv_f32m1_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                                        vfloat16mf2_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwsub_vf_f32m1_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat32m1_t __riscv_vfwsub_wv_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                        vfloat16mf2_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwsub_wf_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat32m2_t __riscv_vfwsub_vv_f32m2_tu(vfloat32m2_t vd, vfloat16m1_t vs2,
                                        vfloat16m1_t vs1, size_t vl);
vfloat32m2_t __riscv_vfwsub_vf_f32m2_tu(vfloat32m2_t vd, vfloat16m1_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat32m2_t __riscv_vfwsub_wv_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                        vfloat16m1_t vs1, size_t vl);
vfloat32m2_t __riscv_vfwsub_wf_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat32m4_t __riscv_vfwsub_vv_f32m4_tu(vfloat32m4_t vd, vfloat16m2_t vs2,
                                        vfloat16m2_t vs1, size_t vl);
vfloat32m4_t __riscv_vfwsub_vf_f32m4_tu(vfloat32m4_t vd, vfloat16m2_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat32m4_t __riscv_vfwsub_wv_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                        vfloat16m2_t vs1, size_t vl);
vfloat32m4_t __riscv_vfwsub_wf_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat32m8_t __riscv_vfwsub_vv_f32m8_tu(vfloat32m8_t vd, vfloat16m4_t vs2,
                                        vfloat16m4_t vs1, size_t vl);
vfloat32m8_t __riscv_vfwsub_vf_f32m8_tu(vfloat32m8_t vd, vfloat16m4_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat32m8_t __riscv_vfwsub_wv_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                        vfloat16m4_t vs1, size_t vl);
vfloat32m8_t __riscv_vfwsub_wf_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat64m1_t __riscv_vfwsub_vv_f64m1_tu(vfloat64m1_t vd, vfloat32mf2_t vs2,
                                        vfloat32mf2_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwsub_vf_f64m1_tu(vfloat64m1_t vd, vfloat32mf2_t vs2,
                                        float rs1, size_t vl);
vfloat64m1_t __riscv_vfwsub_wv_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                        vfloat32mf2_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwsub_wf_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                        float rs1, size_t vl);
vfloat64m2_t __riscv_vfwsub_vv_f64m2_tu(vfloat64m2_t vd, vfloat32m1_t vs2,
                                        vfloat32m1_t vs1, size_t vl);
vfloat64m2_t __riscv_vfwsub_vf_f64m2_tu(vfloat64m2_t vd, vfloat32m1_t vs2,
                                        float rs1, size_t vl);
vfloat64m2_t __riscv_vfwsub_wv_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                        vfloat32m1_t vs1, size_t vl);
vfloat64m2_t __riscv_vfwsub_wf_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                        float rs1, size_t vl);
vfloat64m4_t __riscv_vfwsub_vv_f64m4_tu(vfloat64m4_t vd, vfloat32m2_t vs2,
                                        vfloat32m2_t vs1, size_t vl);
vfloat64m4_t __riscv_vfwsub_vf_f64m4_tu(vfloat64m4_t vd, vfloat32m2_t vs2,
                                        float rs1, size_t vl);
vfloat64m4_t __riscv_vfwsub_wv_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                        vfloat32m2_t vs1, size_t vl);
vfloat64m4_t __riscv_vfwsub_wf_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                        float rs1, size_t vl);
vfloat64m8_t __riscv_vfwsub_vv_f64m8_tu(vfloat64m8_t vd, vfloat32m4_t vs2,
                                        vfloat32m4_t vs1, size_t vl);
vfloat64m8_t __riscv_vfwsub_vf_f64m8_tu(vfloat64m8_t vd, vfloat32m4_t vs2,
                                        float rs1, size_t vl);
vfloat64m8_t __riscv_vfwsub_wv_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                        vfloat32m4_t vs1, size_t vl);
vfloat64m8_t __riscv_vfwsub_wf_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                        float rs1, size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwadd_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                           size_t vl);
vfloat32mf2_t __riscv_vfwadd_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat16mf4_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat32mf2_t __riscv_vfwadd_wv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, vfloat16mf4_t vs1,
                                           size_t vl);
vfloat32mf2_t __riscv_vfwadd_wf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat32m1_t __riscv_vfwadd_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                         size_t vl);
vfloat32m1_t __riscv_vfwadd_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat16mf2_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32m1_t __riscv_vfwadd_wv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, vfloat16mf2_t vs1,
                                         size_t vl);
vfloat32m1_t __riscv_vfwadd_wf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfwadd_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat16m1_t vs2, vfloat16m1_t vs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfwadd_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat16m1_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfwadd_wv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, vfloat16m1_t vs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfwadd_wf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfwadd_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat16m2_t vs2, vfloat16m2_t vs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfwadd_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat16m2_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfwadd_wv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, vfloat16m2_t vs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfwadd_wf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfwadd_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat16m4_t vs2, vfloat16m4_t vs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfwadd_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat16m4_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfwadd_wv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, vfloat16m4_t vs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfwadd_wf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfwadd_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfwadd_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat32mf2_t vs2, float rs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfwadd_wv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, vfloat32mf2_t vs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfwadd_wf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, float rs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfwadd_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat32m1_t vs2, vfloat32m1_t vs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfwadd_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat32m1_t vs2, float rs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfwadd_wv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, vfloat32m1_t vs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfwadd_wf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, float rs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfwadd_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat32m2_t vs2, vfloat32m2_t vs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfwadd_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat32m2_t vs2, float rs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfwadd_wv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, vfloat32m2_t vs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfwadd_wf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, float rs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfwadd_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat32m4_t vs2, vfloat32m4_t vs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfwadd_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat32m4_t vs2, float rs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfwadd_wv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, vfloat32m4_t vs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfwadd_wf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, float rs1,
                                         size_t vl);
vfloat32mf2_t __riscv_vfwsub_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                           size_t vl);
vfloat32mf2_t __riscv_vfwsub_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat16mf4_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat32mf2_t __riscv_vfwsub_wv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, vfloat16mf4_t vs1,
                                           size_t vl);
vfloat32mf2_t __riscv_vfwsub_wf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat32m1_t __riscv_vfwsub_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                         size_t vl);
vfloat32m1_t __riscv_vfwsub_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat16mf2_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32m1_t __riscv_vfwsub_wv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, vfloat16mf2_t vs1,
                                         size_t vl);
vfloat32m1_t __riscv_vfwsub_wf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfwsub_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat16m1_t vs2, vfloat16m1_t vs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfwsub_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat16m1_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfwsub_wv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, vfloat16m1_t vs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfwsub_wf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfwsub_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat16m2_t vs2, vfloat16m2_t vs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfwsub_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat16m2_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfwsub_wv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, vfloat16m2_t vs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfwsub_wf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfwsub_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat16m4_t vs2, vfloat16m4_t vs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfwsub_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat16m4_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfwsub_wv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, vfloat16m4_t vs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfwsub_wf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfwsub_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfwsub_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat32mf2_t vs2, float rs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfwsub_wv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, vfloat32mf2_t vs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfwsub_wf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, float rs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfwsub_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat32m1_t vs2, vfloat32m1_t vs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfwsub_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat32m1_t vs2, float rs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfwsub_wv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, vfloat32m1_t vs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfwsub_wf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, float rs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfwsub_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat32m2_t vs2, vfloat32m2_t vs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfwsub_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat32m2_t vs2, float rs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfwsub_wv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, vfloat32m2_t vs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfwsub_wf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, float rs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfwsub_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat32m4_t vs2, vfloat32m4_t vs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfwsub_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat32m4_t vs2, float rs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfwsub_wv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, vfloat32m4_t vs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfwsub_wf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, float rs1,
                                         size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwadd_vv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat16mf4_t vs2,
                                            vfloat16mf4_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfwadd_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat16mf4_t vs2, _Float16 rs1,
                                            size_t vl);
vfloat32mf2_t __riscv_vfwadd_wv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2,
                                            vfloat16mf4_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfwadd_wf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2, _Float16 rs1,
                                            size_t vl);
vfloat32m1_t __riscv_vfwadd_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                          size_t vl);
vfloat32m1_t __riscv_vfwadd_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat16mf2_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32m1_t __riscv_vfwadd_wv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, vfloat16mf2_t vs1,
                                          size_t vl);
vfloat32m1_t __riscv_vfwadd_wf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32m2_t __riscv_vfwadd_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat16m1_t vs2, vfloat16m1_t vs1,
                                          size_t vl);
vfloat32m2_t __riscv_vfwadd_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat16m1_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32m2_t __riscv_vfwadd_wv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, vfloat16m1_t vs1,
                                          size_t vl);
vfloat32m2_t __riscv_vfwadd_wf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32m4_t __riscv_vfwadd_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat16m2_t vs2, vfloat16m2_t vs1,
                                          size_t vl);
vfloat32m4_t __riscv_vfwadd_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat16m2_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32m4_t __riscv_vfwadd_wv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, vfloat16m2_t vs1,
                                          size_t vl);
vfloat32m4_t __riscv_vfwadd_wf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32m8_t __riscv_vfwadd_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat16m4_t vs2, vfloat16m4_t vs1,
                                          size_t vl);
vfloat32m8_t __riscv_vfwadd_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat16m4_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32m8_t __riscv_vfwadd_wv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, vfloat16m4_t vs1,
                                          size_t vl);
vfloat32m8_t __riscv_vfwadd_wf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat64m1_t __riscv_vfwadd_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                          size_t vl);
vfloat64m1_t __riscv_vfwadd_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat32mf2_t vs2, float rs1,
                                          size_t vl);
vfloat64m1_t __riscv_vfwadd_wv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, vfloat32mf2_t vs1,
                                          size_t vl);
vfloat64m1_t __riscv_vfwadd_wf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, float rs1,
                                          size_t vl);
vfloat64m2_t __riscv_vfwadd_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat32m1_t vs2, vfloat32m1_t vs1,
                                          size_t vl);
vfloat64m2_t __riscv_vfwadd_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat32m1_t vs2, float rs1,
                                          size_t vl);
vfloat64m2_t __riscv_vfwadd_wv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, vfloat32m1_t vs1,
                                          size_t vl);
vfloat64m2_t __riscv_vfwadd_wf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, float rs1,
                                          size_t vl);
vfloat64m4_t __riscv_vfwadd_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat32m2_t vs2, vfloat32m2_t vs1,
                                          size_t vl);
vfloat64m4_t __riscv_vfwadd_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat32m2_t vs2, float rs1,
                                          size_t vl);
vfloat64m4_t __riscv_vfwadd_wv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, vfloat32m2_t vs1,
                                          size_t vl);
vfloat64m4_t __riscv_vfwadd_wf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, float rs1,
                                          size_t vl);
vfloat64m8_t __riscv_vfwadd_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat32m4_t vs2, vfloat32m4_t vs1,
                                          size_t vl);
vfloat64m8_t __riscv_vfwadd_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat32m4_t vs2, float rs1,
                                          size_t vl);
vfloat64m8_t __riscv_vfwadd_wv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, vfloat32m4_t vs1,
                                          size_t vl);
vfloat64m8_t __riscv_vfwadd_wf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, float rs1,
                                          size_t vl);
vfloat32mf2_t __riscv_vfwsub_vv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat16mf4_t vs2,
                                            vfloat16mf4_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfwsub_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat16mf4_t vs2, _Float16 rs1,
                                            size_t vl);
vfloat32mf2_t __riscv_vfwsub_wv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2,
                                            vfloat16mf4_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfwsub_wf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2, _Float16 rs1,
                                            size_t vl);
vfloat32m1_t __riscv_vfwsub_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                          size_t vl);
vfloat32m1_t __riscv_vfwsub_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat16mf2_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32m1_t __riscv_vfwsub_wv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, vfloat16mf2_t vs1,
                                          size_t vl);
vfloat32m1_t __riscv_vfwsub_wf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32m2_t __riscv_vfwsub_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat16m1_t vs2, vfloat16m1_t vs1,
                                          size_t vl);
vfloat32m2_t __riscv_vfwsub_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat16m1_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32m2_t __riscv_vfwsub_wv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, vfloat16m1_t vs1,
                                          size_t vl);
vfloat32m2_t __riscv_vfwsub_wf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32m4_t __riscv_vfwsub_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat16m2_t vs2, vfloat16m2_t vs1,
                                          size_t vl);
vfloat32m4_t __riscv_vfwsub_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat16m2_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32m4_t __riscv_vfwsub_wv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, vfloat16m2_t vs1,
                                          size_t vl);
vfloat32m4_t __riscv_vfwsub_wf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32m8_t __riscv_vfwsub_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat16m4_t vs2, vfloat16m4_t vs1,
                                          size_t vl);
vfloat32m8_t __riscv_vfwsub_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat16m4_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32m8_t __riscv_vfwsub_wv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, vfloat16m4_t vs1,
                                          size_t vl);
vfloat32m8_t __riscv_vfwsub_wf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat64m1_t __riscv_vfwsub_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                          size_t vl);
vfloat64m1_t __riscv_vfwsub_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat32mf2_t vs2, float rs1,
                                          size_t vl);
vfloat64m1_t __riscv_vfwsub_wv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, vfloat32mf2_t vs1,
                                          size_t vl);
vfloat64m1_t __riscv_vfwsub_wf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, float rs1,
                                          size_t vl);
vfloat64m2_t __riscv_vfwsub_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat32m1_t vs2, vfloat32m1_t vs1,
                                          size_t vl);
vfloat64m2_t __riscv_vfwsub_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat32m1_t vs2, float rs1,
                                          size_t vl);
vfloat64m2_t __riscv_vfwsub_wv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, vfloat32m1_t vs1,
                                          size_t vl);
vfloat64m2_t __riscv_vfwsub_wf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, float rs1,
                                          size_t vl);
vfloat64m4_t __riscv_vfwsub_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat32m2_t vs2, vfloat32m2_t vs1,
                                          size_t vl);
vfloat64m4_t __riscv_vfwsub_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat32m2_t vs2, float rs1,
                                          size_t vl);
vfloat64m4_t __riscv_vfwsub_wv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, vfloat32m2_t vs1,
                                          size_t vl);
vfloat64m4_t __riscv_vfwsub_wf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, float rs1,
                                          size_t vl);
vfloat64m8_t __riscv_vfwsub_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat32m4_t vs2, vfloat32m4_t vs1,
                                          size_t vl);
vfloat64m8_t __riscv_vfwsub_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat32m4_t vs2, float rs1,
                                          size_t vl);
vfloat64m8_t __riscv_vfwsub_wv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, vfloat32m4_t vs1,
                                          size_t vl);
vfloat64m8_t __riscv_vfwsub_wf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, float rs1,
                                          size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwadd_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                          size_t vl);
vfloat32mf2_t __riscv_vfwadd_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat16mf4_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32mf2_t __riscv_vfwadd_wv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs2, vfloat16mf4_t vs1,
                                          size_t vl);
vfloat32mf2_t __riscv_vfwadd_wf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32m1_t __riscv_vfwadd_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                        size_t vl);
vfloat32m1_t __riscv_vfwadd_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat16mf2_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32m1_t __riscv_vfwadd_wv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs2, vfloat16mf2_t vs1,
                                        size_t vl);
vfloat32m1_t __riscv_vfwadd_wf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32m2_t __riscv_vfwadd_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat16m1_t vs2, vfloat16m1_t vs1,
                                        size_t vl);
vfloat32m2_t __riscv_vfwadd_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat16m1_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32m2_t __riscv_vfwadd_wv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs2, vfloat16m1_t vs1,
                                        size_t vl);
vfloat32m2_t __riscv_vfwadd_wf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32m4_t __riscv_vfwadd_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat16m2_t vs2, vfloat16m2_t vs1,
                                        size_t vl);
vfloat32m4_t __riscv_vfwadd_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat16m2_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32m4_t __riscv_vfwadd_wv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs2, vfloat16m2_t vs1,
                                        size_t vl);
vfloat32m4_t __riscv_vfwadd_wf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32m8_t __riscv_vfwadd_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat16m4_t vs2, vfloat16m4_t vs1,
                                        size_t vl);
vfloat32m8_t __riscv_vfwadd_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat16m4_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32m8_t __riscv_vfwadd_wv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs2, vfloat16m4_t vs1,
                                        size_t vl);
vfloat32m8_t __riscv_vfwadd_wf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat64m1_t __riscv_vfwadd_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                        size_t vl);
vfloat64m1_t __riscv_vfwadd_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat32mf2_t vs2, float rs1,
                                        size_t vl);
vfloat64m1_t __riscv_vfwadd_wv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs2, vfloat32mf2_t vs1,
                                        size_t vl);
vfloat64m1_t __riscv_vfwadd_wf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs2, float rs1, size_t vl);
vfloat64m2_t __riscv_vfwadd_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat32m1_t vs2, vfloat32m1_t vs1,
                                        size_t vl);
vfloat64m2_t __riscv_vfwadd_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat32m1_t vs2, float rs1, size_t vl);
vfloat64m2_t __riscv_vfwadd_wv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs2, vfloat32m1_t vs1,
                                        size_t vl);
vfloat64m2_t __riscv_vfwadd_wf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs2, float rs1, size_t vl);
vfloat64m4_t __riscv_vfwadd_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat32m2_t vs2, vfloat32m2_t vs1,
                                        size_t vl);
vfloat64m4_t __riscv_vfwadd_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat32m2_t vs2, float rs1, size_t vl);
vfloat64m4_t __riscv_vfwadd_wv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs2, vfloat32m2_t vs1,
                                        size_t vl);
vfloat64m4_t __riscv_vfwadd_wf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs2, float rs1, size_t vl);
vfloat64m8_t __riscv_vfwadd_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat32m4_t vs2, vfloat32m4_t vs1,
                                        size_t vl);
vfloat64m8_t __riscv_vfwadd_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat32m4_t vs2, float rs1, size_t vl);
vfloat64m8_t __riscv_vfwadd_wv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs2, vfloat32m4_t vs1,
                                        size_t vl);
vfloat64m8_t __riscv_vfwadd_wf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs2, float rs1, size_t vl);
vfloat32mf2_t __riscv_vfwsub_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                          size_t vl);
vfloat32mf2_t __riscv_vfwsub_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat16mf4_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32mf2_t __riscv_vfwsub_wv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs2, vfloat16mf4_t vs1,
                                          size_t vl);
vfloat32mf2_t __riscv_vfwsub_wf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32m1_t __riscv_vfwsub_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                        size_t vl);
vfloat32m1_t __riscv_vfwsub_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat16mf2_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32m1_t __riscv_vfwsub_wv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs2, vfloat16mf2_t vs1,
                                        size_t vl);
vfloat32m1_t __riscv_vfwsub_wf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32m2_t __riscv_vfwsub_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat16m1_t vs2, vfloat16m1_t vs1,
                                        size_t vl);
vfloat32m2_t __riscv_vfwsub_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat16m1_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32m2_t __riscv_vfwsub_wv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs2, vfloat16m1_t vs1,
                                        size_t vl);
vfloat32m2_t __riscv_vfwsub_wf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32m4_t __riscv_vfwsub_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat16m2_t vs2, vfloat16m2_t vs1,
                                        size_t vl);
vfloat32m4_t __riscv_vfwsub_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat16m2_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32m4_t __riscv_vfwsub_wv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs2, vfloat16m2_t vs1,
                                        size_t vl);
vfloat32m4_t __riscv_vfwsub_wf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32m8_t __riscv_vfwsub_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat16m4_t vs2, vfloat16m4_t vs1,
                                        size_t vl);
vfloat32m8_t __riscv_vfwsub_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat16m4_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32m8_t __riscv_vfwsub_wv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs2, vfloat16m4_t vs1,
                                        size_t vl);
vfloat32m8_t __riscv_vfwsub_wf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat64m1_t __riscv_vfwsub_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                        size_t vl);
vfloat64m1_t __riscv_vfwsub_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat32mf2_t vs2, float rs1,
                                        size_t vl);
vfloat64m1_t __riscv_vfwsub_wv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs2, vfloat32mf2_t vs1,
                                        size_t vl);
vfloat64m1_t __riscv_vfwsub_wf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs2, float rs1, size_t vl);
vfloat64m2_t __riscv_vfwsub_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat32m1_t vs2, vfloat32m1_t vs1,
                                        size_t vl);
vfloat64m2_t __riscv_vfwsub_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat32m1_t vs2, float rs1, size_t vl);
vfloat64m2_t __riscv_vfwsub_wv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs2, vfloat32m1_t vs1,
                                        size_t vl);
vfloat64m2_t __riscv_vfwsub_wf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs2, float rs1, size_t vl);
vfloat64m4_t __riscv_vfwsub_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat32m2_t vs2, vfloat32m2_t vs1,
                                        size_t vl);
vfloat64m4_t __riscv_vfwsub_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat32m2_t vs2, float rs1, size_t vl);
vfloat64m4_t __riscv_vfwsub_wv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs2, vfloat32m2_t vs1,
                                        size_t vl);
vfloat64m4_t __riscv_vfwsub_wf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs2, float rs1, size_t vl);
vfloat64m8_t __riscv_vfwsub_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat32m4_t vs2, vfloat32m4_t vs1,
                                        size_t vl);
vfloat64m8_t __riscv_vfwsub_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat32m4_t vs2, float rs1, size_t vl);
vfloat64m8_t __riscv_vfwsub_wv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs2, vfloat32m4_t vs1,
                                        size_t vl);
vfloat64m8_t __riscv_vfwsub_wf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs2, float rs1, size_t vl);
vfloat32mf2_t __riscv_vfwadd_vv_f32mf2_rm_tu(vfloat32mf2_t vd,
                                             vfloat16mf4_t vs2,
                                             vfloat16mf4_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwadd_vf_f32mf2_rm_tu(vfloat32mf2_t vd,
                                             vfloat16mf4_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwadd_wv_f32mf2_rm_tu(vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2,
                                             vfloat16mf4_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwadd_wf_f32mf2_rm_tu(vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_vv_f32m1_rm_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                                           vfloat16mf2_t vs1, unsigned int frm,
                                           size_t vl);
vfloat32m1_t __riscv_vfwadd_vf_f32m1_rm_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat32m1_t __riscv_vfwadd_wv_f32m1_rm_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                           vfloat16mf2_t vs1, unsigned int frm,
                                           size_t vl);
vfloat32m1_t __riscv_vfwadd_wf_f32m1_rm_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat32m2_t __riscv_vfwadd_vv_f32m2_rm_tu(vfloat32m2_t vd, vfloat16m1_t vs2,
                                           vfloat16m1_t vs1, unsigned int frm,
                                           size_t vl);
vfloat32m2_t __riscv_vfwadd_vf_f32m2_rm_tu(vfloat32m2_t vd, vfloat16m1_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat32m2_t __riscv_vfwadd_wv_f32m2_rm_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                           vfloat16m1_t vs1, unsigned int frm,
                                           size_t vl);
vfloat32m2_t __riscv_vfwadd_wf_f32m2_rm_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat32m4_t __riscv_vfwadd_vv_f32m4_rm_tu(vfloat32m4_t vd, vfloat16m2_t vs2,
                                           vfloat16m2_t vs1, unsigned int frm,
                                           size_t vl);
vfloat32m4_t __riscv_vfwadd_vf_f32m4_rm_tu(vfloat32m4_t vd, vfloat16m2_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat32m4_t __riscv_vfwadd_wv_f32m4_rm_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                           vfloat16m2_t vs1, unsigned int frm,
                                           size_t vl);
vfloat32m4_t __riscv_vfwadd_wf_f32m4_rm_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat32m8_t __riscv_vfwadd_vv_f32m8_rm_tu(vfloat32m8_t vd, vfloat16m4_t vs2,
                                           vfloat16m4_t vs1, unsigned int frm,
                                           size_t vl);
vfloat32m8_t __riscv_vfwadd_vf_f32m8_rm_tu(vfloat32m8_t vd, vfloat16m4_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat32m8_t __riscv_vfwadd_wv_f32m8_rm_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                           vfloat16m4_t vs1, unsigned int frm,
                                           size_t vl);
vfloat32m8_t __riscv_vfwadd_wf_f32m8_rm_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat64m1_t __riscv_vfwadd_vv_f64m1_rm_tu(vfloat64m1_t vd, vfloat32mf2_t vs2,
                                           vfloat32mf2_t vs1, unsigned int frm,
                                           size_t vl);
vfloat64m1_t __riscv_vfwadd_vf_f64m1_rm_tu(vfloat64m1_t vd, vfloat32mf2_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat64m1_t __riscv_vfwadd_wv_f64m1_rm_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                           vfloat32mf2_t vs1, unsigned int frm,
                                           size_t vl);
vfloat64m1_t __riscv_vfwadd_wf_f64m1_rm_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat64m2_t __riscv_vfwadd_vv_f64m2_rm_tu(vfloat64m2_t vd, vfloat32m1_t vs2,
                                           vfloat32m1_t vs1, unsigned int frm,
                                           size_t vl);
vfloat64m2_t __riscv_vfwadd_vf_f64m2_rm_tu(vfloat64m2_t vd, vfloat32m1_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat64m2_t __riscv_vfwadd_wv_f64m2_rm_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                           vfloat32m1_t vs1, unsigned int frm,
                                           size_t vl);
vfloat64m2_t __riscv_vfwadd_wf_f64m2_rm_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat64m4_t __riscv_vfwadd_vv_f64m4_rm_tu(vfloat64m4_t vd, vfloat32m2_t vs2,
                                           vfloat32m2_t vs1, unsigned int frm,
                                           size_t vl);
vfloat64m4_t __riscv_vfwadd_vf_f64m4_rm_tu(vfloat64m4_t vd, vfloat32m2_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat64m4_t __riscv_vfwadd_wv_f64m4_rm_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                           vfloat32m2_t vs1, unsigned int frm,
                                           size_t vl);
vfloat64m4_t __riscv_vfwadd_wf_f64m4_rm_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat64m8_t __riscv_vfwadd_vv_f64m8_rm_tu(vfloat64m8_t vd, vfloat32m4_t vs2,
                                           vfloat32m4_t vs1, unsigned int frm,
                                           size_t vl);
vfloat64m8_t __riscv_vfwadd_vf_f64m8_rm_tu(vfloat64m8_t vd, vfloat32m4_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat64m8_t __riscv_vfwadd_wv_f64m8_rm_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                           vfloat32m4_t vs1, unsigned int frm,
                                           size_t vl);
vfloat64m8_t __riscv_vfwadd_wf_f64m8_rm_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat32mf2_t __riscv_vfwsub_vv_f32mf2_rm_tu(vfloat32mf2_t vd,
                                             vfloat16mf4_t vs2,
                                             vfloat16mf4_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_vf_f32mf2_rm_tu(vfloat32mf2_t vd,
                                             vfloat16mf4_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_wv_f32mf2_rm_tu(vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2,
                                             vfloat16mf4_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_wf_f32mf2_rm_tu(vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_vv_f32m1_rm_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                                           vfloat16mf2_t vs1, unsigned int frm,
                                           size_t vl);
vfloat32m1_t __riscv_vfwsub_vf_f32m1_rm_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat32m1_t __riscv_vfwsub_wv_f32m1_rm_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                           vfloat16mf2_t vs1, unsigned int frm,
                                           size_t vl);
vfloat32m1_t __riscv_vfwsub_wf_f32m1_rm_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat32m2_t __riscv_vfwsub_vv_f32m2_rm_tu(vfloat32m2_t vd, vfloat16m1_t vs2,
                                           vfloat16m1_t vs1, unsigned int frm,
                                           size_t vl);
vfloat32m2_t __riscv_vfwsub_vf_f32m2_rm_tu(vfloat32m2_t vd, vfloat16m1_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat32m2_t __riscv_vfwsub_wv_f32m2_rm_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                           vfloat16m1_t vs1, unsigned int frm,
                                           size_t vl);
vfloat32m2_t __riscv_vfwsub_wf_f32m2_rm_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat32m4_t __riscv_vfwsub_vv_f32m4_rm_tu(vfloat32m4_t vd, vfloat16m2_t vs2,
                                           vfloat16m2_t vs1, unsigned int frm,
                                           size_t vl);
vfloat32m4_t __riscv_vfwsub_vf_f32m4_rm_tu(vfloat32m4_t vd, vfloat16m2_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat32m4_t __riscv_vfwsub_wv_f32m4_rm_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                           vfloat16m2_t vs1, unsigned int frm,
                                           size_t vl);
vfloat32m4_t __riscv_vfwsub_wf_f32m4_rm_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat32m8_t __riscv_vfwsub_vv_f32m8_rm_tu(vfloat32m8_t vd, vfloat16m4_t vs2,
                                           vfloat16m4_t vs1, unsigned int frm,
                                           size_t vl);
vfloat32m8_t __riscv_vfwsub_vf_f32m8_rm_tu(vfloat32m8_t vd, vfloat16m4_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat32m8_t __riscv_vfwsub_wv_f32m8_rm_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                           vfloat16m4_t vs1, unsigned int frm,
                                           size_t vl);
vfloat32m8_t __riscv_vfwsub_wf_f32m8_rm_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat64m1_t __riscv_vfwsub_vv_f64m1_rm_tu(vfloat64m1_t vd, vfloat32mf2_t vs2,
                                           vfloat32mf2_t vs1, unsigned int frm,
                                           size_t vl);
vfloat64m1_t __riscv_vfwsub_vf_f64m1_rm_tu(vfloat64m1_t vd, vfloat32mf2_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat64m1_t __riscv_vfwsub_wv_f64m1_rm_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                           vfloat32mf2_t vs1, unsigned int frm,
                                           size_t vl);
vfloat64m1_t __riscv_vfwsub_wf_f64m1_rm_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat64m2_t __riscv_vfwsub_vv_f64m2_rm_tu(vfloat64m2_t vd, vfloat32m1_t vs2,
                                           vfloat32m1_t vs1, unsigned int frm,
                                           size_t vl);
vfloat64m2_t __riscv_vfwsub_vf_f64m2_rm_tu(vfloat64m2_t vd, vfloat32m1_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat64m2_t __riscv_vfwsub_wv_f64m2_rm_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                           vfloat32m1_t vs1, unsigned int frm,
                                           size_t vl);
vfloat64m2_t __riscv_vfwsub_wf_f64m2_rm_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat64m4_t __riscv_vfwsub_vv_f64m4_rm_tu(vfloat64m4_t vd, vfloat32m2_t vs2,
                                           vfloat32m2_t vs1, unsigned int frm,
                                           size_t vl);
vfloat64m4_t __riscv_vfwsub_vf_f64m4_rm_tu(vfloat64m4_t vd, vfloat32m2_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat64m4_t __riscv_vfwsub_wv_f64m4_rm_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                           vfloat32m2_t vs1, unsigned int frm,
                                           size_t vl);
vfloat64m4_t __riscv_vfwsub_wf_f64m4_rm_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat64m8_t __riscv_vfwsub_vv_f64m8_rm_tu(vfloat64m8_t vd, vfloat32m4_t vs2,
                                           vfloat32m4_t vs1, unsigned int frm,
                                           size_t vl);
vfloat64m8_t __riscv_vfwsub_vf_f64m8_rm_tu(vfloat64m8_t vd, vfloat32m4_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat64m8_t __riscv_vfwsub_wv_f64m8_rm_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                           vfloat32m4_t vs1, unsigned int frm,
                                           size_t vl);
vfloat64m8_t __riscv_vfwsub_wf_f64m8_rm_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwadd_vv_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat16mf4_t vs2,
                                              vfloat16mf4_t vs1,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwadd_vf_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat16mf4_t vs2, _Float16 rs1,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwadd_wv_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs2,
                                              vfloat16mf4_t vs1,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwadd_wf_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs2, _Float16 rs1,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_vv_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat16mf2_t vs2,
                                            vfloat16mf2_t vs1, unsigned int frm,
                                            size_t vl);
vfloat32m1_t __riscv_vfwadd_vf_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat16mf2_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_wv_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs2, vfloat16mf2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_wf_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_vv_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat16m1_t vs2, vfloat16m1_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_vf_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat16m1_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_wv_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs2, vfloat16m1_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_wf_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_vv_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat16m2_t vs2, vfloat16m2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_vf_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat16m2_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_wv_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs2, vfloat16m2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_wf_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_vv_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat16m4_t vs2, vfloat16m4_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_vf_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat16m4_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_wv_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs2, vfloat16m4_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_wf_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwadd_vv_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat32mf2_t vs2,
                                            vfloat32mf2_t vs1, unsigned int frm,
                                            size_t vl);
vfloat64m1_t __riscv_vfwadd_vf_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat32mf2_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwadd_wv_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs2, vfloat32mf2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwadd_wf_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwadd_vv_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat32m1_t vs2, vfloat32m1_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwadd_vf_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat32m1_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwadd_wv_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs2, vfloat32m1_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwadd_wf_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwadd_vv_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat32m2_t vs2, vfloat32m2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwadd_vf_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat32m2_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwadd_wv_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs2, vfloat32m2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwadd_wf_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwadd_vv_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat32m4_t vs2, vfloat32m4_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwadd_vf_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat32m4_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwadd_wv_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs2, vfloat32m4_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwadd_wf_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_vv_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat16mf4_t vs2,
                                              vfloat16mf4_t vs1,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_vf_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat16mf4_t vs2, _Float16 rs1,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_wv_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs2,
                                              vfloat16mf4_t vs1,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_wf_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs2, _Float16 rs1,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_vv_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat16mf2_t vs2,
                                            vfloat16mf2_t vs1, unsigned int frm,
                                            size_t vl);
vfloat32m1_t __riscv_vfwsub_vf_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat16mf2_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_wv_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs2, vfloat16mf2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_wf_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_vv_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat16m1_t vs2, vfloat16m1_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_vf_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat16m1_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_wv_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs2, vfloat16m1_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_wf_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_vv_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat16m2_t vs2, vfloat16m2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_vf_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat16m2_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_wv_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs2, vfloat16m2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_wf_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_vv_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat16m4_t vs2, vfloat16m4_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_vf_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat16m4_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_wv_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs2, vfloat16m4_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_wf_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwsub_vv_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat32mf2_t vs2,
                                            vfloat32mf2_t vs1, unsigned int frm,
                                            size_t vl);
vfloat64m1_t __riscv_vfwsub_vf_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat32mf2_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwsub_wv_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs2, vfloat32mf2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwsub_wf_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwsub_vv_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat32m1_t vs2, vfloat32m1_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwsub_vf_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat32m1_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwsub_wv_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs2, vfloat32m1_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwsub_wf_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwsub_vv_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat32m2_t vs2, vfloat32m2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwsub_vf_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat32m2_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwsub_wv_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs2, vfloat32m2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwsub_wf_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwsub_vv_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat32m4_t vs2, vfloat32m4_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwsub_vf_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat32m4_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwsub_wv_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs2, vfloat32m4_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwsub_wf_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwadd_vv_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat16mf4_t vs2,
                                               vfloat16mf4_t vs1,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwadd_vf_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat16mf4_t vs2, _Float16 rs1,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwadd_wv_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat32mf2_t vs2,
                                               vfloat16mf4_t vs1,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwadd_wf_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat32mf2_t vs2, _Float16 rs1,
                                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_vv_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat16mf2_t vs2,
                                             vfloat16mf2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_vf_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat16mf2_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_wv_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat32m1_t vs2,
                                             vfloat16mf2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_wf_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat32m1_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_vv_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat16m1_t vs2, vfloat16m1_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_vf_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat16m1_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_wv_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat32m2_t vs2, vfloat16m1_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_wf_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat32m2_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_vv_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat16m2_t vs2, vfloat16m2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_vf_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat16m2_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_wv_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat32m4_t vs2, vfloat16m2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_wf_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat32m4_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_vv_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat16m4_t vs2, vfloat16m4_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_vf_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat16m4_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_wv_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat32m8_t vs2, vfloat16m4_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_wf_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat32m8_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwadd_vv_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat32mf2_t vs2,
                                             vfloat32mf2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwadd_vf_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat32mf2_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwadd_wv_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat64m1_t vs2,
                                             vfloat32mf2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwadd_wf_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat64m1_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwadd_vv_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat32m1_t vs2, vfloat32m1_t vs1,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwadd_vf_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat32m1_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwadd_wv_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat64m2_t vs2, vfloat32m1_t vs1,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwadd_wf_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat64m2_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwadd_vv_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat32m2_t vs2, vfloat32m2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwadd_vf_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat32m2_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwadd_wv_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat64m4_t vs2, vfloat32m2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwadd_wf_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat64m4_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwadd_vv_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat32m4_t vs2, vfloat32m4_t vs1,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwadd_vf_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat32m4_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwadd_wv_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat64m8_t vs2, vfloat32m4_t vs1,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwadd_wf_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat64m8_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_vv_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat16mf4_t vs2,
                                               vfloat16mf4_t vs1,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_vf_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat16mf4_t vs2, _Float16 rs1,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_wv_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat32mf2_t vs2,
                                               vfloat16mf4_t vs1,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_wf_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat32mf2_t vs2, _Float16 rs1,
                                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_vv_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat16mf2_t vs2,
                                             vfloat16mf2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_vf_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat16mf2_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_wv_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat32m1_t vs2,
                                             vfloat16mf2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_wf_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat32m1_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_vv_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat16m1_t vs2, vfloat16m1_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_vf_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat16m1_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_wv_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat32m2_t vs2, vfloat16m1_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_wf_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat32m2_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_vv_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat16m2_t vs2, vfloat16m2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_vf_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat16m2_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_wv_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat32m4_t vs2, vfloat16m2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_wf_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat32m4_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_vv_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat16m4_t vs2, vfloat16m4_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_vf_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat16m4_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_wv_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat32m8_t vs2, vfloat16m4_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_wf_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat32m8_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwsub_vv_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat32mf2_t vs2,
                                             vfloat32mf2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwsub_vf_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat32mf2_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwsub_wv_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat64m1_t vs2,
                                             vfloat32mf2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwsub_wf_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat64m1_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwsub_vv_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat32m1_t vs2, vfloat32m1_t vs1,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwsub_vf_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat32m1_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwsub_wv_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat64m2_t vs2, vfloat32m1_t vs1,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwsub_wf_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat64m2_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwsub_vv_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat32m2_t vs2, vfloat32m2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwsub_vf_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat32m2_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwsub_wv_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat64m4_t vs2, vfloat32m2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwsub_wf_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat64m4_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwsub_vv_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat32m4_t vs2, vfloat32m4_t vs1,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwsub_vf_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat32m4_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwsub_wv_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat64m8_t vs2, vfloat32m4_t vs1,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwsub_wf_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat64m8_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwadd_vv_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat16mf4_t vs2,
                                             vfloat16mf4_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwadd_vf_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat16mf4_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwadd_wv_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2,
                                             vfloat16mf4_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwadd_wf_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_vv_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_vf_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat16mf2_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_wv_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs2, vfloat16mf2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_wf_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_vv_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat16m1_t vs2, vfloat16m1_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_vf_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat16m1_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_wv_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs2, vfloat16m1_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_wf_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_vv_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat16m2_t vs2, vfloat16m2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_vf_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat16m2_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_wv_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs2, vfloat16m2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_wf_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_vv_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat16m4_t vs2, vfloat16m4_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_vf_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat16m4_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_wv_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs2, vfloat16m4_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_wf_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwadd_vv_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwadd_vf_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat32mf2_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwadd_wv_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs2, vfloat32mf2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwadd_wf_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwadd_vv_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat32m1_t vs2, vfloat32m1_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwadd_vf_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat32m1_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwadd_wv_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs2, vfloat32m1_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwadd_wf_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwadd_vv_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat32m2_t vs2, vfloat32m2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwadd_vf_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat32m2_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwadd_wv_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs2, vfloat32m2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwadd_wf_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwadd_vv_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat32m4_t vs2, vfloat32m4_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwadd_vf_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat32m4_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwadd_wv_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs2, vfloat32m4_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwadd_wf_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_vv_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat16mf4_t vs2,
                                             vfloat16mf4_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_vf_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat16mf4_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_wv_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2,
                                             vfloat16mf4_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_wf_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_vv_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_vf_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat16mf2_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_wv_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs2, vfloat16mf2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_wf_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_vv_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat16m1_t vs2, vfloat16m1_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_vf_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat16m1_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_wv_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs2, vfloat16m1_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_wf_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_vv_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat16m2_t vs2, vfloat16m2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_vf_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat16m2_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_wv_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs2, vfloat16m2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_wf_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_vv_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat16m4_t vs2, vfloat16m4_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_vf_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat16m4_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_wv_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs2, vfloat16m4_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_wf_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwsub_vv_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwsub_vf_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat32mf2_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwsub_wv_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs2, vfloat32mf2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwsub_wf_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwsub_vv_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat32m1_t vs2, vfloat32m1_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwsub_vf_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat32m1_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwsub_wv_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs2, vfloat32m1_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwsub_wf_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwsub_vv_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat32m2_t vs2, vfloat32m2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwsub_vf_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat32m2_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwsub_wv_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs2, vfloat32m2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwsub_wf_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwsub_vv_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat32m4_t vs2, vfloat32m4_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwsub_vf_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat32m4_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwsub_wv_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs2, vfloat32m4_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwsub_wf_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs2, float rs1,
                                           unsigned int frm, size_t vl);

Vector Single-Width Floating-Point Multiply/Divide Intrinsics

vfloat16mf4_t __riscv_vfmul_vv_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                         vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfmul_vf_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                         _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfmul_vv_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                         vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfmul_vf_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                         _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfmul_vv_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                       vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfmul_vf_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                       _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfmul_vv_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                       vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfmul_vf_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                       _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfmul_vv_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                       vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfmul_vf_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                       _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfmul_vv_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                       vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfmul_vf_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                       _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfmul_vv_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                         vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfmul_vf_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                         float rs1, size_t vl);
vfloat32m1_t __riscv_vfmul_vv_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                       vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfmul_vf_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                       float rs1, size_t vl);
vfloat32m2_t __riscv_vfmul_vv_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                       vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfmul_vf_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                       float rs1, size_t vl);
vfloat32m4_t __riscv_vfmul_vv_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                       vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfmul_vf_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                       float rs1, size_t vl);
vfloat32m8_t __riscv_vfmul_vv_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                       vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfmul_vf_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                       float rs1, size_t vl);
vfloat64m1_t __riscv_vfmul_vv_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                       vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfmul_vf_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                       double rs1, size_t vl);
vfloat64m2_t __riscv_vfmul_vv_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                       vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfmul_vf_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                       double rs1, size_t vl);
vfloat64m4_t __riscv_vfmul_vv_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                       vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfmul_vf_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                       double rs1, size_t vl);
vfloat64m8_t __riscv_vfmul_vv_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                       vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfmul_vf_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                       double rs1, size_t vl);
vfloat16mf4_t __riscv_vfdiv_vv_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                         vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfdiv_vf_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                         _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfdiv_vv_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                         vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfdiv_vf_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                         _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfdiv_vv_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                       vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfdiv_vf_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                       _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfdiv_vv_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                       vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfdiv_vf_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                       _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfdiv_vv_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                       vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfdiv_vf_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                       _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfdiv_vv_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                       vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfdiv_vf_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                       _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfdiv_vv_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                         vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfdiv_vf_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                         float rs1, size_t vl);
vfloat32m1_t __riscv_vfdiv_vv_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                       vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfdiv_vf_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                       float rs1, size_t vl);
vfloat32m2_t __riscv_vfdiv_vv_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                       vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfdiv_vf_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                       float rs1, size_t vl);
vfloat32m4_t __riscv_vfdiv_vv_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                       vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfdiv_vf_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                       float rs1, size_t vl);
vfloat32m8_t __riscv_vfdiv_vv_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                       vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfdiv_vf_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                       float rs1, size_t vl);
vfloat64m1_t __riscv_vfdiv_vv_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                       vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfdiv_vf_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                       double rs1, size_t vl);
vfloat64m2_t __riscv_vfdiv_vv_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                       vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfdiv_vf_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                       double rs1, size_t vl);
vfloat64m4_t __riscv_vfdiv_vv_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                       vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfdiv_vf_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                       double rs1, size_t vl);
vfloat64m8_t __riscv_vfdiv_vv_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                       vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfdiv_vf_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                       double rs1, size_t vl);
vfloat16mf4_t __riscv_vfrdiv_vf_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                          _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfrdiv_vf_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                          _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfrdiv_vf_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfrdiv_vf_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfrdiv_vf_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfrdiv_vf_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfrdiv_vf_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                          float rs1, size_t vl);
vfloat32m1_t __riscv_vfrdiv_vf_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                        float rs1, size_t vl);
vfloat32m2_t __riscv_vfrdiv_vf_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                        float rs1, size_t vl);
vfloat32m4_t __riscv_vfrdiv_vf_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                        float rs1, size_t vl);
vfloat32m8_t __riscv_vfrdiv_vf_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                        float rs1, size_t vl);
vfloat64m1_t __riscv_vfrdiv_vf_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                        double rs1, size_t vl);
vfloat64m2_t __riscv_vfrdiv_vf_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                        double rs1, size_t vl);
vfloat64m4_t __riscv_vfrdiv_vf_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                        double rs1, size_t vl);
vfloat64m8_t __riscv_vfrdiv_vf_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                        double rs1, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmul_vv_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                          vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                          size_t vl);
vfloat16mf4_t __riscv_vfmul_vf_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                          vfloat16mf4_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16mf2_t __riscv_vfmul_vv_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                          vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                          size_t vl);
vfloat16mf2_t __riscv_vfmul_vf_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                          vfloat16mf2_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16m1_t __riscv_vfmul_vv_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                        vfloat16m1_t vs2, vfloat16m1_t vs1,
                                        size_t vl);
vfloat16m1_t __riscv_vfmul_vf_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                        vfloat16m1_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m2_t __riscv_vfmul_vv_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                        vfloat16m2_t vs2, vfloat16m2_t vs1,
                                        size_t vl);
vfloat16m2_t __riscv_vfmul_vf_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                        vfloat16m2_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m4_t __riscv_vfmul_vv_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                        vfloat16m4_t vs2, vfloat16m4_t vs1,
                                        size_t vl);
vfloat16m4_t __riscv_vfmul_vf_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                        vfloat16m4_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m8_t __riscv_vfmul_vv_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                        vfloat16m8_t vs2, vfloat16m8_t vs1,
                                        size_t vl);
vfloat16m8_t __riscv_vfmul_vf_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                        vfloat16m8_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32mf2_t __riscv_vfmul_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                          size_t vl);
vfloat32mf2_t __riscv_vfmul_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs2, float rs1,
                                          size_t vl);
vfloat32m1_t __riscv_vfmul_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs2, vfloat32m1_t vs1,
                                        size_t vl);
vfloat32m1_t __riscv_vfmul_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs2, float rs1, size_t vl);
vfloat32m2_t __riscv_vfmul_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs2, vfloat32m2_t vs1,
                                        size_t vl);
vfloat32m2_t __riscv_vfmul_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs2, float rs1, size_t vl);
vfloat32m4_t __riscv_vfmul_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs2, vfloat32m4_t vs1,
                                        size_t vl);
vfloat32m4_t __riscv_vfmul_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs2, float rs1, size_t vl);
vfloat32m8_t __riscv_vfmul_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs2, vfloat32m8_t vs1,
                                        size_t vl);
vfloat32m8_t __riscv_vfmul_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs2, float rs1, size_t vl);
vfloat64m1_t __riscv_vfmul_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs2, vfloat64m1_t vs1,
                                        size_t vl);
vfloat64m1_t __riscv_vfmul_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs2, double rs1,
                                        size_t vl);
vfloat64m2_t __riscv_vfmul_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs2, vfloat64m2_t vs1,
                                        size_t vl);
vfloat64m2_t __riscv_vfmul_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs2, double rs1,
                                        size_t vl);
vfloat64m4_t __riscv_vfmul_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs2, vfloat64m4_t vs1,
                                        size_t vl);
vfloat64m4_t __riscv_vfmul_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs2, double rs1,
                                        size_t vl);
vfloat64m8_t __riscv_vfmul_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs2, vfloat64m8_t vs1,
                                        size_t vl);
vfloat64m8_t __riscv_vfmul_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs2, double rs1,
                                        size_t vl);
vfloat16mf4_t __riscv_vfdiv_vv_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                          vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                          size_t vl);
vfloat16mf4_t __riscv_vfdiv_vf_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                          vfloat16mf4_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16mf2_t __riscv_vfdiv_vv_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                          vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                          size_t vl);
vfloat16mf2_t __riscv_vfdiv_vf_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                          vfloat16mf2_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16m1_t __riscv_vfdiv_vv_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                        vfloat16m1_t vs2, vfloat16m1_t vs1,
                                        size_t vl);
vfloat16m1_t __riscv_vfdiv_vf_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                        vfloat16m1_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m2_t __riscv_vfdiv_vv_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                        vfloat16m2_t vs2, vfloat16m2_t vs1,
                                        size_t vl);
vfloat16m2_t __riscv_vfdiv_vf_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                        vfloat16m2_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m4_t __riscv_vfdiv_vv_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                        vfloat16m4_t vs2, vfloat16m4_t vs1,
                                        size_t vl);
vfloat16m4_t __riscv_vfdiv_vf_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                        vfloat16m4_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m8_t __riscv_vfdiv_vv_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                        vfloat16m8_t vs2, vfloat16m8_t vs1,
                                        size_t vl);
vfloat16m8_t __riscv_vfdiv_vf_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                        vfloat16m8_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32mf2_t __riscv_vfdiv_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                          size_t vl);
vfloat32mf2_t __riscv_vfdiv_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs2, float rs1,
                                          size_t vl);
vfloat32m1_t __riscv_vfdiv_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs2, vfloat32m1_t vs1,
                                        size_t vl);
vfloat32m1_t __riscv_vfdiv_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs2, float rs1, size_t vl);
vfloat32m2_t __riscv_vfdiv_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs2, vfloat32m2_t vs1,
                                        size_t vl);
vfloat32m2_t __riscv_vfdiv_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs2, float rs1, size_t vl);
vfloat32m4_t __riscv_vfdiv_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs2, vfloat32m4_t vs1,
                                        size_t vl);
vfloat32m4_t __riscv_vfdiv_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs2, float rs1, size_t vl);
vfloat32m8_t __riscv_vfdiv_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs2, vfloat32m8_t vs1,
                                        size_t vl);
vfloat32m8_t __riscv_vfdiv_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs2, float rs1, size_t vl);
vfloat64m1_t __riscv_vfdiv_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs2, vfloat64m1_t vs1,
                                        size_t vl);
vfloat64m1_t __riscv_vfdiv_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs2, double rs1,
                                        size_t vl);
vfloat64m2_t __riscv_vfdiv_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs2, vfloat64m2_t vs1,
                                        size_t vl);
vfloat64m2_t __riscv_vfdiv_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs2, double rs1,
                                        size_t vl);
vfloat64m4_t __riscv_vfdiv_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs2, vfloat64m4_t vs1,
                                        size_t vl);
vfloat64m4_t __riscv_vfdiv_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs2, double rs1,
                                        size_t vl);
vfloat64m8_t __riscv_vfdiv_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs2, vfloat64m8_t vs1,
                                        size_t vl);
vfloat64m8_t __riscv_vfdiv_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs2, double rs1,
                                        size_t vl);
vfloat16mf4_t __riscv_vfrdiv_vf_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16mf2_t __riscv_vfrdiv_vf_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16m1_t __riscv_vfrdiv_vf_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m2_t __riscv_vfrdiv_vf_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m4_t __riscv_vfrdiv_vf_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m8_t __riscv_vfrdiv_vf_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32mf2_t __riscv_vfrdiv_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, float rs1,
                                           size_t vl);
vfloat32m1_t __riscv_vfrdiv_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, float rs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfrdiv_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, float rs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfrdiv_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, float rs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfrdiv_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, float rs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfrdiv_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, double rs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfrdiv_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, double rs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfrdiv_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, double rs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfrdiv_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, double rs1,
                                         size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmul_vv_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                           size_t vl);
vfloat16mf4_t __riscv_vfmul_vf_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16mf2_t __riscv_vfmul_vv_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                           size_t vl);
vfloat16mf2_t __riscv_vfmul_vf_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16m1_t __riscv_vfmul_vv_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs2, vfloat16m1_t vs1,
                                         size_t vl);
vfloat16m1_t __riscv_vfmul_vf_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m2_t __riscv_vfmul_vv_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs2, vfloat16m2_t vs1,
                                         size_t vl);
vfloat16m2_t __riscv_vfmul_vf_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m4_t __riscv_vfmul_vv_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs2, vfloat16m4_t vs1,
                                         size_t vl);
vfloat16m4_t __riscv_vfmul_vf_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m8_t __riscv_vfmul_vv_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs2, vfloat16m8_t vs1,
                                         size_t vl);
vfloat16m8_t __riscv_vfmul_vf_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32mf2_t __riscv_vfmul_vv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                           size_t vl);
vfloat32mf2_t __riscv_vfmul_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, float rs1,
                                           size_t vl);
vfloat32m1_t __riscv_vfmul_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, vfloat32m1_t vs1,
                                         size_t vl);
vfloat32m1_t __riscv_vfmul_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, float rs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfmul_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, vfloat32m2_t vs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfmul_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, float rs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfmul_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, vfloat32m4_t vs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfmul_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, float rs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfmul_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, vfloat32m8_t vs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfmul_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, float rs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfmul_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, vfloat64m1_t vs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfmul_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, double rs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfmul_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, vfloat64m2_t vs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfmul_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, double rs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfmul_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, vfloat64m4_t vs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfmul_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, double rs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfmul_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, vfloat64m8_t vs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfmul_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, double rs1,
                                         size_t vl);
vfloat16mf4_t __riscv_vfdiv_vv_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                           size_t vl);
vfloat16mf4_t __riscv_vfdiv_vf_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16mf2_t __riscv_vfdiv_vv_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                           size_t vl);
vfloat16mf2_t __riscv_vfdiv_vf_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16m1_t __riscv_vfdiv_vv_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs2, vfloat16m1_t vs1,
                                         size_t vl);
vfloat16m1_t __riscv_vfdiv_vf_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m2_t __riscv_vfdiv_vv_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs2, vfloat16m2_t vs1,
                                         size_t vl);
vfloat16m2_t __riscv_vfdiv_vf_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m4_t __riscv_vfdiv_vv_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs2, vfloat16m4_t vs1,
                                         size_t vl);
vfloat16m4_t __riscv_vfdiv_vf_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m8_t __riscv_vfdiv_vv_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs2, vfloat16m8_t vs1,
                                         size_t vl);
vfloat16m8_t __riscv_vfdiv_vf_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32mf2_t __riscv_vfdiv_vv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                           size_t vl);
vfloat32mf2_t __riscv_vfdiv_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, float rs1,
                                           size_t vl);
vfloat32m1_t __riscv_vfdiv_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, vfloat32m1_t vs1,
                                         size_t vl);
vfloat32m1_t __riscv_vfdiv_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, float rs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfdiv_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, vfloat32m2_t vs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfdiv_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, float rs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfdiv_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, vfloat32m4_t vs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfdiv_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, float rs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfdiv_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, vfloat32m8_t vs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfdiv_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, float rs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfdiv_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, vfloat64m1_t vs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfdiv_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, double rs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfdiv_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, vfloat64m2_t vs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfdiv_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, double rs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfdiv_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, vfloat64m4_t vs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfdiv_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, double rs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfdiv_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, vfloat64m8_t vs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfdiv_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, double rs1,
                                         size_t vl);
vfloat16mf4_t __riscv_vfrdiv_vf_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs2, _Float16 rs1,
                                            size_t vl);
vfloat16mf2_t __riscv_vfrdiv_vf_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs2, _Float16 rs1,
                                            size_t vl);
vfloat16m1_t __riscv_vfrdiv_vf_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16m2_t __riscv_vfrdiv_vf_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16m4_t __riscv_vfrdiv_vf_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16m8_t __riscv_vfrdiv_vf_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32mf2_t __riscv_vfrdiv_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2, float rs1,
                                            size_t vl);
vfloat32m1_t __riscv_vfrdiv_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, float rs1,
                                          size_t vl);
vfloat32m2_t __riscv_vfrdiv_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, float rs1,
                                          size_t vl);
vfloat32m4_t __riscv_vfrdiv_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, float rs1,
                                          size_t vl);
vfloat32m8_t __riscv_vfrdiv_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, float rs1,
                                          size_t vl);
vfloat64m1_t __riscv_vfrdiv_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, double rs1,
                                          size_t vl);
vfloat64m2_t __riscv_vfrdiv_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, double rs1,
                                          size_t vl);
vfloat64m4_t __riscv_vfrdiv_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, double rs1,
                                          size_t vl);
vfloat64m8_t __riscv_vfrdiv_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, double rs1,
                                          size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmul_vv_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                         vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                         size_t vl);
vfloat16mf4_t __riscv_vfmul_vf_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                         vfloat16mf4_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16mf2_t __riscv_vfmul_vv_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                         vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                         size_t vl);
vfloat16mf2_t __riscv_vfmul_vf_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                         vfloat16mf2_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m1_t __riscv_vfmul_vv_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                       vfloat16m1_t vs2, vfloat16m1_t vs1,
                                       size_t vl);
vfloat16m1_t __riscv_vfmul_vf_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                       vfloat16m1_t vs2, _Float16 rs1,
                                       size_t vl);
vfloat16m2_t __riscv_vfmul_vv_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                       vfloat16m2_t vs2, vfloat16m2_t vs1,
                                       size_t vl);
vfloat16m2_t __riscv_vfmul_vf_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                       vfloat16m2_t vs2, _Float16 rs1,
                                       size_t vl);
vfloat16m4_t __riscv_vfmul_vv_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                       vfloat16m4_t vs2, vfloat16m4_t vs1,
                                       size_t vl);
vfloat16m4_t __riscv_vfmul_vf_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                       vfloat16m4_t vs2, _Float16 rs1,
                                       size_t vl);
vfloat16m8_t __riscv_vfmul_vv_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                       vfloat16m8_t vs2, vfloat16m8_t vs1,
                                       size_t vl);
vfloat16m8_t __riscv_vfmul_vf_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                       vfloat16m8_t vs2, _Float16 rs1,
                                       size_t vl);
vfloat32mf2_t __riscv_vfmul_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                         vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                         size_t vl);
vfloat32mf2_t __riscv_vfmul_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                         vfloat32mf2_t vs2, float rs1,
                                         size_t vl);
vfloat32m1_t __riscv_vfmul_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                       vfloat32m1_t vs2, vfloat32m1_t vs1,
                                       size_t vl);
vfloat32m1_t __riscv_vfmul_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                       vfloat32m1_t vs2, float rs1, size_t vl);
vfloat32m2_t __riscv_vfmul_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                       vfloat32m2_t vs2, vfloat32m2_t vs1,
                                       size_t vl);
vfloat32m2_t __riscv_vfmul_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                       vfloat32m2_t vs2, float rs1, size_t vl);
vfloat32m4_t __riscv_vfmul_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                       vfloat32m4_t vs2, vfloat32m4_t vs1,
                                       size_t vl);
vfloat32m4_t __riscv_vfmul_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                       vfloat32m4_t vs2, float rs1, size_t vl);
vfloat32m8_t __riscv_vfmul_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                       vfloat32m8_t vs2, vfloat32m8_t vs1,
                                       size_t vl);
vfloat32m8_t __riscv_vfmul_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                       vfloat32m8_t vs2, float rs1, size_t vl);
vfloat64m1_t __riscv_vfmul_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                       vfloat64m1_t vs2, vfloat64m1_t vs1,
                                       size_t vl);
vfloat64m1_t __riscv_vfmul_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                       vfloat64m1_t vs2, double rs1, size_t vl);
vfloat64m2_t __riscv_vfmul_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                       vfloat64m2_t vs2, vfloat64m2_t vs1,
                                       size_t vl);
vfloat64m2_t __riscv_vfmul_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                       vfloat64m2_t vs2, double rs1, size_t vl);
vfloat64m4_t __riscv_vfmul_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                       vfloat64m4_t vs2, vfloat64m4_t vs1,
                                       size_t vl);
vfloat64m4_t __riscv_vfmul_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                       vfloat64m4_t vs2, double rs1, size_t vl);
vfloat64m8_t __riscv_vfmul_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                       vfloat64m8_t vs2, vfloat64m8_t vs1,
                                       size_t vl);
vfloat64m8_t __riscv_vfmul_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                       vfloat64m8_t vs2, double rs1, size_t vl);
vfloat16mf4_t __riscv_vfdiv_vv_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                         vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                         size_t vl);
vfloat16mf4_t __riscv_vfdiv_vf_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                         vfloat16mf4_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16mf2_t __riscv_vfdiv_vv_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                         vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                         size_t vl);
vfloat16mf2_t __riscv_vfdiv_vf_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                         vfloat16mf2_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m1_t __riscv_vfdiv_vv_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                       vfloat16m1_t vs2, vfloat16m1_t vs1,
                                       size_t vl);
vfloat16m1_t __riscv_vfdiv_vf_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                       vfloat16m1_t vs2, _Float16 rs1,
                                       size_t vl);
vfloat16m2_t __riscv_vfdiv_vv_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                       vfloat16m2_t vs2, vfloat16m2_t vs1,
                                       size_t vl);
vfloat16m2_t __riscv_vfdiv_vf_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                       vfloat16m2_t vs2, _Float16 rs1,
                                       size_t vl);
vfloat16m4_t __riscv_vfdiv_vv_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                       vfloat16m4_t vs2, vfloat16m4_t vs1,
                                       size_t vl);
vfloat16m4_t __riscv_vfdiv_vf_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                       vfloat16m4_t vs2, _Float16 rs1,
                                       size_t vl);
vfloat16m8_t __riscv_vfdiv_vv_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                       vfloat16m8_t vs2, vfloat16m8_t vs1,
                                       size_t vl);
vfloat16m8_t __riscv_vfdiv_vf_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                       vfloat16m8_t vs2, _Float16 rs1,
                                       size_t vl);
vfloat32mf2_t __riscv_vfdiv_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                         vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                         size_t vl);
vfloat32mf2_t __riscv_vfdiv_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                         vfloat32mf2_t vs2, float rs1,
                                         size_t vl);
vfloat32m1_t __riscv_vfdiv_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                       vfloat32m1_t vs2, vfloat32m1_t vs1,
                                       size_t vl);
vfloat32m1_t __riscv_vfdiv_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                       vfloat32m1_t vs2, float rs1, size_t vl);
vfloat32m2_t __riscv_vfdiv_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                       vfloat32m2_t vs2, vfloat32m2_t vs1,
                                       size_t vl);
vfloat32m2_t __riscv_vfdiv_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                       vfloat32m2_t vs2, float rs1, size_t vl);
vfloat32m4_t __riscv_vfdiv_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                       vfloat32m4_t vs2, vfloat32m4_t vs1,
                                       size_t vl);
vfloat32m4_t __riscv_vfdiv_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                       vfloat32m4_t vs2, float rs1, size_t vl);
vfloat32m8_t __riscv_vfdiv_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                       vfloat32m8_t vs2, vfloat32m8_t vs1,
                                       size_t vl);
vfloat32m8_t __riscv_vfdiv_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                       vfloat32m8_t vs2, float rs1, size_t vl);
vfloat64m1_t __riscv_vfdiv_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                       vfloat64m1_t vs2, vfloat64m1_t vs1,
                                       size_t vl);
vfloat64m1_t __riscv_vfdiv_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                       vfloat64m1_t vs2, double rs1, size_t vl);
vfloat64m2_t __riscv_vfdiv_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                       vfloat64m2_t vs2, vfloat64m2_t vs1,
                                       size_t vl);
vfloat64m2_t __riscv_vfdiv_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                       vfloat64m2_t vs2, double rs1, size_t vl);
vfloat64m4_t __riscv_vfdiv_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                       vfloat64m4_t vs2, vfloat64m4_t vs1,
                                       size_t vl);
vfloat64m4_t __riscv_vfdiv_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                       vfloat64m4_t vs2, double rs1, size_t vl);
vfloat64m8_t __riscv_vfdiv_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                       vfloat64m8_t vs2, vfloat64m8_t vs1,
                                       size_t vl);
vfloat64m8_t __riscv_vfdiv_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                       vfloat64m8_t vs2, double rs1, size_t vl);
vfloat16mf4_t __riscv_vfrdiv_vf_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                          vfloat16mf4_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16mf2_t __riscv_vfrdiv_vf_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                          vfloat16mf2_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16m1_t __riscv_vfrdiv_vf_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                        vfloat16m1_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m2_t __riscv_vfrdiv_vf_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                        vfloat16m2_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m4_t __riscv_vfrdiv_vf_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                        vfloat16m4_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m8_t __riscv_vfrdiv_vf_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                        vfloat16m8_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32mf2_t __riscv_vfrdiv_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs2, float rs1,
                                          size_t vl);
vfloat32m1_t __riscv_vfrdiv_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs2, float rs1, size_t vl);
vfloat32m2_t __riscv_vfrdiv_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs2, float rs1, size_t vl);
vfloat32m4_t __riscv_vfrdiv_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs2, float rs1, size_t vl);
vfloat32m8_t __riscv_vfrdiv_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs2, float rs1, size_t vl);
vfloat64m1_t __riscv_vfrdiv_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs2, double rs1,
                                        size_t vl);
vfloat64m2_t __riscv_vfrdiv_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs2, double rs1,
                                        size_t vl);
vfloat64m4_t __riscv_vfrdiv_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs2, double rs1,
                                        size_t vl);
vfloat64m8_t __riscv_vfrdiv_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs2, double rs1,
                                        size_t vl);
vfloat16mf4_t __riscv_vfmul_vv_f16mf4_rm_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                            vfloat16mf4_t vs1, unsigned int frm,
                                            size_t vl);
vfloat16mf4_t __riscv_vfmul_vf_f16mf4_rm_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                            _Float16 rs1, unsigned int frm,
                                            size_t vl);
vfloat16mf2_t __riscv_vfmul_vv_f16mf2_rm_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                            vfloat16mf2_t vs1, unsigned int frm,
                                            size_t vl);
vfloat16mf2_t __riscv_vfmul_vf_f16mf2_rm_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                            _Float16 rs1, unsigned int frm,
                                            size_t vl);
vfloat16m1_t __riscv_vfmul_vv_f16m1_rm_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                          vfloat16m1_t vs1, unsigned int frm,
                                          size_t vl);
vfloat16m1_t __riscv_vfmul_vf_f16m1_rm_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                          _Float16 rs1, unsigned int frm,
                                          size_t vl);
vfloat16m2_t __riscv_vfmul_vv_f16m2_rm_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                          vfloat16m2_t vs1, unsigned int frm,
                                          size_t vl);
vfloat16m2_t __riscv_vfmul_vf_f16m2_rm_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                          _Float16 rs1, unsigned int frm,
                                          size_t vl);
vfloat16m4_t __riscv_vfmul_vv_f16m4_rm_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                          vfloat16m4_t vs1, unsigned int frm,
                                          size_t vl);
vfloat16m4_t __riscv_vfmul_vf_f16m4_rm_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                          _Float16 rs1, unsigned int frm,
                                          size_t vl);
vfloat16m8_t __riscv_vfmul_vv_f16m8_rm_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                          vfloat16m8_t vs1, unsigned int frm,
                                          size_t vl);
vfloat16m8_t __riscv_vfmul_vf_f16m8_rm_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                          _Float16 rs1, unsigned int frm,
                                          size_t vl);
vfloat32mf2_t __riscv_vfmul_vv_f32mf2_rm_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                            vfloat32mf2_t vs1, unsigned int frm,
                                            size_t vl);
vfloat32mf2_t __riscv_vfmul_vf_f32mf2_rm_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                            float rs1, unsigned int frm,
                                            size_t vl);
vfloat32m1_t __riscv_vfmul_vv_f32m1_rm_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                          vfloat32m1_t vs1, unsigned int frm,
                                          size_t vl);
vfloat32m1_t __riscv_vfmul_vf_f32m1_rm_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                          float rs1, unsigned int frm,
                                          size_t vl);
vfloat32m2_t __riscv_vfmul_vv_f32m2_rm_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                          vfloat32m2_t vs1, unsigned int frm,
                                          size_t vl);
vfloat32m2_t __riscv_vfmul_vf_f32m2_rm_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                          float rs1, unsigned int frm,
                                          size_t vl);
vfloat32m4_t __riscv_vfmul_vv_f32m4_rm_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                          vfloat32m4_t vs1, unsigned int frm,
                                          size_t vl);
vfloat32m4_t __riscv_vfmul_vf_f32m4_rm_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                          float rs1, unsigned int frm,
                                          size_t vl);
vfloat32m8_t __riscv_vfmul_vv_f32m8_rm_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                          vfloat32m8_t vs1, unsigned int frm,
                                          size_t vl);
vfloat32m8_t __riscv_vfmul_vf_f32m8_rm_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                          float rs1, unsigned int frm,
                                          size_t vl);
vfloat64m1_t __riscv_vfmul_vv_f64m1_rm_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                          vfloat64m1_t vs1, unsigned int frm,
                                          size_t vl);
vfloat64m1_t __riscv_vfmul_vf_f64m1_rm_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                          double rs1, unsigned int frm,
                                          size_t vl);
vfloat64m2_t __riscv_vfmul_vv_f64m2_rm_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                          vfloat64m2_t vs1, unsigned int frm,
                                          size_t vl);
vfloat64m2_t __riscv_vfmul_vf_f64m2_rm_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                          double rs1, unsigned int frm,
                                          size_t vl);
vfloat64m4_t __riscv_vfmul_vv_f64m4_rm_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                          vfloat64m4_t vs1, unsigned int frm,
                                          size_t vl);
vfloat64m4_t __riscv_vfmul_vf_f64m4_rm_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                          double rs1, unsigned int frm,
                                          size_t vl);
vfloat64m8_t __riscv_vfmul_vv_f64m8_rm_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                          vfloat64m8_t vs1, unsigned int frm,
                                          size_t vl);
vfloat64m8_t __riscv_vfmul_vf_f64m8_rm_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                          double rs1, unsigned int frm,
                                          size_t vl);
vfloat16mf4_t __riscv_vfdiv_vv_f16mf4_rm_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                            vfloat16mf4_t vs1, unsigned int frm,
                                            size_t vl);
vfloat16mf4_t __riscv_vfdiv_vf_f16mf4_rm_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                            _Float16 rs1, unsigned int frm,
                                            size_t vl);
vfloat16mf2_t __riscv_vfdiv_vv_f16mf2_rm_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                            vfloat16mf2_t vs1, unsigned int frm,
                                            size_t vl);
vfloat16mf2_t __riscv_vfdiv_vf_f16mf2_rm_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                            _Float16 rs1, unsigned int frm,
                                            size_t vl);
vfloat16m1_t __riscv_vfdiv_vv_f16m1_rm_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                          vfloat16m1_t vs1, unsigned int frm,
                                          size_t vl);
vfloat16m1_t __riscv_vfdiv_vf_f16m1_rm_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                          _Float16 rs1, unsigned int frm,
                                          size_t vl);
vfloat16m2_t __riscv_vfdiv_vv_f16m2_rm_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                          vfloat16m2_t vs1, unsigned int frm,
                                          size_t vl);
vfloat16m2_t __riscv_vfdiv_vf_f16m2_rm_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                          _Float16 rs1, unsigned int frm,
                                          size_t vl);
vfloat16m4_t __riscv_vfdiv_vv_f16m4_rm_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                          vfloat16m4_t vs1, unsigned int frm,
                                          size_t vl);
vfloat16m4_t __riscv_vfdiv_vf_f16m4_rm_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                          _Float16 rs1, unsigned int frm,
                                          size_t vl);
vfloat16m8_t __riscv_vfdiv_vv_f16m8_rm_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                          vfloat16m8_t vs1, unsigned int frm,
                                          size_t vl);
vfloat16m8_t __riscv_vfdiv_vf_f16m8_rm_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                          _Float16 rs1, unsigned int frm,
                                          size_t vl);
vfloat32mf2_t __riscv_vfdiv_vv_f32mf2_rm_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                            vfloat32mf2_t vs1, unsigned int frm,
                                            size_t vl);
vfloat32mf2_t __riscv_vfdiv_vf_f32mf2_rm_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                            float rs1, unsigned int frm,
                                            size_t vl);
vfloat32m1_t __riscv_vfdiv_vv_f32m1_rm_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                          vfloat32m1_t vs1, unsigned int frm,
                                          size_t vl);
vfloat32m1_t __riscv_vfdiv_vf_f32m1_rm_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                          float rs1, unsigned int frm,
                                          size_t vl);
vfloat32m2_t __riscv_vfdiv_vv_f32m2_rm_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                          vfloat32m2_t vs1, unsigned int frm,
                                          size_t vl);
vfloat32m2_t __riscv_vfdiv_vf_f32m2_rm_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                          float rs1, unsigned int frm,
                                          size_t vl);
vfloat32m4_t __riscv_vfdiv_vv_f32m4_rm_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                          vfloat32m4_t vs1, unsigned int frm,
                                          size_t vl);
vfloat32m4_t __riscv_vfdiv_vf_f32m4_rm_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                          float rs1, unsigned int frm,
                                          size_t vl);
vfloat32m8_t __riscv_vfdiv_vv_f32m8_rm_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                          vfloat32m8_t vs1, unsigned int frm,
                                          size_t vl);
vfloat32m8_t __riscv_vfdiv_vf_f32m8_rm_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                          float rs1, unsigned int frm,
                                          size_t vl);
vfloat64m1_t __riscv_vfdiv_vv_f64m1_rm_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                          vfloat64m1_t vs1, unsigned int frm,
                                          size_t vl);
vfloat64m1_t __riscv_vfdiv_vf_f64m1_rm_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                          double rs1, unsigned int frm,
                                          size_t vl);
vfloat64m2_t __riscv_vfdiv_vv_f64m2_rm_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                          vfloat64m2_t vs1, unsigned int frm,
                                          size_t vl);
vfloat64m2_t __riscv_vfdiv_vf_f64m2_rm_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                          double rs1, unsigned int frm,
                                          size_t vl);
vfloat64m4_t __riscv_vfdiv_vv_f64m4_rm_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                          vfloat64m4_t vs1, unsigned int frm,
                                          size_t vl);
vfloat64m4_t __riscv_vfdiv_vf_f64m4_rm_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                          double rs1, unsigned int frm,
                                          size_t vl);
vfloat64m8_t __riscv_vfdiv_vv_f64m8_rm_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                          vfloat64m8_t vs1, unsigned int frm,
                                          size_t vl);
vfloat64m8_t __riscv_vfdiv_vf_f64m8_rm_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                          double rs1, unsigned int frm,
                                          size_t vl);
vfloat16mf4_t __riscv_vfrdiv_vf_f16mf4_rm_tu(vfloat16mf4_t vd,
                                             vfloat16mf4_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfrdiv_vf_f16mf2_rm_tu(vfloat16mf2_t vd,
                                             vfloat16mf2_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfrdiv_vf_f16m1_rm_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat16m2_t __riscv_vfrdiv_vf_f16m2_rm_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat16m4_t __riscv_vfrdiv_vf_f16m4_rm_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat16m8_t __riscv_vfrdiv_vf_f16m8_rm_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat32mf2_t __riscv_vfrdiv_vf_f32mf2_rm_tu(vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfrdiv_vf_f32m1_rm_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat32m2_t __riscv_vfrdiv_vf_f32m2_rm_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat32m4_t __riscv_vfrdiv_vf_f32m4_rm_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat32m8_t __riscv_vfrdiv_vf_f32m8_rm_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat64m1_t __riscv_vfrdiv_vf_f64m1_rm_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                           double rs1, unsigned int frm,
                                           size_t vl);
vfloat64m2_t __riscv_vfrdiv_vf_f64m2_rm_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                           double rs1, unsigned int frm,
                                           size_t vl);
vfloat64m4_t __riscv_vfrdiv_vf_f64m4_rm_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                           double rs1, unsigned int frm,
                                           size_t vl);
vfloat64m8_t __riscv_vfrdiv_vf_f64m8_rm_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                           double rs1, unsigned int frm,
                                           size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmul_vv_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs2,
                                             vfloat16mf4_t vs1,
                                             unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmul_vf_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmul_vv_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs2,
                                             vfloat16mf2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmul_vf_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmul_vv_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs2, vfloat16m1_t vs1,
                                           unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmul_vf_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmul_vv_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs2, vfloat16m2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmul_vf_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmul_vv_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs2, vfloat16m4_t vs1,
                                           unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmul_vf_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmul_vv_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs2, vfloat16m8_t vs1,
                                           unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmul_vf_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmul_vv_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2,
                                             vfloat32mf2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmul_vf_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmul_vv_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs2, vfloat32m1_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmul_vf_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmul_vv_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs2, vfloat32m2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmul_vf_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmul_vv_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs2, vfloat32m4_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmul_vf_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmul_vv_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs2, vfloat32m8_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmul_vf_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmul_vv_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs2, vfloat64m1_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmul_vf_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs2, double rs1,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmul_vv_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs2, vfloat64m2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmul_vf_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs2, double rs1,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmul_vv_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs2, vfloat64m4_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmul_vf_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs2, double rs1,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmul_vv_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs2, vfloat64m8_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmul_vf_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs2, double rs1,
                                           unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfdiv_vv_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs2,
                                             vfloat16mf4_t vs1,
                                             unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfdiv_vf_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfdiv_vv_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs2,
                                             vfloat16mf2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfdiv_vf_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfdiv_vv_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs2, vfloat16m1_t vs1,
                                           unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfdiv_vf_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfdiv_vv_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs2, vfloat16m2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfdiv_vf_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfdiv_vv_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs2, vfloat16m4_t vs1,
                                           unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfdiv_vf_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfdiv_vv_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs2, vfloat16m8_t vs1,
                                           unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfdiv_vf_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfdiv_vv_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2,
                                             vfloat32mf2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfdiv_vf_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfdiv_vv_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs2, vfloat32m1_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfdiv_vf_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfdiv_vv_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs2, vfloat32m2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfdiv_vf_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfdiv_vv_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs2, vfloat32m4_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfdiv_vf_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfdiv_vv_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs2, vfloat32m8_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfdiv_vf_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfdiv_vv_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs2, vfloat64m1_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfdiv_vf_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs2, double rs1,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfdiv_vv_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs2, vfloat64m2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfdiv_vf_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs2, double rs1,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfdiv_vv_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs2, vfloat64m4_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfdiv_vf_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs2, double rs1,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfdiv_vv_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs2, vfloat64m8_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfdiv_vf_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs2, double rs1,
                                           unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfrdiv_vf_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat16mf4_t vs2, _Float16 rs1,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfrdiv_vf_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat16mf2_t vs2, _Float16 rs1,
                                              unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfrdiv_vf_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat16m1_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfrdiv_vf_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat16m2_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfrdiv_vf_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat16m4_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfrdiv_vf_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                            vfloat16m8_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfrdiv_vf_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs2, float rs1,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfrdiv_vf_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfrdiv_vf_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfrdiv_vf_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfrdiv_vf_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfrdiv_vf_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs2, double rs1,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfrdiv_vf_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs2, double rs1,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfrdiv_vf_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs2, double rs1,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfrdiv_vf_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs2, double rs1,
                                            unsigned int frm, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmul_vv_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat16mf4_t vs2,
                                              vfloat16mf4_t vs1,
                                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmul_vf_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat16mf4_t vs2, _Float16 rs1,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmul_vv_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat16mf2_t vs2,
                                              vfloat16mf2_t vs1,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmul_vf_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat16mf2_t vs2, _Float16 rs1,
                                              unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmul_vv_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat16m1_t vs2, vfloat16m1_t vs1,
                                            unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmul_vf_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat16m1_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmul_vv_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat16m2_t vs2, vfloat16m2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmul_vf_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat16m2_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmul_vv_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat16m4_t vs2, vfloat16m4_t vs1,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmul_vf_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat16m4_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmul_vv_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                            vfloat16m8_t vs2, vfloat16m8_t vs1,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmul_vf_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                            vfloat16m8_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmul_vv_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs2,
                                              vfloat32mf2_t vs1,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmul_vf_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs2, float rs1,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmul_vv_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs2, vfloat32m1_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmul_vf_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmul_vv_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs2, vfloat32m2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmul_vf_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmul_vv_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs2, vfloat32m4_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmul_vf_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmul_vv_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs2, vfloat32m8_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmul_vf_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmul_vv_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs2, vfloat64m1_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmul_vf_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs2, double rs1,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmul_vv_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs2, vfloat64m2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmul_vf_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs2, double rs1,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmul_vv_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs2, vfloat64m4_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmul_vf_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs2, double rs1,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmul_vv_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs2, vfloat64m8_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmul_vf_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs2, double rs1,
                                            unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfdiv_vv_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat16mf4_t vs2,
                                              vfloat16mf4_t vs1,
                                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfdiv_vf_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat16mf4_t vs2, _Float16 rs1,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfdiv_vv_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat16mf2_t vs2,
                                              vfloat16mf2_t vs1,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfdiv_vf_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat16mf2_t vs2, _Float16 rs1,
                                              unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfdiv_vv_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat16m1_t vs2, vfloat16m1_t vs1,
                                            unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfdiv_vf_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat16m1_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfdiv_vv_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat16m2_t vs2, vfloat16m2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfdiv_vf_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat16m2_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfdiv_vv_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat16m4_t vs2, vfloat16m4_t vs1,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfdiv_vf_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat16m4_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfdiv_vv_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                            vfloat16m8_t vs2, vfloat16m8_t vs1,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfdiv_vf_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                            vfloat16m8_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfdiv_vv_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs2,
                                              vfloat32mf2_t vs1,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfdiv_vf_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs2, float rs1,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfdiv_vv_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs2, vfloat32m1_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfdiv_vf_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfdiv_vv_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs2, vfloat32m2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfdiv_vf_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfdiv_vv_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs2, vfloat32m4_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfdiv_vf_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfdiv_vv_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs2, vfloat32m8_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfdiv_vf_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfdiv_vv_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs2, vfloat64m1_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfdiv_vf_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs2, double rs1,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfdiv_vv_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs2, vfloat64m2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfdiv_vf_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs2, double rs1,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfdiv_vv_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs2, vfloat64m4_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfdiv_vf_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs2, double rs1,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfdiv_vv_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs2, vfloat64m8_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfdiv_vf_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs2, double rs1,
                                            unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfrdiv_vf_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                               vfloat16mf4_t vs2, _Float16 rs1,
                                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfrdiv_vf_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                               vfloat16mf2_t vs2, _Float16 rs1,
                                               unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfrdiv_vf_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                             vfloat16m1_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfrdiv_vf_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                             vfloat16m2_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfrdiv_vf_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                             vfloat16m4_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfrdiv_vf_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                             vfloat16m8_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfrdiv_vf_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat32mf2_t vs2, float rs1,
                                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfrdiv_vf_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat32m1_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfrdiv_vf_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat32m2_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfrdiv_vf_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat32m4_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfrdiv_vf_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat32m8_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfrdiv_vf_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat64m1_t vs2, double rs1,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfrdiv_vf_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat64m2_t vs2, double rs1,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfrdiv_vf_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat64m4_t vs2, double rs1,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfrdiv_vf_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat64m8_t vs2, double rs1,
                                             unsigned int frm, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmul_vv_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs2,
                                            vfloat16mf4_t vs1, unsigned int frm,
                                            size_t vl);
vfloat16mf4_t __riscv_vfmul_vf_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmul_vv_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs2,
                                            vfloat16mf2_t vs1, unsigned int frm,
                                            size_t vl);
vfloat16mf2_t __riscv_vfmul_vf_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmul_vv_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs2, vfloat16m1_t vs1,
                                          unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmul_vf_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs2, _Float16 rs1,
                                          unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmul_vv_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs2, vfloat16m2_t vs1,
                                          unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmul_vf_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs2, _Float16 rs1,
                                          unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmul_vv_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs2, vfloat16m4_t vs1,
                                          unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmul_vf_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs2, _Float16 rs1,
                                          unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmul_vv_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs2, vfloat16m8_t vs1,
                                          unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmul_vf_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs2, _Float16 rs1,
                                          unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmul_vv_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2,
                                            vfloat32mf2_t vs1, unsigned int frm,
                                            size_t vl);
vfloat32mf2_t __riscv_vfmul_vf_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmul_vv_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, vfloat32m1_t vs1,
                                          unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmul_vf_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, float rs1,
                                          unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmul_vv_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, vfloat32m2_t vs1,
                                          unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmul_vf_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, float rs1,
                                          unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmul_vv_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, vfloat32m4_t vs1,
                                          unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmul_vf_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, float rs1,
                                          unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmul_vv_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, vfloat32m8_t vs1,
                                          unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmul_vf_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, float rs1,
                                          unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmul_vv_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, vfloat64m1_t vs1,
                                          unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmul_vf_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, double rs1,
                                          unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmul_vv_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, vfloat64m2_t vs1,
                                          unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmul_vf_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, double rs1,
                                          unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmul_vv_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, vfloat64m4_t vs1,
                                          unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmul_vf_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, double rs1,
                                          unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmul_vv_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, vfloat64m8_t vs1,
                                          unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmul_vf_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, double rs1,
                                          unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfdiv_vv_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs2,
                                            vfloat16mf4_t vs1, unsigned int frm,
                                            size_t vl);
vfloat16mf4_t __riscv_vfdiv_vf_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfdiv_vv_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs2,
                                            vfloat16mf2_t vs1, unsigned int frm,
                                            size_t vl);
vfloat16mf2_t __riscv_vfdiv_vf_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfdiv_vv_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs2, vfloat16m1_t vs1,
                                          unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfdiv_vf_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs2, _Float16 rs1,
                                          unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfdiv_vv_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs2, vfloat16m2_t vs1,
                                          unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfdiv_vf_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs2, _Float16 rs1,
                                          unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfdiv_vv_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs2, vfloat16m4_t vs1,
                                          unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfdiv_vf_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs2, _Float16 rs1,
                                          unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfdiv_vv_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs2, vfloat16m8_t vs1,
                                          unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfdiv_vf_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs2, _Float16 rs1,
                                          unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfdiv_vv_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2,
                                            vfloat32mf2_t vs1, unsigned int frm,
                                            size_t vl);
vfloat32mf2_t __riscv_vfdiv_vf_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfdiv_vv_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, vfloat32m1_t vs1,
                                          unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfdiv_vf_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, float rs1,
                                          unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfdiv_vv_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, vfloat32m2_t vs1,
                                          unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfdiv_vf_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, float rs1,
                                          unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfdiv_vv_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, vfloat32m4_t vs1,
                                          unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfdiv_vf_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, float rs1,
                                          unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfdiv_vv_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, vfloat32m8_t vs1,
                                          unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfdiv_vf_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, float rs1,
                                          unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfdiv_vv_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, vfloat64m1_t vs1,
                                          unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfdiv_vf_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, double rs1,
                                          unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfdiv_vv_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, vfloat64m2_t vs1,
                                          unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfdiv_vf_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, double rs1,
                                          unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfdiv_vv_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, vfloat64m4_t vs1,
                                          unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfdiv_vf_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, double rs1,
                                          unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfdiv_vv_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, vfloat64m8_t vs1,
                                          unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfdiv_vf_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, double rs1,
                                          unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfrdiv_vf_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfrdiv_vf_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfrdiv_vf_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfrdiv_vf_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfrdiv_vf_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfrdiv_vf_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfrdiv_vf_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfrdiv_vf_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfrdiv_vf_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfrdiv_vf_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfrdiv_vf_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfrdiv_vf_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs2, double rs1,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfrdiv_vf_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs2, double rs1,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfrdiv_vf_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs2, double rs1,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfrdiv_vf_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs2, double rs1,
                                           unsigned int frm, size_t vl);

Vector Widening Floating-Point Multiply Intrinsics

vfloat32mf2_t __riscv_vfwmul_vv_f32mf2_tu(vfloat32mf2_t vd, vfloat16mf4_t vs2,
                                          vfloat16mf4_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfwmul_vf_f32mf2_tu(vfloat32mf2_t vd, vfloat16mf4_t vs2,
                                          _Float16 rs1, size_t vl);
vfloat32m1_t __riscv_vfwmul_vv_f32m1_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                                        vfloat16mf2_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwmul_vf_f32m1_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat32m2_t __riscv_vfwmul_vv_f32m2_tu(vfloat32m2_t vd, vfloat16m1_t vs2,
                                        vfloat16m1_t vs1, size_t vl);
vfloat32m2_t __riscv_vfwmul_vf_f32m2_tu(vfloat32m2_t vd, vfloat16m1_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat32m4_t __riscv_vfwmul_vv_f32m4_tu(vfloat32m4_t vd, vfloat16m2_t vs2,
                                        vfloat16m2_t vs1, size_t vl);
vfloat32m4_t __riscv_vfwmul_vf_f32m4_tu(vfloat32m4_t vd, vfloat16m2_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat32m8_t __riscv_vfwmul_vv_f32m8_tu(vfloat32m8_t vd, vfloat16m4_t vs2,
                                        vfloat16m4_t vs1, size_t vl);
vfloat32m8_t __riscv_vfwmul_vf_f32m8_tu(vfloat32m8_t vd, vfloat16m4_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat64m1_t __riscv_vfwmul_vv_f64m1_tu(vfloat64m1_t vd, vfloat32mf2_t vs2,
                                        vfloat32mf2_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwmul_vf_f64m1_tu(vfloat64m1_t vd, vfloat32mf2_t vs2,
                                        float rs1, size_t vl);
vfloat64m2_t __riscv_vfwmul_vv_f64m2_tu(vfloat64m2_t vd, vfloat32m1_t vs2,
                                        vfloat32m1_t vs1, size_t vl);
vfloat64m2_t __riscv_vfwmul_vf_f64m2_tu(vfloat64m2_t vd, vfloat32m1_t vs2,
                                        float rs1, size_t vl);
vfloat64m4_t __riscv_vfwmul_vv_f64m4_tu(vfloat64m4_t vd, vfloat32m2_t vs2,
                                        vfloat32m2_t vs1, size_t vl);
vfloat64m4_t __riscv_vfwmul_vf_f64m4_tu(vfloat64m4_t vd, vfloat32m2_t vs2,
                                        float rs1, size_t vl);
vfloat64m8_t __riscv_vfwmul_vv_f64m8_tu(vfloat64m8_t vd, vfloat32m4_t vs2,
                                        vfloat32m4_t vs1, size_t vl);
vfloat64m8_t __riscv_vfwmul_vf_f64m8_tu(vfloat64m8_t vd, vfloat32m4_t vs2,
                                        float rs1, size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwmul_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                           size_t vl);
vfloat32mf2_t __riscv_vfwmul_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat16mf4_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat32m1_t __riscv_vfwmul_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                         size_t vl);
vfloat32m1_t __riscv_vfwmul_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat16mf2_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfwmul_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat16m1_t vs2, vfloat16m1_t vs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfwmul_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat16m1_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfwmul_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat16m2_t vs2, vfloat16m2_t vs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfwmul_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat16m2_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfwmul_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat16m4_t vs2, vfloat16m4_t vs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfwmul_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat16m4_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfwmul_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfwmul_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat32mf2_t vs2, float rs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfwmul_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat32m1_t vs2, vfloat32m1_t vs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfwmul_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat32m1_t vs2, float rs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfwmul_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat32m2_t vs2, vfloat32m2_t vs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfwmul_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat32m2_t vs2, float rs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfwmul_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat32m4_t vs2, vfloat32m4_t vs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfwmul_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat32m4_t vs2, float rs1,
                                         size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwmul_vv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat16mf4_t vs2,
                                            vfloat16mf4_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfwmul_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat16mf4_t vs2, _Float16 rs1,
                                            size_t vl);
vfloat32m1_t __riscv_vfwmul_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                          size_t vl);
vfloat32m1_t __riscv_vfwmul_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat16mf2_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32m2_t __riscv_vfwmul_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat16m1_t vs2, vfloat16m1_t vs1,
                                          size_t vl);
vfloat32m2_t __riscv_vfwmul_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat16m1_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32m4_t __riscv_vfwmul_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat16m2_t vs2, vfloat16m2_t vs1,
                                          size_t vl);
vfloat32m4_t __riscv_vfwmul_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat16m2_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32m8_t __riscv_vfwmul_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat16m4_t vs2, vfloat16m4_t vs1,
                                          size_t vl);
vfloat32m8_t __riscv_vfwmul_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat16m4_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat64m1_t __riscv_vfwmul_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                          size_t vl);
vfloat64m1_t __riscv_vfwmul_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat32mf2_t vs2, float rs1,
                                          size_t vl);
vfloat64m2_t __riscv_vfwmul_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat32m1_t vs2, vfloat32m1_t vs1,
                                          size_t vl);
vfloat64m2_t __riscv_vfwmul_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat32m1_t vs2, float rs1,
                                          size_t vl);
vfloat64m4_t __riscv_vfwmul_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat32m2_t vs2, vfloat32m2_t vs1,
                                          size_t vl);
vfloat64m4_t __riscv_vfwmul_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat32m2_t vs2, float rs1,
                                          size_t vl);
vfloat64m8_t __riscv_vfwmul_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat32m4_t vs2, vfloat32m4_t vs1,
                                          size_t vl);
vfloat64m8_t __riscv_vfwmul_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat32m4_t vs2, float rs1,
                                          size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwmul_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                          size_t vl);
vfloat32mf2_t __riscv_vfwmul_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat16mf4_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32m1_t __riscv_vfwmul_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                        size_t vl);
vfloat32m1_t __riscv_vfwmul_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat16mf2_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32m2_t __riscv_vfwmul_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat16m1_t vs2, vfloat16m1_t vs1,
                                        size_t vl);
vfloat32m2_t __riscv_vfwmul_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat16m1_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32m4_t __riscv_vfwmul_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat16m2_t vs2, vfloat16m2_t vs1,
                                        size_t vl);
vfloat32m4_t __riscv_vfwmul_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat16m2_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32m8_t __riscv_vfwmul_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat16m4_t vs2, vfloat16m4_t vs1,
                                        size_t vl);
vfloat32m8_t __riscv_vfwmul_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat16m4_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat64m1_t __riscv_vfwmul_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                        size_t vl);
vfloat64m1_t __riscv_vfwmul_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat32mf2_t vs2, float rs1,
                                        size_t vl);
vfloat64m2_t __riscv_vfwmul_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat32m1_t vs2, vfloat32m1_t vs1,
                                        size_t vl);
vfloat64m2_t __riscv_vfwmul_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat32m1_t vs2, float rs1, size_t vl);
vfloat64m4_t __riscv_vfwmul_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat32m2_t vs2, vfloat32m2_t vs1,
                                        size_t vl);
vfloat64m4_t __riscv_vfwmul_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat32m2_t vs2, float rs1, size_t vl);
vfloat64m8_t __riscv_vfwmul_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat32m4_t vs2, vfloat32m4_t vs1,
                                        size_t vl);
vfloat64m8_t __riscv_vfwmul_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat32m4_t vs2, float rs1, size_t vl);
vfloat32mf2_t __riscv_vfwmul_vv_f32mf2_rm_tu(vfloat32mf2_t vd,
                                             vfloat16mf4_t vs2,
                                             vfloat16mf4_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmul_vf_f32mf2_rm_tu(vfloat32mf2_t vd,
                                             vfloat16mf4_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmul_vv_f32m1_rm_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                                           vfloat16mf2_t vs1, unsigned int frm,
                                           size_t vl);
vfloat32m1_t __riscv_vfwmul_vf_f32m1_rm_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat32m2_t __riscv_vfwmul_vv_f32m2_rm_tu(vfloat32m2_t vd, vfloat16m1_t vs2,
                                           vfloat16m1_t vs1, unsigned int frm,
                                           size_t vl);
vfloat32m2_t __riscv_vfwmul_vf_f32m2_rm_tu(vfloat32m2_t vd, vfloat16m1_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat32m4_t __riscv_vfwmul_vv_f32m4_rm_tu(vfloat32m4_t vd, vfloat16m2_t vs2,
                                           vfloat16m2_t vs1, unsigned int frm,
                                           size_t vl);
vfloat32m4_t __riscv_vfwmul_vf_f32m4_rm_tu(vfloat32m4_t vd, vfloat16m2_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat32m8_t __riscv_vfwmul_vv_f32m8_rm_tu(vfloat32m8_t vd, vfloat16m4_t vs2,
                                           vfloat16m4_t vs1, unsigned int frm,
                                           size_t vl);
vfloat32m8_t __riscv_vfwmul_vf_f32m8_rm_tu(vfloat32m8_t vd, vfloat16m4_t vs2,
                                           _Float16 rs1, unsigned int frm,
                                           size_t vl);
vfloat64m1_t __riscv_vfwmul_vv_f64m1_rm_tu(vfloat64m1_t vd, vfloat32mf2_t vs2,
                                           vfloat32mf2_t vs1, unsigned int frm,
                                           size_t vl);
vfloat64m1_t __riscv_vfwmul_vf_f64m1_rm_tu(vfloat64m1_t vd, vfloat32mf2_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat64m2_t __riscv_vfwmul_vv_f64m2_rm_tu(vfloat64m2_t vd, vfloat32m1_t vs2,
                                           vfloat32m1_t vs1, unsigned int frm,
                                           size_t vl);
vfloat64m2_t __riscv_vfwmul_vf_f64m2_rm_tu(vfloat64m2_t vd, vfloat32m1_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat64m4_t __riscv_vfwmul_vv_f64m4_rm_tu(vfloat64m4_t vd, vfloat32m2_t vs2,
                                           vfloat32m2_t vs1, unsigned int frm,
                                           size_t vl);
vfloat64m4_t __riscv_vfwmul_vf_f64m4_rm_tu(vfloat64m4_t vd, vfloat32m2_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
vfloat64m8_t __riscv_vfwmul_vv_f64m8_rm_tu(vfloat64m8_t vd, vfloat32m4_t vs2,
                                           vfloat32m4_t vs1, unsigned int frm,
                                           size_t vl);
vfloat64m8_t __riscv_vfwmul_vf_f64m8_rm_tu(vfloat64m8_t vd, vfloat32m4_t vs2,
                                           float rs1, unsigned int frm,
                                           size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwmul_vv_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat16mf4_t vs2,
                                              vfloat16mf4_t vs1,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmul_vf_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat16mf4_t vs2, _Float16 rs1,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmul_vv_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat16mf2_t vs2,
                                            vfloat16mf2_t vs1, unsigned int frm,
                                            size_t vl);
vfloat32m1_t __riscv_vfwmul_vf_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat16mf2_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmul_vv_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat16m1_t vs2, vfloat16m1_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmul_vf_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat16m1_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmul_vv_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat16m2_t vs2, vfloat16m2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmul_vf_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat16m2_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmul_vv_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat16m4_t vs2, vfloat16m4_t vs1,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmul_vf_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat16m4_t vs2, _Float16 rs1,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmul_vv_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat32mf2_t vs2,
                                            vfloat32mf2_t vs1, unsigned int frm,
                                            size_t vl);
vfloat64m1_t __riscv_vfwmul_vf_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat32mf2_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmul_vv_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat32m1_t vs2, vfloat32m1_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmul_vf_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat32m1_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmul_vv_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat32m2_t vs2, vfloat32m2_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmul_vf_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat32m2_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmul_vv_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat32m4_t vs2, vfloat32m4_t vs1,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmul_vf_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat32m4_t vs2, float rs1,
                                            unsigned int frm, size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwmul_vv_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat16mf4_t vs2,
                                               vfloat16mf4_t vs1,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmul_vf_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat16mf4_t vs2, _Float16 rs1,
                                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmul_vv_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat16mf2_t vs2,
                                             vfloat16mf2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmul_vf_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat16mf2_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmul_vv_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat16m1_t vs2, vfloat16m1_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmul_vf_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat16m1_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmul_vv_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat16m2_t vs2, vfloat16m2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmul_vf_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat16m2_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmul_vv_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat16m4_t vs2, vfloat16m4_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmul_vf_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat16m4_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmul_vv_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat32mf2_t vs2,
                                             vfloat32mf2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmul_vf_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat32mf2_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmul_vv_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat32m1_t vs2, vfloat32m1_t vs1,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmul_vf_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat32m1_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmul_vv_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat32m2_t vs2, vfloat32m2_t vs1,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmul_vf_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat32m2_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmul_vv_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat32m4_t vs2, vfloat32m4_t vs1,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmul_vf_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat32m4_t vs2, float rs1,
                                             unsigned int frm, size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwmul_vv_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat16mf4_t vs2,
                                             vfloat16mf4_t vs1,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmul_vf_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat16mf4_t vs2, _Float16 rs1,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmul_vv_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmul_vf_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat16mf2_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmul_vv_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat16m1_t vs2, vfloat16m1_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmul_vf_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat16m1_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmul_vv_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat16m2_t vs2, vfloat16m2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmul_vf_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat16m2_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmul_vv_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat16m4_t vs2, vfloat16m4_t vs1,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmul_vf_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat16m4_t vs2, _Float16 rs1,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmul_vv_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmul_vf_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat32mf2_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmul_vv_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat32m1_t vs2, vfloat32m1_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmul_vf_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat32m1_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmul_vv_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat32m2_t vs2, vfloat32m2_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmul_vf_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat32m2_t vs2, float rs1,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmul_vv_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat32m4_t vs2, vfloat32m4_t vs1,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmul_vf_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat32m4_t vs2, float rs1,
                                           unsigned int frm, size_t vl);

Vector Single-Width Floating-Point Fused Multiply-Add Intrinsics

vfloat16mf4_t __riscv_vfmacc_vv_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1,
                                          vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfmacc_vf_f16mf4_tu(vfloat16mf4_t vd, _Float16 rs1,
                                          vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmacc_vv_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1,
                                          vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmacc_vf_f16mf2_tu(vfloat16mf2_t vd, _Float16 rs1,
                                          vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmacc_vv_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                                        vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmacc_vf_f16m1_tu(vfloat16m1_t vd, _Float16 rs1,
                                        vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmacc_vv_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                                        vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmacc_vf_f16m2_tu(vfloat16m2_t vd, _Float16 rs1,
                                        vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmacc_vv_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                                        vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmacc_vf_f16m4_tu(vfloat16m4_t vd, _Float16 rs1,
                                        vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmacc_vv_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                                        vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmacc_vf_f16m8_tu(vfloat16m8_t vd, _Float16 rs1,
                                        vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmacc_vv_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1,
                                          vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmacc_vf_f32mf2_tu(vfloat32mf2_t vd, float rs1,
                                          vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmacc_vv_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                                        vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmacc_vf_f32m1_tu(vfloat32m1_t vd, float rs1,
                                        vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmacc_vv_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                                        vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmacc_vf_f32m2_tu(vfloat32m2_t vd, float rs1,
                                        vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmacc_vv_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                                        vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmacc_vf_f32m4_tu(vfloat32m4_t vd, float rs1,
                                        vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmacc_vv_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                                        vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmacc_vf_f32m8_tu(vfloat32m8_t vd, float rs1,
                                        vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmacc_vv_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                                        vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmacc_vf_f64m1_tu(vfloat64m1_t vd, double rs1,
                                        vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmacc_vv_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                                        vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmacc_vf_f64m2_tu(vfloat64m2_t vd, double rs1,
                                        vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmacc_vv_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                                        vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmacc_vf_f64m4_tu(vfloat64m4_t vd, double rs1,
                                        vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmacc_vv_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                                        vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmacc_vf_f64m8_tu(vfloat64m8_t vd, double rs1,
                                        vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmacc_vv_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1,
                                           vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmacc_vf_f16mf4_tu(vfloat16mf4_t vd, _Float16 rs1,
                                           vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmacc_vv_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1,
                                           vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmacc_vf_f16mf2_tu(vfloat16mf2_t vd, _Float16 rs1,
                                           vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmacc_vv_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                                         vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmacc_vf_f16m1_tu(vfloat16m1_t vd, _Float16 rs1,
                                         vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmacc_vv_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                                         vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmacc_vf_f16m2_tu(vfloat16m2_t vd, _Float16 rs1,
                                         vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmacc_vv_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                                         vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmacc_vf_f16m4_tu(vfloat16m4_t vd, _Float16 rs1,
                                         vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmacc_vv_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                                         vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmacc_vf_f16m8_tu(vfloat16m8_t vd, _Float16 rs1,
                                         vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmacc_vv_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1,
                                           vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmacc_vf_f32mf2_tu(vfloat32mf2_t vd, float rs1,
                                           vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmacc_vv_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                                         vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmacc_vf_f32m1_tu(vfloat32m1_t vd, float rs1,
                                         vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmacc_vv_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                                         vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmacc_vf_f32m2_tu(vfloat32m2_t vd, float rs1,
                                         vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmacc_vv_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                                         vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmacc_vf_f32m4_tu(vfloat32m4_t vd, float rs1,
                                         vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmacc_vv_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                                         vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmacc_vf_f32m8_tu(vfloat32m8_t vd, float rs1,
                                         vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmacc_vv_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                                         vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmacc_vf_f64m1_tu(vfloat64m1_t vd, double rs1,
                                         vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmacc_vv_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                                         vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmacc_vf_f64m2_tu(vfloat64m2_t vd, double rs1,
                                         vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmacc_vv_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                                         vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmacc_vf_f64m4_tu(vfloat64m4_t vd, double rs1,
                                         vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmacc_vv_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                                         vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmacc_vf_f64m8_tu(vfloat64m8_t vd, double rs1,
                                         vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfmsac_vv_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1,
                                          vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfmsac_vf_f16mf4_tu(vfloat16mf4_t vd, _Float16 rs1,
                                          vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmsac_vv_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1,
                                          vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmsac_vf_f16mf2_tu(vfloat16mf2_t vd, _Float16 rs1,
                                          vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmsac_vv_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                                        vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmsac_vf_f16m1_tu(vfloat16m1_t vd, _Float16 rs1,
                                        vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmsac_vv_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                                        vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmsac_vf_f16m2_tu(vfloat16m2_t vd, _Float16 rs1,
                                        vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmsac_vv_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                                        vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmsac_vf_f16m4_tu(vfloat16m4_t vd, _Float16 rs1,
                                        vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmsac_vv_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                                        vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmsac_vf_f16m8_tu(vfloat16m8_t vd, _Float16 rs1,
                                        vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmsac_vv_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1,
                                          vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmsac_vf_f32mf2_tu(vfloat32mf2_t vd, float rs1,
                                          vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmsac_vv_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                                        vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmsac_vf_f32m1_tu(vfloat32m1_t vd, float rs1,
                                        vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmsac_vv_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                                        vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmsac_vf_f32m2_tu(vfloat32m2_t vd, float rs1,
                                        vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmsac_vv_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                                        vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmsac_vf_f32m4_tu(vfloat32m4_t vd, float rs1,
                                        vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmsac_vv_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                                        vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmsac_vf_f32m8_tu(vfloat32m8_t vd, float rs1,
                                        vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmsac_vv_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                                        vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmsac_vf_f64m1_tu(vfloat64m1_t vd, double rs1,
                                        vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmsac_vv_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                                        vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmsac_vf_f64m2_tu(vfloat64m2_t vd, double rs1,
                                        vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmsac_vv_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                                        vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmsac_vf_f64m4_tu(vfloat64m4_t vd, double rs1,
                                        vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmsac_vv_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                                        vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmsac_vf_f64m8_tu(vfloat64m8_t vd, double rs1,
                                        vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmsac_vv_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1,
                                           vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmsac_vf_f16mf4_tu(vfloat16mf4_t vd, _Float16 rs1,
                                           vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmsac_vv_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1,
                                           vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmsac_vf_f16mf2_tu(vfloat16mf2_t vd, _Float16 rs1,
                                           vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmsac_vv_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                                         vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmsac_vf_f16m1_tu(vfloat16m1_t vd, _Float16 rs1,
                                         vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmsac_vv_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                                         vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmsac_vf_f16m2_tu(vfloat16m2_t vd, _Float16 rs1,
                                         vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmsac_vv_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                                         vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmsac_vf_f16m4_tu(vfloat16m4_t vd, _Float16 rs1,
                                         vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmsac_vv_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                                         vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmsac_vf_f16m8_tu(vfloat16m8_t vd, _Float16 rs1,
                                         vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmsac_vv_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1,
                                           vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmsac_vf_f32mf2_tu(vfloat32mf2_t vd, float rs1,
                                           vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmsac_vv_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                                         vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmsac_vf_f32m1_tu(vfloat32m1_t vd, float rs1,
                                         vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmsac_vv_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                                         vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmsac_vf_f32m2_tu(vfloat32m2_t vd, float rs1,
                                         vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmsac_vv_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                                         vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmsac_vf_f32m4_tu(vfloat32m4_t vd, float rs1,
                                         vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmsac_vv_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                                         vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmsac_vf_f32m8_tu(vfloat32m8_t vd, float rs1,
                                         vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmsac_vv_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                                         vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmsac_vf_f64m1_tu(vfloat64m1_t vd, double rs1,
                                         vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmsac_vv_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                                         vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmsac_vf_f64m2_tu(vfloat64m2_t vd, double rs1,
                                         vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmsac_vv_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                                         vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmsac_vf_f64m4_tu(vfloat64m4_t vd, double rs1,
                                         vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmsac_vv_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                                         vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmsac_vf_f64m8_tu(vfloat64m8_t vd, double rs1,
                                         vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfmadd_vv_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1,
                                          vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfmadd_vf_f16mf4_tu(vfloat16mf4_t vd, _Float16 rs1,
                                          vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmadd_vv_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1,
                                          vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmadd_vf_f16mf2_tu(vfloat16mf2_t vd, _Float16 rs1,
                                          vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmadd_vv_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                                        vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmadd_vf_f16m1_tu(vfloat16m1_t vd, _Float16 rs1,
                                        vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmadd_vv_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                                        vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmadd_vf_f16m2_tu(vfloat16m2_t vd, _Float16 rs1,
                                        vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmadd_vv_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                                        vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmadd_vf_f16m4_tu(vfloat16m4_t vd, _Float16 rs1,
                                        vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmadd_vv_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                                        vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmadd_vf_f16m8_tu(vfloat16m8_t vd, _Float16 rs1,
                                        vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmadd_vv_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1,
                                          vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmadd_vf_f32mf2_tu(vfloat32mf2_t vd, float rs1,
                                          vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmadd_vv_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                                        vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmadd_vf_f32m1_tu(vfloat32m1_t vd, float rs1,
                                        vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmadd_vv_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                                        vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmadd_vf_f32m2_tu(vfloat32m2_t vd, float rs1,
                                        vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmadd_vv_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                                        vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmadd_vf_f32m4_tu(vfloat32m4_t vd, float rs1,
                                        vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmadd_vv_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                                        vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmadd_vf_f32m8_tu(vfloat32m8_t vd, float rs1,
                                        vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmadd_vv_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                                        vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmadd_vf_f64m1_tu(vfloat64m1_t vd, double rs1,
                                        vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmadd_vv_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                                        vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmadd_vf_f64m2_tu(vfloat64m2_t vd, double rs1,
                                        vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmadd_vv_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                                        vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmadd_vf_f64m4_tu(vfloat64m4_t vd, double rs1,
                                        vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmadd_vv_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                                        vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmadd_vf_f64m8_tu(vfloat64m8_t vd, double rs1,
                                        vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmadd_vv_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1,
                                           vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmadd_vf_f16mf4_tu(vfloat16mf4_t vd, _Float16 rs1,
                                           vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmadd_vv_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1,
                                           vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmadd_vf_f16mf2_tu(vfloat16mf2_t vd, _Float16 rs1,
                                           vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmadd_vv_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                                         vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmadd_vf_f16m1_tu(vfloat16m1_t vd, _Float16 rs1,
                                         vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmadd_vv_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                                         vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmadd_vf_f16m2_tu(vfloat16m2_t vd, _Float16 rs1,
                                         vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmadd_vv_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                                         vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmadd_vf_f16m4_tu(vfloat16m4_t vd, _Float16 rs1,
                                         vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmadd_vv_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                                         vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmadd_vf_f16m8_tu(vfloat16m8_t vd, _Float16 rs1,
                                         vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmadd_vv_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1,
                                           vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmadd_vf_f32mf2_tu(vfloat32mf2_t vd, float rs1,
                                           vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmadd_vv_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                                         vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmadd_vf_f32m1_tu(vfloat32m1_t vd, float rs1,
                                         vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmadd_vv_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                                         vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmadd_vf_f32m2_tu(vfloat32m2_t vd, float rs1,
                                         vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmadd_vv_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                                         vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmadd_vf_f32m4_tu(vfloat32m4_t vd, float rs1,
                                         vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmadd_vv_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                                         vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmadd_vf_f32m8_tu(vfloat32m8_t vd, float rs1,
                                         vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmadd_vv_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                                         vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmadd_vf_f64m1_tu(vfloat64m1_t vd, double rs1,
                                         vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmadd_vv_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                                         vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmadd_vf_f64m2_tu(vfloat64m2_t vd, double rs1,
                                         vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmadd_vv_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                                         vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmadd_vf_f64m4_tu(vfloat64m4_t vd, double rs1,
                                         vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmadd_vv_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                                         vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmadd_vf_f64m8_tu(vfloat64m8_t vd, double rs1,
                                         vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfmsub_vv_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1,
                                          vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfmsub_vf_f16mf4_tu(vfloat16mf4_t vd, _Float16 rs1,
                                          vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmsub_vv_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1,
                                          vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmsub_vf_f16mf2_tu(vfloat16mf2_t vd, _Float16 rs1,
                                          vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmsub_vv_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                                        vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmsub_vf_f16m1_tu(vfloat16m1_t vd, _Float16 rs1,
                                        vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmsub_vv_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                                        vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmsub_vf_f16m2_tu(vfloat16m2_t vd, _Float16 rs1,
                                        vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmsub_vv_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                                        vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmsub_vf_f16m4_tu(vfloat16m4_t vd, _Float16 rs1,
                                        vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmsub_vv_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                                        vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmsub_vf_f16m8_tu(vfloat16m8_t vd, _Float16 rs1,
                                        vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmsub_vv_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1,
                                          vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmsub_vf_f32mf2_tu(vfloat32mf2_t vd, float rs1,
                                          vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmsub_vv_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                                        vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmsub_vf_f32m1_tu(vfloat32m1_t vd, float rs1,
                                        vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmsub_vv_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                                        vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmsub_vf_f32m2_tu(vfloat32m2_t vd, float rs1,
                                        vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmsub_vv_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                                        vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmsub_vf_f32m4_tu(vfloat32m4_t vd, float rs1,
                                        vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmsub_vv_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                                        vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmsub_vf_f32m8_tu(vfloat32m8_t vd, float rs1,
                                        vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmsub_vv_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                                        vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmsub_vf_f64m1_tu(vfloat64m1_t vd, double rs1,
                                        vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmsub_vv_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                                        vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmsub_vf_f64m2_tu(vfloat64m2_t vd, double rs1,
                                        vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmsub_vv_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                                        vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmsub_vf_f64m4_tu(vfloat64m4_t vd, double rs1,
                                        vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmsub_vv_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                                        vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmsub_vf_f64m8_tu(vfloat64m8_t vd, double rs1,
                                        vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmsub_vv_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1,
                                           vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmsub_vf_f16mf4_tu(vfloat16mf4_t vd, _Float16 rs1,
                                           vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmsub_vv_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1,
                                           vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmsub_vf_f16mf2_tu(vfloat16mf2_t vd, _Float16 rs1,
                                           vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmsub_vv_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                                         vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmsub_vf_f16m1_tu(vfloat16m1_t vd, _Float16 rs1,
                                         vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmsub_vv_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                                         vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmsub_vf_f16m2_tu(vfloat16m2_t vd, _Float16 rs1,
                                         vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmsub_vv_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                                         vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmsub_vf_f16m4_tu(vfloat16m4_t vd, _Float16 rs1,
                                         vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmsub_vv_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                                         vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmsub_vf_f16m8_tu(vfloat16m8_t vd, _Float16 rs1,
                                         vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmsub_vv_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1,
                                           vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmsub_vf_f32mf2_tu(vfloat32mf2_t vd, float rs1,
                                           vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmsub_vv_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                                         vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmsub_vf_f32m1_tu(vfloat32m1_t vd, float rs1,
                                         vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmsub_vv_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                                         vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmsub_vf_f32m2_tu(vfloat32m2_t vd, float rs1,
                                         vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmsub_vv_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                                         vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmsub_vf_f32m4_tu(vfloat32m4_t vd, float rs1,
                                         vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmsub_vv_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                                         vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmsub_vf_f32m8_tu(vfloat32m8_t vd, float rs1,
                                         vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmsub_vv_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                                         vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmsub_vf_f64m1_tu(vfloat64m1_t vd, double rs1,
                                         vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmsub_vv_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                                         vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmsub_vf_f64m2_tu(vfloat64m2_t vd, double rs1,
                                         vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmsub_vv_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                                         vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmsub_vf_f64m4_tu(vfloat64m4_t vd, double rs1,
                                         vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmsub_vv_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                                         vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmsub_vf_f64m8_tu(vfloat64m8_t vd, double rs1,
                                         vfloat64m8_t vs2, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmacc_vv_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                           size_t vl);
vfloat16mf4_t __riscv_vfmacc_vf_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                           _Float16 rs1, vfloat16mf4_t vs2,
                                           size_t vl);
vfloat16mf2_t __riscv_vfmacc_vv_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat16mf2_t __riscv_vfmacc_vf_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                           _Float16 rs1, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat16m1_t __riscv_vfmacc_vv_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs1, vfloat16m1_t vs2,
                                         size_t vl);
vfloat16m1_t __riscv_vfmacc_vf_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                         _Float16 rs1, vfloat16m1_t vs2,
                                         size_t vl);
vfloat16m2_t __riscv_vfmacc_vv_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs1, vfloat16m2_t vs2,
                                         size_t vl);
vfloat16m2_t __riscv_vfmacc_vf_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                         _Float16 rs1, vfloat16m2_t vs2,
                                         size_t vl);
vfloat16m4_t __riscv_vfmacc_vv_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs1, vfloat16m4_t vs2,
                                         size_t vl);
vfloat16m4_t __riscv_vfmacc_vf_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                         _Float16 rs1, vfloat16m4_t vs2,
                                         size_t vl);
vfloat16m8_t __riscv_vfmacc_vv_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs1, vfloat16m8_t vs2,
                                         size_t vl);
vfloat16m8_t __riscv_vfmacc_vf_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                         _Float16 rs1, vfloat16m8_t vs2,
                                         size_t vl);
vfloat32mf2_t __riscv_vfmacc_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat32mf2_t __riscv_vfmacc_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                           float rs1, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat32m1_t __riscv_vfmacc_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs1, vfloat32m1_t vs2,
                                         size_t vl);
vfloat32m1_t __riscv_vfmacc_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                         float rs1, vfloat32m1_t vs2,
                                         size_t vl);
vfloat32m2_t __riscv_vfmacc_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs1, vfloat32m2_t vs2,
                                         size_t vl);
vfloat32m2_t __riscv_vfmacc_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                         float rs1, vfloat32m2_t vs2,
                                         size_t vl);
vfloat32m4_t __riscv_vfmacc_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs1, vfloat32m4_t vs2,
                                         size_t vl);
vfloat32m4_t __riscv_vfmacc_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                         float rs1, vfloat32m4_t vs2,
                                         size_t vl);
vfloat32m8_t __riscv_vfmacc_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs1, vfloat32m8_t vs2,
                                         size_t vl);
vfloat32m8_t __riscv_vfmacc_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                         float rs1, vfloat32m8_t vs2,
                                         size_t vl);
vfloat64m1_t __riscv_vfmacc_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs1, vfloat64m1_t vs2,
                                         size_t vl);
vfloat64m1_t __riscv_vfmacc_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                         double rs1, vfloat64m1_t vs2,
                                         size_t vl);
vfloat64m2_t __riscv_vfmacc_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs1, vfloat64m2_t vs2,
                                         size_t vl);
vfloat64m2_t __riscv_vfmacc_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                         double rs1, vfloat64m2_t vs2,
                                         size_t vl);
vfloat64m4_t __riscv_vfmacc_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs1, vfloat64m4_t vs2,
                                         size_t vl);
vfloat64m4_t __riscv_vfmacc_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                         double rs1, vfloat64m4_t vs2,
                                         size_t vl);
vfloat64m8_t __riscv_vfmacc_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs1, vfloat64m8_t vs2,
                                         size_t vl);
vfloat64m8_t __riscv_vfmacc_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                         double rs1, vfloat64m8_t vs2,
                                         size_t vl);
vfloat16mf4_t __riscv_vfnmacc_vv_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs1,
                                            vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmacc_vf_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                            _Float16 rs1, vfloat16mf4_t vs2,
                                            size_t vl);
vfloat16mf2_t __riscv_vfnmacc_vv_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs1,
                                            vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmacc_vf_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                            _Float16 rs1, vfloat16mf2_t vs2,
                                            size_t vl);
vfloat16m1_t __riscv_vfnmacc_vv_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs1, vfloat16m1_t vs2,
                                          size_t vl);
vfloat16m1_t __riscv_vfnmacc_vf_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                          _Float16 rs1, vfloat16m1_t vs2,
                                          size_t vl);
vfloat16m2_t __riscv_vfnmacc_vv_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs1, vfloat16m2_t vs2,
                                          size_t vl);
vfloat16m2_t __riscv_vfnmacc_vf_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                          _Float16 rs1, vfloat16m2_t vs2,
                                          size_t vl);
vfloat16m4_t __riscv_vfnmacc_vv_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs1, vfloat16m4_t vs2,
                                          size_t vl);
vfloat16m4_t __riscv_vfnmacc_vf_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                          _Float16 rs1, vfloat16m4_t vs2,
                                          size_t vl);
vfloat16m8_t __riscv_vfnmacc_vv_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs1, vfloat16m8_t vs2,
                                          size_t vl);
vfloat16m8_t __riscv_vfnmacc_vf_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                          _Float16 rs1, vfloat16m8_t vs2,
                                          size_t vl);
vfloat32mf2_t __riscv_vfnmacc_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs1,
                                            vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmacc_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                            float rs1, vfloat32mf2_t vs2,
                                            size_t vl);
vfloat32m1_t __riscv_vfnmacc_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs1, vfloat32m1_t vs2,
                                          size_t vl);
vfloat32m1_t __riscv_vfnmacc_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                          float rs1, vfloat32m1_t vs2,
                                          size_t vl);
vfloat32m2_t __riscv_vfnmacc_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs1, vfloat32m2_t vs2,
                                          size_t vl);
vfloat32m2_t __riscv_vfnmacc_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                          float rs1, vfloat32m2_t vs2,
                                          size_t vl);
vfloat32m4_t __riscv_vfnmacc_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs1, vfloat32m4_t vs2,
                                          size_t vl);
vfloat32m4_t __riscv_vfnmacc_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                          float rs1, vfloat32m4_t vs2,
                                          size_t vl);
vfloat32m8_t __riscv_vfnmacc_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs1, vfloat32m8_t vs2,
                                          size_t vl);
vfloat32m8_t __riscv_vfnmacc_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                          float rs1, vfloat32m8_t vs2,
                                          size_t vl);
vfloat64m1_t __riscv_vfnmacc_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs1, vfloat64m1_t vs2,
                                          size_t vl);
vfloat64m1_t __riscv_vfnmacc_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                          double rs1, vfloat64m1_t vs2,
                                          size_t vl);
vfloat64m2_t __riscv_vfnmacc_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs1, vfloat64m2_t vs2,
                                          size_t vl);
vfloat64m2_t __riscv_vfnmacc_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                          double rs1, vfloat64m2_t vs2,
                                          size_t vl);
vfloat64m4_t __riscv_vfnmacc_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs1, vfloat64m4_t vs2,
                                          size_t vl);
vfloat64m4_t __riscv_vfnmacc_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                          double rs1, vfloat64m4_t vs2,
                                          size_t vl);
vfloat64m8_t __riscv_vfnmacc_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs1, vfloat64m8_t vs2,
                                          size_t vl);
vfloat64m8_t __riscv_vfnmacc_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                          double rs1, vfloat64m8_t vs2,
                                          size_t vl);
vfloat16mf4_t __riscv_vfmsac_vv_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                           size_t vl);
vfloat16mf4_t __riscv_vfmsac_vf_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                           _Float16 rs1, vfloat16mf4_t vs2,
                                           size_t vl);
vfloat16mf2_t __riscv_vfmsac_vv_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat16mf2_t __riscv_vfmsac_vf_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                           _Float16 rs1, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat16m1_t __riscv_vfmsac_vv_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs1, vfloat16m1_t vs2,
                                         size_t vl);
vfloat16m1_t __riscv_vfmsac_vf_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                         _Float16 rs1, vfloat16m1_t vs2,
                                         size_t vl);
vfloat16m2_t __riscv_vfmsac_vv_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs1, vfloat16m2_t vs2,
                                         size_t vl);
vfloat16m2_t __riscv_vfmsac_vf_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                         _Float16 rs1, vfloat16m2_t vs2,
                                         size_t vl);
vfloat16m4_t __riscv_vfmsac_vv_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs1, vfloat16m4_t vs2,
                                         size_t vl);
vfloat16m4_t __riscv_vfmsac_vf_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                         _Float16 rs1, vfloat16m4_t vs2,
                                         size_t vl);
vfloat16m8_t __riscv_vfmsac_vv_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs1, vfloat16m8_t vs2,
                                         size_t vl);
vfloat16m8_t __riscv_vfmsac_vf_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                         _Float16 rs1, vfloat16m8_t vs2,
                                         size_t vl);
vfloat32mf2_t __riscv_vfmsac_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat32mf2_t __riscv_vfmsac_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                           float rs1, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat32m1_t __riscv_vfmsac_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs1, vfloat32m1_t vs2,
                                         size_t vl);
vfloat32m1_t __riscv_vfmsac_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                         float rs1, vfloat32m1_t vs2,
                                         size_t vl);
vfloat32m2_t __riscv_vfmsac_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs1, vfloat32m2_t vs2,
                                         size_t vl);
vfloat32m2_t __riscv_vfmsac_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                         float rs1, vfloat32m2_t vs2,
                                         size_t vl);
vfloat32m4_t __riscv_vfmsac_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs1, vfloat32m4_t vs2,
                                         size_t vl);
vfloat32m4_t __riscv_vfmsac_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                         float rs1, vfloat32m4_t vs2,
                                         size_t vl);
vfloat32m8_t __riscv_vfmsac_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs1, vfloat32m8_t vs2,
                                         size_t vl);
vfloat32m8_t __riscv_vfmsac_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                         float rs1, vfloat32m8_t vs2,
                                         size_t vl);
vfloat64m1_t __riscv_vfmsac_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs1, vfloat64m1_t vs2,
                                         size_t vl);
vfloat64m1_t __riscv_vfmsac_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                         double rs1, vfloat64m1_t vs2,
                                         size_t vl);
vfloat64m2_t __riscv_vfmsac_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs1, vfloat64m2_t vs2,
                                         size_t vl);
vfloat64m2_t __riscv_vfmsac_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                         double rs1, vfloat64m2_t vs2,
                                         size_t vl);
vfloat64m4_t __riscv_vfmsac_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs1, vfloat64m4_t vs2,
                                         size_t vl);
vfloat64m4_t __riscv_vfmsac_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                         double rs1, vfloat64m4_t vs2,
                                         size_t vl);
vfloat64m8_t __riscv_vfmsac_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs1, vfloat64m8_t vs2,
                                         size_t vl);
vfloat64m8_t __riscv_vfmsac_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                         double rs1, vfloat64m8_t vs2,
                                         size_t vl);
vfloat16mf4_t __riscv_vfnmsac_vv_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs1,
                                            vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmsac_vf_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                            _Float16 rs1, vfloat16mf4_t vs2,
                                            size_t vl);
vfloat16mf2_t __riscv_vfnmsac_vv_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs1,
                                            vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmsac_vf_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                            _Float16 rs1, vfloat16mf2_t vs2,
                                            size_t vl);
vfloat16m1_t __riscv_vfnmsac_vv_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs1, vfloat16m1_t vs2,
                                          size_t vl);
vfloat16m1_t __riscv_vfnmsac_vf_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                          _Float16 rs1, vfloat16m1_t vs2,
                                          size_t vl);
vfloat16m2_t __riscv_vfnmsac_vv_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs1, vfloat16m2_t vs2,
                                          size_t vl);
vfloat16m2_t __riscv_vfnmsac_vf_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                          _Float16 rs1, vfloat16m2_t vs2,
                                          size_t vl);
vfloat16m4_t __riscv_vfnmsac_vv_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs1, vfloat16m4_t vs2,
                                          size_t vl);
vfloat16m4_t __riscv_vfnmsac_vf_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                          _Float16 rs1, vfloat16m4_t vs2,
                                          size_t vl);
vfloat16m8_t __riscv_vfnmsac_vv_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs1, vfloat16m8_t vs2,
                                          size_t vl);
vfloat16m8_t __riscv_vfnmsac_vf_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                          _Float16 rs1, vfloat16m8_t vs2,
                                          size_t vl);
vfloat32mf2_t __riscv_vfnmsac_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs1,
                                            vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmsac_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                            float rs1, vfloat32mf2_t vs2,
                                            size_t vl);
vfloat32m1_t __riscv_vfnmsac_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs1, vfloat32m1_t vs2,
                                          size_t vl);
vfloat32m1_t __riscv_vfnmsac_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                          float rs1, vfloat32m1_t vs2,
                                          size_t vl);
vfloat32m2_t __riscv_vfnmsac_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs1, vfloat32m2_t vs2,
                                          size_t vl);
vfloat32m2_t __riscv_vfnmsac_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                          float rs1, vfloat32m2_t vs2,
                                          size_t vl);
vfloat32m4_t __riscv_vfnmsac_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs1, vfloat32m4_t vs2,
                                          size_t vl);
vfloat32m4_t __riscv_vfnmsac_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                          float rs1, vfloat32m4_t vs2,
                                          size_t vl);
vfloat32m8_t __riscv_vfnmsac_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs1, vfloat32m8_t vs2,
                                          size_t vl);
vfloat32m8_t __riscv_vfnmsac_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                          float rs1, vfloat32m8_t vs2,
                                          size_t vl);
vfloat64m1_t __riscv_vfnmsac_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs1, vfloat64m1_t vs2,
                                          size_t vl);
vfloat64m1_t __riscv_vfnmsac_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                          double rs1, vfloat64m1_t vs2,
                                          size_t vl);
vfloat64m2_t __riscv_vfnmsac_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs1, vfloat64m2_t vs2,
                                          size_t vl);
vfloat64m2_t __riscv_vfnmsac_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                          double rs1, vfloat64m2_t vs2,
                                          size_t vl);
vfloat64m4_t __riscv_vfnmsac_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs1, vfloat64m4_t vs2,
                                          size_t vl);
vfloat64m4_t __riscv_vfnmsac_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                          double rs1, vfloat64m4_t vs2,
                                          size_t vl);
vfloat64m8_t __riscv_vfnmsac_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs1, vfloat64m8_t vs2,
                                          size_t vl);
vfloat64m8_t __riscv_vfnmsac_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                          double rs1, vfloat64m8_t vs2,
                                          size_t vl);
vfloat16mf4_t __riscv_vfmadd_vv_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                           size_t vl);
vfloat16mf4_t __riscv_vfmadd_vf_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                           _Float16 rs1, vfloat16mf4_t vs2,
                                           size_t vl);
vfloat16mf2_t __riscv_vfmadd_vv_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat16mf2_t __riscv_vfmadd_vf_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                           _Float16 rs1, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat16m1_t __riscv_vfmadd_vv_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs1, vfloat16m1_t vs2,
                                         size_t vl);
vfloat16m1_t __riscv_vfmadd_vf_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                         _Float16 rs1, vfloat16m1_t vs2,
                                         size_t vl);
vfloat16m2_t __riscv_vfmadd_vv_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs1, vfloat16m2_t vs2,
                                         size_t vl);
vfloat16m2_t __riscv_vfmadd_vf_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                         _Float16 rs1, vfloat16m2_t vs2,
                                         size_t vl);
vfloat16m4_t __riscv_vfmadd_vv_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs1, vfloat16m4_t vs2,
                                         size_t vl);
vfloat16m4_t __riscv_vfmadd_vf_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                         _Float16 rs1, vfloat16m4_t vs2,
                                         size_t vl);
vfloat16m8_t __riscv_vfmadd_vv_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs1, vfloat16m8_t vs2,
                                         size_t vl);
vfloat16m8_t __riscv_vfmadd_vf_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                         _Float16 rs1, vfloat16m8_t vs2,
                                         size_t vl);
vfloat32mf2_t __riscv_vfmadd_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat32mf2_t __riscv_vfmadd_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                           float rs1, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat32m1_t __riscv_vfmadd_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs1, vfloat32m1_t vs2,
                                         size_t vl);
vfloat32m1_t __riscv_vfmadd_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                         float rs1, vfloat32m1_t vs2,
                                         size_t vl);
vfloat32m2_t __riscv_vfmadd_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs1, vfloat32m2_t vs2,
                                         size_t vl);
vfloat32m2_t __riscv_vfmadd_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                         float rs1, vfloat32m2_t vs2,
                                         size_t vl);
vfloat32m4_t __riscv_vfmadd_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs1, vfloat32m4_t vs2,
                                         size_t vl);
vfloat32m4_t __riscv_vfmadd_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                         float rs1, vfloat32m4_t vs2,
                                         size_t vl);
vfloat32m8_t __riscv_vfmadd_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs1, vfloat32m8_t vs2,
                                         size_t vl);
vfloat32m8_t __riscv_vfmadd_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                         float rs1, vfloat32m8_t vs2,
                                         size_t vl);
vfloat64m1_t __riscv_vfmadd_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs1, vfloat64m1_t vs2,
                                         size_t vl);
vfloat64m1_t __riscv_vfmadd_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                         double rs1, vfloat64m1_t vs2,
                                         size_t vl);
vfloat64m2_t __riscv_vfmadd_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs1, vfloat64m2_t vs2,
                                         size_t vl);
vfloat64m2_t __riscv_vfmadd_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                         double rs1, vfloat64m2_t vs2,
                                         size_t vl);
vfloat64m4_t __riscv_vfmadd_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs1, vfloat64m4_t vs2,
                                         size_t vl);
vfloat64m4_t __riscv_vfmadd_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                         double rs1, vfloat64m4_t vs2,
                                         size_t vl);
vfloat64m8_t __riscv_vfmadd_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs1, vfloat64m8_t vs2,
                                         size_t vl);
vfloat64m8_t __riscv_vfmadd_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                         double rs1, vfloat64m8_t vs2,
                                         size_t vl);
vfloat16mf4_t __riscv_vfnmadd_vv_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs1,
                                            vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmadd_vf_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                            _Float16 rs1, vfloat16mf4_t vs2,
                                            size_t vl);
vfloat16mf2_t __riscv_vfnmadd_vv_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs1,
                                            vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmadd_vf_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                            _Float16 rs1, vfloat16mf2_t vs2,
                                            size_t vl);
vfloat16m1_t __riscv_vfnmadd_vv_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs1, vfloat16m1_t vs2,
                                          size_t vl);
vfloat16m1_t __riscv_vfnmadd_vf_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                          _Float16 rs1, vfloat16m1_t vs2,
                                          size_t vl);
vfloat16m2_t __riscv_vfnmadd_vv_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs1, vfloat16m2_t vs2,
                                          size_t vl);
vfloat16m2_t __riscv_vfnmadd_vf_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                          _Float16 rs1, vfloat16m2_t vs2,
                                          size_t vl);
vfloat16m4_t __riscv_vfnmadd_vv_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs1, vfloat16m4_t vs2,
                                          size_t vl);
vfloat16m4_t __riscv_vfnmadd_vf_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                          _Float16 rs1, vfloat16m4_t vs2,
                                          size_t vl);
vfloat16m8_t __riscv_vfnmadd_vv_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs1, vfloat16m8_t vs2,
                                          size_t vl);
vfloat16m8_t __riscv_vfnmadd_vf_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                          _Float16 rs1, vfloat16m8_t vs2,
                                          size_t vl);
vfloat32mf2_t __riscv_vfnmadd_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs1,
                                            vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmadd_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                            float rs1, vfloat32mf2_t vs2,
                                            size_t vl);
vfloat32m1_t __riscv_vfnmadd_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs1, vfloat32m1_t vs2,
                                          size_t vl);
vfloat32m1_t __riscv_vfnmadd_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                          float rs1, vfloat32m1_t vs2,
                                          size_t vl);
vfloat32m2_t __riscv_vfnmadd_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs1, vfloat32m2_t vs2,
                                          size_t vl);
vfloat32m2_t __riscv_vfnmadd_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                          float rs1, vfloat32m2_t vs2,
                                          size_t vl);
vfloat32m4_t __riscv_vfnmadd_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs1, vfloat32m4_t vs2,
                                          size_t vl);
vfloat32m4_t __riscv_vfnmadd_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                          float rs1, vfloat32m4_t vs2,
                                          size_t vl);
vfloat32m8_t __riscv_vfnmadd_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs1, vfloat32m8_t vs2,
                                          size_t vl);
vfloat32m8_t __riscv_vfnmadd_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                          float rs1, vfloat32m8_t vs2,
                                          size_t vl);
vfloat64m1_t __riscv_vfnmadd_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs1, vfloat64m1_t vs2,
                                          size_t vl);
vfloat64m1_t __riscv_vfnmadd_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                          double rs1, vfloat64m1_t vs2,
                                          size_t vl);
vfloat64m2_t __riscv_vfnmadd_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs1, vfloat64m2_t vs2,
                                          size_t vl);
vfloat64m2_t __riscv_vfnmadd_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                          double rs1, vfloat64m2_t vs2,
                                          size_t vl);
vfloat64m4_t __riscv_vfnmadd_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs1, vfloat64m4_t vs2,
                                          size_t vl);
vfloat64m4_t __riscv_vfnmadd_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                          double rs1, vfloat64m4_t vs2,
                                          size_t vl);
vfloat64m8_t __riscv_vfnmadd_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs1, vfloat64m8_t vs2,
                                          size_t vl);
vfloat64m8_t __riscv_vfnmadd_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                          double rs1, vfloat64m8_t vs2,
                                          size_t vl);
vfloat16mf4_t __riscv_vfmsub_vv_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                           size_t vl);
vfloat16mf4_t __riscv_vfmsub_vf_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                           _Float16 rs1, vfloat16mf4_t vs2,
                                           size_t vl);
vfloat16mf2_t __riscv_vfmsub_vv_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat16mf2_t __riscv_vfmsub_vf_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                           _Float16 rs1, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat16m1_t __riscv_vfmsub_vv_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs1, vfloat16m1_t vs2,
                                         size_t vl);
vfloat16m1_t __riscv_vfmsub_vf_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                         _Float16 rs1, vfloat16m1_t vs2,
                                         size_t vl);
vfloat16m2_t __riscv_vfmsub_vv_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs1, vfloat16m2_t vs2,
                                         size_t vl);
vfloat16m2_t __riscv_vfmsub_vf_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                         _Float16 rs1, vfloat16m2_t vs2,
                                         size_t vl);
vfloat16m4_t __riscv_vfmsub_vv_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs1, vfloat16m4_t vs2,
                                         size_t vl);
vfloat16m4_t __riscv_vfmsub_vf_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                         _Float16 rs1, vfloat16m4_t vs2,
                                         size_t vl);
vfloat16m8_t __riscv_vfmsub_vv_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs1, vfloat16m8_t vs2,
                                         size_t vl);
vfloat16m8_t __riscv_vfmsub_vf_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                         _Float16 rs1, vfloat16m8_t vs2,
                                         size_t vl);
vfloat32mf2_t __riscv_vfmsub_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat32mf2_t __riscv_vfmsub_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                           float rs1, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat32m1_t __riscv_vfmsub_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs1, vfloat32m1_t vs2,
                                         size_t vl);
vfloat32m1_t __riscv_vfmsub_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                         float rs1, vfloat32m1_t vs2,
                                         size_t vl);
vfloat32m2_t __riscv_vfmsub_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs1, vfloat32m2_t vs2,
                                         size_t vl);
vfloat32m2_t __riscv_vfmsub_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                         float rs1, vfloat32m2_t vs2,
                                         size_t vl);
vfloat32m4_t __riscv_vfmsub_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs1, vfloat32m4_t vs2,
                                         size_t vl);
vfloat32m4_t __riscv_vfmsub_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                         float rs1, vfloat32m4_t vs2,
                                         size_t vl);
vfloat32m8_t __riscv_vfmsub_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs1, vfloat32m8_t vs2,
                                         size_t vl);
vfloat32m8_t __riscv_vfmsub_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                         float rs1, vfloat32m8_t vs2,
                                         size_t vl);
vfloat64m1_t __riscv_vfmsub_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs1, vfloat64m1_t vs2,
                                         size_t vl);
vfloat64m1_t __riscv_vfmsub_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                         double rs1, vfloat64m1_t vs2,
                                         size_t vl);
vfloat64m2_t __riscv_vfmsub_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs1, vfloat64m2_t vs2,
                                         size_t vl);
vfloat64m2_t __riscv_vfmsub_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                         double rs1, vfloat64m2_t vs2,
                                         size_t vl);
vfloat64m4_t __riscv_vfmsub_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs1, vfloat64m4_t vs2,
                                         size_t vl);
vfloat64m4_t __riscv_vfmsub_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                         double rs1, vfloat64m4_t vs2,
                                         size_t vl);
vfloat64m8_t __riscv_vfmsub_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs1, vfloat64m8_t vs2,
                                         size_t vl);
vfloat64m8_t __riscv_vfmsub_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                         double rs1, vfloat64m8_t vs2,
                                         size_t vl);
vfloat16mf4_t __riscv_vfnmsub_vv_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs1,
                                            vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmsub_vf_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                            _Float16 rs1, vfloat16mf4_t vs2,
                                            size_t vl);
vfloat16mf2_t __riscv_vfnmsub_vv_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs1,
                                            vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmsub_vf_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                            _Float16 rs1, vfloat16mf2_t vs2,
                                            size_t vl);
vfloat16m1_t __riscv_vfnmsub_vv_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs1, vfloat16m1_t vs2,
                                          size_t vl);
vfloat16m1_t __riscv_vfnmsub_vf_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                          _Float16 rs1, vfloat16m1_t vs2,
                                          size_t vl);
vfloat16m2_t __riscv_vfnmsub_vv_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs1, vfloat16m2_t vs2,
                                          size_t vl);
vfloat16m2_t __riscv_vfnmsub_vf_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                          _Float16 rs1, vfloat16m2_t vs2,
                                          size_t vl);
vfloat16m4_t __riscv_vfnmsub_vv_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs1, vfloat16m4_t vs2,
                                          size_t vl);
vfloat16m4_t __riscv_vfnmsub_vf_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                          _Float16 rs1, vfloat16m4_t vs2,
                                          size_t vl);
vfloat16m8_t __riscv_vfnmsub_vv_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs1, vfloat16m8_t vs2,
                                          size_t vl);
vfloat16m8_t __riscv_vfnmsub_vf_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                          _Float16 rs1, vfloat16m8_t vs2,
                                          size_t vl);
vfloat32mf2_t __riscv_vfnmsub_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs1,
                                            vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmsub_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                            float rs1, vfloat32mf2_t vs2,
                                            size_t vl);
vfloat32m1_t __riscv_vfnmsub_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs1, vfloat32m1_t vs2,
                                          size_t vl);
vfloat32m1_t __riscv_vfnmsub_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                          float rs1, vfloat32m1_t vs2,
                                          size_t vl);
vfloat32m2_t __riscv_vfnmsub_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs1, vfloat32m2_t vs2,
                                          size_t vl);
vfloat32m2_t __riscv_vfnmsub_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                          float rs1, vfloat32m2_t vs2,
                                          size_t vl);
vfloat32m4_t __riscv_vfnmsub_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs1, vfloat32m4_t vs2,
                                          size_t vl);
vfloat32m4_t __riscv_vfnmsub_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                          float rs1, vfloat32m4_t vs2,
                                          size_t vl);
vfloat32m8_t __riscv_vfnmsub_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs1, vfloat32m8_t vs2,
                                          size_t vl);
vfloat32m8_t __riscv_vfnmsub_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                          float rs1, vfloat32m8_t vs2,
                                          size_t vl);
vfloat64m1_t __riscv_vfnmsub_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs1, vfloat64m1_t vs2,
                                          size_t vl);
vfloat64m1_t __riscv_vfnmsub_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                          double rs1, vfloat64m1_t vs2,
                                          size_t vl);
vfloat64m2_t __riscv_vfnmsub_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs1, vfloat64m2_t vs2,
                                          size_t vl);
vfloat64m2_t __riscv_vfnmsub_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                          double rs1, vfloat64m2_t vs2,
                                          size_t vl);
vfloat64m4_t __riscv_vfnmsub_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs1, vfloat64m4_t vs2,
                                          size_t vl);
vfloat64m4_t __riscv_vfnmsub_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                          double rs1, vfloat64m4_t vs2,
                                          size_t vl);
vfloat64m8_t __riscv_vfnmsub_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs1, vfloat64m8_t vs2,
                                          size_t vl);
vfloat64m8_t __riscv_vfnmsub_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                          double rs1, vfloat64m8_t vs2,
                                          size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmacc_vv_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs1,
                                            vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfmacc_vf_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                            _Float16 rs1, vfloat16mf4_t vs2,
                                            size_t vl);
vfloat16mf2_t __riscv_vfmacc_vv_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs1,
                                            vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmacc_vf_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                            _Float16 rs1, vfloat16mf2_t vs2,
                                            size_t vl);
vfloat16m1_t __riscv_vfmacc_vv_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs1, vfloat16m1_t vs2,
                                          size_t vl);
vfloat16m1_t __riscv_vfmacc_vf_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                          _Float16 rs1, vfloat16m1_t vs2,
                                          size_t vl);
vfloat16m2_t __riscv_vfmacc_vv_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs1, vfloat16m2_t vs2,
                                          size_t vl);
vfloat16m2_t __riscv_vfmacc_vf_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                          _Float16 rs1, vfloat16m2_t vs2,
                                          size_t vl);
vfloat16m4_t __riscv_vfmacc_vv_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs1, vfloat16m4_t vs2,
                                          size_t vl);
vfloat16m4_t __riscv_vfmacc_vf_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                          _Float16 rs1, vfloat16m4_t vs2,
                                          size_t vl);
vfloat16m8_t __riscv_vfmacc_vv_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs1, vfloat16m8_t vs2,
                                          size_t vl);
vfloat16m8_t __riscv_vfmacc_vf_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                          _Float16 rs1, vfloat16m8_t vs2,
                                          size_t vl);
vfloat32mf2_t __riscv_vfmacc_vv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs1,
                                            vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmacc_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                            float rs1, vfloat32mf2_t vs2,
                                            size_t vl);
vfloat32m1_t __riscv_vfmacc_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs1, vfloat32m1_t vs2,
                                          size_t vl);
vfloat32m1_t __riscv_vfmacc_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                          float rs1, vfloat32m1_t vs2,
                                          size_t vl);
vfloat32m2_t __riscv_vfmacc_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs1, vfloat32m2_t vs2,
                                          size_t vl);
vfloat32m2_t __riscv_vfmacc_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                          float rs1, vfloat32m2_t vs2,
                                          size_t vl);
vfloat32m4_t __riscv_vfmacc_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs1, vfloat32m4_t vs2,
                                          size_t vl);
vfloat32m4_t __riscv_vfmacc_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                          float rs1, vfloat32m4_t vs2,
                                          size_t vl);
vfloat32m8_t __riscv_vfmacc_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs1, vfloat32m8_t vs2,
                                          size_t vl);
vfloat32m8_t __riscv_vfmacc_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                          float rs1, vfloat32m8_t vs2,
                                          size_t vl);
vfloat64m1_t __riscv_vfmacc_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs1, vfloat64m1_t vs2,
                                          size_t vl);
vfloat64m1_t __riscv_vfmacc_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                          double rs1, vfloat64m1_t vs2,
                                          size_t vl);
vfloat64m2_t __riscv_vfmacc_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs1, vfloat64m2_t vs2,
                                          size_t vl);
vfloat64m2_t __riscv_vfmacc_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                          double rs1, vfloat64m2_t vs2,
                                          size_t vl);
vfloat64m4_t __riscv_vfmacc_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs1, vfloat64m4_t vs2,
                                          size_t vl);
vfloat64m4_t __riscv_vfmacc_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                          double rs1, vfloat64m4_t vs2,
                                          size_t vl);
vfloat64m8_t __riscv_vfmacc_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs1, vfloat64m8_t vs2,
                                          size_t vl);
vfloat64m8_t __riscv_vfmacc_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                          double rs1, vfloat64m8_t vs2,
                                          size_t vl);
vfloat16mf4_t __riscv_vfnmacc_vv_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs1,
                                             vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmacc_vf_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                             _Float16 rs1, vfloat16mf4_t vs2,
                                             size_t vl);
vfloat16mf2_t __riscv_vfnmacc_vv_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs1,
                                             vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmacc_vf_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                             _Float16 rs1, vfloat16mf2_t vs2,
                                             size_t vl);
vfloat16m1_t __riscv_vfnmacc_vv_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs1, vfloat16m1_t vs2,
                                           size_t vl);
vfloat16m1_t __riscv_vfnmacc_vf_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                           _Float16 rs1, vfloat16m1_t vs2,
                                           size_t vl);
vfloat16m2_t __riscv_vfnmacc_vv_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs1, vfloat16m2_t vs2,
                                           size_t vl);
vfloat16m2_t __riscv_vfnmacc_vf_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                           _Float16 rs1, vfloat16m2_t vs2,
                                           size_t vl);
vfloat16m4_t __riscv_vfnmacc_vv_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs1, vfloat16m4_t vs2,
                                           size_t vl);
vfloat16m4_t __riscv_vfnmacc_vf_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                           _Float16 rs1, vfloat16m4_t vs2,
                                           size_t vl);
vfloat16m8_t __riscv_vfnmacc_vv_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs1, vfloat16m8_t vs2,
                                           size_t vl);
vfloat16m8_t __riscv_vfnmacc_vf_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                           _Float16 rs1, vfloat16m8_t vs2,
                                           size_t vl);
vfloat32mf2_t __riscv_vfnmacc_vv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs1,
                                             vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmacc_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                             float rs1, vfloat32mf2_t vs2,
                                             size_t vl);
vfloat32m1_t __riscv_vfnmacc_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs1, vfloat32m1_t vs2,
                                           size_t vl);
vfloat32m1_t __riscv_vfnmacc_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                           float rs1, vfloat32m1_t vs2,
                                           size_t vl);
vfloat32m2_t __riscv_vfnmacc_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs1, vfloat32m2_t vs2,
                                           size_t vl);
vfloat32m2_t __riscv_vfnmacc_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                           float rs1, vfloat32m2_t vs2,
                                           size_t vl);
vfloat32m4_t __riscv_vfnmacc_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs1, vfloat32m4_t vs2,
                                           size_t vl);
vfloat32m4_t __riscv_vfnmacc_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                           float rs1, vfloat32m4_t vs2,
                                           size_t vl);
vfloat32m8_t __riscv_vfnmacc_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs1, vfloat32m8_t vs2,
                                           size_t vl);
vfloat32m8_t __riscv_vfnmacc_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                           float rs1, vfloat32m8_t vs2,
                                           size_t vl);
vfloat64m1_t __riscv_vfnmacc_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs1, vfloat64m1_t vs2,
                                           size_t vl);
vfloat64m1_t __riscv_vfnmacc_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                           double rs1, vfloat64m1_t vs2,
                                           size_t vl);
vfloat64m2_t __riscv_vfnmacc_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs1, vfloat64m2_t vs2,
                                           size_t vl);
vfloat64m2_t __riscv_vfnmacc_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                           double rs1, vfloat64m2_t vs2,
                                           size_t vl);
vfloat64m4_t __riscv_vfnmacc_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs1, vfloat64m4_t vs2,
                                           size_t vl);
vfloat64m4_t __riscv_vfnmacc_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                           double rs1, vfloat64m4_t vs2,
                                           size_t vl);
vfloat64m8_t __riscv_vfnmacc_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs1, vfloat64m8_t vs2,
                                           size_t vl);
vfloat64m8_t __riscv_vfnmacc_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                           double rs1, vfloat64m8_t vs2,
                                           size_t vl);
vfloat16mf4_t __riscv_vfmsac_vv_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs1,
                                            vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfmsac_vf_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                            _Float16 rs1, vfloat16mf4_t vs2,
                                            size_t vl);
vfloat16mf2_t __riscv_vfmsac_vv_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs1,
                                            vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmsac_vf_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                            _Float16 rs1, vfloat16mf2_t vs2,
                                            size_t vl);
vfloat16m1_t __riscv_vfmsac_vv_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs1, vfloat16m1_t vs2,
                                          size_t vl);
vfloat16m1_t __riscv_vfmsac_vf_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                          _Float16 rs1, vfloat16m1_t vs2,
                                          size_t vl);
vfloat16m2_t __riscv_vfmsac_vv_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs1, vfloat16m2_t vs2,
                                          size_t vl);
vfloat16m2_t __riscv_vfmsac_vf_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                          _Float16 rs1, vfloat16m2_t vs2,
                                          size_t vl);
vfloat16m4_t __riscv_vfmsac_vv_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs1, vfloat16m4_t vs2,
                                          size_t vl);
vfloat16m4_t __riscv_vfmsac_vf_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                          _Float16 rs1, vfloat16m4_t vs2,
                                          size_t vl);
vfloat16m8_t __riscv_vfmsac_vv_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs1, vfloat16m8_t vs2,
                                          size_t vl);
vfloat16m8_t __riscv_vfmsac_vf_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                          _Float16 rs1, vfloat16m8_t vs2,
                                          size_t vl);
vfloat32mf2_t __riscv_vfmsac_vv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs1,
                                            vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmsac_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                            float rs1, vfloat32mf2_t vs2,
                                            size_t vl);
vfloat32m1_t __riscv_vfmsac_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs1, vfloat32m1_t vs2,
                                          size_t vl);
vfloat32m1_t __riscv_vfmsac_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                          float rs1, vfloat32m1_t vs2,
                                          size_t vl);
vfloat32m2_t __riscv_vfmsac_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs1, vfloat32m2_t vs2,
                                          size_t vl);
vfloat32m2_t __riscv_vfmsac_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                          float rs1, vfloat32m2_t vs2,
                                          size_t vl);
vfloat32m4_t __riscv_vfmsac_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs1, vfloat32m4_t vs2,
                                          size_t vl);
vfloat32m4_t __riscv_vfmsac_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                          float rs1, vfloat32m4_t vs2,
                                          size_t vl);
vfloat32m8_t __riscv_vfmsac_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs1, vfloat32m8_t vs2,
                                          size_t vl);
vfloat32m8_t __riscv_vfmsac_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                          float rs1, vfloat32m8_t vs2,
                                          size_t vl);
vfloat64m1_t __riscv_vfmsac_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs1, vfloat64m1_t vs2,
                                          size_t vl);
vfloat64m1_t __riscv_vfmsac_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                          double rs1, vfloat64m1_t vs2,
                                          size_t vl);
vfloat64m2_t __riscv_vfmsac_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs1, vfloat64m2_t vs2,
                                          size_t vl);
vfloat64m2_t __riscv_vfmsac_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                          double rs1, vfloat64m2_t vs2,
                                          size_t vl);
vfloat64m4_t __riscv_vfmsac_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs1, vfloat64m4_t vs2,
                                          size_t vl);
vfloat64m4_t __riscv_vfmsac_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                          double rs1, vfloat64m4_t vs2,
                                          size_t vl);
vfloat64m8_t __riscv_vfmsac_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs1, vfloat64m8_t vs2,
                                          size_t vl);
vfloat64m8_t __riscv_vfmsac_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                          double rs1, vfloat64m8_t vs2,
                                          size_t vl);
vfloat16mf4_t __riscv_vfnmsac_vv_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs1,
                                             vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmsac_vf_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                             _Float16 rs1, vfloat16mf4_t vs2,
                                             size_t vl);
vfloat16mf2_t __riscv_vfnmsac_vv_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs1,
                                             vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmsac_vf_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                             _Float16 rs1, vfloat16mf2_t vs2,
                                             size_t vl);
vfloat16m1_t __riscv_vfnmsac_vv_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs1, vfloat16m1_t vs2,
                                           size_t vl);
vfloat16m1_t __riscv_vfnmsac_vf_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                           _Float16 rs1, vfloat16m1_t vs2,
                                           size_t vl);
vfloat16m2_t __riscv_vfnmsac_vv_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs1, vfloat16m2_t vs2,
                                           size_t vl);
vfloat16m2_t __riscv_vfnmsac_vf_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                           _Float16 rs1, vfloat16m2_t vs2,
                                           size_t vl);
vfloat16m4_t __riscv_vfnmsac_vv_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs1, vfloat16m4_t vs2,
                                           size_t vl);
vfloat16m4_t __riscv_vfnmsac_vf_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                           _Float16 rs1, vfloat16m4_t vs2,
                                           size_t vl);
vfloat16m8_t __riscv_vfnmsac_vv_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs1, vfloat16m8_t vs2,
                                           size_t vl);
vfloat16m8_t __riscv_vfnmsac_vf_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                           _Float16 rs1, vfloat16m8_t vs2,
                                           size_t vl);
vfloat32mf2_t __riscv_vfnmsac_vv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs1,
                                             vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmsac_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                             float rs1, vfloat32mf2_t vs2,
                                             size_t vl);
vfloat32m1_t __riscv_vfnmsac_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs1, vfloat32m1_t vs2,
                                           size_t vl);
vfloat32m1_t __riscv_vfnmsac_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                           float rs1, vfloat32m1_t vs2,
                                           size_t vl);
vfloat32m2_t __riscv_vfnmsac_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs1, vfloat32m2_t vs2,
                                           size_t vl);
vfloat32m2_t __riscv_vfnmsac_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                           float rs1, vfloat32m2_t vs2,
                                           size_t vl);
vfloat32m4_t __riscv_vfnmsac_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs1, vfloat32m4_t vs2,
                                           size_t vl);
vfloat32m4_t __riscv_vfnmsac_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                           float rs1, vfloat32m4_t vs2,
                                           size_t vl);
vfloat32m8_t __riscv_vfnmsac_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs1, vfloat32m8_t vs2,
                                           size_t vl);
vfloat32m8_t __riscv_vfnmsac_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                           float rs1, vfloat32m8_t vs2,
                                           size_t vl);
vfloat64m1_t __riscv_vfnmsac_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs1, vfloat64m1_t vs2,
                                           size_t vl);
vfloat64m1_t __riscv_vfnmsac_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                           double rs1, vfloat64m1_t vs2,
                                           size_t vl);
vfloat64m2_t __riscv_vfnmsac_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs1, vfloat64m2_t vs2,
                                           size_t vl);
vfloat64m2_t __riscv_vfnmsac_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                           double rs1, vfloat64m2_t vs2,
                                           size_t vl);
vfloat64m4_t __riscv_vfnmsac_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs1, vfloat64m4_t vs2,
                                           size_t vl);
vfloat64m4_t __riscv_vfnmsac_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                           double rs1, vfloat64m4_t vs2,
                                           size_t vl);
vfloat64m8_t __riscv_vfnmsac_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs1, vfloat64m8_t vs2,
                                           size_t vl);
vfloat64m8_t __riscv_vfnmsac_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                           double rs1, vfloat64m8_t vs2,
                                           size_t vl);
vfloat16mf4_t __riscv_vfmadd_vv_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs1,
                                            vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfmadd_vf_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                            _Float16 rs1, vfloat16mf4_t vs2,
                                            size_t vl);
vfloat16mf2_t __riscv_vfmadd_vv_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs1,
                                            vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmadd_vf_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                            _Float16 rs1, vfloat16mf2_t vs2,
                                            size_t vl);
vfloat16m1_t __riscv_vfmadd_vv_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs1, vfloat16m1_t vs2,
                                          size_t vl);
vfloat16m1_t __riscv_vfmadd_vf_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                          _Float16 rs1, vfloat16m1_t vs2,
                                          size_t vl);
vfloat16m2_t __riscv_vfmadd_vv_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs1, vfloat16m2_t vs2,
                                          size_t vl);
vfloat16m2_t __riscv_vfmadd_vf_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                          _Float16 rs1, vfloat16m2_t vs2,
                                          size_t vl);
vfloat16m4_t __riscv_vfmadd_vv_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs1, vfloat16m4_t vs2,
                                          size_t vl);
vfloat16m4_t __riscv_vfmadd_vf_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                          _Float16 rs1, vfloat16m4_t vs2,
                                          size_t vl);
vfloat16m8_t __riscv_vfmadd_vv_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs1, vfloat16m8_t vs2,
                                          size_t vl);
vfloat16m8_t __riscv_vfmadd_vf_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                          _Float16 rs1, vfloat16m8_t vs2,
                                          size_t vl);
vfloat32mf2_t __riscv_vfmadd_vv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs1,
                                            vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmadd_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                            float rs1, vfloat32mf2_t vs2,
                                            size_t vl);
vfloat32m1_t __riscv_vfmadd_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs1, vfloat32m1_t vs2,
                                          size_t vl);
vfloat32m1_t __riscv_vfmadd_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                          float rs1, vfloat32m1_t vs2,
                                          size_t vl);
vfloat32m2_t __riscv_vfmadd_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs1, vfloat32m2_t vs2,
                                          size_t vl);
vfloat32m2_t __riscv_vfmadd_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                          float rs1, vfloat32m2_t vs2,
                                          size_t vl);
vfloat32m4_t __riscv_vfmadd_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs1, vfloat32m4_t vs2,
                                          size_t vl);
vfloat32m4_t __riscv_vfmadd_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                          float rs1, vfloat32m4_t vs2,
                                          size_t vl);
vfloat32m8_t __riscv_vfmadd_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs1, vfloat32m8_t vs2,
                                          size_t vl);
vfloat32m8_t __riscv_vfmadd_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                          float rs1, vfloat32m8_t vs2,
                                          size_t vl);
vfloat64m1_t __riscv_vfmadd_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs1, vfloat64m1_t vs2,
                                          size_t vl);
vfloat64m1_t __riscv_vfmadd_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                          double rs1, vfloat64m1_t vs2,
                                          size_t vl);
vfloat64m2_t __riscv_vfmadd_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs1, vfloat64m2_t vs2,
                                          size_t vl);
vfloat64m2_t __riscv_vfmadd_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                          double rs1, vfloat64m2_t vs2,
                                          size_t vl);
vfloat64m4_t __riscv_vfmadd_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs1, vfloat64m4_t vs2,
                                          size_t vl);
vfloat64m4_t __riscv_vfmadd_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                          double rs1, vfloat64m4_t vs2,
                                          size_t vl);
vfloat64m8_t __riscv_vfmadd_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs1, vfloat64m8_t vs2,
                                          size_t vl);
vfloat64m8_t __riscv_vfmadd_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                          double rs1, vfloat64m8_t vs2,
                                          size_t vl);
vfloat16mf4_t __riscv_vfnmadd_vv_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs1,
                                             vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmadd_vf_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                             _Float16 rs1, vfloat16mf4_t vs2,
                                             size_t vl);
vfloat16mf2_t __riscv_vfnmadd_vv_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs1,
                                             vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmadd_vf_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                             _Float16 rs1, vfloat16mf2_t vs2,
                                             size_t vl);
vfloat16m1_t __riscv_vfnmadd_vv_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs1, vfloat16m1_t vs2,
                                           size_t vl);
vfloat16m1_t __riscv_vfnmadd_vf_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                           _Float16 rs1, vfloat16m1_t vs2,
                                           size_t vl);
vfloat16m2_t __riscv_vfnmadd_vv_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs1, vfloat16m2_t vs2,
                                           size_t vl);
vfloat16m2_t __riscv_vfnmadd_vf_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                           _Float16 rs1, vfloat16m2_t vs2,
                                           size_t vl);
vfloat16m4_t __riscv_vfnmadd_vv_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs1, vfloat16m4_t vs2,
                                           size_t vl);
vfloat16m4_t __riscv_vfnmadd_vf_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                           _Float16 rs1, vfloat16m4_t vs2,
                                           size_t vl);
vfloat16m8_t __riscv_vfnmadd_vv_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs1, vfloat16m8_t vs2,
                                           size_t vl);
vfloat16m8_t __riscv_vfnmadd_vf_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                           _Float16 rs1, vfloat16m8_t vs2,
                                           size_t vl);
vfloat32mf2_t __riscv_vfnmadd_vv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs1,
                                             vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmadd_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                             float rs1, vfloat32mf2_t vs2,
                                             size_t vl);
vfloat32m1_t __riscv_vfnmadd_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs1, vfloat32m1_t vs2,
                                           size_t vl);
vfloat32m1_t __riscv_vfnmadd_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                           float rs1, vfloat32m1_t vs2,
                                           size_t vl);
vfloat32m2_t __riscv_vfnmadd_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs1, vfloat32m2_t vs2,
                                           size_t vl);
vfloat32m2_t __riscv_vfnmadd_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                           float rs1, vfloat32m2_t vs2,
                                           size_t vl);
vfloat32m4_t __riscv_vfnmadd_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs1, vfloat32m4_t vs2,
                                           size_t vl);
vfloat32m4_t __riscv_vfnmadd_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                           float rs1, vfloat32m4_t vs2,
                                           size_t vl);
vfloat32m8_t __riscv_vfnmadd_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs1, vfloat32m8_t vs2,
                                           size_t vl);
vfloat32m8_t __riscv_vfnmadd_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                           float rs1, vfloat32m8_t vs2,
                                           size_t vl);
vfloat64m1_t __riscv_vfnmadd_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs1, vfloat64m1_t vs2,
                                           size_t vl);
vfloat64m1_t __riscv_vfnmadd_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                           double rs1, vfloat64m1_t vs2,
                                           size_t vl);
vfloat64m2_t __riscv_vfnmadd_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs1, vfloat64m2_t vs2,
                                           size_t vl);
vfloat64m2_t __riscv_vfnmadd_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                           double rs1, vfloat64m2_t vs2,
                                           size_t vl);
vfloat64m4_t __riscv_vfnmadd_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs1, vfloat64m4_t vs2,
                                           size_t vl);
vfloat64m4_t __riscv_vfnmadd_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                           double rs1, vfloat64m4_t vs2,
                                           size_t vl);
vfloat64m8_t __riscv_vfnmadd_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs1, vfloat64m8_t vs2,
                                           size_t vl);
vfloat64m8_t __riscv_vfnmadd_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                           double rs1, vfloat64m8_t vs2,
                                           size_t vl);
vfloat16mf4_t __riscv_vfmsub_vv_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs1,
                                            vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfmsub_vf_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                            _Float16 rs1, vfloat16mf4_t vs2,
                                            size_t vl);
vfloat16mf2_t __riscv_vfmsub_vv_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs1,
                                            vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmsub_vf_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                            _Float16 rs1, vfloat16mf2_t vs2,
                                            size_t vl);
vfloat16m1_t __riscv_vfmsub_vv_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs1, vfloat16m1_t vs2,
                                          size_t vl);
vfloat16m1_t __riscv_vfmsub_vf_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                          _Float16 rs1, vfloat16m1_t vs2,
                                          size_t vl);
vfloat16m2_t __riscv_vfmsub_vv_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs1, vfloat16m2_t vs2,
                                          size_t vl);
vfloat16m2_t __riscv_vfmsub_vf_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                          _Float16 rs1, vfloat16m2_t vs2,
                                          size_t vl);
vfloat16m4_t __riscv_vfmsub_vv_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs1, vfloat16m4_t vs2,
                                          size_t vl);
vfloat16m4_t __riscv_vfmsub_vf_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                          _Float16 rs1, vfloat16m4_t vs2,
                                          size_t vl);
vfloat16m8_t __riscv_vfmsub_vv_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs1, vfloat16m8_t vs2,
                                          size_t vl);
vfloat16m8_t __riscv_vfmsub_vf_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                          _Float16 rs1, vfloat16m8_t vs2,
                                          size_t vl);
vfloat32mf2_t __riscv_vfmsub_vv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs1,
                                            vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmsub_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                            float rs1, vfloat32mf2_t vs2,
                                            size_t vl);
vfloat32m1_t __riscv_vfmsub_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs1, vfloat32m1_t vs2,
                                          size_t vl);
vfloat32m1_t __riscv_vfmsub_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                          float rs1, vfloat32m1_t vs2,
                                          size_t vl);
vfloat32m2_t __riscv_vfmsub_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs1, vfloat32m2_t vs2,
                                          size_t vl);
vfloat32m2_t __riscv_vfmsub_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                          float rs1, vfloat32m2_t vs2,
                                          size_t vl);
vfloat32m4_t __riscv_vfmsub_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs1, vfloat32m4_t vs2,
                                          size_t vl);
vfloat32m4_t __riscv_vfmsub_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                          float rs1, vfloat32m4_t vs2,
                                          size_t vl);
vfloat32m8_t __riscv_vfmsub_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs1, vfloat32m8_t vs2,
                                          size_t vl);
vfloat32m8_t __riscv_vfmsub_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                          float rs1, vfloat32m8_t vs2,
                                          size_t vl);
vfloat64m1_t __riscv_vfmsub_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs1, vfloat64m1_t vs2,
                                          size_t vl);
vfloat64m1_t __riscv_vfmsub_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                          double rs1, vfloat64m1_t vs2,
                                          size_t vl);
vfloat64m2_t __riscv_vfmsub_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs1, vfloat64m2_t vs2,
                                          size_t vl);
vfloat64m2_t __riscv_vfmsub_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                          double rs1, vfloat64m2_t vs2,
                                          size_t vl);
vfloat64m4_t __riscv_vfmsub_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs1, vfloat64m4_t vs2,
                                          size_t vl);
vfloat64m4_t __riscv_vfmsub_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                          double rs1, vfloat64m4_t vs2,
                                          size_t vl);
vfloat64m8_t __riscv_vfmsub_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs1, vfloat64m8_t vs2,
                                          size_t vl);
vfloat64m8_t __riscv_vfmsub_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                          double rs1, vfloat64m8_t vs2,
                                          size_t vl);
vfloat16mf4_t __riscv_vfnmsub_vv_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs1,
                                             vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmsub_vf_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                             _Float16 rs1, vfloat16mf4_t vs2,
                                             size_t vl);
vfloat16mf2_t __riscv_vfnmsub_vv_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs1,
                                             vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmsub_vf_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                             _Float16 rs1, vfloat16mf2_t vs2,
                                             size_t vl);
vfloat16m1_t __riscv_vfnmsub_vv_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs1, vfloat16m1_t vs2,
                                           size_t vl);
vfloat16m1_t __riscv_vfnmsub_vf_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                           _Float16 rs1, vfloat16m1_t vs2,
                                           size_t vl);
vfloat16m2_t __riscv_vfnmsub_vv_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs1, vfloat16m2_t vs2,
                                           size_t vl);
vfloat16m2_t __riscv_vfnmsub_vf_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                           _Float16 rs1, vfloat16m2_t vs2,
                                           size_t vl);
vfloat16m4_t __riscv_vfnmsub_vv_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs1, vfloat16m4_t vs2,
                                           size_t vl);
vfloat16m4_t __riscv_vfnmsub_vf_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                           _Float16 rs1, vfloat16m4_t vs2,
                                           size_t vl);
vfloat16m8_t __riscv_vfnmsub_vv_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs1, vfloat16m8_t vs2,
                                           size_t vl);
vfloat16m8_t __riscv_vfnmsub_vf_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                           _Float16 rs1, vfloat16m8_t vs2,
                                           size_t vl);
vfloat32mf2_t __riscv_vfnmsub_vv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs1,
                                             vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmsub_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                             float rs1, vfloat32mf2_t vs2,
                                             size_t vl);
vfloat32m1_t __riscv_vfnmsub_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs1, vfloat32m1_t vs2,
                                           size_t vl);
vfloat32m1_t __riscv_vfnmsub_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                           float rs1, vfloat32m1_t vs2,
                                           size_t vl);
vfloat32m2_t __riscv_vfnmsub_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs1, vfloat32m2_t vs2,
                                           size_t vl);
vfloat32m2_t __riscv_vfnmsub_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                           float rs1, vfloat32m2_t vs2,
                                           size_t vl);
vfloat32m4_t __riscv_vfnmsub_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs1, vfloat32m4_t vs2,
                                           size_t vl);
vfloat32m4_t __riscv_vfnmsub_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                           float rs1, vfloat32m4_t vs2,
                                           size_t vl);
vfloat32m8_t __riscv_vfnmsub_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs1, vfloat32m8_t vs2,
                                           size_t vl);
vfloat32m8_t __riscv_vfnmsub_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                           float rs1, vfloat32m8_t vs2,
                                           size_t vl);
vfloat64m1_t __riscv_vfnmsub_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs1, vfloat64m1_t vs2,
                                           size_t vl);
vfloat64m1_t __riscv_vfnmsub_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                           double rs1, vfloat64m1_t vs2,
                                           size_t vl);
vfloat64m2_t __riscv_vfnmsub_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs1, vfloat64m2_t vs2,
                                           size_t vl);
vfloat64m2_t __riscv_vfnmsub_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                           double rs1, vfloat64m2_t vs2,
                                           size_t vl);
vfloat64m4_t __riscv_vfnmsub_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs1, vfloat64m4_t vs2,
                                           size_t vl);
vfloat64m4_t __riscv_vfnmsub_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                           double rs1, vfloat64m4_t vs2,
                                           size_t vl);
vfloat64m8_t __riscv_vfnmsub_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs1, vfloat64m8_t vs2,
                                           size_t vl);
vfloat64m8_t __riscv_vfnmsub_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                           double rs1, vfloat64m8_t vs2,
                                           size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmacc_vv_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                          vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                          size_t vl);
vfloat16mf4_t __riscv_vfmacc_vf_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                          _Float16 rs1, vfloat16mf4_t vs2,
                                          size_t vl);
vfloat16mf2_t __riscv_vfmacc_vv_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                          vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                          size_t vl);
vfloat16mf2_t __riscv_vfmacc_vf_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                          _Float16 rs1, vfloat16mf2_t vs2,
                                          size_t vl);
vfloat16m1_t __riscv_vfmacc_vv_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                        vfloat16m1_t vs1, vfloat16m1_t vs2,
                                        size_t vl);
vfloat16m1_t __riscv_vfmacc_vf_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                        _Float16 rs1, vfloat16m1_t vs2,
                                        size_t vl);
vfloat16m2_t __riscv_vfmacc_vv_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                        vfloat16m2_t vs1, vfloat16m2_t vs2,
                                        size_t vl);
vfloat16m2_t __riscv_vfmacc_vf_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                        _Float16 rs1, vfloat16m2_t vs2,
                                        size_t vl);
vfloat16m4_t __riscv_vfmacc_vv_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                        vfloat16m4_t vs1, vfloat16m4_t vs2,
                                        size_t vl);
vfloat16m4_t __riscv_vfmacc_vf_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                        _Float16 rs1, vfloat16m4_t vs2,
                                        size_t vl);
vfloat16m8_t __riscv_vfmacc_vv_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                        vfloat16m8_t vs1, vfloat16m8_t vs2,
                                        size_t vl);
vfloat16m8_t __riscv_vfmacc_vf_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                        _Float16 rs1, vfloat16m8_t vs2,
                                        size_t vl);
vfloat32mf2_t __riscv_vfmacc_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                          size_t vl);
vfloat32mf2_t __riscv_vfmacc_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                          float rs1, vfloat32mf2_t vs2,
                                          size_t vl);
vfloat32m1_t __riscv_vfmacc_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs1, vfloat32m1_t vs2,
                                        size_t vl);
vfloat32m1_t __riscv_vfmacc_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                        float rs1, vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmacc_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs1, vfloat32m2_t vs2,
                                        size_t vl);
vfloat32m2_t __riscv_vfmacc_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                        float rs1, vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmacc_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs1, vfloat32m4_t vs2,
                                        size_t vl);
vfloat32m4_t __riscv_vfmacc_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                        vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmacc_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs1, vfloat32m8_t vs2,
                                        size_t vl);
vfloat32m8_t __riscv_vfmacc_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                        vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmacc_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs1, vfloat64m1_t vs2,
                                        size_t vl);
vfloat64m1_t __riscv_vfmacc_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                        double rs1, vfloat64m1_t vs2,
                                        size_t vl);
vfloat64m2_t __riscv_vfmacc_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs1, vfloat64m2_t vs2,
                                        size_t vl);
vfloat64m2_t __riscv_vfmacc_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                        double rs1, vfloat64m2_t vs2,
                                        size_t vl);
vfloat64m4_t __riscv_vfmacc_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs1, vfloat64m4_t vs2,
                                        size_t vl);
vfloat64m4_t __riscv_vfmacc_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                        double rs1, vfloat64m4_t vs2,
                                        size_t vl);
vfloat64m8_t __riscv_vfmacc_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs1, vfloat64m8_t vs2,
                                        size_t vl);
vfloat64m8_t __riscv_vfmacc_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                        double rs1, vfloat64m8_t vs2,
                                        size_t vl);
vfloat16mf4_t __riscv_vfnmacc_vv_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                           size_t vl);
vfloat16mf4_t __riscv_vfnmacc_vf_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                           _Float16 rs1, vfloat16mf4_t vs2,
                                           size_t vl);
vfloat16mf2_t __riscv_vfnmacc_vv_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat16mf2_t __riscv_vfnmacc_vf_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                           _Float16 rs1, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat16m1_t __riscv_vfnmacc_vv_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs1, vfloat16m1_t vs2,
                                         size_t vl);
vfloat16m1_t __riscv_vfnmacc_vf_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                         _Float16 rs1, vfloat16m1_t vs2,
                                         size_t vl);
vfloat16m2_t __riscv_vfnmacc_vv_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs1, vfloat16m2_t vs2,
                                         size_t vl);
vfloat16m2_t __riscv_vfnmacc_vf_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                         _Float16 rs1, vfloat16m2_t vs2,
                                         size_t vl);
vfloat16m4_t __riscv_vfnmacc_vv_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs1, vfloat16m4_t vs2,
                                         size_t vl);
vfloat16m4_t __riscv_vfnmacc_vf_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                         _Float16 rs1, vfloat16m4_t vs2,
                                         size_t vl);
vfloat16m8_t __riscv_vfnmacc_vv_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs1, vfloat16m8_t vs2,
                                         size_t vl);
vfloat16m8_t __riscv_vfnmacc_vf_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                         _Float16 rs1, vfloat16m8_t vs2,
                                         size_t vl);
vfloat32mf2_t __riscv_vfnmacc_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat32mf2_t __riscv_vfnmacc_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                           float rs1, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat32m1_t __riscv_vfnmacc_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs1, vfloat32m1_t vs2,
                                         size_t vl);
vfloat32m1_t __riscv_vfnmacc_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                         float rs1, vfloat32m1_t vs2,
                                         size_t vl);
vfloat32m2_t __riscv_vfnmacc_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs1, vfloat32m2_t vs2,
                                         size_t vl);
vfloat32m2_t __riscv_vfnmacc_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                         float rs1, vfloat32m2_t vs2,
                                         size_t vl);
vfloat32m4_t __riscv_vfnmacc_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs1, vfloat32m4_t vs2,
                                         size_t vl);
vfloat32m4_t __riscv_vfnmacc_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                         float rs1, vfloat32m4_t vs2,
                                         size_t vl);
vfloat32m8_t __riscv_vfnmacc_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs1, vfloat32m8_t vs2,
                                         size_t vl);
vfloat32m8_t __riscv_vfnmacc_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                         float rs1, vfloat32m8_t vs2,
                                         size_t vl);
vfloat64m1_t __riscv_vfnmacc_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs1, vfloat64m1_t vs2,
                                         size_t vl);
vfloat64m1_t __riscv_vfnmacc_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                         double rs1, vfloat64m1_t vs2,
                                         size_t vl);
vfloat64m2_t __riscv_vfnmacc_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs1, vfloat64m2_t vs2,
                                         size_t vl);
vfloat64m2_t __riscv_vfnmacc_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                         double rs1, vfloat64m2_t vs2,
                                         size_t vl);
vfloat64m4_t __riscv_vfnmacc_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs1, vfloat64m4_t vs2,
                                         size_t vl);
vfloat64m4_t __riscv_vfnmacc_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                         double rs1, vfloat64m4_t vs2,
                                         size_t vl);
vfloat64m8_t __riscv_vfnmacc_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs1, vfloat64m8_t vs2,
                                         size_t vl);
vfloat64m8_t __riscv_vfnmacc_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                         double rs1, vfloat64m8_t vs2,
                                         size_t vl);
vfloat16mf4_t __riscv_vfmsac_vv_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                          vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                          size_t vl);
vfloat16mf4_t __riscv_vfmsac_vf_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                          _Float16 rs1, vfloat16mf4_t vs2,
                                          size_t vl);
vfloat16mf2_t __riscv_vfmsac_vv_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                          vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                          size_t vl);
vfloat16mf2_t __riscv_vfmsac_vf_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                          _Float16 rs1, vfloat16mf2_t vs2,
                                          size_t vl);
vfloat16m1_t __riscv_vfmsac_vv_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                        vfloat16m1_t vs1, vfloat16m1_t vs2,
                                        size_t vl);
vfloat16m1_t __riscv_vfmsac_vf_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                        _Float16 rs1, vfloat16m1_t vs2,
                                        size_t vl);
vfloat16m2_t __riscv_vfmsac_vv_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                        vfloat16m2_t vs1, vfloat16m2_t vs2,
                                        size_t vl);
vfloat16m2_t __riscv_vfmsac_vf_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                        _Float16 rs1, vfloat16m2_t vs2,
                                        size_t vl);
vfloat16m4_t __riscv_vfmsac_vv_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                        vfloat16m4_t vs1, vfloat16m4_t vs2,
                                        size_t vl);
vfloat16m4_t __riscv_vfmsac_vf_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                        _Float16 rs1, vfloat16m4_t vs2,
                                        size_t vl);
vfloat16m8_t __riscv_vfmsac_vv_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                        vfloat16m8_t vs1, vfloat16m8_t vs2,
                                        size_t vl);
vfloat16m8_t __riscv_vfmsac_vf_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                        _Float16 rs1, vfloat16m8_t vs2,
                                        size_t vl);
vfloat32mf2_t __riscv_vfmsac_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                          size_t vl);
vfloat32mf2_t __riscv_vfmsac_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                          float rs1, vfloat32mf2_t vs2,
                                          size_t vl);
vfloat32m1_t __riscv_vfmsac_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs1, vfloat32m1_t vs2,
                                        size_t vl);
vfloat32m1_t __riscv_vfmsac_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                        float rs1, vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmsac_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs1, vfloat32m2_t vs2,
                                        size_t vl);
vfloat32m2_t __riscv_vfmsac_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                        float rs1, vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmsac_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs1, vfloat32m4_t vs2,
                                        size_t vl);
vfloat32m4_t __riscv_vfmsac_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                        vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmsac_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs1, vfloat32m8_t vs2,
                                        size_t vl);
vfloat32m8_t __riscv_vfmsac_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                        vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmsac_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs1, vfloat64m1_t vs2,
                                        size_t vl);
vfloat64m1_t __riscv_vfmsac_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                        double rs1, vfloat64m1_t vs2,
                                        size_t vl);
vfloat64m2_t __riscv_vfmsac_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs1, vfloat64m2_t vs2,
                                        size_t vl);
vfloat64m2_t __riscv_vfmsac_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                        double rs1, vfloat64m2_t vs2,
                                        size_t vl);
vfloat64m4_t __riscv_vfmsac_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs1, vfloat64m4_t vs2,
                                        size_t vl);
vfloat64m4_t __riscv_vfmsac_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                        double rs1, vfloat64m4_t vs2,
                                        size_t vl);
vfloat64m8_t __riscv_vfmsac_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs1, vfloat64m8_t vs2,
                                        size_t vl);
vfloat64m8_t __riscv_vfmsac_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                        double rs1, vfloat64m8_t vs2,
                                        size_t vl);
vfloat16mf4_t __riscv_vfnmsac_vv_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                           size_t vl);
vfloat16mf4_t __riscv_vfnmsac_vf_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                           _Float16 rs1, vfloat16mf4_t vs2,
                                           size_t vl);
vfloat16mf2_t __riscv_vfnmsac_vv_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat16mf2_t __riscv_vfnmsac_vf_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                           _Float16 rs1, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat16m1_t __riscv_vfnmsac_vv_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs1, vfloat16m1_t vs2,
                                         size_t vl);
vfloat16m1_t __riscv_vfnmsac_vf_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                         _Float16 rs1, vfloat16m1_t vs2,
                                         size_t vl);
vfloat16m2_t __riscv_vfnmsac_vv_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs1, vfloat16m2_t vs2,
                                         size_t vl);
vfloat16m2_t __riscv_vfnmsac_vf_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                         _Float16 rs1, vfloat16m2_t vs2,
                                         size_t vl);
vfloat16m4_t __riscv_vfnmsac_vv_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs1, vfloat16m4_t vs2,
                                         size_t vl);
vfloat16m4_t __riscv_vfnmsac_vf_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                         _Float16 rs1, vfloat16m4_t vs2,
                                         size_t vl);
vfloat16m8_t __riscv_vfnmsac_vv_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs1, vfloat16m8_t vs2,
                                         size_t vl);
vfloat16m8_t __riscv_vfnmsac_vf_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                         _Float16 rs1, vfloat16m8_t vs2,
                                         size_t vl);
vfloat32mf2_t __riscv_vfnmsac_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat32mf2_t __riscv_vfnmsac_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                           float rs1, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat32m1_t __riscv_vfnmsac_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs1, vfloat32m1_t vs2,
                                         size_t vl);
vfloat32m1_t __riscv_vfnmsac_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                         float rs1, vfloat32m1_t vs2,
                                         size_t vl);
vfloat32m2_t __riscv_vfnmsac_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs1, vfloat32m2_t vs2,
                                         size_t vl);
vfloat32m2_t __riscv_vfnmsac_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                         float rs1, vfloat32m2_t vs2,
                                         size_t vl);
vfloat32m4_t __riscv_vfnmsac_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs1, vfloat32m4_t vs2,
                                         size_t vl);
vfloat32m4_t __riscv_vfnmsac_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                         float rs1, vfloat32m4_t vs2,
                                         size_t vl);
vfloat32m8_t __riscv_vfnmsac_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs1, vfloat32m8_t vs2,
                                         size_t vl);
vfloat32m8_t __riscv_vfnmsac_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                         float rs1, vfloat32m8_t vs2,
                                         size_t vl);
vfloat64m1_t __riscv_vfnmsac_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs1, vfloat64m1_t vs2,
                                         size_t vl);
vfloat64m1_t __riscv_vfnmsac_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                         double rs1, vfloat64m1_t vs2,
                                         size_t vl);
vfloat64m2_t __riscv_vfnmsac_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs1, vfloat64m2_t vs2,
                                         size_t vl);
vfloat64m2_t __riscv_vfnmsac_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                         double rs1, vfloat64m2_t vs2,
                                         size_t vl);
vfloat64m4_t __riscv_vfnmsac_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs1, vfloat64m4_t vs2,
                                         size_t vl);
vfloat64m4_t __riscv_vfnmsac_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                         double rs1, vfloat64m4_t vs2,
                                         size_t vl);
vfloat64m8_t __riscv_vfnmsac_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs1, vfloat64m8_t vs2,
                                         size_t vl);
vfloat64m8_t __riscv_vfnmsac_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                         double rs1, vfloat64m8_t vs2,
                                         size_t vl);
vfloat16mf4_t __riscv_vfmadd_vv_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                          vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                          size_t vl);
vfloat16mf4_t __riscv_vfmadd_vf_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                          _Float16 rs1, vfloat16mf4_t vs2,
                                          size_t vl);
vfloat16mf2_t __riscv_vfmadd_vv_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                          vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                          size_t vl);
vfloat16mf2_t __riscv_vfmadd_vf_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                          _Float16 rs1, vfloat16mf2_t vs2,
                                          size_t vl);
vfloat16m1_t __riscv_vfmadd_vv_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                        vfloat16m1_t vs1, vfloat16m1_t vs2,
                                        size_t vl);
vfloat16m1_t __riscv_vfmadd_vf_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                        _Float16 rs1, vfloat16m1_t vs2,
                                        size_t vl);
vfloat16m2_t __riscv_vfmadd_vv_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                        vfloat16m2_t vs1, vfloat16m2_t vs2,
                                        size_t vl);
vfloat16m2_t __riscv_vfmadd_vf_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                        _Float16 rs1, vfloat16m2_t vs2,
                                        size_t vl);
vfloat16m4_t __riscv_vfmadd_vv_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                        vfloat16m4_t vs1, vfloat16m4_t vs2,
                                        size_t vl);
vfloat16m4_t __riscv_vfmadd_vf_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                        _Float16 rs1, vfloat16m4_t vs2,
                                        size_t vl);
vfloat16m8_t __riscv_vfmadd_vv_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                        vfloat16m8_t vs1, vfloat16m8_t vs2,
                                        size_t vl);
vfloat16m8_t __riscv_vfmadd_vf_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                        _Float16 rs1, vfloat16m8_t vs2,
                                        size_t vl);
vfloat32mf2_t __riscv_vfmadd_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                          size_t vl);
vfloat32mf2_t __riscv_vfmadd_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                          float rs1, vfloat32mf2_t vs2,
                                          size_t vl);
vfloat32m1_t __riscv_vfmadd_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs1, vfloat32m1_t vs2,
                                        size_t vl);
vfloat32m1_t __riscv_vfmadd_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                        float rs1, vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmadd_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs1, vfloat32m2_t vs2,
                                        size_t vl);
vfloat32m2_t __riscv_vfmadd_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                        float rs1, vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmadd_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs1, vfloat32m4_t vs2,
                                        size_t vl);
vfloat32m4_t __riscv_vfmadd_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                        vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmadd_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs1, vfloat32m8_t vs2,
                                        size_t vl);
vfloat32m8_t __riscv_vfmadd_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                        vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmadd_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs1, vfloat64m1_t vs2,
                                        size_t vl);
vfloat64m1_t __riscv_vfmadd_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                        double rs1, vfloat64m1_t vs2,
                                        size_t vl);
vfloat64m2_t __riscv_vfmadd_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs1, vfloat64m2_t vs2,
                                        size_t vl);
vfloat64m2_t __riscv_vfmadd_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                        double rs1, vfloat64m2_t vs2,
                                        size_t vl);
vfloat64m4_t __riscv_vfmadd_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs1, vfloat64m4_t vs2,
                                        size_t vl);
vfloat64m4_t __riscv_vfmadd_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                        double rs1, vfloat64m4_t vs2,
                                        size_t vl);
vfloat64m8_t __riscv_vfmadd_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs1, vfloat64m8_t vs2,
                                        size_t vl);
vfloat64m8_t __riscv_vfmadd_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                        double rs1, vfloat64m8_t vs2,
                                        size_t vl);
vfloat16mf4_t __riscv_vfnmadd_vv_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                           size_t vl);
vfloat16mf4_t __riscv_vfnmadd_vf_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                           _Float16 rs1, vfloat16mf4_t vs2,
                                           size_t vl);
vfloat16mf2_t __riscv_vfnmadd_vv_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat16mf2_t __riscv_vfnmadd_vf_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                           _Float16 rs1, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat16m1_t __riscv_vfnmadd_vv_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs1, vfloat16m1_t vs2,
                                         size_t vl);
vfloat16m1_t __riscv_vfnmadd_vf_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                         _Float16 rs1, vfloat16m1_t vs2,
                                         size_t vl);
vfloat16m2_t __riscv_vfnmadd_vv_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs1, vfloat16m2_t vs2,
                                         size_t vl);
vfloat16m2_t __riscv_vfnmadd_vf_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                         _Float16 rs1, vfloat16m2_t vs2,
                                         size_t vl);
vfloat16m4_t __riscv_vfnmadd_vv_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs1, vfloat16m4_t vs2,
                                         size_t vl);
vfloat16m4_t __riscv_vfnmadd_vf_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                         _Float16 rs1, vfloat16m4_t vs2,
                                         size_t vl);
vfloat16m8_t __riscv_vfnmadd_vv_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs1, vfloat16m8_t vs2,
                                         size_t vl);
vfloat16m8_t __riscv_vfnmadd_vf_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                         _Float16 rs1, vfloat16m8_t vs2,
                                         size_t vl);
vfloat32mf2_t __riscv_vfnmadd_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat32mf2_t __riscv_vfnmadd_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                           float rs1, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat32m1_t __riscv_vfnmadd_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs1, vfloat32m1_t vs2,
                                         size_t vl);
vfloat32m1_t __riscv_vfnmadd_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                         float rs1, vfloat32m1_t vs2,
                                         size_t vl);
vfloat32m2_t __riscv_vfnmadd_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs1, vfloat32m2_t vs2,
                                         size_t vl);
vfloat32m2_t __riscv_vfnmadd_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                         float rs1, vfloat32m2_t vs2,
                                         size_t vl);
vfloat32m4_t __riscv_vfnmadd_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs1, vfloat32m4_t vs2,
                                         size_t vl);
vfloat32m4_t __riscv_vfnmadd_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                         float rs1, vfloat32m4_t vs2,
                                         size_t vl);
vfloat32m8_t __riscv_vfnmadd_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs1, vfloat32m8_t vs2,
                                         size_t vl);
vfloat32m8_t __riscv_vfnmadd_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                         float rs1, vfloat32m8_t vs2,
                                         size_t vl);
vfloat64m1_t __riscv_vfnmadd_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs1, vfloat64m1_t vs2,
                                         size_t vl);
vfloat64m1_t __riscv_vfnmadd_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                         double rs1, vfloat64m1_t vs2,
                                         size_t vl);
vfloat64m2_t __riscv_vfnmadd_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs1, vfloat64m2_t vs2,
                                         size_t vl);
vfloat64m2_t __riscv_vfnmadd_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                         double rs1, vfloat64m2_t vs2,
                                         size_t vl);
vfloat64m4_t __riscv_vfnmadd_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs1, vfloat64m4_t vs2,
                                         size_t vl);
vfloat64m4_t __riscv_vfnmadd_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                         double rs1, vfloat64m4_t vs2,
                                         size_t vl);
vfloat64m8_t __riscv_vfnmadd_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs1, vfloat64m8_t vs2,
                                         size_t vl);
vfloat64m8_t __riscv_vfnmadd_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                         double rs1, vfloat64m8_t vs2,
                                         size_t vl);
vfloat16mf4_t __riscv_vfmsub_vv_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                          vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                          size_t vl);
vfloat16mf4_t __riscv_vfmsub_vf_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                          _Float16 rs1, vfloat16mf4_t vs2,
                                          size_t vl);
vfloat16mf2_t __riscv_vfmsub_vv_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                          vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                          size_t vl);
vfloat16mf2_t __riscv_vfmsub_vf_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                          _Float16 rs1, vfloat16mf2_t vs2,
                                          size_t vl);
vfloat16m1_t __riscv_vfmsub_vv_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                        vfloat16m1_t vs1, vfloat16m1_t vs2,
                                        size_t vl);
vfloat16m1_t __riscv_vfmsub_vf_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                        _Float16 rs1, vfloat16m1_t vs2,
                                        size_t vl);
vfloat16m2_t __riscv_vfmsub_vv_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                        vfloat16m2_t vs1, vfloat16m2_t vs2,
                                        size_t vl);
vfloat16m2_t __riscv_vfmsub_vf_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                        _Float16 rs1, vfloat16m2_t vs2,
                                        size_t vl);
vfloat16m4_t __riscv_vfmsub_vv_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                        vfloat16m4_t vs1, vfloat16m4_t vs2,
                                        size_t vl);
vfloat16m4_t __riscv_vfmsub_vf_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                        _Float16 rs1, vfloat16m4_t vs2,
                                        size_t vl);
vfloat16m8_t __riscv_vfmsub_vv_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                        vfloat16m8_t vs1, vfloat16m8_t vs2,
                                        size_t vl);
vfloat16m8_t __riscv_vfmsub_vf_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                        _Float16 rs1, vfloat16m8_t vs2,
                                        size_t vl);
vfloat32mf2_t __riscv_vfmsub_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                          size_t vl);
vfloat32mf2_t __riscv_vfmsub_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                          float rs1, vfloat32mf2_t vs2,
                                          size_t vl);
vfloat32m1_t __riscv_vfmsub_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs1, vfloat32m1_t vs2,
                                        size_t vl);
vfloat32m1_t __riscv_vfmsub_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                        float rs1, vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmsub_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs1, vfloat32m2_t vs2,
                                        size_t vl);
vfloat32m2_t __riscv_vfmsub_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                        float rs1, vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmsub_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs1, vfloat32m4_t vs2,
                                        size_t vl);
vfloat32m4_t __riscv_vfmsub_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                        vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmsub_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs1, vfloat32m8_t vs2,
                                        size_t vl);
vfloat32m8_t __riscv_vfmsub_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                        vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmsub_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs1, vfloat64m1_t vs2,
                                        size_t vl);
vfloat64m1_t __riscv_vfmsub_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                        double rs1, vfloat64m1_t vs2,
                                        size_t vl);
vfloat64m2_t __riscv_vfmsub_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs1, vfloat64m2_t vs2,
                                        size_t vl);
vfloat64m2_t __riscv_vfmsub_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                        double rs1, vfloat64m2_t vs2,
                                        size_t vl);
vfloat64m4_t __riscv_vfmsub_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs1, vfloat64m4_t vs2,
                                        size_t vl);
vfloat64m4_t __riscv_vfmsub_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                        double rs1, vfloat64m4_t vs2,
                                        size_t vl);
vfloat64m8_t __riscv_vfmsub_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs1, vfloat64m8_t vs2,
                                        size_t vl);
vfloat64m8_t __riscv_vfmsub_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                        double rs1, vfloat64m8_t vs2,
                                        size_t vl);
vfloat16mf4_t __riscv_vfnmsub_vv_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                           size_t vl);
vfloat16mf4_t __riscv_vfnmsub_vf_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                           _Float16 rs1, vfloat16mf4_t vs2,
                                           size_t vl);
vfloat16mf2_t __riscv_vfnmsub_vv_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat16mf2_t __riscv_vfnmsub_vf_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                           _Float16 rs1, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat16m1_t __riscv_vfnmsub_vv_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs1, vfloat16m1_t vs2,
                                         size_t vl);
vfloat16m1_t __riscv_vfnmsub_vf_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                         _Float16 rs1, vfloat16m1_t vs2,
                                         size_t vl);
vfloat16m2_t __riscv_vfnmsub_vv_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs1, vfloat16m2_t vs2,
                                         size_t vl);
vfloat16m2_t __riscv_vfnmsub_vf_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                         _Float16 rs1, vfloat16m2_t vs2,
                                         size_t vl);
vfloat16m4_t __riscv_vfnmsub_vv_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs1, vfloat16m4_t vs2,
                                         size_t vl);
vfloat16m4_t __riscv_vfnmsub_vf_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                         _Float16 rs1, vfloat16m4_t vs2,
                                         size_t vl);
vfloat16m8_t __riscv_vfnmsub_vv_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs1, vfloat16m8_t vs2,
                                         size_t vl);
vfloat16m8_t __riscv_vfnmsub_vf_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                         _Float16 rs1, vfloat16m8_t vs2,
                                         size_t vl);
vfloat32mf2_t __riscv_vfnmsub_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat32mf2_t __riscv_vfnmsub_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                           float rs1, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat32m1_t __riscv_vfnmsub_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs1, vfloat32m1_t vs2,
                                         size_t vl);
vfloat32m1_t __riscv_vfnmsub_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                         float rs1, vfloat32m1_t vs2,
                                         size_t vl);
vfloat32m2_t __riscv_vfnmsub_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs1, vfloat32m2_t vs2,
                                         size_t vl);
vfloat32m2_t __riscv_vfnmsub_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                         float rs1, vfloat32m2_t vs2,
                                         size_t vl);
vfloat32m4_t __riscv_vfnmsub_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs1, vfloat32m4_t vs2,
                                         size_t vl);
vfloat32m4_t __riscv_vfnmsub_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                         float rs1, vfloat32m4_t vs2,
                                         size_t vl);
vfloat32m8_t __riscv_vfnmsub_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs1, vfloat32m8_t vs2,
                                         size_t vl);
vfloat32m8_t __riscv_vfnmsub_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                         float rs1, vfloat32m8_t vs2,
                                         size_t vl);
vfloat64m1_t __riscv_vfnmsub_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs1, vfloat64m1_t vs2,
                                         size_t vl);
vfloat64m1_t __riscv_vfnmsub_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                         double rs1, vfloat64m1_t vs2,
                                         size_t vl);
vfloat64m2_t __riscv_vfnmsub_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs1, vfloat64m2_t vs2,
                                         size_t vl);
vfloat64m2_t __riscv_vfnmsub_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                         double rs1, vfloat64m2_t vs2,
                                         size_t vl);
vfloat64m4_t __riscv_vfnmsub_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs1, vfloat64m4_t vs2,
                                         size_t vl);
vfloat64m4_t __riscv_vfnmsub_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                         double rs1, vfloat64m4_t vs2,
                                         size_t vl);
vfloat64m8_t __riscv_vfnmsub_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs1, vfloat64m8_t vs2,
                                         size_t vl);
vfloat64m8_t __riscv_vfnmsub_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                         double rs1, vfloat64m8_t vs2,
                                         size_t vl);
vfloat16mf4_t __riscv_vfmacc_vv_f16mf4_rm_tu(vfloat16mf4_t vd,
                                             vfloat16mf4_t vs1,
                                             vfloat16mf4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmacc_vf_f16mf4_rm_tu(vfloat16mf4_t vd, _Float16 rs1,
                                             vfloat16mf4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmacc_vv_f16mf2_rm_tu(vfloat16mf2_t vd,
                                             vfloat16mf2_t vs1,
                                             vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmacc_vf_f16mf2_rm_tu(vfloat16mf2_t vd, _Float16 rs1,
                                             vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmacc_vv_f16m1_rm_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                                           vfloat16m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m1_t __riscv_vfmacc_vf_f16m1_rm_tu(vfloat16m1_t vd, _Float16 rs1,
                                           vfloat16m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m2_t __riscv_vfmacc_vv_f16m2_rm_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                                           vfloat16m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m2_t __riscv_vfmacc_vf_f16m2_rm_tu(vfloat16m2_t vd, _Float16 rs1,
                                           vfloat16m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m4_t __riscv_vfmacc_vv_f16m4_rm_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                                           vfloat16m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m4_t __riscv_vfmacc_vf_f16m4_rm_tu(vfloat16m4_t vd, _Float16 rs1,
                                           vfloat16m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m8_t __riscv_vfmacc_vv_f16m8_rm_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                                           vfloat16m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m8_t __riscv_vfmacc_vf_f16m8_rm_tu(vfloat16m8_t vd, _Float16 rs1,
                                           vfloat16m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32mf2_t __riscv_vfmacc_vv_f32mf2_rm_tu(vfloat32mf2_t vd,
                                             vfloat32mf2_t vs1,
                                             vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmacc_vf_f32mf2_rm_tu(vfloat32mf2_t vd, float rs1,
                                             vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmacc_vv_f32m1_rm_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                                           vfloat32m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m1_t __riscv_vfmacc_vf_f32m1_rm_tu(vfloat32m1_t vd, float rs1,
                                           vfloat32m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m2_t __riscv_vfmacc_vv_f32m2_rm_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                                           vfloat32m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m2_t __riscv_vfmacc_vf_f32m2_rm_tu(vfloat32m2_t vd, float rs1,
                                           vfloat32m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m4_t __riscv_vfmacc_vv_f32m4_rm_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                                           vfloat32m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m4_t __riscv_vfmacc_vf_f32m4_rm_tu(vfloat32m4_t vd, float rs1,
                                           vfloat32m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m8_t __riscv_vfmacc_vv_f32m8_rm_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                                           vfloat32m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m8_t __riscv_vfmacc_vf_f32m8_rm_tu(vfloat32m8_t vd, float rs1,
                                           vfloat32m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m1_t __riscv_vfmacc_vv_f64m1_rm_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                                           vfloat64m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m1_t __riscv_vfmacc_vf_f64m1_rm_tu(vfloat64m1_t vd, double rs1,
                                           vfloat64m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m2_t __riscv_vfmacc_vv_f64m2_rm_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                                           vfloat64m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m2_t __riscv_vfmacc_vf_f64m2_rm_tu(vfloat64m2_t vd, double rs1,
                                           vfloat64m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m4_t __riscv_vfmacc_vv_f64m4_rm_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                                           vfloat64m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m4_t __riscv_vfmacc_vf_f64m4_rm_tu(vfloat64m4_t vd, double rs1,
                                           vfloat64m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m8_t __riscv_vfmacc_vv_f64m8_rm_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                                           vfloat64m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m8_t __riscv_vfmacc_vf_f64m8_rm_tu(vfloat64m8_t vd, double rs1,
                                           vfloat64m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16mf4_t __riscv_vfnmacc_vv_f16mf4_rm_tu(vfloat16mf4_t vd,
                                              vfloat16mf4_t vs1,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmacc_vf_f16mf4_rm_tu(vfloat16mf4_t vd, _Float16 rs1,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmacc_vv_f16mf2_rm_tu(vfloat16mf2_t vd,
                                              vfloat16mf2_t vs1,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmacc_vf_f16mf2_rm_tu(vfloat16mf2_t vd, _Float16 rs1,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmacc_vv_f16m1_rm_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                                            vfloat16m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m1_t __riscv_vfnmacc_vf_f16m1_rm_tu(vfloat16m1_t vd, _Float16 rs1,
                                            vfloat16m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m2_t __riscv_vfnmacc_vv_f16m2_rm_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                                            vfloat16m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m2_t __riscv_vfnmacc_vf_f16m2_rm_tu(vfloat16m2_t vd, _Float16 rs1,
                                            vfloat16m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m4_t __riscv_vfnmacc_vv_f16m4_rm_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                                            vfloat16m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m4_t __riscv_vfnmacc_vf_f16m4_rm_tu(vfloat16m4_t vd, _Float16 rs1,
                                            vfloat16m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m8_t __riscv_vfnmacc_vv_f16m8_rm_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                                            vfloat16m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m8_t __riscv_vfnmacc_vf_f16m8_rm_tu(vfloat16m8_t vd, _Float16 rs1,
                                            vfloat16m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32mf2_t __riscv_vfnmacc_vv_f32mf2_rm_tu(vfloat32mf2_t vd,
                                              vfloat32mf2_t vs1,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmacc_vf_f32mf2_rm_tu(vfloat32mf2_t vd, float rs1,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmacc_vv_f32m1_rm_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                                            vfloat32m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m1_t __riscv_vfnmacc_vf_f32m1_rm_tu(vfloat32m1_t vd, float rs1,
                                            vfloat32m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m2_t __riscv_vfnmacc_vv_f32m2_rm_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                                            vfloat32m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m2_t __riscv_vfnmacc_vf_f32m2_rm_tu(vfloat32m2_t vd, float rs1,
                                            vfloat32m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m4_t __riscv_vfnmacc_vv_f32m4_rm_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                                            vfloat32m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m4_t __riscv_vfnmacc_vf_f32m4_rm_tu(vfloat32m4_t vd, float rs1,
                                            vfloat32m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m8_t __riscv_vfnmacc_vv_f32m8_rm_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                                            vfloat32m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m8_t __riscv_vfnmacc_vf_f32m8_rm_tu(vfloat32m8_t vd, float rs1,
                                            vfloat32m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m1_t __riscv_vfnmacc_vv_f64m1_rm_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                                            vfloat64m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m1_t __riscv_vfnmacc_vf_f64m1_rm_tu(vfloat64m1_t vd, double rs1,
                                            vfloat64m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m2_t __riscv_vfnmacc_vv_f64m2_rm_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                                            vfloat64m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m2_t __riscv_vfnmacc_vf_f64m2_rm_tu(vfloat64m2_t vd, double rs1,
                                            vfloat64m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m4_t __riscv_vfnmacc_vv_f64m4_rm_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                                            vfloat64m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m4_t __riscv_vfnmacc_vf_f64m4_rm_tu(vfloat64m4_t vd, double rs1,
                                            vfloat64m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m8_t __riscv_vfnmacc_vv_f64m8_rm_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                                            vfloat64m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m8_t __riscv_vfnmacc_vf_f64m8_rm_tu(vfloat64m8_t vd, double rs1,
                                            vfloat64m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16mf4_t __riscv_vfmsac_vv_f16mf4_rm_tu(vfloat16mf4_t vd,
                                             vfloat16mf4_t vs1,
                                             vfloat16mf4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsac_vf_f16mf4_rm_tu(vfloat16mf4_t vd, _Float16 rs1,
                                             vfloat16mf4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsac_vv_f16mf2_rm_tu(vfloat16mf2_t vd,
                                             vfloat16mf2_t vs1,
                                             vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsac_vf_f16mf2_rm_tu(vfloat16mf2_t vd, _Float16 rs1,
                                             vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsac_vv_f16m1_rm_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                                           vfloat16m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m1_t __riscv_vfmsac_vf_f16m1_rm_tu(vfloat16m1_t vd, _Float16 rs1,
                                           vfloat16m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m2_t __riscv_vfmsac_vv_f16m2_rm_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                                           vfloat16m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m2_t __riscv_vfmsac_vf_f16m2_rm_tu(vfloat16m2_t vd, _Float16 rs1,
                                           vfloat16m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m4_t __riscv_vfmsac_vv_f16m4_rm_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                                           vfloat16m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m4_t __riscv_vfmsac_vf_f16m4_rm_tu(vfloat16m4_t vd, _Float16 rs1,
                                           vfloat16m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m8_t __riscv_vfmsac_vv_f16m8_rm_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                                           vfloat16m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m8_t __riscv_vfmsac_vf_f16m8_rm_tu(vfloat16m8_t vd, _Float16 rs1,
                                           vfloat16m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32mf2_t __riscv_vfmsac_vv_f32mf2_rm_tu(vfloat32mf2_t vd,
                                             vfloat32mf2_t vs1,
                                             vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsac_vf_f32mf2_rm_tu(vfloat32mf2_t vd, float rs1,
                                             vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsac_vv_f32m1_rm_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                                           vfloat32m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m1_t __riscv_vfmsac_vf_f32m1_rm_tu(vfloat32m1_t vd, float rs1,
                                           vfloat32m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m2_t __riscv_vfmsac_vv_f32m2_rm_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                                           vfloat32m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m2_t __riscv_vfmsac_vf_f32m2_rm_tu(vfloat32m2_t vd, float rs1,
                                           vfloat32m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m4_t __riscv_vfmsac_vv_f32m4_rm_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                                           vfloat32m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m4_t __riscv_vfmsac_vf_f32m4_rm_tu(vfloat32m4_t vd, float rs1,
                                           vfloat32m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m8_t __riscv_vfmsac_vv_f32m8_rm_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                                           vfloat32m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m8_t __riscv_vfmsac_vf_f32m8_rm_tu(vfloat32m8_t vd, float rs1,
                                           vfloat32m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m1_t __riscv_vfmsac_vv_f64m1_rm_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                                           vfloat64m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m1_t __riscv_vfmsac_vf_f64m1_rm_tu(vfloat64m1_t vd, double rs1,
                                           vfloat64m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m2_t __riscv_vfmsac_vv_f64m2_rm_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                                           vfloat64m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m2_t __riscv_vfmsac_vf_f64m2_rm_tu(vfloat64m2_t vd, double rs1,
                                           vfloat64m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m4_t __riscv_vfmsac_vv_f64m4_rm_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                                           vfloat64m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m4_t __riscv_vfmsac_vf_f64m4_rm_tu(vfloat64m4_t vd, double rs1,
                                           vfloat64m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m8_t __riscv_vfmsac_vv_f64m8_rm_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                                           vfloat64m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m8_t __riscv_vfmsac_vf_f64m8_rm_tu(vfloat64m8_t vd, double rs1,
                                           vfloat64m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16mf4_t __riscv_vfnmsac_vv_f16mf4_rm_tu(vfloat16mf4_t vd,
                                              vfloat16mf4_t vs1,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsac_vf_f16mf4_rm_tu(vfloat16mf4_t vd, _Float16 rs1,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmsac_vv_f16mf2_rm_tu(vfloat16mf2_t vd,
                                              vfloat16mf2_t vs1,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmsac_vf_f16mf2_rm_tu(vfloat16mf2_t vd, _Float16 rs1,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmsac_vv_f16m1_rm_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                                            vfloat16m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m1_t __riscv_vfnmsac_vf_f16m1_rm_tu(vfloat16m1_t vd, _Float16 rs1,
                                            vfloat16m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m2_t __riscv_vfnmsac_vv_f16m2_rm_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                                            vfloat16m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m2_t __riscv_vfnmsac_vf_f16m2_rm_tu(vfloat16m2_t vd, _Float16 rs1,
                                            vfloat16m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m4_t __riscv_vfnmsac_vv_f16m4_rm_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                                            vfloat16m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m4_t __riscv_vfnmsac_vf_f16m4_rm_tu(vfloat16m4_t vd, _Float16 rs1,
                                            vfloat16m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m8_t __riscv_vfnmsac_vv_f16m8_rm_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                                            vfloat16m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m8_t __riscv_vfnmsac_vf_f16m8_rm_tu(vfloat16m8_t vd, _Float16 rs1,
                                            vfloat16m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32mf2_t __riscv_vfnmsac_vv_f32mf2_rm_tu(vfloat32mf2_t vd,
                                              vfloat32mf2_t vs1,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsac_vf_f32mf2_rm_tu(vfloat32mf2_t vd, float rs1,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmsac_vv_f32m1_rm_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                                            vfloat32m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m1_t __riscv_vfnmsac_vf_f32m1_rm_tu(vfloat32m1_t vd, float rs1,
                                            vfloat32m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m2_t __riscv_vfnmsac_vv_f32m2_rm_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                                            vfloat32m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m2_t __riscv_vfnmsac_vf_f32m2_rm_tu(vfloat32m2_t vd, float rs1,
                                            vfloat32m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m4_t __riscv_vfnmsac_vv_f32m4_rm_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                                            vfloat32m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m4_t __riscv_vfnmsac_vf_f32m4_rm_tu(vfloat32m4_t vd, float rs1,
                                            vfloat32m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m8_t __riscv_vfnmsac_vv_f32m8_rm_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                                            vfloat32m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m8_t __riscv_vfnmsac_vf_f32m8_rm_tu(vfloat32m8_t vd, float rs1,
                                            vfloat32m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m1_t __riscv_vfnmsac_vv_f64m1_rm_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                                            vfloat64m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m1_t __riscv_vfnmsac_vf_f64m1_rm_tu(vfloat64m1_t vd, double rs1,
                                            vfloat64m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m2_t __riscv_vfnmsac_vv_f64m2_rm_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                                            vfloat64m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m2_t __riscv_vfnmsac_vf_f64m2_rm_tu(vfloat64m2_t vd, double rs1,
                                            vfloat64m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m4_t __riscv_vfnmsac_vv_f64m4_rm_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                                            vfloat64m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m4_t __riscv_vfnmsac_vf_f64m4_rm_tu(vfloat64m4_t vd, double rs1,
                                            vfloat64m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m8_t __riscv_vfnmsac_vv_f64m8_rm_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                                            vfloat64m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m8_t __riscv_vfnmsac_vf_f64m8_rm_tu(vfloat64m8_t vd, double rs1,
                                            vfloat64m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16mf4_t __riscv_vfmadd_vv_f16mf4_rm_tu(vfloat16mf4_t vd,
                                             vfloat16mf4_t vs1,
                                             vfloat16mf4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmadd_vf_f16mf4_rm_tu(vfloat16mf4_t vd, _Float16 rs1,
                                             vfloat16mf4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmadd_vv_f16mf2_rm_tu(vfloat16mf2_t vd,
                                             vfloat16mf2_t vs1,
                                             vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmadd_vf_f16mf2_rm_tu(vfloat16mf2_t vd, _Float16 rs1,
                                             vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmadd_vv_f16m1_rm_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                                           vfloat16m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m1_t __riscv_vfmadd_vf_f16m1_rm_tu(vfloat16m1_t vd, _Float16 rs1,
                                           vfloat16m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m2_t __riscv_vfmadd_vv_f16m2_rm_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                                           vfloat16m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m2_t __riscv_vfmadd_vf_f16m2_rm_tu(vfloat16m2_t vd, _Float16 rs1,
                                           vfloat16m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m4_t __riscv_vfmadd_vv_f16m4_rm_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                                           vfloat16m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m4_t __riscv_vfmadd_vf_f16m4_rm_tu(vfloat16m4_t vd, _Float16 rs1,
                                           vfloat16m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m8_t __riscv_vfmadd_vv_f16m8_rm_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                                           vfloat16m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m8_t __riscv_vfmadd_vf_f16m8_rm_tu(vfloat16m8_t vd, _Float16 rs1,
                                           vfloat16m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32mf2_t __riscv_vfmadd_vv_f32mf2_rm_tu(vfloat32mf2_t vd,
                                             vfloat32mf2_t vs1,
                                             vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmadd_vf_f32mf2_rm_tu(vfloat32mf2_t vd, float rs1,
                                             vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmadd_vv_f32m1_rm_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                                           vfloat32m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m1_t __riscv_vfmadd_vf_f32m1_rm_tu(vfloat32m1_t vd, float rs1,
                                           vfloat32m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m2_t __riscv_vfmadd_vv_f32m2_rm_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                                           vfloat32m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m2_t __riscv_vfmadd_vf_f32m2_rm_tu(vfloat32m2_t vd, float rs1,
                                           vfloat32m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m4_t __riscv_vfmadd_vv_f32m4_rm_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                                           vfloat32m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m4_t __riscv_vfmadd_vf_f32m4_rm_tu(vfloat32m4_t vd, float rs1,
                                           vfloat32m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m8_t __riscv_vfmadd_vv_f32m8_rm_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                                           vfloat32m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m8_t __riscv_vfmadd_vf_f32m8_rm_tu(vfloat32m8_t vd, float rs1,
                                           vfloat32m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m1_t __riscv_vfmadd_vv_f64m1_rm_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                                           vfloat64m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m1_t __riscv_vfmadd_vf_f64m1_rm_tu(vfloat64m1_t vd, double rs1,
                                           vfloat64m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m2_t __riscv_vfmadd_vv_f64m2_rm_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                                           vfloat64m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m2_t __riscv_vfmadd_vf_f64m2_rm_tu(vfloat64m2_t vd, double rs1,
                                           vfloat64m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m4_t __riscv_vfmadd_vv_f64m4_rm_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                                           vfloat64m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m4_t __riscv_vfmadd_vf_f64m4_rm_tu(vfloat64m4_t vd, double rs1,
                                           vfloat64m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m8_t __riscv_vfmadd_vv_f64m8_rm_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                                           vfloat64m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m8_t __riscv_vfmadd_vf_f64m8_rm_tu(vfloat64m8_t vd, double rs1,
                                           vfloat64m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16mf4_t __riscv_vfnmadd_vv_f16mf4_rm_tu(vfloat16mf4_t vd,
                                              vfloat16mf4_t vs1,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmadd_vf_f16mf4_rm_tu(vfloat16mf4_t vd, _Float16 rs1,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmadd_vv_f16mf2_rm_tu(vfloat16mf2_t vd,
                                              vfloat16mf2_t vs1,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmadd_vf_f16mf2_rm_tu(vfloat16mf2_t vd, _Float16 rs1,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmadd_vv_f16m1_rm_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                                            vfloat16m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m1_t __riscv_vfnmadd_vf_f16m1_rm_tu(vfloat16m1_t vd, _Float16 rs1,
                                            vfloat16m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m2_t __riscv_vfnmadd_vv_f16m2_rm_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                                            vfloat16m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m2_t __riscv_vfnmadd_vf_f16m2_rm_tu(vfloat16m2_t vd, _Float16 rs1,
                                            vfloat16m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m4_t __riscv_vfnmadd_vv_f16m4_rm_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                                            vfloat16m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m4_t __riscv_vfnmadd_vf_f16m4_rm_tu(vfloat16m4_t vd, _Float16 rs1,
                                            vfloat16m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m8_t __riscv_vfnmadd_vv_f16m8_rm_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                                            vfloat16m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m8_t __riscv_vfnmadd_vf_f16m8_rm_tu(vfloat16m8_t vd, _Float16 rs1,
                                            vfloat16m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32mf2_t __riscv_vfnmadd_vv_f32mf2_rm_tu(vfloat32mf2_t vd,
                                              vfloat32mf2_t vs1,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmadd_vf_f32mf2_rm_tu(vfloat32mf2_t vd, float rs1,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmadd_vv_f32m1_rm_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                                            vfloat32m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m1_t __riscv_vfnmadd_vf_f32m1_rm_tu(vfloat32m1_t vd, float rs1,
                                            vfloat32m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m2_t __riscv_vfnmadd_vv_f32m2_rm_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                                            vfloat32m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m2_t __riscv_vfnmadd_vf_f32m2_rm_tu(vfloat32m2_t vd, float rs1,
                                            vfloat32m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m4_t __riscv_vfnmadd_vv_f32m4_rm_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                                            vfloat32m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m4_t __riscv_vfnmadd_vf_f32m4_rm_tu(vfloat32m4_t vd, float rs1,
                                            vfloat32m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m8_t __riscv_vfnmadd_vv_f32m8_rm_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                                            vfloat32m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m8_t __riscv_vfnmadd_vf_f32m8_rm_tu(vfloat32m8_t vd, float rs1,
                                            vfloat32m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m1_t __riscv_vfnmadd_vv_f64m1_rm_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                                            vfloat64m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m1_t __riscv_vfnmadd_vf_f64m1_rm_tu(vfloat64m1_t vd, double rs1,
                                            vfloat64m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m2_t __riscv_vfnmadd_vv_f64m2_rm_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                                            vfloat64m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m2_t __riscv_vfnmadd_vf_f64m2_rm_tu(vfloat64m2_t vd, double rs1,
                                            vfloat64m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m4_t __riscv_vfnmadd_vv_f64m4_rm_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                                            vfloat64m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m4_t __riscv_vfnmadd_vf_f64m4_rm_tu(vfloat64m4_t vd, double rs1,
                                            vfloat64m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m8_t __riscv_vfnmadd_vv_f64m8_rm_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                                            vfloat64m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m8_t __riscv_vfnmadd_vf_f64m8_rm_tu(vfloat64m8_t vd, double rs1,
                                            vfloat64m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16mf4_t __riscv_vfmsub_vv_f16mf4_rm_tu(vfloat16mf4_t vd,
                                             vfloat16mf4_t vs1,
                                             vfloat16mf4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsub_vf_f16mf4_rm_tu(vfloat16mf4_t vd, _Float16 rs1,
                                             vfloat16mf4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsub_vv_f16mf2_rm_tu(vfloat16mf2_t vd,
                                             vfloat16mf2_t vs1,
                                             vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsub_vf_f16mf2_rm_tu(vfloat16mf2_t vd, _Float16 rs1,
                                             vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsub_vv_f16m1_rm_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                                           vfloat16m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m1_t __riscv_vfmsub_vf_f16m1_rm_tu(vfloat16m1_t vd, _Float16 rs1,
                                           vfloat16m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m2_t __riscv_vfmsub_vv_f16m2_rm_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                                           vfloat16m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m2_t __riscv_vfmsub_vf_f16m2_rm_tu(vfloat16m2_t vd, _Float16 rs1,
                                           vfloat16m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m4_t __riscv_vfmsub_vv_f16m4_rm_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                                           vfloat16m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m4_t __riscv_vfmsub_vf_f16m4_rm_tu(vfloat16m4_t vd, _Float16 rs1,
                                           vfloat16m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m8_t __riscv_vfmsub_vv_f16m8_rm_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                                           vfloat16m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m8_t __riscv_vfmsub_vf_f16m8_rm_tu(vfloat16m8_t vd, _Float16 rs1,
                                           vfloat16m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32mf2_t __riscv_vfmsub_vv_f32mf2_rm_tu(vfloat32mf2_t vd,
                                             vfloat32mf2_t vs1,
                                             vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsub_vf_f32mf2_rm_tu(vfloat32mf2_t vd, float rs1,
                                             vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsub_vv_f32m1_rm_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                                           vfloat32m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m1_t __riscv_vfmsub_vf_f32m1_rm_tu(vfloat32m1_t vd, float rs1,
                                           vfloat32m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m2_t __riscv_vfmsub_vv_f32m2_rm_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                                           vfloat32m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m2_t __riscv_vfmsub_vf_f32m2_rm_tu(vfloat32m2_t vd, float rs1,
                                           vfloat32m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m4_t __riscv_vfmsub_vv_f32m4_rm_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                                           vfloat32m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m4_t __riscv_vfmsub_vf_f32m4_rm_tu(vfloat32m4_t vd, float rs1,
                                           vfloat32m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m8_t __riscv_vfmsub_vv_f32m8_rm_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                                           vfloat32m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m8_t __riscv_vfmsub_vf_f32m8_rm_tu(vfloat32m8_t vd, float rs1,
                                           vfloat32m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m1_t __riscv_vfmsub_vv_f64m1_rm_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                                           vfloat64m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m1_t __riscv_vfmsub_vf_f64m1_rm_tu(vfloat64m1_t vd, double rs1,
                                           vfloat64m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m2_t __riscv_vfmsub_vv_f64m2_rm_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                                           vfloat64m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m2_t __riscv_vfmsub_vf_f64m2_rm_tu(vfloat64m2_t vd, double rs1,
                                           vfloat64m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m4_t __riscv_vfmsub_vv_f64m4_rm_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                                           vfloat64m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m4_t __riscv_vfmsub_vf_f64m4_rm_tu(vfloat64m4_t vd, double rs1,
                                           vfloat64m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m8_t __riscv_vfmsub_vv_f64m8_rm_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                                           vfloat64m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m8_t __riscv_vfmsub_vf_f64m8_rm_tu(vfloat64m8_t vd, double rs1,
                                           vfloat64m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16mf4_t __riscv_vfnmsub_vv_f16mf4_rm_tu(vfloat16mf4_t vd,
                                              vfloat16mf4_t vs1,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsub_vf_f16mf4_rm_tu(vfloat16mf4_t vd, _Float16 rs1,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmsub_vv_f16mf2_rm_tu(vfloat16mf2_t vd,
                                              vfloat16mf2_t vs1,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmsub_vf_f16mf2_rm_tu(vfloat16mf2_t vd, _Float16 rs1,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmsub_vv_f16m1_rm_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                                            vfloat16m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m1_t __riscv_vfnmsub_vf_f16m1_rm_tu(vfloat16m1_t vd, _Float16 rs1,
                                            vfloat16m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m2_t __riscv_vfnmsub_vv_f16m2_rm_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                                            vfloat16m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m2_t __riscv_vfnmsub_vf_f16m2_rm_tu(vfloat16m2_t vd, _Float16 rs1,
                                            vfloat16m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m4_t __riscv_vfnmsub_vv_f16m4_rm_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                                            vfloat16m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m4_t __riscv_vfnmsub_vf_f16m4_rm_tu(vfloat16m4_t vd, _Float16 rs1,
                                            vfloat16m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m8_t __riscv_vfnmsub_vv_f16m8_rm_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                                            vfloat16m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m8_t __riscv_vfnmsub_vf_f16m8_rm_tu(vfloat16m8_t vd, _Float16 rs1,
                                            vfloat16m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32mf2_t __riscv_vfnmsub_vv_f32mf2_rm_tu(vfloat32mf2_t vd,
                                              vfloat32mf2_t vs1,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsub_vf_f32mf2_rm_tu(vfloat32mf2_t vd, float rs1,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmsub_vv_f32m1_rm_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                                            vfloat32m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m1_t __riscv_vfnmsub_vf_f32m1_rm_tu(vfloat32m1_t vd, float rs1,
                                            vfloat32m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m2_t __riscv_vfnmsub_vv_f32m2_rm_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                                            vfloat32m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m2_t __riscv_vfnmsub_vf_f32m2_rm_tu(vfloat32m2_t vd, float rs1,
                                            vfloat32m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m4_t __riscv_vfnmsub_vv_f32m4_rm_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                                            vfloat32m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m4_t __riscv_vfnmsub_vf_f32m4_rm_tu(vfloat32m4_t vd, float rs1,
                                            vfloat32m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m8_t __riscv_vfnmsub_vv_f32m8_rm_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                                            vfloat32m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m8_t __riscv_vfnmsub_vf_f32m8_rm_tu(vfloat32m8_t vd, float rs1,
                                            vfloat32m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m1_t __riscv_vfnmsub_vv_f64m1_rm_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                                            vfloat64m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m1_t __riscv_vfnmsub_vf_f64m1_rm_tu(vfloat64m1_t vd, double rs1,
                                            vfloat64m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m2_t __riscv_vfnmsub_vv_f64m2_rm_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                                            vfloat64m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m2_t __riscv_vfnmsub_vf_f64m2_rm_tu(vfloat64m2_t vd, double rs1,
                                            vfloat64m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m4_t __riscv_vfnmsub_vv_f64m4_rm_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                                            vfloat64m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m4_t __riscv_vfnmsub_vf_f64m4_rm_tu(vfloat64m4_t vd, double rs1,
                                            vfloat64m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m8_t __riscv_vfnmsub_vv_f64m8_rm_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                                            vfloat64m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m8_t __riscv_vfnmsub_vf_f64m8_rm_tu(vfloat64m8_t vd, double rs1,
                                            vfloat64m8_t vs2, unsigned int frm,
                                            size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmacc_vv_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat16mf4_t vs1,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmacc_vf_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                              _Float16 rs1, vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmacc_vv_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat16mf2_t vs1,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmacc_vf_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                              _Float16 rs1, vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmacc_vv_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat16m1_t vs1, vfloat16m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmacc_vf_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                            _Float16 rs1, vfloat16m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmacc_vv_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat16m2_t vs1, vfloat16m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmacc_vf_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                            _Float16 rs1, vfloat16m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmacc_vv_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat16m4_t vs1, vfloat16m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmacc_vf_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                            _Float16 rs1, vfloat16m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmacc_vv_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                            vfloat16m8_t vs1, vfloat16m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmacc_vf_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                            _Float16 rs1, vfloat16m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmacc_vv_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs1,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmacc_vf_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                              float rs1, vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmacc_vv_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs1, vfloat32m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmacc_vf_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                            float rs1, vfloat32m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmacc_vv_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs1, vfloat32m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmacc_vf_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                            float rs1, vfloat32m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmacc_vv_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs1, vfloat32m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmacc_vf_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                            float rs1, vfloat32m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmacc_vv_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs1, vfloat32m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmacc_vf_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                            float rs1, vfloat32m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmacc_vv_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs1, vfloat64m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmacc_vf_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                            double rs1, vfloat64m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmacc_vv_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs1, vfloat64m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmacc_vf_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                            double rs1, vfloat64m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmacc_vv_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs1, vfloat64m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmacc_vf_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                            double rs1, vfloat64m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmacc_vv_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs1, vfloat64m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmacc_vf_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                            double rs1, vfloat64m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmacc_vv_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                               vfloat16mf4_t vs1,
                                               vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmacc_vf_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                               _Float16 rs1, vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmacc_vv_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                               vfloat16mf2_t vs1,
                                               vfloat16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmacc_vf_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                               _Float16 rs1, vfloat16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmacc_vv_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                             vfloat16m1_t vs1, vfloat16m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmacc_vf_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                             _Float16 rs1, vfloat16m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmacc_vv_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                             vfloat16m2_t vs1, vfloat16m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmacc_vf_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                             _Float16 rs1, vfloat16m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmacc_vv_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                             vfloat16m4_t vs1, vfloat16m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmacc_vf_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                             _Float16 rs1, vfloat16m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmacc_vv_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                             vfloat16m8_t vs1, vfloat16m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmacc_vf_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                             _Float16 rs1, vfloat16m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmacc_vv_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat32mf2_t vs1,
                                               vfloat32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmacc_vf_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                               float rs1, vfloat32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmacc_vv_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat32m1_t vs1, vfloat32m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmacc_vf_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                             float rs1, vfloat32m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmacc_vv_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat32m2_t vs1, vfloat32m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmacc_vf_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                             float rs1, vfloat32m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmacc_vv_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat32m4_t vs1, vfloat32m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmacc_vf_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                             float rs1, vfloat32m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmacc_vv_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat32m8_t vs1, vfloat32m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmacc_vf_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                             float rs1, vfloat32m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmacc_vv_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat64m1_t vs1, vfloat64m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmacc_vf_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                             double rs1, vfloat64m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmacc_vv_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat64m2_t vs1, vfloat64m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmacc_vf_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                             double rs1, vfloat64m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmacc_vv_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat64m4_t vs1, vfloat64m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmacc_vf_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                             double rs1, vfloat64m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmacc_vv_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat64m8_t vs1, vfloat64m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmacc_vf_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                             double rs1, vfloat64m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsac_vv_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat16mf4_t vs1,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsac_vf_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                              _Float16 rs1, vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsac_vv_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat16mf2_t vs1,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsac_vf_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                              _Float16 rs1, vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsac_vv_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat16m1_t vs1, vfloat16m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsac_vf_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                            _Float16 rs1, vfloat16m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsac_vv_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat16m2_t vs1, vfloat16m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsac_vf_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                            _Float16 rs1, vfloat16m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsac_vv_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat16m4_t vs1, vfloat16m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsac_vf_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                            _Float16 rs1, vfloat16m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsac_vv_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                            vfloat16m8_t vs1, vfloat16m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsac_vf_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                            _Float16 rs1, vfloat16m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsac_vv_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs1,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsac_vf_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                              float rs1, vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsac_vv_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs1, vfloat32m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsac_vf_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                            float rs1, vfloat32m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsac_vv_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs1, vfloat32m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsac_vf_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                            float rs1, vfloat32m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsac_vv_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs1, vfloat32m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsac_vf_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                            float rs1, vfloat32m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsac_vv_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs1, vfloat32m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsac_vf_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                            float rs1, vfloat32m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsac_vv_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs1, vfloat64m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsac_vf_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                            double rs1, vfloat64m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsac_vv_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs1, vfloat64m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsac_vf_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                            double rs1, vfloat64m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsac_vv_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs1, vfloat64m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsac_vf_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                            double rs1, vfloat64m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsac_vv_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs1, vfloat64m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsac_vf_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                            double rs1, vfloat64m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsac_vv_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                               vfloat16mf4_t vs1,
                                               vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsac_vf_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                               _Float16 rs1, vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmsac_vv_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                               vfloat16mf2_t vs1,
                                               vfloat16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmsac_vf_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                               _Float16 rs1, vfloat16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmsac_vv_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                             vfloat16m1_t vs1, vfloat16m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmsac_vf_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                             _Float16 rs1, vfloat16m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsac_vv_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                             vfloat16m2_t vs1, vfloat16m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsac_vf_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                             _Float16 rs1, vfloat16m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsac_vv_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                             vfloat16m4_t vs1, vfloat16m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsac_vf_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                             _Float16 rs1, vfloat16m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsac_vv_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                             vfloat16m8_t vs1, vfloat16m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsac_vf_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                             _Float16 rs1, vfloat16m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsac_vv_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat32mf2_t vs1,
                                               vfloat32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsac_vf_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                               float rs1, vfloat32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmsac_vv_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat32m1_t vs1, vfloat32m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmsac_vf_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                             float rs1, vfloat32m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsac_vv_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat32m2_t vs1, vfloat32m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsac_vf_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                             float rs1, vfloat32m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsac_vv_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat32m4_t vs1, vfloat32m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsac_vf_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                             float rs1, vfloat32m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsac_vv_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat32m8_t vs1, vfloat32m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsac_vf_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                             float rs1, vfloat32m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsac_vv_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat64m1_t vs1, vfloat64m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsac_vf_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                             double rs1, vfloat64m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsac_vv_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat64m2_t vs1, vfloat64m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsac_vf_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                             double rs1, vfloat64m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsac_vv_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat64m4_t vs1, vfloat64m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsac_vf_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                             double rs1, vfloat64m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsac_vv_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat64m8_t vs1, vfloat64m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsac_vf_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                             double rs1, vfloat64m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmadd_vv_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat16mf4_t vs1,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmadd_vf_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                              _Float16 rs1, vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmadd_vv_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat16mf2_t vs1,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmadd_vf_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                              _Float16 rs1, vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmadd_vv_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat16m1_t vs1, vfloat16m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmadd_vf_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                            _Float16 rs1, vfloat16m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmadd_vv_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat16m2_t vs1, vfloat16m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmadd_vf_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                            _Float16 rs1, vfloat16m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmadd_vv_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat16m4_t vs1, vfloat16m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmadd_vf_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                            _Float16 rs1, vfloat16m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmadd_vv_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                            vfloat16m8_t vs1, vfloat16m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmadd_vf_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                            _Float16 rs1, vfloat16m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmadd_vv_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs1,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmadd_vf_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                              float rs1, vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmadd_vv_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs1, vfloat32m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmadd_vf_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                            float rs1, vfloat32m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmadd_vv_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs1, vfloat32m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmadd_vf_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                            float rs1, vfloat32m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmadd_vv_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs1, vfloat32m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmadd_vf_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                            float rs1, vfloat32m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmadd_vv_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs1, vfloat32m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmadd_vf_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                            float rs1, vfloat32m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmadd_vv_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs1, vfloat64m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmadd_vf_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                            double rs1, vfloat64m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmadd_vv_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs1, vfloat64m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmadd_vf_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                            double rs1, vfloat64m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmadd_vv_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs1, vfloat64m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmadd_vf_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                            double rs1, vfloat64m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmadd_vv_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs1, vfloat64m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmadd_vf_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                            double rs1, vfloat64m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmadd_vv_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                               vfloat16mf4_t vs1,
                                               vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmadd_vf_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                               _Float16 rs1, vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmadd_vv_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                               vfloat16mf2_t vs1,
                                               vfloat16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmadd_vf_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                               _Float16 rs1, vfloat16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmadd_vv_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                             vfloat16m1_t vs1, vfloat16m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmadd_vf_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                             _Float16 rs1, vfloat16m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmadd_vv_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                             vfloat16m2_t vs1, vfloat16m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmadd_vf_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                             _Float16 rs1, vfloat16m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmadd_vv_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                             vfloat16m4_t vs1, vfloat16m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmadd_vf_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                             _Float16 rs1, vfloat16m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmadd_vv_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                             vfloat16m8_t vs1, vfloat16m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmadd_vf_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                             _Float16 rs1, vfloat16m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmadd_vv_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat32mf2_t vs1,
                                               vfloat32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmadd_vf_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                               float rs1, vfloat32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmadd_vv_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat32m1_t vs1, vfloat32m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmadd_vf_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                             float rs1, vfloat32m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmadd_vv_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat32m2_t vs1, vfloat32m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmadd_vf_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                             float rs1, vfloat32m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmadd_vv_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat32m4_t vs1, vfloat32m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmadd_vf_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                             float rs1, vfloat32m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmadd_vv_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat32m8_t vs1, vfloat32m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmadd_vf_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                             float rs1, vfloat32m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmadd_vv_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat64m1_t vs1, vfloat64m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmadd_vf_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                             double rs1, vfloat64m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmadd_vv_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat64m2_t vs1, vfloat64m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmadd_vf_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                             double rs1, vfloat64m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmadd_vv_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat64m4_t vs1, vfloat64m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmadd_vf_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                             double rs1, vfloat64m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmadd_vv_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat64m8_t vs1, vfloat64m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmadd_vf_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                             double rs1, vfloat64m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsub_vv_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat16mf4_t vs1,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsub_vf_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                              _Float16 rs1, vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsub_vv_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat16mf2_t vs1,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsub_vf_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                              _Float16 rs1, vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsub_vv_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat16m1_t vs1, vfloat16m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsub_vf_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                            _Float16 rs1, vfloat16m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsub_vv_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat16m2_t vs1, vfloat16m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsub_vf_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                            _Float16 rs1, vfloat16m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsub_vv_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat16m4_t vs1, vfloat16m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsub_vf_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                            _Float16 rs1, vfloat16m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsub_vv_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                            vfloat16m8_t vs1, vfloat16m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsub_vf_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                            _Float16 rs1, vfloat16m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsub_vv_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs1,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsub_vf_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                              float rs1, vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsub_vv_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs1, vfloat32m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsub_vf_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                            float rs1, vfloat32m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsub_vv_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs1, vfloat32m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsub_vf_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                            float rs1, vfloat32m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsub_vv_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs1, vfloat32m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsub_vf_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                            float rs1, vfloat32m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsub_vv_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs1, vfloat32m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsub_vf_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                            float rs1, vfloat32m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsub_vv_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs1, vfloat64m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsub_vf_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                            double rs1, vfloat64m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsub_vv_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs1, vfloat64m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsub_vf_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                            double rs1, vfloat64m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsub_vv_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs1, vfloat64m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsub_vf_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                            double rs1, vfloat64m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsub_vv_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs1, vfloat64m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsub_vf_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                            double rs1, vfloat64m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsub_vv_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                               vfloat16mf4_t vs1,
                                               vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsub_vf_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                               _Float16 rs1, vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmsub_vv_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                               vfloat16mf2_t vs1,
                                               vfloat16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmsub_vf_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                               _Float16 rs1, vfloat16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmsub_vv_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                             vfloat16m1_t vs1, vfloat16m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmsub_vf_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                             _Float16 rs1, vfloat16m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsub_vv_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                             vfloat16m2_t vs1, vfloat16m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsub_vf_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                             _Float16 rs1, vfloat16m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsub_vv_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                             vfloat16m4_t vs1, vfloat16m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsub_vf_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                             _Float16 rs1, vfloat16m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsub_vv_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                             vfloat16m8_t vs1, vfloat16m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsub_vf_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                             _Float16 rs1, vfloat16m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsub_vv_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat32mf2_t vs1,
                                               vfloat32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsub_vf_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                               float rs1, vfloat32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmsub_vv_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat32m1_t vs1, vfloat32m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmsub_vf_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                             float rs1, vfloat32m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsub_vv_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat32m2_t vs1, vfloat32m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsub_vf_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                             float rs1, vfloat32m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsub_vv_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat32m4_t vs1, vfloat32m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsub_vf_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                             float rs1, vfloat32m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsub_vv_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat32m8_t vs1, vfloat32m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsub_vf_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                             float rs1, vfloat32m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsub_vv_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat64m1_t vs1, vfloat64m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsub_vf_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                             double rs1, vfloat64m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsub_vv_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat64m2_t vs1, vfloat64m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsub_vf_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                             double rs1, vfloat64m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsub_vv_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat64m4_t vs1, vfloat64m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsub_vf_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                             double rs1, vfloat64m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsub_vv_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat64m8_t vs1, vfloat64m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsub_vf_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                             double rs1, vfloat64m8_t vs2,
                                             unsigned int frm, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmacc_vv_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                               vfloat16mf4_t vs1,
                                               vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmacc_vf_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                               _Float16 rs1, vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmacc_vv_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                               vfloat16mf2_t vs1,
                                               vfloat16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmacc_vf_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                               _Float16 rs1, vfloat16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmacc_vv_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                             vfloat16m1_t vs1, vfloat16m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmacc_vf_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                             _Float16 rs1, vfloat16m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmacc_vv_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                             vfloat16m2_t vs1, vfloat16m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmacc_vf_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                             _Float16 rs1, vfloat16m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmacc_vv_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                             vfloat16m4_t vs1, vfloat16m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmacc_vf_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                             _Float16 rs1, vfloat16m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmacc_vv_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                             vfloat16m8_t vs1, vfloat16m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmacc_vf_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                             _Float16 rs1, vfloat16m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmacc_vv_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat32mf2_t vs1,
                                               vfloat32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmacc_vf_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                               float rs1, vfloat32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmacc_vv_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat32m1_t vs1, vfloat32m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmacc_vf_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                             float rs1, vfloat32m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmacc_vv_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat32m2_t vs1, vfloat32m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmacc_vf_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                             float rs1, vfloat32m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmacc_vv_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat32m4_t vs1, vfloat32m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmacc_vf_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                             float rs1, vfloat32m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmacc_vv_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat32m8_t vs1, vfloat32m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmacc_vf_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                             float rs1, vfloat32m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmacc_vv_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat64m1_t vs1, vfloat64m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmacc_vf_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                             double rs1, vfloat64m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmacc_vv_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat64m2_t vs1, vfloat64m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmacc_vf_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                             double rs1, vfloat64m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmacc_vv_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat64m4_t vs1, vfloat64m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmacc_vf_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                             double rs1, vfloat64m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmacc_vv_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat64m8_t vs1, vfloat64m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmacc_vf_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                             double rs1, vfloat64m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmacc_vv_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                                vfloat16mf4_t vs1,
                                                vfloat16mf4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmacc_vf_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                                _Float16 rs1, vfloat16mf4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmacc_vv_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                                vfloat16mf2_t vs1,
                                                vfloat16mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmacc_vf_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                                _Float16 rs1, vfloat16mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmacc_vv_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                              vfloat16m1_t vs1,
                                              vfloat16m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmacc_vf_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                              _Float16 rs1, vfloat16m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmacc_vv_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                              vfloat16m2_t vs1,
                                              vfloat16m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmacc_vf_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                              _Float16 rs1, vfloat16m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmacc_vv_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                              vfloat16m4_t vs1,
                                              vfloat16m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmacc_vf_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                              _Float16 rs1, vfloat16m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmacc_vv_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                              vfloat16m8_t vs1,
                                              vfloat16m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmacc_vf_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                              _Float16 rs1, vfloat16m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmacc_vv_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                                vfloat32mf2_t vs1,
                                                vfloat32mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmacc_vf_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                                float rs1, vfloat32mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmacc_vv_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                              vfloat32m1_t vs1,
                                              vfloat32m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmacc_vf_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                              float rs1, vfloat32m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmacc_vv_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                              vfloat32m2_t vs1,
                                              vfloat32m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmacc_vf_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                              float rs1, vfloat32m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmacc_vv_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                              vfloat32m4_t vs1,
                                              vfloat32m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmacc_vf_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                              float rs1, vfloat32m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmacc_vv_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                              vfloat32m8_t vs1,
                                              vfloat32m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmacc_vf_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                              float rs1, vfloat32m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmacc_vv_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                              vfloat64m1_t vs1,
                                              vfloat64m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmacc_vf_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                              double rs1, vfloat64m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmacc_vv_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                              vfloat64m2_t vs1,
                                              vfloat64m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmacc_vf_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                              double rs1, vfloat64m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmacc_vv_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                              vfloat64m4_t vs1,
                                              vfloat64m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmacc_vf_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                              double rs1, vfloat64m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmacc_vv_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                              vfloat64m8_t vs1,
                                              vfloat64m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmacc_vf_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                              double rs1, vfloat64m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsac_vv_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                               vfloat16mf4_t vs1,
                                               vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsac_vf_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                               _Float16 rs1, vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsac_vv_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                               vfloat16mf2_t vs1,
                                               vfloat16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsac_vf_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                               _Float16 rs1, vfloat16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsac_vv_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                             vfloat16m1_t vs1, vfloat16m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsac_vf_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                             _Float16 rs1, vfloat16m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsac_vv_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                             vfloat16m2_t vs1, vfloat16m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsac_vf_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                             _Float16 rs1, vfloat16m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsac_vv_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                             vfloat16m4_t vs1, vfloat16m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsac_vf_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                             _Float16 rs1, vfloat16m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsac_vv_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                             vfloat16m8_t vs1, vfloat16m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsac_vf_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                             _Float16 rs1, vfloat16m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsac_vv_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat32mf2_t vs1,
                                               vfloat32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsac_vf_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                               float rs1, vfloat32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsac_vv_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat32m1_t vs1, vfloat32m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsac_vf_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                             float rs1, vfloat32m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsac_vv_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat32m2_t vs1, vfloat32m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsac_vf_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                             float rs1, vfloat32m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsac_vv_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat32m4_t vs1, vfloat32m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsac_vf_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                             float rs1, vfloat32m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsac_vv_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat32m8_t vs1, vfloat32m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsac_vf_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                             float rs1, vfloat32m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsac_vv_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat64m1_t vs1, vfloat64m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsac_vf_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                             double rs1, vfloat64m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsac_vv_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat64m2_t vs1, vfloat64m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsac_vf_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                             double rs1, vfloat64m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsac_vv_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat64m4_t vs1, vfloat64m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsac_vf_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                             double rs1, vfloat64m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsac_vv_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat64m8_t vs1, vfloat64m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsac_vf_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                             double rs1, vfloat64m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsac_vv_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                                vfloat16mf4_t vs1,
                                                vfloat16mf4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsac_vf_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                                _Float16 rs1, vfloat16mf4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmsac_vv_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                                vfloat16mf2_t vs1,
                                                vfloat16mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmsac_vf_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                                _Float16 rs1, vfloat16mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmsac_vv_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                              vfloat16m1_t vs1,
                                              vfloat16m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmsac_vf_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                              _Float16 rs1, vfloat16m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsac_vv_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                              vfloat16m2_t vs1,
                                              vfloat16m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsac_vf_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                              _Float16 rs1, vfloat16m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsac_vv_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                              vfloat16m4_t vs1,
                                              vfloat16m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsac_vf_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                              _Float16 rs1, vfloat16m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsac_vv_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                              vfloat16m8_t vs1,
                                              vfloat16m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsac_vf_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                              _Float16 rs1, vfloat16m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsac_vv_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                                vfloat32mf2_t vs1,
                                                vfloat32mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsac_vf_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                                float rs1, vfloat32mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmsac_vv_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                              vfloat32m1_t vs1,
                                              vfloat32m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmsac_vf_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                              float rs1, vfloat32m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsac_vv_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                              vfloat32m2_t vs1,
                                              vfloat32m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsac_vf_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                              float rs1, vfloat32m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsac_vv_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                              vfloat32m4_t vs1,
                                              vfloat32m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsac_vf_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                              float rs1, vfloat32m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsac_vv_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                              vfloat32m8_t vs1,
                                              vfloat32m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsac_vf_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                              float rs1, vfloat32m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsac_vv_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                              vfloat64m1_t vs1,
                                              vfloat64m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsac_vf_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                              double rs1, vfloat64m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsac_vv_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                              vfloat64m2_t vs1,
                                              vfloat64m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsac_vf_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                              double rs1, vfloat64m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsac_vv_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                              vfloat64m4_t vs1,
                                              vfloat64m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsac_vf_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                              double rs1, vfloat64m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsac_vv_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                              vfloat64m8_t vs1,
                                              vfloat64m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsac_vf_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                              double rs1, vfloat64m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmadd_vv_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                               vfloat16mf4_t vs1,
                                               vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmadd_vf_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                               _Float16 rs1, vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmadd_vv_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                               vfloat16mf2_t vs1,
                                               vfloat16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmadd_vf_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                               _Float16 rs1, vfloat16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmadd_vv_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                             vfloat16m1_t vs1, vfloat16m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmadd_vf_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                             _Float16 rs1, vfloat16m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmadd_vv_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                             vfloat16m2_t vs1, vfloat16m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmadd_vf_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                             _Float16 rs1, vfloat16m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmadd_vv_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                             vfloat16m4_t vs1, vfloat16m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmadd_vf_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                             _Float16 rs1, vfloat16m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmadd_vv_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                             vfloat16m8_t vs1, vfloat16m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmadd_vf_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                             _Float16 rs1, vfloat16m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmadd_vv_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat32mf2_t vs1,
                                               vfloat32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmadd_vf_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                               float rs1, vfloat32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmadd_vv_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat32m1_t vs1, vfloat32m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmadd_vf_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                             float rs1, vfloat32m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmadd_vv_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat32m2_t vs1, vfloat32m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmadd_vf_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                             float rs1, vfloat32m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmadd_vv_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat32m4_t vs1, vfloat32m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmadd_vf_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                             float rs1, vfloat32m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmadd_vv_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat32m8_t vs1, vfloat32m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmadd_vf_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                             float rs1, vfloat32m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmadd_vv_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat64m1_t vs1, vfloat64m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmadd_vf_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                             double rs1, vfloat64m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmadd_vv_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat64m2_t vs1, vfloat64m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmadd_vf_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                             double rs1, vfloat64m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmadd_vv_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat64m4_t vs1, vfloat64m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmadd_vf_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                             double rs1, vfloat64m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmadd_vv_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat64m8_t vs1, vfloat64m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmadd_vf_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                             double rs1, vfloat64m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmadd_vv_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                                vfloat16mf4_t vs1,
                                                vfloat16mf4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmadd_vf_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                                _Float16 rs1, vfloat16mf4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmadd_vv_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                                vfloat16mf2_t vs1,
                                                vfloat16mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmadd_vf_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                                _Float16 rs1, vfloat16mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmadd_vv_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                              vfloat16m1_t vs1,
                                              vfloat16m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmadd_vf_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                              _Float16 rs1, vfloat16m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmadd_vv_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                              vfloat16m2_t vs1,
                                              vfloat16m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmadd_vf_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                              _Float16 rs1, vfloat16m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmadd_vv_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                              vfloat16m4_t vs1,
                                              vfloat16m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmadd_vf_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                              _Float16 rs1, vfloat16m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmadd_vv_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                              vfloat16m8_t vs1,
                                              vfloat16m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmadd_vf_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                              _Float16 rs1, vfloat16m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmadd_vv_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                                vfloat32mf2_t vs1,
                                                vfloat32mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmadd_vf_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                                float rs1, vfloat32mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmadd_vv_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                              vfloat32m1_t vs1,
                                              vfloat32m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmadd_vf_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                              float rs1, vfloat32m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmadd_vv_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                              vfloat32m2_t vs1,
                                              vfloat32m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmadd_vf_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                              float rs1, vfloat32m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmadd_vv_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                              vfloat32m4_t vs1,
                                              vfloat32m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmadd_vf_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                              float rs1, vfloat32m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmadd_vv_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                              vfloat32m8_t vs1,
                                              vfloat32m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmadd_vf_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                              float rs1, vfloat32m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmadd_vv_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                              vfloat64m1_t vs1,
                                              vfloat64m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmadd_vf_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                              double rs1, vfloat64m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmadd_vv_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                              vfloat64m2_t vs1,
                                              vfloat64m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmadd_vf_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                              double rs1, vfloat64m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmadd_vv_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                              vfloat64m4_t vs1,
                                              vfloat64m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmadd_vf_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                              double rs1, vfloat64m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmadd_vv_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                              vfloat64m8_t vs1,
                                              vfloat64m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmadd_vf_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                              double rs1, vfloat64m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsub_vv_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                               vfloat16mf4_t vs1,
                                               vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsub_vf_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                               _Float16 rs1, vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsub_vv_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                               vfloat16mf2_t vs1,
                                               vfloat16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsub_vf_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                               _Float16 rs1, vfloat16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsub_vv_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                             vfloat16m1_t vs1, vfloat16m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsub_vf_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                             _Float16 rs1, vfloat16m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsub_vv_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                             vfloat16m2_t vs1, vfloat16m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsub_vf_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                             _Float16 rs1, vfloat16m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsub_vv_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                             vfloat16m4_t vs1, vfloat16m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsub_vf_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                             _Float16 rs1, vfloat16m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsub_vv_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                             vfloat16m8_t vs1, vfloat16m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsub_vf_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                             _Float16 rs1, vfloat16m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsub_vv_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat32mf2_t vs1,
                                               vfloat32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsub_vf_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                               float rs1, vfloat32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsub_vv_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat32m1_t vs1, vfloat32m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsub_vf_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                             float rs1, vfloat32m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsub_vv_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat32m2_t vs1, vfloat32m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsub_vf_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                             float rs1, vfloat32m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsub_vv_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat32m4_t vs1, vfloat32m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsub_vf_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                             float rs1, vfloat32m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsub_vv_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat32m8_t vs1, vfloat32m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsub_vf_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                             float rs1, vfloat32m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsub_vv_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat64m1_t vs1, vfloat64m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsub_vf_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                             double rs1, vfloat64m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsub_vv_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat64m2_t vs1, vfloat64m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsub_vf_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                             double rs1, vfloat64m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsub_vv_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat64m4_t vs1, vfloat64m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsub_vf_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                             double rs1, vfloat64m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsub_vv_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat64m8_t vs1, vfloat64m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsub_vf_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                             double rs1, vfloat64m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsub_vv_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                                vfloat16mf4_t vs1,
                                                vfloat16mf4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsub_vf_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                                _Float16 rs1, vfloat16mf4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmsub_vv_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                                vfloat16mf2_t vs1,
                                                vfloat16mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmsub_vf_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                                _Float16 rs1, vfloat16mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmsub_vv_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                              vfloat16m1_t vs1,
                                              vfloat16m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmsub_vf_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                              _Float16 rs1, vfloat16m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsub_vv_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                              vfloat16m2_t vs1,
                                              vfloat16m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsub_vf_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                              _Float16 rs1, vfloat16m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsub_vv_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                              vfloat16m4_t vs1,
                                              vfloat16m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsub_vf_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                              _Float16 rs1, vfloat16m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsub_vv_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                              vfloat16m8_t vs1,
                                              vfloat16m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsub_vf_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                              _Float16 rs1, vfloat16m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsub_vv_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                                vfloat32mf2_t vs1,
                                                vfloat32mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsub_vf_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                                float rs1, vfloat32mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmsub_vv_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                              vfloat32m1_t vs1,
                                              vfloat32m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmsub_vf_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                              float rs1, vfloat32m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsub_vv_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                              vfloat32m2_t vs1,
                                              vfloat32m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsub_vf_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                              float rs1, vfloat32m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsub_vv_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                              vfloat32m4_t vs1,
                                              vfloat32m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsub_vf_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                              float rs1, vfloat32m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsub_vv_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                              vfloat32m8_t vs1,
                                              vfloat32m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsub_vf_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                              float rs1, vfloat32m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsub_vv_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                              vfloat64m1_t vs1,
                                              vfloat64m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsub_vf_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                              double rs1, vfloat64m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsub_vv_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                              vfloat64m2_t vs1,
                                              vfloat64m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsub_vf_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                              double rs1, vfloat64m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsub_vv_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                              vfloat64m4_t vs1,
                                              vfloat64m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsub_vf_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                              double rs1, vfloat64m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsub_vv_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                              vfloat64m8_t vs1,
                                              vfloat64m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsub_vf_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                              double rs1, vfloat64m8_t vs2,
                                              unsigned int frm, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmacc_vv_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs1,
                                             vfloat16mf4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmacc_vf_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                             _Float16 rs1, vfloat16mf4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmacc_vv_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs1,
                                             vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmacc_vf_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                             _Float16 rs1, vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmacc_vv_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs1, vfloat16m1_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmacc_vf_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                           _Float16 rs1, vfloat16m1_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmacc_vv_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs1, vfloat16m2_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmacc_vf_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                           _Float16 rs1, vfloat16m2_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmacc_vv_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs1, vfloat16m4_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmacc_vf_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                           _Float16 rs1, vfloat16m4_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmacc_vv_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs1, vfloat16m8_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmacc_vf_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                           _Float16 rs1, vfloat16m8_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmacc_vv_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs1,
                                             vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmacc_vf_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                             float rs1, vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmacc_vv_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs1, vfloat32m1_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmacc_vf_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                           float rs1, vfloat32m1_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmacc_vv_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs1, vfloat32m2_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmacc_vf_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                           float rs1, vfloat32m2_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmacc_vv_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs1, vfloat32m4_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmacc_vf_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                           float rs1, vfloat32m4_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmacc_vv_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs1, vfloat32m8_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmacc_vf_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                           float rs1, vfloat32m8_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmacc_vv_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs1, vfloat64m1_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmacc_vf_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                           double rs1, vfloat64m1_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmacc_vv_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs1, vfloat64m2_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmacc_vf_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                           double rs1, vfloat64m2_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmacc_vv_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs1, vfloat64m4_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmacc_vf_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                           double rs1, vfloat64m4_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmacc_vv_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs1, vfloat64m8_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmacc_vf_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                           double rs1, vfloat64m8_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmacc_vv_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat16mf4_t vs1,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmacc_vf_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                              _Float16 rs1, vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmacc_vv_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat16mf2_t vs1,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmacc_vf_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                              _Float16 rs1, vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmacc_vv_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat16m1_t vs1, vfloat16m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmacc_vf_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                            _Float16 rs1, vfloat16m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmacc_vv_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat16m2_t vs1, vfloat16m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmacc_vf_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                            _Float16 rs1, vfloat16m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmacc_vv_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat16m4_t vs1, vfloat16m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmacc_vf_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                            _Float16 rs1, vfloat16m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmacc_vv_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                            vfloat16m8_t vs1, vfloat16m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmacc_vf_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                            _Float16 rs1, vfloat16m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmacc_vv_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs1,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmacc_vf_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                              float rs1, vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmacc_vv_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs1, vfloat32m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmacc_vf_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                            float rs1, vfloat32m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmacc_vv_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs1, vfloat32m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmacc_vf_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                            float rs1, vfloat32m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmacc_vv_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs1, vfloat32m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmacc_vf_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                            float rs1, vfloat32m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmacc_vv_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs1, vfloat32m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmacc_vf_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                            float rs1, vfloat32m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmacc_vv_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs1, vfloat64m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmacc_vf_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                            double rs1, vfloat64m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmacc_vv_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs1, vfloat64m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmacc_vf_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                            double rs1, vfloat64m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmacc_vv_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs1, vfloat64m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmacc_vf_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                            double rs1, vfloat64m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmacc_vv_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs1, vfloat64m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmacc_vf_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                            double rs1, vfloat64m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsac_vv_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs1,
                                             vfloat16mf4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsac_vf_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                             _Float16 rs1, vfloat16mf4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsac_vv_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs1,
                                             vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsac_vf_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                             _Float16 rs1, vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsac_vv_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs1, vfloat16m1_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsac_vf_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                           _Float16 rs1, vfloat16m1_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsac_vv_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs1, vfloat16m2_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsac_vf_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                           _Float16 rs1, vfloat16m2_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsac_vv_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs1, vfloat16m4_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsac_vf_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                           _Float16 rs1, vfloat16m4_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsac_vv_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs1, vfloat16m8_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsac_vf_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                           _Float16 rs1, vfloat16m8_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsac_vv_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs1,
                                             vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsac_vf_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                             float rs1, vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsac_vv_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs1, vfloat32m1_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsac_vf_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                           float rs1, vfloat32m1_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsac_vv_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs1, vfloat32m2_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsac_vf_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                           float rs1, vfloat32m2_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsac_vv_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs1, vfloat32m4_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsac_vf_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                           float rs1, vfloat32m4_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsac_vv_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs1, vfloat32m8_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsac_vf_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                           float rs1, vfloat32m8_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsac_vv_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs1, vfloat64m1_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsac_vf_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                           double rs1, vfloat64m1_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsac_vv_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs1, vfloat64m2_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsac_vf_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                           double rs1, vfloat64m2_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsac_vv_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs1, vfloat64m4_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsac_vf_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                           double rs1, vfloat64m4_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsac_vv_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs1, vfloat64m8_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsac_vf_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                           double rs1, vfloat64m8_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsac_vv_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat16mf4_t vs1,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsac_vf_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                              _Float16 rs1, vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmsac_vv_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat16mf2_t vs1,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmsac_vf_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                              _Float16 rs1, vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmsac_vv_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat16m1_t vs1, vfloat16m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmsac_vf_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                            _Float16 rs1, vfloat16m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsac_vv_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat16m2_t vs1, vfloat16m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsac_vf_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                            _Float16 rs1, vfloat16m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsac_vv_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat16m4_t vs1, vfloat16m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsac_vf_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                            _Float16 rs1, vfloat16m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsac_vv_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                            vfloat16m8_t vs1, vfloat16m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsac_vf_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                            _Float16 rs1, vfloat16m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsac_vv_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs1,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsac_vf_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                              float rs1, vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmsac_vv_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs1, vfloat32m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmsac_vf_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                            float rs1, vfloat32m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsac_vv_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs1, vfloat32m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsac_vf_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                            float rs1, vfloat32m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsac_vv_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs1, vfloat32m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsac_vf_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                            float rs1, vfloat32m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsac_vv_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs1, vfloat32m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsac_vf_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                            float rs1, vfloat32m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsac_vv_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs1, vfloat64m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsac_vf_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                            double rs1, vfloat64m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsac_vv_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs1, vfloat64m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsac_vf_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                            double rs1, vfloat64m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsac_vv_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs1, vfloat64m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsac_vf_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                            double rs1, vfloat64m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsac_vv_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs1, vfloat64m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsac_vf_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                            double rs1, vfloat64m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmadd_vv_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs1,
                                             vfloat16mf4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmadd_vf_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                             _Float16 rs1, vfloat16mf4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmadd_vv_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs1,
                                             vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmadd_vf_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                             _Float16 rs1, vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmadd_vv_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs1, vfloat16m1_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmadd_vf_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                           _Float16 rs1, vfloat16m1_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmadd_vv_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs1, vfloat16m2_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmadd_vf_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                           _Float16 rs1, vfloat16m2_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmadd_vv_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs1, vfloat16m4_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmadd_vf_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                           _Float16 rs1, vfloat16m4_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmadd_vv_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs1, vfloat16m8_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmadd_vf_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                           _Float16 rs1, vfloat16m8_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmadd_vv_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs1,
                                             vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmadd_vf_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                             float rs1, vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmadd_vv_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs1, vfloat32m1_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmadd_vf_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                           float rs1, vfloat32m1_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmadd_vv_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs1, vfloat32m2_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmadd_vf_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                           float rs1, vfloat32m2_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmadd_vv_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs1, vfloat32m4_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmadd_vf_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                           float rs1, vfloat32m4_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmadd_vv_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs1, vfloat32m8_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmadd_vf_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                           float rs1, vfloat32m8_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmadd_vv_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs1, vfloat64m1_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmadd_vf_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                           double rs1, vfloat64m1_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmadd_vv_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs1, vfloat64m2_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmadd_vf_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                           double rs1, vfloat64m2_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmadd_vv_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs1, vfloat64m4_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmadd_vf_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                           double rs1, vfloat64m4_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmadd_vv_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs1, vfloat64m8_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmadd_vf_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                           double rs1, vfloat64m8_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmadd_vv_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat16mf4_t vs1,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmadd_vf_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                              _Float16 rs1, vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmadd_vv_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat16mf2_t vs1,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmadd_vf_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                              _Float16 rs1, vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmadd_vv_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat16m1_t vs1, vfloat16m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmadd_vf_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                            _Float16 rs1, vfloat16m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmadd_vv_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat16m2_t vs1, vfloat16m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmadd_vf_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                            _Float16 rs1, vfloat16m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmadd_vv_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat16m4_t vs1, vfloat16m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmadd_vf_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                            _Float16 rs1, vfloat16m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmadd_vv_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                            vfloat16m8_t vs1, vfloat16m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmadd_vf_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                            _Float16 rs1, vfloat16m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmadd_vv_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs1,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmadd_vf_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                              float rs1, vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmadd_vv_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs1, vfloat32m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmadd_vf_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                            float rs1, vfloat32m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmadd_vv_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs1, vfloat32m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmadd_vf_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                            float rs1, vfloat32m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmadd_vv_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs1, vfloat32m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmadd_vf_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                            float rs1, vfloat32m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmadd_vv_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs1, vfloat32m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmadd_vf_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                            float rs1, vfloat32m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmadd_vv_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs1, vfloat64m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmadd_vf_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                            double rs1, vfloat64m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmadd_vv_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs1, vfloat64m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmadd_vf_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                            double rs1, vfloat64m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmadd_vv_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs1, vfloat64m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmadd_vf_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                            double rs1, vfloat64m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmadd_vv_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs1, vfloat64m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmadd_vf_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                            double rs1, vfloat64m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsub_vv_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs1,
                                             vfloat16mf4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsub_vf_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                             _Float16 rs1, vfloat16mf4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsub_vv_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs1,
                                             vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsub_vf_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                             _Float16 rs1, vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsub_vv_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs1, vfloat16m1_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsub_vf_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                           _Float16 rs1, vfloat16m1_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsub_vv_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs1, vfloat16m2_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsub_vf_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                           _Float16 rs1, vfloat16m2_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsub_vv_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs1, vfloat16m4_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsub_vf_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                           _Float16 rs1, vfloat16m4_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsub_vv_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs1, vfloat16m8_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsub_vf_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                           _Float16 rs1, vfloat16m8_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsub_vv_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs1,
                                             vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsub_vf_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                             float rs1, vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsub_vv_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs1, vfloat32m1_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsub_vf_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                           float rs1, vfloat32m1_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsub_vv_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs1, vfloat32m2_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsub_vf_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                           float rs1, vfloat32m2_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsub_vv_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs1, vfloat32m4_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsub_vf_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                           float rs1, vfloat32m4_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsub_vv_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs1, vfloat32m8_t vs2,
                                           unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsub_vf_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                           float rs1, vfloat32m8_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsub_vv_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs1, vfloat64m1_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsub_vf_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                           double rs1, vfloat64m1_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsub_vv_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs1, vfloat64m2_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsub_vf_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                           double rs1, vfloat64m2_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsub_vv_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs1, vfloat64m4_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsub_vf_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                           double rs1, vfloat64m4_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsub_vv_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs1, vfloat64m8_t vs2,
                                           unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsub_vf_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                           double rs1, vfloat64m8_t vs2,
                                           unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsub_vv_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat16mf4_t vs1,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsub_vf_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                              _Float16 rs1, vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmsub_vv_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat16mf2_t vs1,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmsub_vf_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                              _Float16 rs1, vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmsub_vv_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat16m1_t vs1, vfloat16m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmsub_vf_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                            _Float16 rs1, vfloat16m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsub_vv_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat16m2_t vs1, vfloat16m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsub_vf_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                            _Float16 rs1, vfloat16m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsub_vv_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat16m4_t vs1, vfloat16m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsub_vf_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                            _Float16 rs1, vfloat16m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsub_vv_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                            vfloat16m8_t vs1, vfloat16m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsub_vf_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                            _Float16 rs1, vfloat16m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsub_vv_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs1,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsub_vf_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                              float rs1, vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmsub_vv_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs1, vfloat32m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmsub_vf_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                            float rs1, vfloat32m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsub_vv_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs1, vfloat32m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsub_vf_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                            float rs1, vfloat32m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsub_vv_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs1, vfloat32m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsub_vf_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                            float rs1, vfloat32m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsub_vv_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs1, vfloat32m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsub_vf_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                            float rs1, vfloat32m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsub_vv_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs1, vfloat64m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsub_vf_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                            double rs1, vfloat64m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsub_vv_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs1, vfloat64m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsub_vf_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                            double rs1, vfloat64m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsub_vv_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs1, vfloat64m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsub_vf_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                            double rs1, vfloat64m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsub_vv_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs1, vfloat64m8_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsub_vf_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                            double rs1, vfloat64m8_t vs2,
                                            unsigned int frm, size_t vl);

Vector Widening Floating-Point Fused Multiply-Add Intrinsics

vfloat32mf2_t __riscv_vfwmacc_vv_f32mf2_tu(vfloat32mf2_t vd, vfloat16mf4_t vs1,
                                           vfloat16mf4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwmacc_vf_f32mf2_tu(vfloat32mf2_t vd, _Float16 vs1,
                                           vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwmacc_vv_f32m1_tu(vfloat32m1_t vd, vfloat16mf2_t vs1,
                                         vfloat16mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwmacc_vf_f32m1_tu(vfloat32m1_t vd, _Float16 vs1,
                                         vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwmacc_vv_f32m2_tu(vfloat32m2_t vd, vfloat16m1_t vs1,
                                         vfloat16m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwmacc_vf_f32m2_tu(vfloat32m2_t vd, _Float16 vs1,
                                         vfloat16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwmacc_vv_f32m4_tu(vfloat32m4_t vd, vfloat16m2_t vs1,
                                         vfloat16m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwmacc_vf_f32m4_tu(vfloat32m4_t vd, _Float16 vs1,
                                         vfloat16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwmacc_vv_f32m8_tu(vfloat32m8_t vd, vfloat16m4_t vs1,
                                         vfloat16m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwmacc_vf_f32m8_tu(vfloat32m8_t vd, _Float16 vs1,
                                         vfloat16m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwmacc_vv_f64m1_tu(vfloat64m1_t vd, vfloat32mf2_t vs1,
                                         vfloat32mf2_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwmacc_vf_f64m1_tu(vfloat64m1_t vd, float vs1,
                                         vfloat32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwmacc_vv_f64m2_tu(vfloat64m2_t vd, vfloat32m1_t vs1,
                                         vfloat32m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwmacc_vf_f64m2_tu(vfloat64m2_t vd, float vs1,
                                         vfloat32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwmacc_vv_f64m4_tu(vfloat64m4_t vd, vfloat32m2_t vs1,
                                         vfloat32m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwmacc_vf_f64m4_tu(vfloat64m4_t vd, float vs1,
                                         vfloat32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwmacc_vv_f64m8_tu(vfloat64m8_t vd, vfloat32m4_t vs1,
                                         vfloat32m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwmacc_vf_f64m8_tu(vfloat64m8_t vd, float vs1,
                                         vfloat32m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_vv_f32mf2_tu(vfloat32mf2_t vd, vfloat16mf4_t vs1,
                                            vfloat16mf4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_vf_f32mf2_tu(vfloat32mf2_t vd, _Float16 vs1,
                                            vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwnmacc_vv_f32m1_tu(vfloat32m1_t vd, vfloat16mf2_t vs1,
                                          vfloat16mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwnmacc_vf_f32m1_tu(vfloat32m1_t vd, _Float16 vs1,
                                          vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwnmacc_vv_f32m2_tu(vfloat32m2_t vd, vfloat16m1_t vs1,
                                          vfloat16m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwnmacc_vf_f32m2_tu(vfloat32m2_t vd, _Float16 vs1,
                                          vfloat16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwnmacc_vv_f32m4_tu(vfloat32m4_t vd, vfloat16m2_t vs1,
                                          vfloat16m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwnmacc_vf_f32m4_tu(vfloat32m4_t vd, _Float16 vs1,
                                          vfloat16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwnmacc_vv_f32m8_tu(vfloat32m8_t vd, vfloat16m4_t vs1,
                                          vfloat16m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwnmacc_vf_f32m8_tu(vfloat32m8_t vd, _Float16 vs1,
                                          vfloat16m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwnmacc_vv_f64m1_tu(vfloat64m1_t vd, vfloat32mf2_t vs1,
                                          vfloat32mf2_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwnmacc_vf_f64m1_tu(vfloat64m1_t vd, float vs1,
                                          vfloat32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwnmacc_vv_f64m2_tu(vfloat64m2_t vd, vfloat32m1_t vs1,
                                          vfloat32m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwnmacc_vf_f64m2_tu(vfloat64m2_t vd, float vs1,
                                          vfloat32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwnmacc_vv_f64m4_tu(vfloat64m4_t vd, vfloat32m2_t vs1,
                                          vfloat32m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwnmacc_vf_f64m4_tu(vfloat64m4_t vd, float vs1,
                                          vfloat32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwnmacc_vv_f64m8_tu(vfloat64m8_t vd, vfloat32m4_t vs1,
                                          vfloat32m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwnmacc_vf_f64m8_tu(vfloat64m8_t vd, float vs1,
                                          vfloat32m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwmsac_vv_f32mf2_tu(vfloat32mf2_t vd, vfloat16mf4_t vs1,
                                           vfloat16mf4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwmsac_vf_f32mf2_tu(vfloat32mf2_t vd, _Float16 vs1,
                                           vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwmsac_vv_f32m1_tu(vfloat32m1_t vd, vfloat16mf2_t vs1,
                                         vfloat16mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwmsac_vf_f32m1_tu(vfloat32m1_t vd, _Float16 vs1,
                                         vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwmsac_vv_f32m2_tu(vfloat32m2_t vd, vfloat16m1_t vs1,
                                         vfloat16m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwmsac_vf_f32m2_tu(vfloat32m2_t vd, _Float16 vs1,
                                         vfloat16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwmsac_vv_f32m4_tu(vfloat32m4_t vd, vfloat16m2_t vs1,
                                         vfloat16m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwmsac_vf_f32m4_tu(vfloat32m4_t vd, _Float16 vs1,
                                         vfloat16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwmsac_vv_f32m8_tu(vfloat32m8_t vd, vfloat16m4_t vs1,
                                         vfloat16m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwmsac_vf_f32m8_tu(vfloat32m8_t vd, _Float16 vs1,
                                         vfloat16m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwmsac_vv_f64m1_tu(vfloat64m1_t vd, vfloat32mf2_t vs1,
                                         vfloat32mf2_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwmsac_vf_f64m1_tu(vfloat64m1_t vd, float vs1,
                                         vfloat32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwmsac_vv_f64m2_tu(vfloat64m2_t vd, vfloat32m1_t vs1,
                                         vfloat32m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwmsac_vf_f64m2_tu(vfloat64m2_t vd, float vs1,
                                         vfloat32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwmsac_vv_f64m4_tu(vfloat64m4_t vd, vfloat32m2_t vs1,
                                         vfloat32m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwmsac_vf_f64m4_tu(vfloat64m4_t vd, float vs1,
                                         vfloat32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwmsac_vv_f64m8_tu(vfloat64m8_t vd, vfloat32m4_t vs1,
                                         vfloat32m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwmsac_vf_f64m8_tu(vfloat64m8_t vd, float vs1,
                                         vfloat32m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_vv_f32mf2_tu(vfloat32mf2_t vd, vfloat16mf4_t vs1,
                                            vfloat16mf4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_vf_f32mf2_tu(vfloat32mf2_t vd, _Float16 vs1,
                                            vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwnmsac_vv_f32m1_tu(vfloat32m1_t vd, vfloat16mf2_t vs1,
                                          vfloat16mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwnmsac_vf_f32m1_tu(vfloat32m1_t vd, _Float16 vs1,
                                          vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwnmsac_vv_f32m2_tu(vfloat32m2_t vd, vfloat16m1_t vs1,
                                          vfloat16m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwnmsac_vf_f32m2_tu(vfloat32m2_t vd, _Float16 vs1,
                                          vfloat16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwnmsac_vv_f32m4_tu(vfloat32m4_t vd, vfloat16m2_t vs1,
                                          vfloat16m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwnmsac_vf_f32m4_tu(vfloat32m4_t vd, _Float16 vs1,
                                          vfloat16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwnmsac_vv_f32m8_tu(vfloat32m8_t vd, vfloat16m4_t vs1,
                                          vfloat16m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwnmsac_vf_f32m8_tu(vfloat32m8_t vd, _Float16 vs1,
                                          vfloat16m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwnmsac_vv_f64m1_tu(vfloat64m1_t vd, vfloat32mf2_t vs1,
                                          vfloat32mf2_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwnmsac_vf_f64m1_tu(vfloat64m1_t vd, float vs1,
                                          vfloat32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwnmsac_vv_f64m2_tu(vfloat64m2_t vd, vfloat32m1_t vs1,
                                          vfloat32m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwnmsac_vf_f64m2_tu(vfloat64m2_t vd, float vs1,
                                          vfloat32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwnmsac_vv_f64m4_tu(vfloat64m4_t vd, vfloat32m2_t vs1,
                                          vfloat32m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwnmsac_vf_f64m4_tu(vfloat64m4_t vd, float vs1,
                                          vfloat32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwnmsac_vv_f64m8_tu(vfloat64m8_t vd, vfloat32m4_t vs1,
                                          vfloat32m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwnmsac_vf_f64m8_tu(vfloat64m8_t vd, float vs1,
                                          vfloat32m4_t vs2, size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwmacc_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat16mf4_t vs1,
                                            vfloat16mf4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwmacc_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                            _Float16 vs1, vfloat16mf4_t vs2,
                                            size_t vl);
vfloat32m1_t __riscv_vfwmacc_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                          size_t vl);
vfloat32m1_t __riscv_vfwmacc_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                          _Float16 vs1, vfloat16mf2_t vs2,
                                          size_t vl);
vfloat32m2_t __riscv_vfwmacc_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat16m1_t vs1, vfloat16m1_t vs2,
                                          size_t vl);
vfloat32m2_t __riscv_vfwmacc_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                          _Float16 vs1, vfloat16m1_t vs2,
                                          size_t vl);
vfloat32m4_t __riscv_vfwmacc_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat16m2_t vs1, vfloat16m2_t vs2,
                                          size_t vl);
vfloat32m4_t __riscv_vfwmacc_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                          _Float16 vs1, vfloat16m2_t vs2,
                                          size_t vl);
vfloat32m8_t __riscv_vfwmacc_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat16m4_t vs1, vfloat16m4_t vs2,
                                          size_t vl);
vfloat32m8_t __riscv_vfwmacc_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                          _Float16 vs1, vfloat16m4_t vs2,
                                          size_t vl);
vfloat64m1_t __riscv_vfwmacc_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                          size_t vl);
vfloat64m1_t __riscv_vfwmacc_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                          float vs1, vfloat32mf2_t vs2,
                                          size_t vl);
vfloat64m2_t __riscv_vfwmacc_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat32m1_t vs1, vfloat32m1_t vs2,
                                          size_t vl);
vfloat64m2_t __riscv_vfwmacc_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                          float vs1, vfloat32m1_t vs2,
                                          size_t vl);
vfloat64m4_t __riscv_vfwmacc_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat32m2_t vs1, vfloat32m2_t vs2,
                                          size_t vl);
vfloat64m4_t __riscv_vfwmacc_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                          float vs1, vfloat32m2_t vs2,
                                          size_t vl);
vfloat64m8_t __riscv_vfwmacc_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat32m4_t vs1, vfloat32m4_t vs2,
                                          size_t vl);
vfloat64m8_t __riscv_vfwmacc_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                          float vs1, vfloat32m4_t vs2,
                                          size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat16mf4_t vs1,
                                             vfloat16mf4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                             _Float16 vs1, vfloat16mf4_t vs2,
                                             size_t vl);
vfloat32m1_t __riscv_vfwnmacc_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat32m1_t __riscv_vfwnmacc_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                           _Float16 vs1, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat32m2_t __riscv_vfwnmacc_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat16m1_t vs1, vfloat16m1_t vs2,
                                           size_t vl);
vfloat32m2_t __riscv_vfwnmacc_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                           _Float16 vs1, vfloat16m1_t vs2,
                                           size_t vl);
vfloat32m4_t __riscv_vfwnmacc_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat16m2_t vs1, vfloat16m2_t vs2,
                                           size_t vl);
vfloat32m4_t __riscv_vfwnmacc_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                           _Float16 vs1, vfloat16m2_t vs2,
                                           size_t vl);
vfloat32m8_t __riscv_vfwnmacc_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat16m4_t vs1, vfloat16m4_t vs2,
                                           size_t vl);
vfloat32m8_t __riscv_vfwnmacc_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                           _Float16 vs1, vfloat16m4_t vs2,
                                           size_t vl);
vfloat64m1_t __riscv_vfwnmacc_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat64m1_t __riscv_vfwnmacc_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                           float vs1, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat64m2_t __riscv_vfwnmacc_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat32m1_t vs1, vfloat32m1_t vs2,
                                           size_t vl);
vfloat64m2_t __riscv_vfwnmacc_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                           float vs1, vfloat32m1_t vs2,
                                           size_t vl);
vfloat64m4_t __riscv_vfwnmacc_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat32m2_t vs1, vfloat32m2_t vs2,
                                           size_t vl);
vfloat64m4_t __riscv_vfwnmacc_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                           float vs1, vfloat32m2_t vs2,
                                           size_t vl);
vfloat64m8_t __riscv_vfwnmacc_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat32m4_t vs1, vfloat32m4_t vs2,
                                           size_t vl);
vfloat64m8_t __riscv_vfwnmacc_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                           float vs1, vfloat32m4_t vs2,
                                           size_t vl);
vfloat32mf2_t __riscv_vfwmsac_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat16mf4_t vs1,
                                            vfloat16mf4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwmsac_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                            _Float16 vs1, vfloat16mf4_t vs2,
                                            size_t vl);
vfloat32m1_t __riscv_vfwmsac_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                          size_t vl);
vfloat32m1_t __riscv_vfwmsac_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                          _Float16 vs1, vfloat16mf2_t vs2,
                                          size_t vl);
vfloat32m2_t __riscv_vfwmsac_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat16m1_t vs1, vfloat16m1_t vs2,
                                          size_t vl);
vfloat32m2_t __riscv_vfwmsac_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                          _Float16 vs1, vfloat16m1_t vs2,
                                          size_t vl);
vfloat32m4_t __riscv_vfwmsac_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat16m2_t vs1, vfloat16m2_t vs2,
                                          size_t vl);
vfloat32m4_t __riscv_vfwmsac_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                          _Float16 vs1, vfloat16m2_t vs2,
                                          size_t vl);
vfloat32m8_t __riscv_vfwmsac_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat16m4_t vs1, vfloat16m4_t vs2,
                                          size_t vl);
vfloat32m8_t __riscv_vfwmsac_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                          _Float16 vs1, vfloat16m4_t vs2,
                                          size_t vl);
vfloat64m1_t __riscv_vfwmsac_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                          size_t vl);
vfloat64m1_t __riscv_vfwmsac_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                          float vs1, vfloat32mf2_t vs2,
                                          size_t vl);
vfloat64m2_t __riscv_vfwmsac_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat32m1_t vs1, vfloat32m1_t vs2,
                                          size_t vl);
vfloat64m2_t __riscv_vfwmsac_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                          float vs1, vfloat32m1_t vs2,
                                          size_t vl);
vfloat64m4_t __riscv_vfwmsac_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat32m2_t vs1, vfloat32m2_t vs2,
                                          size_t vl);
vfloat64m4_t __riscv_vfwmsac_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                          float vs1, vfloat32m2_t vs2,
                                          size_t vl);
vfloat64m8_t __riscv_vfwmsac_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat32m4_t vs1, vfloat32m4_t vs2,
                                          size_t vl);
vfloat64m8_t __riscv_vfwmsac_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                          float vs1, vfloat32m4_t vs2,
                                          size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat16mf4_t vs1,
                                             vfloat16mf4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                             _Float16 vs1, vfloat16mf4_t vs2,
                                             size_t vl);
vfloat32m1_t __riscv_vfwnmsac_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat32m1_t __riscv_vfwnmsac_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                           _Float16 vs1, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat32m2_t __riscv_vfwnmsac_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat16m1_t vs1, vfloat16m1_t vs2,
                                           size_t vl);
vfloat32m2_t __riscv_vfwnmsac_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                           _Float16 vs1, vfloat16m1_t vs2,
                                           size_t vl);
vfloat32m4_t __riscv_vfwnmsac_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat16m2_t vs1, vfloat16m2_t vs2,
                                           size_t vl);
vfloat32m4_t __riscv_vfwnmsac_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                           _Float16 vs1, vfloat16m2_t vs2,
                                           size_t vl);
vfloat32m8_t __riscv_vfwnmsac_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat16m4_t vs1, vfloat16m4_t vs2,
                                           size_t vl);
vfloat32m8_t __riscv_vfwnmsac_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                           _Float16 vs1, vfloat16m4_t vs2,
                                           size_t vl);
vfloat64m1_t __riscv_vfwnmsac_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat64m1_t __riscv_vfwnmsac_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                           float vs1, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat64m2_t __riscv_vfwnmsac_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat32m1_t vs1, vfloat32m1_t vs2,
                                           size_t vl);
vfloat64m2_t __riscv_vfwnmsac_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                           float vs1, vfloat32m1_t vs2,
                                           size_t vl);
vfloat64m4_t __riscv_vfwnmsac_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat32m2_t vs1, vfloat32m2_t vs2,
                                           size_t vl);
vfloat64m4_t __riscv_vfwnmsac_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                           float vs1, vfloat32m2_t vs2,
                                           size_t vl);
vfloat64m8_t __riscv_vfwnmsac_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat32m4_t vs1, vfloat32m4_t vs2,
                                           size_t vl);
vfloat64m8_t __riscv_vfwnmsac_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                           float vs1, vfloat32m4_t vs2,
                                           size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwmacc_vv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat16mf4_t vs1,
                                             vfloat16mf4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwmacc_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                             _Float16 vs1, vfloat16mf4_t vs2,
                                             size_t vl);
vfloat32m1_t __riscv_vfwmacc_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat32m1_t __riscv_vfwmacc_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                           _Float16 vs1, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat32m2_t __riscv_vfwmacc_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat16m1_t vs1, vfloat16m1_t vs2,
                                           size_t vl);
vfloat32m2_t __riscv_vfwmacc_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                           _Float16 vs1, vfloat16m1_t vs2,
                                           size_t vl);
vfloat32m4_t __riscv_vfwmacc_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat16m2_t vs1, vfloat16m2_t vs2,
                                           size_t vl);
vfloat32m4_t __riscv_vfwmacc_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                           _Float16 vs1, vfloat16m2_t vs2,
                                           size_t vl);
vfloat32m8_t __riscv_vfwmacc_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat16m4_t vs1, vfloat16m4_t vs2,
                                           size_t vl);
vfloat32m8_t __riscv_vfwmacc_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                           _Float16 vs1, vfloat16m4_t vs2,
                                           size_t vl);
vfloat64m1_t __riscv_vfwmacc_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat64m1_t __riscv_vfwmacc_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                           float vs1, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat64m2_t __riscv_vfwmacc_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat32m1_t vs1, vfloat32m1_t vs2,
                                           size_t vl);
vfloat64m2_t __riscv_vfwmacc_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                           float vs1, vfloat32m1_t vs2,
                                           size_t vl);
vfloat64m4_t __riscv_vfwmacc_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat32m2_t vs1, vfloat32m2_t vs2,
                                           size_t vl);
vfloat64m4_t __riscv_vfwmacc_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                           float vs1, vfloat32m2_t vs2,
                                           size_t vl);
vfloat64m8_t __riscv_vfwmacc_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat32m4_t vs1, vfloat32m4_t vs2,
                                           size_t vl);
vfloat64m8_t __riscv_vfwmacc_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                           float vs1, vfloat32m4_t vs2,
                                           size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_vv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat16mf4_t vs1,
                                              vfloat16mf4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                              _Float16 vs1, vfloat16mf4_t vs2,
                                              size_t vl);
vfloat32m1_t __riscv_vfwnmacc_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat16mf2_t vs1,
                                            vfloat16mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwnmacc_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                            _Float16 vs1, vfloat16mf2_t vs2,
                                            size_t vl);
vfloat32m2_t __riscv_vfwnmacc_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat16m1_t vs1, vfloat16m1_t vs2,
                                            size_t vl);
vfloat32m2_t __riscv_vfwnmacc_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                            _Float16 vs1, vfloat16m1_t vs2,
                                            size_t vl);
vfloat32m4_t __riscv_vfwnmacc_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat16m2_t vs1, vfloat16m2_t vs2,
                                            size_t vl);
vfloat32m4_t __riscv_vfwnmacc_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                            _Float16 vs1, vfloat16m2_t vs2,
                                            size_t vl);
vfloat32m8_t __riscv_vfwnmacc_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat16m4_t vs1, vfloat16m4_t vs2,
                                            size_t vl);
vfloat32m8_t __riscv_vfwnmacc_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                            _Float16 vs1, vfloat16m4_t vs2,
                                            size_t vl);
vfloat64m1_t __riscv_vfwnmacc_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat32mf2_t vs1,
                                            vfloat32mf2_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwnmacc_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                            float vs1, vfloat32mf2_t vs2,
                                            size_t vl);
vfloat64m2_t __riscv_vfwnmacc_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat32m1_t vs1, vfloat32m1_t vs2,
                                            size_t vl);
vfloat64m2_t __riscv_vfwnmacc_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                            float vs1, vfloat32m1_t vs2,
                                            size_t vl);
vfloat64m4_t __riscv_vfwnmacc_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat32m2_t vs1, vfloat32m2_t vs2,
                                            size_t vl);
vfloat64m4_t __riscv_vfwnmacc_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                            float vs1, vfloat32m2_t vs2,
                                            size_t vl);
vfloat64m8_t __riscv_vfwnmacc_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat32m4_t vs1, vfloat32m4_t vs2,
                                            size_t vl);
vfloat64m8_t __riscv_vfwnmacc_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                            float vs1, vfloat32m4_t vs2,
                                            size_t vl);
vfloat32mf2_t __riscv_vfwmsac_vv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat16mf4_t vs1,
                                             vfloat16mf4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwmsac_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                             _Float16 vs1, vfloat16mf4_t vs2,
                                             size_t vl);
vfloat32m1_t __riscv_vfwmsac_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat32m1_t __riscv_vfwmsac_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                           _Float16 vs1, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat32m2_t __riscv_vfwmsac_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat16m1_t vs1, vfloat16m1_t vs2,
                                           size_t vl);
vfloat32m2_t __riscv_vfwmsac_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                           _Float16 vs1, vfloat16m1_t vs2,
                                           size_t vl);
vfloat32m4_t __riscv_vfwmsac_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat16m2_t vs1, vfloat16m2_t vs2,
                                           size_t vl);
vfloat32m4_t __riscv_vfwmsac_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                           _Float16 vs1, vfloat16m2_t vs2,
                                           size_t vl);
vfloat32m8_t __riscv_vfwmsac_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat16m4_t vs1, vfloat16m4_t vs2,
                                           size_t vl);
vfloat32m8_t __riscv_vfwmsac_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                           _Float16 vs1, vfloat16m4_t vs2,
                                           size_t vl);
vfloat64m1_t __riscv_vfwmsac_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat64m1_t __riscv_vfwmsac_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                           float vs1, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat64m2_t __riscv_vfwmsac_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat32m1_t vs1, vfloat32m1_t vs2,
                                           size_t vl);
vfloat64m2_t __riscv_vfwmsac_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                           float vs1, vfloat32m1_t vs2,
                                           size_t vl);
vfloat64m4_t __riscv_vfwmsac_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat32m2_t vs1, vfloat32m2_t vs2,
                                           size_t vl);
vfloat64m4_t __riscv_vfwmsac_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                           float vs1, vfloat32m2_t vs2,
                                           size_t vl);
vfloat64m8_t __riscv_vfwmsac_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat32m4_t vs1, vfloat32m4_t vs2,
                                           size_t vl);
vfloat64m8_t __riscv_vfwmsac_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                           float vs1, vfloat32m4_t vs2,
                                           size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_vv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat16mf4_t vs1,
                                              vfloat16mf4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                              _Float16 vs1, vfloat16mf4_t vs2,
                                              size_t vl);
vfloat32m1_t __riscv_vfwnmsac_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat16mf2_t vs1,
                                            vfloat16mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwnmsac_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                            _Float16 vs1, vfloat16mf2_t vs2,
                                            size_t vl);
vfloat32m2_t __riscv_vfwnmsac_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat16m1_t vs1, vfloat16m1_t vs2,
                                            size_t vl);
vfloat32m2_t __riscv_vfwnmsac_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                            _Float16 vs1, vfloat16m1_t vs2,
                                            size_t vl);
vfloat32m4_t __riscv_vfwnmsac_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat16m2_t vs1, vfloat16m2_t vs2,
                                            size_t vl);
vfloat32m4_t __riscv_vfwnmsac_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                            _Float16 vs1, vfloat16m2_t vs2,
                                            size_t vl);
vfloat32m8_t __riscv_vfwnmsac_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat16m4_t vs1, vfloat16m4_t vs2,
                                            size_t vl);
vfloat32m8_t __riscv_vfwnmsac_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                            _Float16 vs1, vfloat16m4_t vs2,
                                            size_t vl);
vfloat64m1_t __riscv_vfwnmsac_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat32mf2_t vs1,
                                            vfloat32mf2_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwnmsac_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                            float vs1, vfloat32mf2_t vs2,
                                            size_t vl);
vfloat64m2_t __riscv_vfwnmsac_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat32m1_t vs1, vfloat32m1_t vs2,
                                            size_t vl);
vfloat64m2_t __riscv_vfwnmsac_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                            float vs1, vfloat32m1_t vs2,
                                            size_t vl);
vfloat64m4_t __riscv_vfwnmsac_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat32m2_t vs1, vfloat32m2_t vs2,
                                            size_t vl);
vfloat64m4_t __riscv_vfwnmsac_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                            float vs1, vfloat32m2_t vs2,
                                            size_t vl);
vfloat64m8_t __riscv_vfwnmsac_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat32m4_t vs1, vfloat32m4_t vs2,
                                            size_t vl);
vfloat64m8_t __riscv_vfwnmsac_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                            float vs1, vfloat32m4_t vs2,
                                            size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwmacc_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                           size_t vl);
vfloat32mf2_t __riscv_vfwmacc_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                           _Float16 vs1, vfloat16mf4_t vs2,
                                           size_t vl);
vfloat32m1_t __riscv_vfwmacc_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                         size_t vl);
vfloat32m1_t __riscv_vfwmacc_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                         _Float16 vs1, vfloat16mf2_t vs2,
                                         size_t vl);
vfloat32m2_t __riscv_vfwmacc_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat16m1_t vs1, vfloat16m1_t vs2,
                                         size_t vl);
vfloat32m2_t __riscv_vfwmacc_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                         _Float16 vs1, vfloat16m1_t vs2,
                                         size_t vl);
vfloat32m4_t __riscv_vfwmacc_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat16m2_t vs1, vfloat16m2_t vs2,
                                         size_t vl);
vfloat32m4_t __riscv_vfwmacc_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                         _Float16 vs1, vfloat16m2_t vs2,
                                         size_t vl);
vfloat32m8_t __riscv_vfwmacc_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat16m4_t vs1, vfloat16m4_t vs2,
                                         size_t vl);
vfloat32m8_t __riscv_vfwmacc_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                         _Float16 vs1, vfloat16m4_t vs2,
                                         size_t vl);
vfloat64m1_t __riscv_vfwmacc_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                         size_t vl);
vfloat64m1_t __riscv_vfwmacc_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                         float vs1, vfloat32mf2_t vs2,
                                         size_t vl);
vfloat64m2_t __riscv_vfwmacc_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat32m1_t vs1, vfloat32m1_t vs2,
                                         size_t vl);
vfloat64m2_t __riscv_vfwmacc_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                         float vs1, vfloat32m1_t vs2,
                                         size_t vl);
vfloat64m4_t __riscv_vfwmacc_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat32m2_t vs1, vfloat32m2_t vs2,
                                         size_t vl);
vfloat64m4_t __riscv_vfwmacc_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                         float vs1, vfloat32m2_t vs2,
                                         size_t vl);
vfloat64m8_t __riscv_vfwmacc_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat32m4_t vs1, vfloat32m4_t vs2,
                                         size_t vl);
vfloat64m8_t __riscv_vfwmacc_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                         float vs1, vfloat32m4_t vs2,
                                         size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat16mf4_t vs1,
                                            vfloat16mf4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                            _Float16 vs1, vfloat16mf4_t vs2,
                                            size_t vl);
vfloat32m1_t __riscv_vfwnmacc_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                          size_t vl);
vfloat32m1_t __riscv_vfwnmacc_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                          _Float16 vs1, vfloat16mf2_t vs2,
                                          size_t vl);
vfloat32m2_t __riscv_vfwnmacc_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat16m1_t vs1, vfloat16m1_t vs2,
                                          size_t vl);
vfloat32m2_t __riscv_vfwnmacc_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                          _Float16 vs1, vfloat16m1_t vs2,
                                          size_t vl);
vfloat32m4_t __riscv_vfwnmacc_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat16m2_t vs1, vfloat16m2_t vs2,
                                          size_t vl);
vfloat32m4_t __riscv_vfwnmacc_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                          _Float16 vs1, vfloat16m2_t vs2,
                                          size_t vl);
vfloat32m8_t __riscv_vfwnmacc_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat16m4_t vs1, vfloat16m4_t vs2,
                                          size_t vl);
vfloat32m8_t __riscv_vfwnmacc_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                          _Float16 vs1, vfloat16m4_t vs2,
                                          size_t vl);
vfloat64m1_t __riscv_vfwnmacc_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                          size_t vl);
vfloat64m1_t __riscv_vfwnmacc_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                          float vs1, vfloat32mf2_t vs2,
                                          size_t vl);
vfloat64m2_t __riscv_vfwnmacc_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat32m1_t vs1, vfloat32m1_t vs2,
                                          size_t vl);
vfloat64m2_t __riscv_vfwnmacc_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                          float vs1, vfloat32m1_t vs2,
                                          size_t vl);
vfloat64m4_t __riscv_vfwnmacc_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat32m2_t vs1, vfloat32m2_t vs2,
                                          size_t vl);
vfloat64m4_t __riscv_vfwnmacc_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                          float vs1, vfloat32m2_t vs2,
                                          size_t vl);
vfloat64m8_t __riscv_vfwnmacc_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat32m4_t vs1, vfloat32m4_t vs2,
                                          size_t vl);
vfloat64m8_t __riscv_vfwnmacc_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                          float vs1, vfloat32m4_t vs2,
                                          size_t vl);
vfloat32mf2_t __riscv_vfwmsac_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                           size_t vl);
vfloat32mf2_t __riscv_vfwmsac_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                           _Float16 vs1, vfloat16mf4_t vs2,
                                           size_t vl);
vfloat32m1_t __riscv_vfwmsac_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                         size_t vl);
vfloat32m1_t __riscv_vfwmsac_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                         _Float16 vs1, vfloat16mf2_t vs2,
                                         size_t vl);
vfloat32m2_t __riscv_vfwmsac_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat16m1_t vs1, vfloat16m1_t vs2,
                                         size_t vl);
vfloat32m2_t __riscv_vfwmsac_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                         _Float16 vs1, vfloat16m1_t vs2,
                                         size_t vl);
vfloat32m4_t __riscv_vfwmsac_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat16m2_t vs1, vfloat16m2_t vs2,
                                         size_t vl);
vfloat32m4_t __riscv_vfwmsac_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                         _Float16 vs1, vfloat16m2_t vs2,
                                         size_t vl);
vfloat32m8_t __riscv_vfwmsac_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat16m4_t vs1, vfloat16m4_t vs2,
                                         size_t vl);
vfloat32m8_t __riscv_vfwmsac_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                         _Float16 vs1, vfloat16m4_t vs2,
                                         size_t vl);
vfloat64m1_t __riscv_vfwmsac_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                         size_t vl);
vfloat64m1_t __riscv_vfwmsac_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                         float vs1, vfloat32mf2_t vs2,
                                         size_t vl);
vfloat64m2_t __riscv_vfwmsac_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat32m1_t vs1, vfloat32m1_t vs2,
                                         size_t vl);
vfloat64m2_t __riscv_vfwmsac_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                         float vs1, vfloat32m1_t vs2,
                                         size_t vl);
vfloat64m4_t __riscv_vfwmsac_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat32m2_t vs1, vfloat32m2_t vs2,
                                         size_t vl);
vfloat64m4_t __riscv_vfwmsac_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                         float vs1, vfloat32m2_t vs2,
                                         size_t vl);
vfloat64m8_t __riscv_vfwmsac_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat32m4_t vs1, vfloat32m4_t vs2,
                                         size_t vl);
vfloat64m8_t __riscv_vfwmsac_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                         float vs1, vfloat32m4_t vs2,
                                         size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat16mf4_t vs1,
                                            vfloat16mf4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                            _Float16 vs1, vfloat16mf4_t vs2,
                                            size_t vl);
vfloat32m1_t __riscv_vfwnmsac_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                          size_t vl);
vfloat32m1_t __riscv_vfwnmsac_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                          _Float16 vs1, vfloat16mf2_t vs2,
                                          size_t vl);
vfloat32m2_t __riscv_vfwnmsac_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat16m1_t vs1, vfloat16m1_t vs2,
                                          size_t vl);
vfloat32m2_t __riscv_vfwnmsac_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                          _Float16 vs1, vfloat16m1_t vs2,
                                          size_t vl);
vfloat32m4_t __riscv_vfwnmsac_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat16m2_t vs1, vfloat16m2_t vs2,
                                          size_t vl);
vfloat32m4_t __riscv_vfwnmsac_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                          _Float16 vs1, vfloat16m2_t vs2,
                                          size_t vl);
vfloat32m8_t __riscv_vfwnmsac_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat16m4_t vs1, vfloat16m4_t vs2,
                                          size_t vl);
vfloat32m8_t __riscv_vfwnmsac_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                          _Float16 vs1, vfloat16m4_t vs2,
                                          size_t vl);
vfloat64m1_t __riscv_vfwnmsac_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                          size_t vl);
vfloat64m1_t __riscv_vfwnmsac_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                          float vs1, vfloat32mf2_t vs2,
                                          size_t vl);
vfloat64m2_t __riscv_vfwnmsac_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat32m1_t vs1, vfloat32m1_t vs2,
                                          size_t vl);
vfloat64m2_t __riscv_vfwnmsac_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                          float vs1, vfloat32m1_t vs2,
                                          size_t vl);
vfloat64m4_t __riscv_vfwnmsac_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat32m2_t vs1, vfloat32m2_t vs2,
                                          size_t vl);
vfloat64m4_t __riscv_vfwnmsac_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                          float vs1, vfloat32m2_t vs2,
                                          size_t vl);
vfloat64m8_t __riscv_vfwnmsac_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat32m4_t vs1, vfloat32m4_t vs2,
                                          size_t vl);
vfloat64m8_t __riscv_vfwnmsac_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                          float vs1, vfloat32m4_t vs2,
                                          size_t vl);
vfloat32mf2_t __riscv_vfwmacc_vv_f32mf2_rm_tu(vfloat32mf2_t vd,
                                              vfloat16mf4_t vs1,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmacc_vf_f32mf2_rm_tu(vfloat32mf2_t vd, _Float16 vs1,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmacc_vv_f32m1_rm_tu(vfloat32m1_t vd, vfloat16mf2_t vs1,
                                            vfloat16mf2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m1_t __riscv_vfwmacc_vf_f32m1_rm_tu(vfloat32m1_t vd, _Float16 vs1,
                                            vfloat16mf2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m2_t __riscv_vfwmacc_vv_f32m2_rm_tu(vfloat32m2_t vd, vfloat16m1_t vs1,
                                            vfloat16m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m2_t __riscv_vfwmacc_vf_f32m2_rm_tu(vfloat32m2_t vd, _Float16 vs1,
                                            vfloat16m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m4_t __riscv_vfwmacc_vv_f32m4_rm_tu(vfloat32m4_t vd, vfloat16m2_t vs1,
                                            vfloat16m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m4_t __riscv_vfwmacc_vf_f32m4_rm_tu(vfloat32m4_t vd, _Float16 vs1,
                                            vfloat16m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m8_t __riscv_vfwmacc_vv_f32m8_rm_tu(vfloat32m8_t vd, vfloat16m4_t vs1,
                                            vfloat16m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m8_t __riscv_vfwmacc_vf_f32m8_rm_tu(vfloat32m8_t vd, _Float16 vs1,
                                            vfloat16m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m1_t __riscv_vfwmacc_vv_f64m1_rm_tu(vfloat64m1_t vd, vfloat32mf2_t vs1,
                                            vfloat32mf2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m1_t __riscv_vfwmacc_vf_f64m1_rm_tu(vfloat64m1_t vd, float vs1,
                                            vfloat32mf2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m2_t __riscv_vfwmacc_vv_f64m2_rm_tu(vfloat64m2_t vd, vfloat32m1_t vs1,
                                            vfloat32m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m2_t __riscv_vfwmacc_vf_f64m2_rm_tu(vfloat64m2_t vd, float vs1,
                                            vfloat32m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m4_t __riscv_vfwmacc_vv_f64m4_rm_tu(vfloat64m4_t vd, vfloat32m2_t vs1,
                                            vfloat32m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m4_t __riscv_vfwmacc_vf_f64m4_rm_tu(vfloat64m4_t vd, float vs1,
                                            vfloat32m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m8_t __riscv_vfwmacc_vv_f64m8_rm_tu(vfloat64m8_t vd, vfloat32m4_t vs1,
                                            vfloat32m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m8_t __riscv_vfwmacc_vf_f64m8_rm_tu(vfloat64m8_t vd, float vs1,
                                            vfloat32m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_vv_f32mf2_rm_tu(vfloat32mf2_t vd,
                                               vfloat16mf4_t vs1,
                                               vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_vf_f32mf2_rm_tu(vfloat32mf2_t vd, _Float16 vs1,
                                               vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwnmacc_vv_f32m1_rm_tu(vfloat32m1_t vd, vfloat16mf2_t vs1,
                                             vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwnmacc_vf_f32m1_rm_tu(vfloat32m1_t vd, _Float16 vs1,
                                             vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwnmacc_vv_f32m2_rm_tu(vfloat32m2_t vd, vfloat16m1_t vs1,
                                             vfloat16m1_t vs2, unsigned int frm,
                                             size_t vl);
vfloat32m2_t __riscv_vfwnmacc_vf_f32m2_rm_tu(vfloat32m2_t vd, _Float16 vs1,
                                             vfloat16m1_t vs2, unsigned int frm,
                                             size_t vl);
vfloat32m4_t __riscv_vfwnmacc_vv_f32m4_rm_tu(vfloat32m4_t vd, vfloat16m2_t vs1,
                                             vfloat16m2_t vs2, unsigned int frm,
                                             size_t vl);
vfloat32m4_t __riscv_vfwnmacc_vf_f32m4_rm_tu(vfloat32m4_t vd, _Float16 vs1,
                                             vfloat16m2_t vs2, unsigned int frm,
                                             size_t vl);
vfloat32m8_t __riscv_vfwnmacc_vv_f32m8_rm_tu(vfloat32m8_t vd, vfloat16m4_t vs1,
                                             vfloat16m4_t vs2, unsigned int frm,
                                             size_t vl);
vfloat32m8_t __riscv_vfwnmacc_vf_f32m8_rm_tu(vfloat32m8_t vd, _Float16 vs1,
                                             vfloat16m4_t vs2, unsigned int frm,
                                             size_t vl);
vfloat64m1_t __riscv_vfwnmacc_vv_f64m1_rm_tu(vfloat64m1_t vd, vfloat32mf2_t vs1,
                                             vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwnmacc_vf_f64m1_rm_tu(vfloat64m1_t vd, float vs1,
                                             vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwnmacc_vv_f64m2_rm_tu(vfloat64m2_t vd, vfloat32m1_t vs1,
                                             vfloat32m1_t vs2, unsigned int frm,
                                             size_t vl);
vfloat64m2_t __riscv_vfwnmacc_vf_f64m2_rm_tu(vfloat64m2_t vd, float vs1,
                                             vfloat32m1_t vs2, unsigned int frm,
                                             size_t vl);
vfloat64m4_t __riscv_vfwnmacc_vv_f64m4_rm_tu(vfloat64m4_t vd, vfloat32m2_t vs1,
                                             vfloat32m2_t vs2, unsigned int frm,
                                             size_t vl);
vfloat64m4_t __riscv_vfwnmacc_vf_f64m4_rm_tu(vfloat64m4_t vd, float vs1,
                                             vfloat32m2_t vs2, unsigned int frm,
                                             size_t vl);
vfloat64m8_t __riscv_vfwnmacc_vv_f64m8_rm_tu(vfloat64m8_t vd, vfloat32m4_t vs1,
                                             vfloat32m4_t vs2, unsigned int frm,
                                             size_t vl);
vfloat64m8_t __riscv_vfwnmacc_vf_f64m8_rm_tu(vfloat64m8_t vd, float vs1,
                                             vfloat32m4_t vs2, unsigned int frm,
                                             size_t vl);
vfloat32mf2_t __riscv_vfwmsac_vv_f32mf2_rm_tu(vfloat32mf2_t vd,
                                              vfloat16mf4_t vs1,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmsac_vf_f32mf2_rm_tu(vfloat32mf2_t vd, _Float16 vs1,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmsac_vv_f32m1_rm_tu(vfloat32m1_t vd, vfloat16mf2_t vs1,
                                            vfloat16mf2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m1_t __riscv_vfwmsac_vf_f32m1_rm_tu(vfloat32m1_t vd, _Float16 vs1,
                                            vfloat16mf2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m2_t __riscv_vfwmsac_vv_f32m2_rm_tu(vfloat32m2_t vd, vfloat16m1_t vs1,
                                            vfloat16m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m2_t __riscv_vfwmsac_vf_f32m2_rm_tu(vfloat32m2_t vd, _Float16 vs1,
                                            vfloat16m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m4_t __riscv_vfwmsac_vv_f32m4_rm_tu(vfloat32m4_t vd, vfloat16m2_t vs1,
                                            vfloat16m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m4_t __riscv_vfwmsac_vf_f32m4_rm_tu(vfloat32m4_t vd, _Float16 vs1,
                                            vfloat16m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m8_t __riscv_vfwmsac_vv_f32m8_rm_tu(vfloat32m8_t vd, vfloat16m4_t vs1,
                                            vfloat16m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m8_t __riscv_vfwmsac_vf_f32m8_rm_tu(vfloat32m8_t vd, _Float16 vs1,
                                            vfloat16m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m1_t __riscv_vfwmsac_vv_f64m1_rm_tu(vfloat64m1_t vd, vfloat32mf2_t vs1,
                                            vfloat32mf2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m1_t __riscv_vfwmsac_vf_f64m1_rm_tu(vfloat64m1_t vd, float vs1,
                                            vfloat32mf2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m2_t __riscv_vfwmsac_vv_f64m2_rm_tu(vfloat64m2_t vd, vfloat32m1_t vs1,
                                            vfloat32m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m2_t __riscv_vfwmsac_vf_f64m2_rm_tu(vfloat64m2_t vd, float vs1,
                                            vfloat32m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m4_t __riscv_vfwmsac_vv_f64m4_rm_tu(vfloat64m4_t vd, vfloat32m2_t vs1,
                                            vfloat32m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m4_t __riscv_vfwmsac_vf_f64m4_rm_tu(vfloat64m4_t vd, float vs1,
                                            vfloat32m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m8_t __riscv_vfwmsac_vv_f64m8_rm_tu(vfloat64m8_t vd, vfloat32m4_t vs1,
                                            vfloat32m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m8_t __riscv_vfwmsac_vf_f64m8_rm_tu(vfloat64m8_t vd, float vs1,
                                            vfloat32m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_vv_f32mf2_rm_tu(vfloat32mf2_t vd,
                                               vfloat16mf4_t vs1,
                                               vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_vf_f32mf2_rm_tu(vfloat32mf2_t vd, _Float16 vs1,
                                               vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwnmsac_vv_f32m1_rm_tu(vfloat32m1_t vd, vfloat16mf2_t vs1,
                                             vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwnmsac_vf_f32m1_rm_tu(vfloat32m1_t vd, _Float16 vs1,
                                             vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwnmsac_vv_f32m2_rm_tu(vfloat32m2_t vd, vfloat16m1_t vs1,
                                             vfloat16m1_t vs2, unsigned int frm,
                                             size_t vl);
vfloat32m2_t __riscv_vfwnmsac_vf_f32m2_rm_tu(vfloat32m2_t vd, _Float16 vs1,
                                             vfloat16m1_t vs2, unsigned int frm,
                                             size_t vl);
vfloat32m4_t __riscv_vfwnmsac_vv_f32m4_rm_tu(vfloat32m4_t vd, vfloat16m2_t vs1,
                                             vfloat16m2_t vs2, unsigned int frm,
                                             size_t vl);
vfloat32m4_t __riscv_vfwnmsac_vf_f32m4_rm_tu(vfloat32m4_t vd, _Float16 vs1,
                                             vfloat16m2_t vs2, unsigned int frm,
                                             size_t vl);
vfloat32m8_t __riscv_vfwnmsac_vv_f32m8_rm_tu(vfloat32m8_t vd, vfloat16m4_t vs1,
                                             vfloat16m4_t vs2, unsigned int frm,
                                             size_t vl);
vfloat32m8_t __riscv_vfwnmsac_vf_f32m8_rm_tu(vfloat32m8_t vd, _Float16 vs1,
                                             vfloat16m4_t vs2, unsigned int frm,
                                             size_t vl);
vfloat64m1_t __riscv_vfwnmsac_vv_f64m1_rm_tu(vfloat64m1_t vd, vfloat32mf2_t vs1,
                                             vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwnmsac_vf_f64m1_rm_tu(vfloat64m1_t vd, float vs1,
                                             vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwnmsac_vv_f64m2_rm_tu(vfloat64m2_t vd, vfloat32m1_t vs1,
                                             vfloat32m1_t vs2, unsigned int frm,
                                             size_t vl);
vfloat64m2_t __riscv_vfwnmsac_vf_f64m2_rm_tu(vfloat64m2_t vd, float vs1,
                                             vfloat32m1_t vs2, unsigned int frm,
                                             size_t vl);
vfloat64m4_t __riscv_vfwnmsac_vv_f64m4_rm_tu(vfloat64m4_t vd, vfloat32m2_t vs1,
                                             vfloat32m2_t vs2, unsigned int frm,
                                             size_t vl);
vfloat64m4_t __riscv_vfwnmsac_vf_f64m4_rm_tu(vfloat64m4_t vd, float vs1,
                                             vfloat32m2_t vs2, unsigned int frm,
                                             size_t vl);
vfloat64m8_t __riscv_vfwnmsac_vv_f64m8_rm_tu(vfloat64m8_t vd, vfloat32m4_t vs1,
                                             vfloat32m4_t vs2, unsigned int frm,
                                             size_t vl);
vfloat64m8_t __riscv_vfwnmsac_vf_f64m8_rm_tu(vfloat64m8_t vd, float vs1,
                                             vfloat32m4_t vs2, unsigned int frm,
                                             size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwmacc_vv_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat16mf4_t vs1,
                                               vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmacc_vf_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                               _Float16 vs1, vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmacc_vv_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat16mf2_t vs1,
                                             vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmacc_vf_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                             _Float16 vs1, vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmacc_vv_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat16m1_t vs1, vfloat16m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmacc_vf_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                             _Float16 vs1, vfloat16m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmacc_vv_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat16m2_t vs1, vfloat16m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmacc_vf_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                             _Float16 vs1, vfloat16m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmacc_vv_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat16m4_t vs1, vfloat16m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmacc_vf_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                             _Float16 vs1, vfloat16m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmacc_vv_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat32mf2_t vs1,
                                             vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmacc_vf_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                             float vs1, vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmacc_vv_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat32m1_t vs1, vfloat32m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmacc_vf_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                             float vs1, vfloat32m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmacc_vv_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat32m2_t vs1, vfloat32m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmacc_vf_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                             float vs1, vfloat32m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmacc_vv_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat32m4_t vs1, vfloat32m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmacc_vf_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                             float vs1, vfloat32m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_vv_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                                vfloat16mf4_t vs1,
                                                vfloat16mf4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_vf_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                                _Float16 vs1, vfloat16mf4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwnmacc_vv_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                              vfloat16mf2_t vs1,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwnmacc_vf_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                              _Float16 vs1, vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwnmacc_vv_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                              vfloat16m1_t vs1,
                                              vfloat16m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwnmacc_vf_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                              _Float16 vs1, vfloat16m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwnmacc_vv_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                              vfloat16m2_t vs1,
                                              vfloat16m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwnmacc_vf_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                              _Float16 vs1, vfloat16m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwnmacc_vv_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                              vfloat16m4_t vs1,
                                              vfloat16m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwnmacc_vf_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                              _Float16 vs1, vfloat16m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwnmacc_vv_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                              vfloat32mf2_t vs1,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwnmacc_vf_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                              float vs1, vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwnmacc_vv_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                              vfloat32m1_t vs1,
                                              vfloat32m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwnmacc_vf_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                              float vs1, vfloat32m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwnmacc_vv_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                              vfloat32m2_t vs1,
                                              vfloat32m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwnmacc_vf_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                              float vs1, vfloat32m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwnmacc_vv_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                              vfloat32m4_t vs1,
                                              vfloat32m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwnmacc_vf_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                              float vs1, vfloat32m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmsac_vv_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat16mf4_t vs1,
                                               vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmsac_vf_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                               _Float16 vs1, vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmsac_vv_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat16mf2_t vs1,
                                             vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmsac_vf_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                             _Float16 vs1, vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmsac_vv_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat16m1_t vs1, vfloat16m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmsac_vf_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                             _Float16 vs1, vfloat16m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmsac_vv_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat16m2_t vs1, vfloat16m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmsac_vf_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                             _Float16 vs1, vfloat16m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmsac_vv_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat16m4_t vs1, vfloat16m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmsac_vf_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                             _Float16 vs1, vfloat16m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmsac_vv_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat32mf2_t vs1,
                                             vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmsac_vf_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                             float vs1, vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmsac_vv_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat32m1_t vs1, vfloat32m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmsac_vf_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                             float vs1, vfloat32m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmsac_vv_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat32m2_t vs1, vfloat32m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmsac_vf_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                             float vs1, vfloat32m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmsac_vv_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat32m4_t vs1, vfloat32m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmsac_vf_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                             float vs1, vfloat32m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_vv_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                                vfloat16mf4_t vs1,
                                                vfloat16mf4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_vf_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                                _Float16 vs1, vfloat16mf4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwnmsac_vv_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                              vfloat16mf2_t vs1,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwnmsac_vf_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                              _Float16 vs1, vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwnmsac_vv_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                              vfloat16m1_t vs1,
                                              vfloat16m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwnmsac_vf_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                              _Float16 vs1, vfloat16m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwnmsac_vv_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                              vfloat16m2_t vs1,
                                              vfloat16m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwnmsac_vf_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                              _Float16 vs1, vfloat16m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwnmsac_vv_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                              vfloat16m4_t vs1,
                                              vfloat16m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwnmsac_vf_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                              _Float16 vs1, vfloat16m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwnmsac_vv_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                              vfloat32mf2_t vs1,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwnmsac_vf_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                              float vs1, vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwnmsac_vv_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                              vfloat32m1_t vs1,
                                              vfloat32m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwnmsac_vf_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                              float vs1, vfloat32m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwnmsac_vv_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                              vfloat32m2_t vs1,
                                              vfloat32m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwnmsac_vf_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                              float vs1, vfloat32m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwnmsac_vv_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                              vfloat32m4_t vs1,
                                              vfloat32m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwnmsac_vf_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                              float vs1, vfloat32m4_t vs2,
                                              unsigned int frm, size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwmacc_vv_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                                vfloat16mf4_t vs1,
                                                vfloat16mf4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmacc_vf_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                                _Float16 vs1, vfloat16mf4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmacc_vv_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                              vfloat16mf2_t vs1,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmacc_vf_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                              _Float16 vs1, vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmacc_vv_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                              vfloat16m1_t vs1,
                                              vfloat16m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmacc_vf_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                              _Float16 vs1, vfloat16m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmacc_vv_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                              vfloat16m2_t vs1,
                                              vfloat16m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmacc_vf_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                              _Float16 vs1, vfloat16m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmacc_vv_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                              vfloat16m4_t vs1,
                                              vfloat16m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmacc_vf_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                              _Float16 vs1, vfloat16m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmacc_vv_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                              vfloat32mf2_t vs1,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmacc_vf_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                              float vs1, vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmacc_vv_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                              vfloat32m1_t vs1,
                                              vfloat32m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmacc_vf_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                              float vs1, vfloat32m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmacc_vv_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                              vfloat32m2_t vs1,
                                              vfloat32m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmacc_vf_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                              float vs1, vfloat32m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmacc_vv_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                              vfloat32m4_t vs1,
                                              vfloat32m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmacc_vf_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                              float vs1, vfloat32m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_vv_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                                 vfloat16mf4_t vs1,
                                                 vfloat16mf4_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_vf_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                                 _Float16 vs1,
                                                 vfloat16mf4_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwnmacc_vv_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                               vfloat16mf2_t vs1,
                                               vfloat16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwnmacc_vf_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                               _Float16 vs1, vfloat16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwnmacc_vv_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                               vfloat16m1_t vs1,
                                               vfloat16m1_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwnmacc_vf_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                               _Float16 vs1, vfloat16m1_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwnmacc_vv_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                               vfloat16m2_t vs1,
                                               vfloat16m2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwnmacc_vf_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                               _Float16 vs1, vfloat16m2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwnmacc_vv_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                               vfloat16m4_t vs1,
                                               vfloat16m4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwnmacc_vf_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                               _Float16 vs1, vfloat16m4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwnmacc_vv_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                               vfloat32mf2_t vs1,
                                               vfloat32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwnmacc_vf_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                               float vs1, vfloat32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwnmacc_vv_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                               vfloat32m1_t vs1,
                                               vfloat32m1_t vs2,
                                               unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwnmacc_vf_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                               float vs1, vfloat32m1_t vs2,
                                               unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwnmacc_vv_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                               vfloat32m2_t vs1,
                                               vfloat32m2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwnmacc_vf_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                               float vs1, vfloat32m2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwnmacc_vv_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                               vfloat32m4_t vs1,
                                               vfloat32m4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwnmacc_vf_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                               float vs1, vfloat32m4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmsac_vv_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                                vfloat16mf4_t vs1,
                                                vfloat16mf4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmsac_vf_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                                _Float16 vs1, vfloat16mf4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmsac_vv_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                              vfloat16mf2_t vs1,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmsac_vf_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                              _Float16 vs1, vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmsac_vv_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                              vfloat16m1_t vs1,
                                              vfloat16m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmsac_vf_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                              _Float16 vs1, vfloat16m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmsac_vv_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                              vfloat16m2_t vs1,
                                              vfloat16m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmsac_vf_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                              _Float16 vs1, vfloat16m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmsac_vv_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                              vfloat16m4_t vs1,
                                              vfloat16m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmsac_vf_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                              _Float16 vs1, vfloat16m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmsac_vv_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                              vfloat32mf2_t vs1,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmsac_vf_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                              float vs1, vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmsac_vv_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                              vfloat32m1_t vs1,
                                              vfloat32m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmsac_vf_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                              float vs1, vfloat32m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmsac_vv_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                              vfloat32m2_t vs1,
                                              vfloat32m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmsac_vf_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                              float vs1, vfloat32m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmsac_vv_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                              vfloat32m4_t vs1,
                                              vfloat32m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmsac_vf_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                              float vs1, vfloat32m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_vv_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                                 vfloat16mf4_t vs1,
                                                 vfloat16mf4_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_vf_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                                 _Float16 vs1,
                                                 vfloat16mf4_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwnmsac_vv_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                               vfloat16mf2_t vs1,
                                               vfloat16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwnmsac_vf_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                               _Float16 vs1, vfloat16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwnmsac_vv_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                               vfloat16m1_t vs1,
                                               vfloat16m1_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwnmsac_vf_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                               _Float16 vs1, vfloat16m1_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwnmsac_vv_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                               vfloat16m2_t vs1,
                                               vfloat16m2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwnmsac_vf_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                               _Float16 vs1, vfloat16m2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwnmsac_vv_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                               vfloat16m4_t vs1,
                                               vfloat16m4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwnmsac_vf_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                               _Float16 vs1, vfloat16m4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwnmsac_vv_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                               vfloat32mf2_t vs1,
                                               vfloat32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwnmsac_vf_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                               float vs1, vfloat32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwnmsac_vv_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                               vfloat32m1_t vs1,
                                               vfloat32m1_t vs2,
                                               unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwnmsac_vf_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                               float vs1, vfloat32m1_t vs2,
                                               unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwnmsac_vv_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                               vfloat32m2_t vs1,
                                               vfloat32m2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwnmsac_vf_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                               float vs1, vfloat32m2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwnmsac_vv_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                               vfloat32m4_t vs1,
                                               vfloat32m4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwnmsac_vf_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                               float vs1, vfloat32m4_t vs2,
                                               unsigned int frm, size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwmacc_vv_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat16mf4_t vs1,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmacc_vf_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                              _Float16 vs1, vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmacc_vv_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat16mf2_t vs1,
                                            vfloat16mf2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m1_t __riscv_vfwmacc_vf_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                            _Float16 vs1, vfloat16mf2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmacc_vv_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat16m1_t vs1, vfloat16m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmacc_vf_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                            _Float16 vs1, vfloat16m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmacc_vv_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat16m2_t vs1, vfloat16m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmacc_vf_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                            _Float16 vs1, vfloat16m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmacc_vv_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat16m4_t vs1, vfloat16m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmacc_vf_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                            _Float16 vs1, vfloat16m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmacc_vv_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat32mf2_t vs1,
                                            vfloat32mf2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m1_t __riscv_vfwmacc_vf_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                            float vs1, vfloat32mf2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmacc_vv_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat32m1_t vs1, vfloat32m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmacc_vf_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                            float vs1, vfloat32m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmacc_vv_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat32m2_t vs1, vfloat32m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmacc_vf_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                            float vs1, vfloat32m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmacc_vv_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat32m4_t vs1, vfloat32m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmacc_vf_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                            float vs1, vfloat32m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_vv_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat16mf4_t vs1,
                                               vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_vf_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                               _Float16 vs1, vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwnmacc_vv_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat16mf2_t vs1,
                                             vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwnmacc_vf_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                             _Float16 vs1, vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwnmacc_vv_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat16m1_t vs1, vfloat16m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwnmacc_vf_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                             _Float16 vs1, vfloat16m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwnmacc_vv_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat16m2_t vs1, vfloat16m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwnmacc_vf_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                             _Float16 vs1, vfloat16m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwnmacc_vv_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat16m4_t vs1, vfloat16m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwnmacc_vf_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                             _Float16 vs1, vfloat16m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwnmacc_vv_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat32mf2_t vs1,
                                             vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwnmacc_vf_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                             float vs1, vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwnmacc_vv_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat32m1_t vs1, vfloat32m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwnmacc_vf_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                             float vs1, vfloat32m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwnmacc_vv_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat32m2_t vs1, vfloat32m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwnmacc_vf_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                             float vs1, vfloat32m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwnmacc_vv_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat32m4_t vs1, vfloat32m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwnmacc_vf_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                             float vs1, vfloat32m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmsac_vv_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat16mf4_t vs1,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmsac_vf_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                              _Float16 vs1, vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmsac_vv_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat16mf2_t vs1,
                                            vfloat16mf2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m1_t __riscv_vfwmsac_vf_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                            _Float16 vs1, vfloat16mf2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmsac_vv_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat16m1_t vs1, vfloat16m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmsac_vf_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                            _Float16 vs1, vfloat16m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmsac_vv_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat16m2_t vs1, vfloat16m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmsac_vf_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                            _Float16 vs1, vfloat16m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmsac_vv_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat16m4_t vs1, vfloat16m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmsac_vf_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                            _Float16 vs1, vfloat16m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmsac_vv_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat32mf2_t vs1,
                                            vfloat32mf2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m1_t __riscv_vfwmsac_vf_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                            float vs1, vfloat32mf2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmsac_vv_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat32m1_t vs1, vfloat32m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmsac_vf_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                            float vs1, vfloat32m1_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmsac_vv_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat32m2_t vs1, vfloat32m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmsac_vf_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                            float vs1, vfloat32m2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmsac_vv_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat32m4_t vs1, vfloat32m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmsac_vf_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                            float vs1, vfloat32m4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_vv_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat16mf4_t vs1,
                                               vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_vf_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                               _Float16 vs1, vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwnmsac_vv_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat16mf2_t vs1,
                                             vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwnmsac_vf_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                             _Float16 vs1, vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwnmsac_vv_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat16m1_t vs1, vfloat16m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwnmsac_vf_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                             _Float16 vs1, vfloat16m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwnmsac_vv_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat16m2_t vs1, vfloat16m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwnmsac_vf_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                             _Float16 vs1, vfloat16m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwnmsac_vv_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat16m4_t vs1, vfloat16m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwnmsac_vf_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                             _Float16 vs1, vfloat16m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwnmsac_vv_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat32mf2_t vs1,
                                             vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwnmsac_vf_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                             float vs1, vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwnmsac_vv_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat32m1_t vs1, vfloat32m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwnmsac_vf_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                             float vs1, vfloat32m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwnmsac_vv_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat32m2_t vs1, vfloat32m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwnmsac_vf_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                             float vs1, vfloat32m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwnmsac_vv_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat32m4_t vs1, vfloat32m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwnmsac_vf_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                             float vs1, vfloat32m4_t vs2,
                                             unsigned int frm, size_t vl);

Vector Floating-Point Square-Root Intrinsics

vfloat16mf4_t __riscv_vfsqrt_v_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                         size_t vl);
vfloat16mf2_t __riscv_vfsqrt_v_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                         size_t vl);
vfloat16m1_t __riscv_vfsqrt_v_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                       size_t vl);
vfloat16m2_t __riscv_vfsqrt_v_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                       size_t vl);
vfloat16m4_t __riscv_vfsqrt_v_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                       size_t vl);
vfloat16m8_t __riscv_vfsqrt_v_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                       size_t vl);
vfloat32mf2_t __riscv_vfsqrt_v_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                         size_t vl);
vfloat32m1_t __riscv_vfsqrt_v_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                       size_t vl);
vfloat32m2_t __riscv_vfsqrt_v_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                       size_t vl);
vfloat32m4_t __riscv_vfsqrt_v_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                       size_t vl);
vfloat32m8_t __riscv_vfsqrt_v_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                       size_t vl);
vfloat64m1_t __riscv_vfsqrt_v_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                       size_t vl);
vfloat64m2_t __riscv_vfsqrt_v_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                       size_t vl);
vfloat64m4_t __riscv_vfsqrt_v_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                       size_t vl);
vfloat64m8_t __riscv_vfsqrt_v_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                       size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfsqrt_v_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                          vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfsqrt_v_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                          vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfsqrt_v_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                        vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfsqrt_v_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                        vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfsqrt_v_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                        vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfsqrt_v_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                        vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfsqrt_v_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfsqrt_v_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfsqrt_v_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfsqrt_v_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfsqrt_v_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfsqrt_v_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfsqrt_v_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfsqrt_v_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfsqrt_v_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs2, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfsqrt_v_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfsqrt_v_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfsqrt_v_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfsqrt_v_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfsqrt_v_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfsqrt_v_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfsqrt_v_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfsqrt_v_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfsqrt_v_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfsqrt_v_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfsqrt_v_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfsqrt_v_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfsqrt_v_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfsqrt_v_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfsqrt_v_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfsqrt_v_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                         vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfsqrt_v_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                         vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfsqrt_v_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                       vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfsqrt_v_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                       vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfsqrt_v_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                       vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfsqrt_v_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                       vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfsqrt_v_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                         vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfsqrt_v_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                       vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfsqrt_v_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                       vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfsqrt_v_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                       vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfsqrt_v_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                       vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfsqrt_v_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                       vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfsqrt_v_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                       vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfsqrt_v_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                       vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfsqrt_v_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                       vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfsqrt_v_f16mf4_rm_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfsqrt_v_f16mf2_rm_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfsqrt_v_f16m1_rm_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                          unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfsqrt_v_f16m2_rm_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                          unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfsqrt_v_f16m4_rm_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                          unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfsqrt_v_f16m8_rm_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                          unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfsqrt_v_f32mf2_rm_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfsqrt_v_f32m1_rm_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                          unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfsqrt_v_f32m2_rm_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                          unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfsqrt_v_f32m4_rm_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                          unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfsqrt_v_f32m8_rm_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                          unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfsqrt_v_f64m1_rm_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                          unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfsqrt_v_f64m2_rm_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                          unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfsqrt_v_f64m4_rm_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                          unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfsqrt_v_f64m8_rm_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                          unsigned int frm, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfsqrt_v_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfsqrt_v_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfsqrt_v_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m2_t __riscv_vfsqrt_v_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m4_t __riscv_vfsqrt_v_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m8_t __riscv_vfsqrt_v_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32mf2_t __riscv_vfsqrt_v_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfsqrt_v_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m2_t __riscv_vfsqrt_v_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m4_t __riscv_vfsqrt_v_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m8_t __riscv_vfsqrt_v_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m1_t __riscv_vfsqrt_v_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m2_t __riscv_vfsqrt_v_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m4_t __riscv_vfsqrt_v_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m8_t __riscv_vfsqrt_v_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs2, unsigned int frm,
                                           size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfsqrt_v_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfsqrt_v_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfsqrt_v_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat16m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m2_t __riscv_vfsqrt_v_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat16m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m4_t __riscv_vfsqrt_v_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat16m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m8_t __riscv_vfsqrt_v_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                            vfloat16m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32mf2_t __riscv_vfsqrt_v_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfsqrt_v_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m2_t __riscv_vfsqrt_v_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m4_t __riscv_vfsqrt_v_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m8_t __riscv_vfsqrt_v_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m1_t __riscv_vfsqrt_v_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m2_t __riscv_vfsqrt_v_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m4_t __riscv_vfsqrt_v_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m8_t __riscv_vfsqrt_v_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs2, unsigned int frm,
                                            size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfsqrt_v_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16mf2_t __riscv_vfsqrt_v_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m1_t __riscv_vfsqrt_v_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs2, unsigned int frm,
                                          size_t vl);
vfloat16m2_t __riscv_vfsqrt_v_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs2, unsigned int frm,
                                          size_t vl);
vfloat16m4_t __riscv_vfsqrt_v_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs2, unsigned int frm,
                                          size_t vl);
vfloat16m8_t __riscv_vfsqrt_v_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs2, unsigned int frm,
                                          size_t vl);
vfloat32mf2_t __riscv_vfsqrt_v_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m1_t __riscv_vfsqrt_v_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, unsigned int frm,
                                          size_t vl);
vfloat32m2_t __riscv_vfsqrt_v_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, unsigned int frm,
                                          size_t vl);
vfloat32m4_t __riscv_vfsqrt_v_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, unsigned int frm,
                                          size_t vl);
vfloat32m8_t __riscv_vfsqrt_v_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, unsigned int frm,
                                          size_t vl);
vfloat64m1_t __riscv_vfsqrt_v_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, unsigned int frm,
                                          size_t vl);
vfloat64m2_t __riscv_vfsqrt_v_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, unsigned int frm,
                                          size_t vl);
vfloat64m4_t __riscv_vfsqrt_v_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, unsigned int frm,
                                          size_t vl);
vfloat64m8_t __riscv_vfsqrt_v_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, unsigned int frm,
                                          size_t vl);

Vector Floating-Point Reciprocal Square-Root Estimate Intrinsics

vfloat16mf4_t __riscv_vfrsqrt7_v_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                           size_t vl);
vfloat16mf2_t __riscv_vfrsqrt7_v_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat16m1_t __riscv_vfrsqrt7_v_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                         size_t vl);
vfloat16m2_t __riscv_vfrsqrt7_v_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                         size_t vl);
vfloat16m4_t __riscv_vfrsqrt7_v_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                         size_t vl);
vfloat16m8_t __riscv_vfrsqrt7_v_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                         size_t vl);
vfloat32mf2_t __riscv_vfrsqrt7_v_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat32m1_t __riscv_vfrsqrt7_v_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                         size_t vl);
vfloat32m2_t __riscv_vfrsqrt7_v_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                         size_t vl);
vfloat32m4_t __riscv_vfrsqrt7_v_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                         size_t vl);
vfloat32m8_t __riscv_vfrsqrt7_v_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                         size_t vl);
vfloat64m1_t __riscv_vfrsqrt7_v_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                         size_t vl);
vfloat64m2_t __riscv_vfrsqrt7_v_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                         size_t vl);
vfloat64m4_t __riscv_vfrsqrt7_v_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                         size_t vl);
vfloat64m8_t __riscv_vfrsqrt7_v_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                         size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfrsqrt7_v_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfrsqrt7_v_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfrsqrt7_v_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfrsqrt7_v_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfrsqrt7_v_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfrsqrt7_v_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfrsqrt7_v_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfrsqrt7_v_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfrsqrt7_v_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfrsqrt7_v_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfrsqrt7_v_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfrsqrt7_v_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfrsqrt7_v_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfrsqrt7_v_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfrsqrt7_v_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfrsqrt7_v_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfrsqrt7_v_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfrsqrt7_v_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfrsqrt7_v_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfrsqrt7_v_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfrsqrt7_v_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfrsqrt7_v_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfrsqrt7_v_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfrsqrt7_v_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfrsqrt7_v_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfrsqrt7_v_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfrsqrt7_v_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfrsqrt7_v_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfrsqrt7_v_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfrsqrt7_v_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs2, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfrsqrt7_v_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfrsqrt7_v_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfrsqrt7_v_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfrsqrt7_v_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfrsqrt7_v_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfrsqrt7_v_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfrsqrt7_v_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfrsqrt7_v_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfrsqrt7_v_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfrsqrt7_v_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfrsqrt7_v_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfrsqrt7_v_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfrsqrt7_v_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfrsqrt7_v_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfrsqrt7_v_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, size_t vl);

[[policy-variant-#1410-vector-floating-point-reciprocal-estimate]] ==== Vector Floating-Point Reciprocal Estimate Intrinsics

vfloat16mf4_t __riscv_vfrec7_v_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                         size_t vl);
vfloat16mf2_t __riscv_vfrec7_v_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                         size_t vl);
vfloat16m1_t __riscv_vfrec7_v_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                       size_t vl);
vfloat16m2_t __riscv_vfrec7_v_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                       size_t vl);
vfloat16m4_t __riscv_vfrec7_v_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                       size_t vl);
vfloat16m8_t __riscv_vfrec7_v_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                       size_t vl);
vfloat32mf2_t __riscv_vfrec7_v_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                         size_t vl);
vfloat32m1_t __riscv_vfrec7_v_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                       size_t vl);
vfloat32m2_t __riscv_vfrec7_v_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                       size_t vl);
vfloat32m4_t __riscv_vfrec7_v_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                       size_t vl);
vfloat32m8_t __riscv_vfrec7_v_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                       size_t vl);
vfloat64m1_t __riscv_vfrec7_v_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                       size_t vl);
vfloat64m2_t __riscv_vfrec7_v_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                       size_t vl);
vfloat64m4_t __riscv_vfrec7_v_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                       size_t vl);
vfloat64m8_t __riscv_vfrec7_v_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                       size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfrec7_v_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                          vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfrec7_v_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                          vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfrec7_v_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                        vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfrec7_v_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                        vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfrec7_v_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                        vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfrec7_v_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                        vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfrec7_v_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfrec7_v_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfrec7_v_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfrec7_v_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfrec7_v_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfrec7_v_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfrec7_v_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfrec7_v_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfrec7_v_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs2, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfrec7_v_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfrec7_v_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfrec7_v_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfrec7_v_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfrec7_v_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfrec7_v_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfrec7_v_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfrec7_v_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfrec7_v_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfrec7_v_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfrec7_v_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfrec7_v_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfrec7_v_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfrec7_v_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfrec7_v_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfrec7_v_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                         vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfrec7_v_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                         vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfrec7_v_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                       vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfrec7_v_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                       vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfrec7_v_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                       vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfrec7_v_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                       vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfrec7_v_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                         vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfrec7_v_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                       vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfrec7_v_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                       vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfrec7_v_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                       vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfrec7_v_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                       vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfrec7_v_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                       vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfrec7_v_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                       vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfrec7_v_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                       vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfrec7_v_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                       vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfrec7_v_f16mf4_rm_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfrec7_v_f16mf2_rm_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfrec7_v_f16m1_rm_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                          unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfrec7_v_f16m2_rm_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                          unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfrec7_v_f16m4_rm_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                          unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfrec7_v_f16m8_rm_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                          unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfrec7_v_f32mf2_rm_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                            unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfrec7_v_f32m1_rm_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                          unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfrec7_v_f32m2_rm_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                          unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfrec7_v_f32m4_rm_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                          unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfrec7_v_f32m8_rm_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                          unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfrec7_v_f64m1_rm_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                          unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfrec7_v_f64m2_rm_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                          unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfrec7_v_f64m4_rm_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                          unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfrec7_v_f64m8_rm_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                          unsigned int frm, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfrec7_v_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfrec7_v_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfrec7_v_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m2_t __riscv_vfrec7_v_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m4_t __riscv_vfrec7_v_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat16m8_t __riscv_vfrec7_v_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32mf2_t __riscv_vfrec7_v_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfrec7_v_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m2_t __riscv_vfrec7_v_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m4_t __riscv_vfrec7_v_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat32m8_t __riscv_vfrec7_v_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m1_t __riscv_vfrec7_v_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m2_t __riscv_vfrec7_v_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m4_t __riscv_vfrec7_v_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs2, unsigned int frm,
                                           size_t vl);
vfloat64m8_t __riscv_vfrec7_v_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs2, unsigned int frm,
                                           size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfrec7_v_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfrec7_v_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfrec7_v_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat16m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m2_t __riscv_vfrec7_v_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat16m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m4_t __riscv_vfrec7_v_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat16m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m8_t __riscv_vfrec7_v_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                            vfloat16m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32mf2_t __riscv_vfrec7_v_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfrec7_v_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m2_t __riscv_vfrec7_v_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m4_t __riscv_vfrec7_v_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m8_t __riscv_vfrec7_v_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m1_t __riscv_vfrec7_v_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m2_t __riscv_vfrec7_v_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m4_t __riscv_vfrec7_v_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat64m8_t __riscv_vfrec7_v_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs2, unsigned int frm,
                                            size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfrec7_v_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16mf2_t __riscv_vfrec7_v_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat16m1_t __riscv_vfrec7_v_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs2, unsigned int frm,
                                          size_t vl);
vfloat16m2_t __riscv_vfrec7_v_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs2, unsigned int frm,
                                          size_t vl);
vfloat16m4_t __riscv_vfrec7_v_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs2, unsigned int frm,
                                          size_t vl);
vfloat16m8_t __riscv_vfrec7_v_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs2, unsigned int frm,
                                          size_t vl);
vfloat32mf2_t __riscv_vfrec7_v_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2, unsigned int frm,
                                            size_t vl);
vfloat32m1_t __riscv_vfrec7_v_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, unsigned int frm,
                                          size_t vl);
vfloat32m2_t __riscv_vfrec7_v_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, unsigned int frm,
                                          size_t vl);
vfloat32m4_t __riscv_vfrec7_v_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, unsigned int frm,
                                          size_t vl);
vfloat32m8_t __riscv_vfrec7_v_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, unsigned int frm,
                                          size_t vl);
vfloat64m1_t __riscv_vfrec7_v_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, unsigned int frm,
                                          size_t vl);
vfloat64m2_t __riscv_vfrec7_v_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, unsigned int frm,
                                          size_t vl);
vfloat64m4_t __riscv_vfrec7_v_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, unsigned int frm,
                                          size_t vl);
vfloat64m8_t __riscv_vfrec7_v_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, unsigned int frm,
                                          size_t vl);

Vector Floating-Point MIN/MAX Intrinsics

vfloat16mf4_t __riscv_vfmin_vv_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                         vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfmin_vf_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                         _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfmin_vv_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                         vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfmin_vf_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                         _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfmin_vv_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                       vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfmin_vf_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                       _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfmin_vv_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                       vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfmin_vf_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                       _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfmin_vv_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                       vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfmin_vf_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                       _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfmin_vv_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                       vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfmin_vf_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                       _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfmin_vv_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                         vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfmin_vf_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                         float rs1, size_t vl);
vfloat32m1_t __riscv_vfmin_vv_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                       vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfmin_vf_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                       float rs1, size_t vl);
vfloat32m2_t __riscv_vfmin_vv_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                       vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfmin_vf_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                       float rs1, size_t vl);
vfloat32m4_t __riscv_vfmin_vv_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                       vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfmin_vf_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                       float rs1, size_t vl);
vfloat32m8_t __riscv_vfmin_vv_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                       vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfmin_vf_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                       float rs1, size_t vl);
vfloat64m1_t __riscv_vfmin_vv_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                       vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfmin_vf_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                       double rs1, size_t vl);
vfloat64m2_t __riscv_vfmin_vv_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                       vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfmin_vf_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                       double rs1, size_t vl);
vfloat64m4_t __riscv_vfmin_vv_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                       vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfmin_vf_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                       double rs1, size_t vl);
vfloat64m8_t __riscv_vfmin_vv_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                       vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfmin_vf_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                       double rs1, size_t vl);
vfloat16mf4_t __riscv_vfmax_vv_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                         vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfmax_vf_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                         _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfmax_vv_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                         vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfmax_vf_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                         _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfmax_vv_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                       vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfmax_vf_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                       _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfmax_vv_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                       vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfmax_vf_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                       _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfmax_vv_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                       vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfmax_vf_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                       _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfmax_vv_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                       vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfmax_vf_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                       _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfmax_vv_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                         vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfmax_vf_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                         float rs1, size_t vl);
vfloat32m1_t __riscv_vfmax_vv_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                       vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfmax_vf_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                       float rs1, size_t vl);
vfloat32m2_t __riscv_vfmax_vv_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                       vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfmax_vf_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                       float rs1, size_t vl);
vfloat32m4_t __riscv_vfmax_vv_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                       vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfmax_vf_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                       float rs1, size_t vl);
vfloat32m8_t __riscv_vfmax_vv_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                       vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfmax_vf_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                       float rs1, size_t vl);
vfloat64m1_t __riscv_vfmax_vv_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                       vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfmax_vf_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                       double rs1, size_t vl);
vfloat64m2_t __riscv_vfmax_vv_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                       vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfmax_vf_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                       double rs1, size_t vl);
vfloat64m4_t __riscv_vfmax_vv_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                       vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfmax_vf_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                       double rs1, size_t vl);
vfloat64m8_t __riscv_vfmax_vv_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                       vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfmax_vf_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                       double rs1, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmin_vv_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                          vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                          size_t vl);
vfloat16mf4_t __riscv_vfmin_vf_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                          vfloat16mf4_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16mf2_t __riscv_vfmin_vv_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                          vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                          size_t vl);
vfloat16mf2_t __riscv_vfmin_vf_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                          vfloat16mf2_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16m1_t __riscv_vfmin_vv_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                        vfloat16m1_t vs2, vfloat16m1_t vs1,
                                        size_t vl);
vfloat16m1_t __riscv_vfmin_vf_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                        vfloat16m1_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m2_t __riscv_vfmin_vv_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                        vfloat16m2_t vs2, vfloat16m2_t vs1,
                                        size_t vl);
vfloat16m2_t __riscv_vfmin_vf_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                        vfloat16m2_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m4_t __riscv_vfmin_vv_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                        vfloat16m4_t vs2, vfloat16m4_t vs1,
                                        size_t vl);
vfloat16m4_t __riscv_vfmin_vf_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                        vfloat16m4_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m8_t __riscv_vfmin_vv_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                        vfloat16m8_t vs2, vfloat16m8_t vs1,
                                        size_t vl);
vfloat16m8_t __riscv_vfmin_vf_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                        vfloat16m8_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32mf2_t __riscv_vfmin_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                          size_t vl);
vfloat32mf2_t __riscv_vfmin_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs2, float rs1,
                                          size_t vl);
vfloat32m1_t __riscv_vfmin_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs2, vfloat32m1_t vs1,
                                        size_t vl);
vfloat32m1_t __riscv_vfmin_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs2, float rs1, size_t vl);
vfloat32m2_t __riscv_vfmin_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs2, vfloat32m2_t vs1,
                                        size_t vl);
vfloat32m2_t __riscv_vfmin_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs2, float rs1, size_t vl);
vfloat32m4_t __riscv_vfmin_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs2, vfloat32m4_t vs1,
                                        size_t vl);
vfloat32m4_t __riscv_vfmin_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs2, float rs1, size_t vl);
vfloat32m8_t __riscv_vfmin_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs2, vfloat32m8_t vs1,
                                        size_t vl);
vfloat32m8_t __riscv_vfmin_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs2, float rs1, size_t vl);
vfloat64m1_t __riscv_vfmin_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs2, vfloat64m1_t vs1,
                                        size_t vl);
vfloat64m1_t __riscv_vfmin_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs2, double rs1,
                                        size_t vl);
vfloat64m2_t __riscv_vfmin_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs2, vfloat64m2_t vs1,
                                        size_t vl);
vfloat64m2_t __riscv_vfmin_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs2, double rs1,
                                        size_t vl);
vfloat64m4_t __riscv_vfmin_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs2, vfloat64m4_t vs1,
                                        size_t vl);
vfloat64m4_t __riscv_vfmin_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs2, double rs1,
                                        size_t vl);
vfloat64m8_t __riscv_vfmin_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs2, vfloat64m8_t vs1,
                                        size_t vl);
vfloat64m8_t __riscv_vfmin_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs2, double rs1,
                                        size_t vl);
vfloat16mf4_t __riscv_vfmax_vv_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                          vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                          size_t vl);
vfloat16mf4_t __riscv_vfmax_vf_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                          vfloat16mf4_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16mf2_t __riscv_vfmax_vv_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                          vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                          size_t vl);
vfloat16mf2_t __riscv_vfmax_vf_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                          vfloat16mf2_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16m1_t __riscv_vfmax_vv_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                        vfloat16m1_t vs2, vfloat16m1_t vs1,
                                        size_t vl);
vfloat16m1_t __riscv_vfmax_vf_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                        vfloat16m1_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m2_t __riscv_vfmax_vv_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                        vfloat16m2_t vs2, vfloat16m2_t vs1,
                                        size_t vl);
vfloat16m2_t __riscv_vfmax_vf_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                        vfloat16m2_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m4_t __riscv_vfmax_vv_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                        vfloat16m4_t vs2, vfloat16m4_t vs1,
                                        size_t vl);
vfloat16m4_t __riscv_vfmax_vf_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                        vfloat16m4_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m8_t __riscv_vfmax_vv_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                        vfloat16m8_t vs2, vfloat16m8_t vs1,
                                        size_t vl);
vfloat16m8_t __riscv_vfmax_vf_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                        vfloat16m8_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32mf2_t __riscv_vfmax_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                          size_t vl);
vfloat32mf2_t __riscv_vfmax_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs2, float rs1,
                                          size_t vl);
vfloat32m1_t __riscv_vfmax_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs2, vfloat32m1_t vs1,
                                        size_t vl);
vfloat32m1_t __riscv_vfmax_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs2, float rs1, size_t vl);
vfloat32m2_t __riscv_vfmax_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs2, vfloat32m2_t vs1,
                                        size_t vl);
vfloat32m2_t __riscv_vfmax_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs2, float rs1, size_t vl);
vfloat32m4_t __riscv_vfmax_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs2, vfloat32m4_t vs1,
                                        size_t vl);
vfloat32m4_t __riscv_vfmax_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs2, float rs1, size_t vl);
vfloat32m8_t __riscv_vfmax_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs2, vfloat32m8_t vs1,
                                        size_t vl);
vfloat32m8_t __riscv_vfmax_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs2, float rs1, size_t vl);
vfloat64m1_t __riscv_vfmax_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs2, vfloat64m1_t vs1,
                                        size_t vl);
vfloat64m1_t __riscv_vfmax_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs2, double rs1,
                                        size_t vl);
vfloat64m2_t __riscv_vfmax_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs2, vfloat64m2_t vs1,
                                        size_t vl);
vfloat64m2_t __riscv_vfmax_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs2, double rs1,
                                        size_t vl);
vfloat64m4_t __riscv_vfmax_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs2, vfloat64m4_t vs1,
                                        size_t vl);
vfloat64m4_t __riscv_vfmax_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs2, double rs1,
                                        size_t vl);
vfloat64m8_t __riscv_vfmax_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs2, vfloat64m8_t vs1,
                                        size_t vl);
vfloat64m8_t __riscv_vfmax_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs2, double rs1,
                                        size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmin_vv_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                           size_t vl);
vfloat16mf4_t __riscv_vfmin_vf_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16mf2_t __riscv_vfmin_vv_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                           size_t vl);
vfloat16mf2_t __riscv_vfmin_vf_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16m1_t __riscv_vfmin_vv_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs2, vfloat16m1_t vs1,
                                         size_t vl);
vfloat16m1_t __riscv_vfmin_vf_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m2_t __riscv_vfmin_vv_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs2, vfloat16m2_t vs1,
                                         size_t vl);
vfloat16m2_t __riscv_vfmin_vf_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m4_t __riscv_vfmin_vv_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs2, vfloat16m4_t vs1,
                                         size_t vl);
vfloat16m4_t __riscv_vfmin_vf_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m8_t __riscv_vfmin_vv_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs2, vfloat16m8_t vs1,
                                         size_t vl);
vfloat16m8_t __riscv_vfmin_vf_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32mf2_t __riscv_vfmin_vv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                           size_t vl);
vfloat32mf2_t __riscv_vfmin_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, float rs1,
                                           size_t vl);
vfloat32m1_t __riscv_vfmin_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, vfloat32m1_t vs1,
                                         size_t vl);
vfloat32m1_t __riscv_vfmin_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, float rs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfmin_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, vfloat32m2_t vs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfmin_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, float rs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfmin_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, vfloat32m4_t vs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfmin_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, float rs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfmin_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, vfloat32m8_t vs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfmin_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, float rs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfmin_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, vfloat64m1_t vs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfmin_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, double rs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfmin_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, vfloat64m2_t vs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfmin_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, double rs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfmin_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, vfloat64m4_t vs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfmin_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, double rs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfmin_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, vfloat64m8_t vs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfmin_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, double rs1,
                                         size_t vl);
vfloat16mf4_t __riscv_vfmax_vv_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                           size_t vl);
vfloat16mf4_t __riscv_vfmax_vf_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16mf2_t __riscv_vfmax_vv_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                           size_t vl);
vfloat16mf2_t __riscv_vfmax_vf_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16m1_t __riscv_vfmax_vv_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs2, vfloat16m1_t vs1,
                                         size_t vl);
vfloat16m1_t __riscv_vfmax_vf_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m2_t __riscv_vfmax_vv_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs2, vfloat16m2_t vs1,
                                         size_t vl);
vfloat16m2_t __riscv_vfmax_vf_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m4_t __riscv_vfmax_vv_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs2, vfloat16m4_t vs1,
                                         size_t vl);
vfloat16m4_t __riscv_vfmax_vf_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m8_t __riscv_vfmax_vv_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs2, vfloat16m8_t vs1,
                                         size_t vl);
vfloat16m8_t __riscv_vfmax_vf_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32mf2_t __riscv_vfmax_vv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                           size_t vl);
vfloat32mf2_t __riscv_vfmax_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, float rs1,
                                           size_t vl);
vfloat32m1_t __riscv_vfmax_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, vfloat32m1_t vs1,
                                         size_t vl);
vfloat32m1_t __riscv_vfmax_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, float rs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfmax_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, vfloat32m2_t vs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfmax_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, float rs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfmax_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, vfloat32m4_t vs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfmax_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, float rs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfmax_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, vfloat32m8_t vs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfmax_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, float rs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfmax_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, vfloat64m1_t vs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfmax_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, double rs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfmax_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, vfloat64m2_t vs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfmax_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, double rs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfmax_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, vfloat64m4_t vs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfmax_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, double rs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfmax_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, vfloat64m8_t vs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfmax_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, double rs1,
                                         size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmin_vv_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                         vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                         size_t vl);
vfloat16mf4_t __riscv_vfmin_vf_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                         vfloat16mf4_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16mf2_t __riscv_vfmin_vv_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                         vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                         size_t vl);
vfloat16mf2_t __riscv_vfmin_vf_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                         vfloat16mf2_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m1_t __riscv_vfmin_vv_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                       vfloat16m1_t vs2, vfloat16m1_t vs1,
                                       size_t vl);
vfloat16m1_t __riscv_vfmin_vf_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                       vfloat16m1_t vs2, _Float16 rs1,
                                       size_t vl);
vfloat16m2_t __riscv_vfmin_vv_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                       vfloat16m2_t vs2, vfloat16m2_t vs1,
                                       size_t vl);
vfloat16m2_t __riscv_vfmin_vf_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                       vfloat16m2_t vs2, _Float16 rs1,
                                       size_t vl);
vfloat16m4_t __riscv_vfmin_vv_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                       vfloat16m4_t vs2, vfloat16m4_t vs1,
                                       size_t vl);
vfloat16m4_t __riscv_vfmin_vf_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                       vfloat16m4_t vs2, _Float16 rs1,
                                       size_t vl);
vfloat16m8_t __riscv_vfmin_vv_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                       vfloat16m8_t vs2, vfloat16m8_t vs1,
                                       size_t vl);
vfloat16m8_t __riscv_vfmin_vf_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                       vfloat16m8_t vs2, _Float16 rs1,
                                       size_t vl);
vfloat32mf2_t __riscv_vfmin_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                         vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                         size_t vl);
vfloat32mf2_t __riscv_vfmin_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                         vfloat32mf2_t vs2, float rs1,
                                         size_t vl);
vfloat32m1_t __riscv_vfmin_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                       vfloat32m1_t vs2, vfloat32m1_t vs1,
                                       size_t vl);
vfloat32m1_t __riscv_vfmin_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                       vfloat32m1_t vs2, float rs1, size_t vl);
vfloat32m2_t __riscv_vfmin_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                       vfloat32m2_t vs2, vfloat32m2_t vs1,
                                       size_t vl);
vfloat32m2_t __riscv_vfmin_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                       vfloat32m2_t vs2, float rs1, size_t vl);
vfloat32m4_t __riscv_vfmin_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                       vfloat32m4_t vs2, vfloat32m4_t vs1,
                                       size_t vl);
vfloat32m4_t __riscv_vfmin_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                       vfloat32m4_t vs2, float rs1, size_t vl);
vfloat32m8_t __riscv_vfmin_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                       vfloat32m8_t vs2, vfloat32m8_t vs1,
                                       size_t vl);
vfloat32m8_t __riscv_vfmin_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                       vfloat32m8_t vs2, float rs1, size_t vl);
vfloat64m1_t __riscv_vfmin_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                       vfloat64m1_t vs2, vfloat64m1_t vs1,
                                       size_t vl);
vfloat64m1_t __riscv_vfmin_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                       vfloat64m1_t vs2, double rs1, size_t vl);
vfloat64m2_t __riscv_vfmin_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                       vfloat64m2_t vs2, vfloat64m2_t vs1,
                                       size_t vl);
vfloat64m2_t __riscv_vfmin_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                       vfloat64m2_t vs2, double rs1, size_t vl);
vfloat64m4_t __riscv_vfmin_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                       vfloat64m4_t vs2, vfloat64m4_t vs1,
                                       size_t vl);
vfloat64m4_t __riscv_vfmin_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                       vfloat64m4_t vs2, double rs1, size_t vl);
vfloat64m8_t __riscv_vfmin_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                       vfloat64m8_t vs2, vfloat64m8_t vs1,
                                       size_t vl);
vfloat64m8_t __riscv_vfmin_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                       vfloat64m8_t vs2, double rs1, size_t vl);
vfloat16mf4_t __riscv_vfmax_vv_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                         vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                         size_t vl);
vfloat16mf4_t __riscv_vfmax_vf_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                         vfloat16mf4_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16mf2_t __riscv_vfmax_vv_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                         vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                         size_t vl);
vfloat16mf2_t __riscv_vfmax_vf_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                         vfloat16mf2_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m1_t __riscv_vfmax_vv_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                       vfloat16m1_t vs2, vfloat16m1_t vs1,
                                       size_t vl);
vfloat16m1_t __riscv_vfmax_vf_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                       vfloat16m1_t vs2, _Float16 rs1,
                                       size_t vl);
vfloat16m2_t __riscv_vfmax_vv_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                       vfloat16m2_t vs2, vfloat16m2_t vs1,
                                       size_t vl);
vfloat16m2_t __riscv_vfmax_vf_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                       vfloat16m2_t vs2, _Float16 rs1,
                                       size_t vl);
vfloat16m4_t __riscv_vfmax_vv_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                       vfloat16m4_t vs2, vfloat16m4_t vs1,
                                       size_t vl);
vfloat16m4_t __riscv_vfmax_vf_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                       vfloat16m4_t vs2, _Float16 rs1,
                                       size_t vl);
vfloat16m8_t __riscv_vfmax_vv_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                       vfloat16m8_t vs2, vfloat16m8_t vs1,
                                       size_t vl);
vfloat16m8_t __riscv_vfmax_vf_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                       vfloat16m8_t vs2, _Float16 rs1,
                                       size_t vl);
vfloat32mf2_t __riscv_vfmax_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                         vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                         size_t vl);
vfloat32mf2_t __riscv_vfmax_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                         vfloat32mf2_t vs2, float rs1,
                                         size_t vl);
vfloat32m1_t __riscv_vfmax_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                       vfloat32m1_t vs2, vfloat32m1_t vs1,
                                       size_t vl);
vfloat32m1_t __riscv_vfmax_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                       vfloat32m1_t vs2, float rs1, size_t vl);
vfloat32m2_t __riscv_vfmax_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                       vfloat32m2_t vs2, vfloat32m2_t vs1,
                                       size_t vl);
vfloat32m2_t __riscv_vfmax_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                       vfloat32m2_t vs2, float rs1, size_t vl);
vfloat32m4_t __riscv_vfmax_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                       vfloat32m4_t vs2, vfloat32m4_t vs1,
                                       size_t vl);
vfloat32m4_t __riscv_vfmax_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                       vfloat32m4_t vs2, float rs1, size_t vl);
vfloat32m8_t __riscv_vfmax_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                       vfloat32m8_t vs2, vfloat32m8_t vs1,
                                       size_t vl);
vfloat32m8_t __riscv_vfmax_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                       vfloat32m8_t vs2, float rs1, size_t vl);
vfloat64m1_t __riscv_vfmax_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                       vfloat64m1_t vs2, vfloat64m1_t vs1,
                                       size_t vl);
vfloat64m1_t __riscv_vfmax_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                       vfloat64m1_t vs2, double rs1, size_t vl);
vfloat64m2_t __riscv_vfmax_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                       vfloat64m2_t vs2, vfloat64m2_t vs1,
                                       size_t vl);
vfloat64m2_t __riscv_vfmax_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                       vfloat64m2_t vs2, double rs1, size_t vl);
vfloat64m4_t __riscv_vfmax_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                       vfloat64m4_t vs2, vfloat64m4_t vs1,
                                       size_t vl);
vfloat64m4_t __riscv_vfmax_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                       vfloat64m4_t vs2, double rs1, size_t vl);
vfloat64m8_t __riscv_vfmax_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                       vfloat64m8_t vs2, vfloat64m8_t vs1,
                                       size_t vl);
vfloat64m8_t __riscv_vfmax_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                       vfloat64m8_t vs2, double rs1, size_t vl);

Vector Floating-Point Sign-Injection Intrinsics

vfloat16mf4_t __riscv_vfsgnj_vv_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                          vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfsgnj_vf_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                          _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnj_vv_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                          vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnj_vf_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                          _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfsgnj_vv_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                        vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfsgnj_vf_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfsgnj_vv_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                        vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfsgnj_vf_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfsgnj_vv_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                        vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfsgnj_vf_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfsgnj_vv_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                        vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfsgnj_vf_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                        _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfsgnj_vv_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                          vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfsgnj_vf_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                          float rs1, size_t vl);
vfloat32m1_t __riscv_vfsgnj_vv_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                        vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfsgnj_vf_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                        float rs1, size_t vl);
vfloat32m2_t __riscv_vfsgnj_vv_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                        vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfsgnj_vf_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                        float rs1, size_t vl);
vfloat32m4_t __riscv_vfsgnj_vv_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                        vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfsgnj_vf_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                        float rs1, size_t vl);
vfloat32m8_t __riscv_vfsgnj_vv_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                        vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfsgnj_vf_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                        float rs1, size_t vl);
vfloat64m1_t __riscv_vfsgnj_vv_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                        vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfsgnj_vf_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                        double rs1, size_t vl);
vfloat64m2_t __riscv_vfsgnj_vv_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                        vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfsgnj_vf_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                        double rs1, size_t vl);
vfloat64m4_t __riscv_vfsgnj_vv_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                        vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfsgnj_vf_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                        double rs1, size_t vl);
vfloat64m8_t __riscv_vfsgnj_vv_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                        vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfsgnj_vf_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                        double rs1, size_t vl);
vfloat16mf4_t __riscv_vfsgnjn_vv_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                           vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfsgnjn_vf_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                           _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnjn_vv_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                           vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnjn_vf_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                           _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfsgnjn_vv_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                         vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfsgnjn_vf_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                         _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfsgnjn_vv_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                         vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfsgnjn_vf_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                         _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfsgnjn_vv_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                         vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfsgnjn_vf_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                         _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfsgnjn_vv_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                         vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfsgnjn_vf_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                         _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfsgnjn_vv_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                           vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfsgnjn_vf_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                           float rs1, size_t vl);
vfloat32m1_t __riscv_vfsgnjn_vv_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                         vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfsgnjn_vf_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                         float rs1, size_t vl);
vfloat32m2_t __riscv_vfsgnjn_vv_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                         vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfsgnjn_vf_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                         float rs1, size_t vl);
vfloat32m4_t __riscv_vfsgnjn_vv_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                         vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfsgnjn_vf_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                         float rs1, size_t vl);
vfloat32m8_t __riscv_vfsgnjn_vv_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                         vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfsgnjn_vf_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                         float rs1, size_t vl);
vfloat64m1_t __riscv_vfsgnjn_vv_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                         vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfsgnjn_vf_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                         double rs1, size_t vl);
vfloat64m2_t __riscv_vfsgnjn_vv_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                         vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfsgnjn_vf_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                         double rs1, size_t vl);
vfloat64m4_t __riscv_vfsgnjn_vv_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                         vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfsgnjn_vf_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                         double rs1, size_t vl);
vfloat64m8_t __riscv_vfsgnjn_vv_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                         vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfsgnjn_vf_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                         double rs1, size_t vl);
vfloat16mf4_t __riscv_vfsgnjx_vv_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                           vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfsgnjx_vf_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                           _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnjx_vv_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                           vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnjx_vf_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                           _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfsgnjx_vv_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                         vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfsgnjx_vf_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                         _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfsgnjx_vv_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                         vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfsgnjx_vf_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                         _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfsgnjx_vv_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                         vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfsgnjx_vf_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                         _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfsgnjx_vv_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                         vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfsgnjx_vf_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                         _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfsgnjx_vv_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                           vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfsgnjx_vf_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                           float rs1, size_t vl);
vfloat32m1_t __riscv_vfsgnjx_vv_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                         vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfsgnjx_vf_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                         float rs1, size_t vl);
vfloat32m2_t __riscv_vfsgnjx_vv_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                         vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfsgnjx_vf_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                         float rs1, size_t vl);
vfloat32m4_t __riscv_vfsgnjx_vv_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                         vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfsgnjx_vf_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                         float rs1, size_t vl);
vfloat32m8_t __riscv_vfsgnjx_vv_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                         vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfsgnjx_vf_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                         float rs1, size_t vl);
vfloat64m1_t __riscv_vfsgnjx_vv_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                         vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfsgnjx_vf_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                         double rs1, size_t vl);
vfloat64m2_t __riscv_vfsgnjx_vv_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                         vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfsgnjx_vf_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                         double rs1, size_t vl);
vfloat64m4_t __riscv_vfsgnjx_vv_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                         vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfsgnjx_vf_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                         double rs1, size_t vl);
vfloat64m8_t __riscv_vfsgnjx_vv_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                         vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfsgnjx_vf_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                         double rs1, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfsgnj_vv_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                           size_t vl);
vfloat16mf4_t __riscv_vfsgnj_vf_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16mf2_t __riscv_vfsgnj_vv_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                           size_t vl);
vfloat16mf2_t __riscv_vfsgnj_vf_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16m1_t __riscv_vfsgnj_vv_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs2, vfloat16m1_t vs1,
                                         size_t vl);
vfloat16m1_t __riscv_vfsgnj_vf_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m2_t __riscv_vfsgnj_vv_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs2, vfloat16m2_t vs1,
                                         size_t vl);
vfloat16m2_t __riscv_vfsgnj_vf_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m4_t __riscv_vfsgnj_vv_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs2, vfloat16m4_t vs1,
                                         size_t vl);
vfloat16m4_t __riscv_vfsgnj_vf_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m8_t __riscv_vfsgnj_vv_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs2, vfloat16m8_t vs1,
                                         size_t vl);
vfloat16m8_t __riscv_vfsgnj_vf_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32mf2_t __riscv_vfsgnj_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                           size_t vl);
vfloat32mf2_t __riscv_vfsgnj_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, float rs1,
                                           size_t vl);
vfloat32m1_t __riscv_vfsgnj_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, vfloat32m1_t vs1,
                                         size_t vl);
vfloat32m1_t __riscv_vfsgnj_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, float rs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfsgnj_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, vfloat32m2_t vs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfsgnj_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, float rs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfsgnj_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, vfloat32m4_t vs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfsgnj_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, float rs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfsgnj_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, vfloat32m8_t vs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfsgnj_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, float rs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfsgnj_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, vfloat64m1_t vs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfsgnj_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, double rs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfsgnj_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, vfloat64m2_t vs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfsgnj_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, double rs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfsgnj_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, vfloat64m4_t vs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfsgnj_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, double rs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfsgnj_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, vfloat64m8_t vs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfsgnj_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, double rs1,
                                         size_t vl);
vfloat16mf4_t __riscv_vfsgnjn_vv_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs2,
                                            vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfsgnjn_vf_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs2, _Float16 rs1,
                                            size_t vl);
vfloat16mf2_t __riscv_vfsgnjn_vv_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs2,
                                            vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnjn_vf_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs2, _Float16 rs1,
                                            size_t vl);
vfloat16m1_t __riscv_vfsgnjn_vv_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs2, vfloat16m1_t vs1,
                                          size_t vl);
vfloat16m1_t __riscv_vfsgnjn_vf_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16m2_t __riscv_vfsgnjn_vv_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs2, vfloat16m2_t vs1,
                                          size_t vl);
vfloat16m2_t __riscv_vfsgnjn_vf_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16m4_t __riscv_vfsgnjn_vv_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs2, vfloat16m4_t vs1,
                                          size_t vl);
vfloat16m4_t __riscv_vfsgnjn_vf_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16m8_t __riscv_vfsgnjn_vv_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs2, vfloat16m8_t vs1,
                                          size_t vl);
vfloat16m8_t __riscv_vfsgnjn_vf_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32mf2_t __riscv_vfsgnjn_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2,
                                            vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfsgnjn_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2, float rs1,
                                            size_t vl);
vfloat32m1_t __riscv_vfsgnjn_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, vfloat32m1_t vs1,
                                          size_t vl);
vfloat32m1_t __riscv_vfsgnjn_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, float rs1,
                                          size_t vl);
vfloat32m2_t __riscv_vfsgnjn_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, vfloat32m2_t vs1,
                                          size_t vl);
vfloat32m2_t __riscv_vfsgnjn_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, float rs1,
                                          size_t vl);
vfloat32m4_t __riscv_vfsgnjn_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, vfloat32m4_t vs1,
                                          size_t vl);
vfloat32m4_t __riscv_vfsgnjn_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, float rs1,
                                          size_t vl);
vfloat32m8_t __riscv_vfsgnjn_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, vfloat32m8_t vs1,
                                          size_t vl);
vfloat32m8_t __riscv_vfsgnjn_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, float rs1,
                                          size_t vl);
vfloat64m1_t __riscv_vfsgnjn_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, vfloat64m1_t vs1,
                                          size_t vl);
vfloat64m1_t __riscv_vfsgnjn_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, double rs1,
                                          size_t vl);
vfloat64m2_t __riscv_vfsgnjn_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, vfloat64m2_t vs1,
                                          size_t vl);
vfloat64m2_t __riscv_vfsgnjn_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, double rs1,
                                          size_t vl);
vfloat64m4_t __riscv_vfsgnjn_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, vfloat64m4_t vs1,
                                          size_t vl);
vfloat64m4_t __riscv_vfsgnjn_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, double rs1,
                                          size_t vl);
vfloat64m8_t __riscv_vfsgnjn_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, vfloat64m8_t vs1,
                                          size_t vl);
vfloat64m8_t __riscv_vfsgnjn_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, double rs1,
                                          size_t vl);
vfloat16mf4_t __riscv_vfsgnjx_vv_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs2,
                                            vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfsgnjx_vf_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs2, _Float16 rs1,
                                            size_t vl);
vfloat16mf2_t __riscv_vfsgnjx_vv_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs2,
                                            vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnjx_vf_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs2, _Float16 rs1,
                                            size_t vl);
vfloat16m1_t __riscv_vfsgnjx_vv_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs2, vfloat16m1_t vs1,
                                          size_t vl);
vfloat16m1_t __riscv_vfsgnjx_vf_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16m2_t __riscv_vfsgnjx_vv_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs2, vfloat16m2_t vs1,
                                          size_t vl);
vfloat16m2_t __riscv_vfsgnjx_vf_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16m4_t __riscv_vfsgnjx_vv_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs2, vfloat16m4_t vs1,
                                          size_t vl);
vfloat16m4_t __riscv_vfsgnjx_vf_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16m8_t __riscv_vfsgnjx_vv_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs2, vfloat16m8_t vs1,
                                          size_t vl);
vfloat16m8_t __riscv_vfsgnjx_vf_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32mf2_t __riscv_vfsgnjx_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2,
                                            vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfsgnjx_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2, float rs1,
                                            size_t vl);
vfloat32m1_t __riscv_vfsgnjx_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, vfloat32m1_t vs1,
                                          size_t vl);
vfloat32m1_t __riscv_vfsgnjx_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, float rs1,
                                          size_t vl);
vfloat32m2_t __riscv_vfsgnjx_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, vfloat32m2_t vs1,
                                          size_t vl);
vfloat32m2_t __riscv_vfsgnjx_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, float rs1,
                                          size_t vl);
vfloat32m4_t __riscv_vfsgnjx_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, vfloat32m4_t vs1,
                                          size_t vl);
vfloat32m4_t __riscv_vfsgnjx_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, float rs1,
                                          size_t vl);
vfloat32m8_t __riscv_vfsgnjx_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, vfloat32m8_t vs1,
                                          size_t vl);
vfloat32m8_t __riscv_vfsgnjx_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, float rs1,
                                          size_t vl);
vfloat64m1_t __riscv_vfsgnjx_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, vfloat64m1_t vs1,
                                          size_t vl);
vfloat64m1_t __riscv_vfsgnjx_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, double rs1,
                                          size_t vl);
vfloat64m2_t __riscv_vfsgnjx_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, vfloat64m2_t vs1,
                                          size_t vl);
vfloat64m2_t __riscv_vfsgnjx_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, double rs1,
                                          size_t vl);
vfloat64m4_t __riscv_vfsgnjx_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, vfloat64m4_t vs1,
                                          size_t vl);
vfloat64m4_t __riscv_vfsgnjx_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, double rs1,
                                          size_t vl);
vfloat64m8_t __riscv_vfsgnjx_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, vfloat64m8_t vs1,
                                          size_t vl);
vfloat64m8_t __riscv_vfsgnjx_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, double rs1,
                                          size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfsgnj_vv_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs2,
                                            vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfsgnj_vf_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs2, _Float16 rs1,
                                            size_t vl);
vfloat16mf2_t __riscv_vfsgnj_vv_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs2,
                                            vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnj_vf_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs2, _Float16 rs1,
                                            size_t vl);
vfloat16m1_t __riscv_vfsgnj_vv_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs2, vfloat16m1_t vs1,
                                          size_t vl);
vfloat16m1_t __riscv_vfsgnj_vf_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16m2_t __riscv_vfsgnj_vv_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs2, vfloat16m2_t vs1,
                                          size_t vl);
vfloat16m2_t __riscv_vfsgnj_vf_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16m4_t __riscv_vfsgnj_vv_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs2, vfloat16m4_t vs1,
                                          size_t vl);
vfloat16m4_t __riscv_vfsgnj_vf_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16m8_t __riscv_vfsgnj_vv_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs2, vfloat16m8_t vs1,
                                          size_t vl);
vfloat16m8_t __riscv_vfsgnj_vf_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat32mf2_t __riscv_vfsgnj_vv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2,
                                            vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfsgnj_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2, float rs1,
                                            size_t vl);
vfloat32m1_t __riscv_vfsgnj_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, vfloat32m1_t vs1,
                                          size_t vl);
vfloat32m1_t __riscv_vfsgnj_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, float rs1,
                                          size_t vl);
vfloat32m2_t __riscv_vfsgnj_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, vfloat32m2_t vs1,
                                          size_t vl);
vfloat32m2_t __riscv_vfsgnj_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, float rs1,
                                          size_t vl);
vfloat32m4_t __riscv_vfsgnj_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, vfloat32m4_t vs1,
                                          size_t vl);
vfloat32m4_t __riscv_vfsgnj_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, float rs1,
                                          size_t vl);
vfloat32m8_t __riscv_vfsgnj_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, vfloat32m8_t vs1,
                                          size_t vl);
vfloat32m8_t __riscv_vfsgnj_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, float rs1,
                                          size_t vl);
vfloat64m1_t __riscv_vfsgnj_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, vfloat64m1_t vs1,
                                          size_t vl);
vfloat64m1_t __riscv_vfsgnj_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, double rs1,
                                          size_t vl);
vfloat64m2_t __riscv_vfsgnj_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, vfloat64m2_t vs1,
                                          size_t vl);
vfloat64m2_t __riscv_vfsgnj_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, double rs1,
                                          size_t vl);
vfloat64m4_t __riscv_vfsgnj_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, vfloat64m4_t vs1,
                                          size_t vl);
vfloat64m4_t __riscv_vfsgnj_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, double rs1,
                                          size_t vl);
vfloat64m8_t __riscv_vfsgnj_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, vfloat64m8_t vs1,
                                          size_t vl);
vfloat64m8_t __riscv_vfsgnj_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, double rs1,
                                          size_t vl);
vfloat16mf4_t __riscv_vfsgnjn_vv_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs2,
                                             vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfsgnjn_vf_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs2, _Float16 rs1,
                                             size_t vl);
vfloat16mf2_t __riscv_vfsgnjn_vv_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs2,
                                             vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnjn_vf_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs2, _Float16 rs1,
                                             size_t vl);
vfloat16m1_t __riscv_vfsgnjn_vv_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs2, vfloat16m1_t vs1,
                                           size_t vl);
vfloat16m1_t __riscv_vfsgnjn_vf_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16m2_t __riscv_vfsgnjn_vv_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs2, vfloat16m2_t vs1,
                                           size_t vl);
vfloat16m2_t __riscv_vfsgnjn_vf_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16m4_t __riscv_vfsgnjn_vv_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs2, vfloat16m4_t vs1,
                                           size_t vl);
vfloat16m4_t __riscv_vfsgnjn_vf_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16m8_t __riscv_vfsgnjn_vv_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs2, vfloat16m8_t vs1,
                                           size_t vl);
vfloat16m8_t __riscv_vfsgnjn_vf_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat32mf2_t __riscv_vfsgnjn_vv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2,
                                             vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfsgnjn_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2, float rs1,
                                             size_t vl);
vfloat32m1_t __riscv_vfsgnjn_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs2, vfloat32m1_t vs1,
                                           size_t vl);
vfloat32m1_t __riscv_vfsgnjn_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs2, float rs1,
                                           size_t vl);
vfloat32m2_t __riscv_vfsgnjn_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs2, vfloat32m2_t vs1,
                                           size_t vl);
vfloat32m2_t __riscv_vfsgnjn_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs2, float rs1,
                                           size_t vl);
vfloat32m4_t __riscv_vfsgnjn_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs2, vfloat32m4_t vs1,
                                           size_t vl);
vfloat32m4_t __riscv_vfsgnjn_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs2, float rs1,
                                           size_t vl);
vfloat32m8_t __riscv_vfsgnjn_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs2, vfloat32m8_t vs1,
                                           size_t vl);
vfloat32m8_t __riscv_vfsgnjn_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs2, float rs1,
                                           size_t vl);
vfloat64m1_t __riscv_vfsgnjn_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs2, vfloat64m1_t vs1,
                                           size_t vl);
vfloat64m1_t __riscv_vfsgnjn_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs2, double rs1,
                                           size_t vl);
vfloat64m2_t __riscv_vfsgnjn_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs2, vfloat64m2_t vs1,
                                           size_t vl);
vfloat64m2_t __riscv_vfsgnjn_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs2, double rs1,
                                           size_t vl);
vfloat64m4_t __riscv_vfsgnjn_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs2, vfloat64m4_t vs1,
                                           size_t vl);
vfloat64m4_t __riscv_vfsgnjn_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs2, double rs1,
                                           size_t vl);
vfloat64m8_t __riscv_vfsgnjn_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs2, vfloat64m8_t vs1,
                                           size_t vl);
vfloat64m8_t __riscv_vfsgnjn_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs2, double rs1,
                                           size_t vl);
vfloat16mf4_t __riscv_vfsgnjx_vv_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs2,
                                             vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfsgnjx_vf_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs2, _Float16 rs1,
                                             size_t vl);
vfloat16mf2_t __riscv_vfsgnjx_vv_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs2,
                                             vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnjx_vf_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs2, _Float16 rs1,
                                             size_t vl);
vfloat16m1_t __riscv_vfsgnjx_vv_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs2, vfloat16m1_t vs1,
                                           size_t vl);
vfloat16m1_t __riscv_vfsgnjx_vf_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16m2_t __riscv_vfsgnjx_vv_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs2, vfloat16m2_t vs1,
                                           size_t vl);
vfloat16m2_t __riscv_vfsgnjx_vf_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16m4_t __riscv_vfsgnjx_vv_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs2, vfloat16m4_t vs1,
                                           size_t vl);
vfloat16m4_t __riscv_vfsgnjx_vf_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16m8_t __riscv_vfsgnjx_vv_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs2, vfloat16m8_t vs1,
                                           size_t vl);
vfloat16m8_t __riscv_vfsgnjx_vf_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat32mf2_t __riscv_vfsgnjx_vv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2,
                                             vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfsgnjx_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2, float rs1,
                                             size_t vl);
vfloat32m1_t __riscv_vfsgnjx_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs2, vfloat32m1_t vs1,
                                           size_t vl);
vfloat32m1_t __riscv_vfsgnjx_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs2, float rs1,
                                           size_t vl);
vfloat32m2_t __riscv_vfsgnjx_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs2, vfloat32m2_t vs1,
                                           size_t vl);
vfloat32m2_t __riscv_vfsgnjx_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs2, float rs1,
                                           size_t vl);
vfloat32m4_t __riscv_vfsgnjx_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs2, vfloat32m4_t vs1,
                                           size_t vl);
vfloat32m4_t __riscv_vfsgnjx_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs2, float rs1,
                                           size_t vl);
vfloat32m8_t __riscv_vfsgnjx_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs2, vfloat32m8_t vs1,
                                           size_t vl);
vfloat32m8_t __riscv_vfsgnjx_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs2, float rs1,
                                           size_t vl);
vfloat64m1_t __riscv_vfsgnjx_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs2, vfloat64m1_t vs1,
                                           size_t vl);
vfloat64m1_t __riscv_vfsgnjx_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs2, double rs1,
                                           size_t vl);
vfloat64m2_t __riscv_vfsgnjx_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs2, vfloat64m2_t vs1,
                                           size_t vl);
vfloat64m2_t __riscv_vfsgnjx_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs2, double rs1,
                                           size_t vl);
vfloat64m4_t __riscv_vfsgnjx_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs2, vfloat64m4_t vs1,
                                           size_t vl);
vfloat64m4_t __riscv_vfsgnjx_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs2, double rs1,
                                           size_t vl);
vfloat64m8_t __riscv_vfsgnjx_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs2, vfloat64m8_t vs1,
                                           size_t vl);
vfloat64m8_t __riscv_vfsgnjx_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs2, double rs1,
                                           size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfsgnj_vv_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                          vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                          size_t vl);
vfloat16mf4_t __riscv_vfsgnj_vf_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                          vfloat16mf4_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16mf2_t __riscv_vfsgnj_vv_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                          vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                          size_t vl);
vfloat16mf2_t __riscv_vfsgnj_vf_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                          vfloat16mf2_t vs2, _Float16 rs1,
                                          size_t vl);
vfloat16m1_t __riscv_vfsgnj_vv_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                        vfloat16m1_t vs2, vfloat16m1_t vs1,
                                        size_t vl);
vfloat16m1_t __riscv_vfsgnj_vf_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                        vfloat16m1_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m2_t __riscv_vfsgnj_vv_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                        vfloat16m2_t vs2, vfloat16m2_t vs1,
                                        size_t vl);
vfloat16m2_t __riscv_vfsgnj_vf_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                        vfloat16m2_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m4_t __riscv_vfsgnj_vv_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                        vfloat16m4_t vs2, vfloat16m4_t vs1,
                                        size_t vl);
vfloat16m4_t __riscv_vfsgnj_vf_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                        vfloat16m4_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat16m8_t __riscv_vfsgnj_vv_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                        vfloat16m8_t vs2, vfloat16m8_t vs1,
                                        size_t vl);
vfloat16m8_t __riscv_vfsgnj_vf_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                        vfloat16m8_t vs2, _Float16 rs1,
                                        size_t vl);
vfloat32mf2_t __riscv_vfsgnj_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                          size_t vl);
vfloat32mf2_t __riscv_vfsgnj_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs2, float rs1,
                                          size_t vl);
vfloat32m1_t __riscv_vfsgnj_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs2, vfloat32m1_t vs1,
                                        size_t vl);
vfloat32m1_t __riscv_vfsgnj_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs2, float rs1, size_t vl);
vfloat32m2_t __riscv_vfsgnj_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs2, vfloat32m2_t vs1,
                                        size_t vl);
vfloat32m2_t __riscv_vfsgnj_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs2, float rs1, size_t vl);
vfloat32m4_t __riscv_vfsgnj_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs2, vfloat32m4_t vs1,
                                        size_t vl);
vfloat32m4_t __riscv_vfsgnj_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs2, float rs1, size_t vl);
vfloat32m8_t __riscv_vfsgnj_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs2, vfloat32m8_t vs1,
                                        size_t vl);
vfloat32m8_t __riscv_vfsgnj_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs2, float rs1, size_t vl);
vfloat64m1_t __riscv_vfsgnj_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs2, vfloat64m1_t vs1,
                                        size_t vl);
vfloat64m1_t __riscv_vfsgnj_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs2, double rs1,
                                        size_t vl);
vfloat64m2_t __riscv_vfsgnj_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs2, vfloat64m2_t vs1,
                                        size_t vl);
vfloat64m2_t __riscv_vfsgnj_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs2, double rs1,
                                        size_t vl);
vfloat64m4_t __riscv_vfsgnj_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs2, vfloat64m4_t vs1,
                                        size_t vl);
vfloat64m4_t __riscv_vfsgnj_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs2, double rs1,
                                        size_t vl);
vfloat64m8_t __riscv_vfsgnj_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs2, vfloat64m8_t vs1,
                                        size_t vl);
vfloat64m8_t __riscv_vfsgnj_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs2, double rs1,
                                        size_t vl);
vfloat16mf4_t __riscv_vfsgnjn_vv_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                           size_t vl);
vfloat16mf4_t __riscv_vfsgnjn_vf_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16mf2_t __riscv_vfsgnjn_vv_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                           size_t vl);
vfloat16mf2_t __riscv_vfsgnjn_vf_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16m1_t __riscv_vfsgnjn_vv_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs2, vfloat16m1_t vs1,
                                         size_t vl);
vfloat16m1_t __riscv_vfsgnjn_vf_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m2_t __riscv_vfsgnjn_vv_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs2, vfloat16m2_t vs1,
                                         size_t vl);
vfloat16m2_t __riscv_vfsgnjn_vf_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m4_t __riscv_vfsgnjn_vv_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs2, vfloat16m4_t vs1,
                                         size_t vl);
vfloat16m4_t __riscv_vfsgnjn_vf_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m8_t __riscv_vfsgnjn_vv_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs2, vfloat16m8_t vs1,
                                         size_t vl);
vfloat16m8_t __riscv_vfsgnjn_vf_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32mf2_t __riscv_vfsgnjn_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                           size_t vl);
vfloat32mf2_t __riscv_vfsgnjn_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, float rs1,
                                           size_t vl);
vfloat32m1_t __riscv_vfsgnjn_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, vfloat32m1_t vs1,
                                         size_t vl);
vfloat32m1_t __riscv_vfsgnjn_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, float rs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfsgnjn_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, vfloat32m2_t vs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfsgnjn_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, float rs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfsgnjn_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, vfloat32m4_t vs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfsgnjn_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, float rs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfsgnjn_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, vfloat32m8_t vs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfsgnjn_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, float rs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfsgnjn_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, vfloat64m1_t vs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfsgnjn_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, double rs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfsgnjn_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, vfloat64m2_t vs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfsgnjn_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, double rs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfsgnjn_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, vfloat64m4_t vs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfsgnjn_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, double rs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfsgnjn_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, vfloat64m8_t vs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfsgnjn_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, double rs1,
                                         size_t vl);
vfloat16mf4_t __riscv_vfsgnjx_vv_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                           size_t vl);
vfloat16mf4_t __riscv_vfsgnjx_vf_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                           vfloat16mf4_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16mf2_t __riscv_vfsgnjx_vv_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                           size_t vl);
vfloat16mf2_t __riscv_vfsgnjx_vf_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                           vfloat16mf2_t vs2, _Float16 rs1,
                                           size_t vl);
vfloat16m1_t __riscv_vfsgnjx_vv_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs2, vfloat16m1_t vs1,
                                         size_t vl);
vfloat16m1_t __riscv_vfsgnjx_vf_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                         vfloat16m1_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m2_t __riscv_vfsgnjx_vv_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs2, vfloat16m2_t vs1,
                                         size_t vl);
vfloat16m2_t __riscv_vfsgnjx_vf_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                         vfloat16m2_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m4_t __riscv_vfsgnjx_vv_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs2, vfloat16m4_t vs1,
                                         size_t vl);
vfloat16m4_t __riscv_vfsgnjx_vf_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                         vfloat16m4_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat16m8_t __riscv_vfsgnjx_vv_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs2, vfloat16m8_t vs1,
                                         size_t vl);
vfloat16m8_t __riscv_vfsgnjx_vf_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                         vfloat16m8_t vs2, _Float16 rs1,
                                         size_t vl);
vfloat32mf2_t __riscv_vfsgnjx_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                           size_t vl);
vfloat32mf2_t __riscv_vfsgnjx_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                           vfloat32mf2_t vs2, float rs1,
                                           size_t vl);
vfloat32m1_t __riscv_vfsgnjx_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, vfloat32m1_t vs1,
                                         size_t vl);
vfloat32m1_t __riscv_vfsgnjx_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                         vfloat32m1_t vs2, float rs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfsgnjx_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, vfloat32m2_t vs1,
                                         size_t vl);
vfloat32m2_t __riscv_vfsgnjx_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                         vfloat32m2_t vs2, float rs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfsgnjx_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, vfloat32m4_t vs1,
                                         size_t vl);
vfloat32m4_t __riscv_vfsgnjx_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                         vfloat32m4_t vs2, float rs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfsgnjx_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, vfloat32m8_t vs1,
                                         size_t vl);
vfloat32m8_t __riscv_vfsgnjx_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                         vfloat32m8_t vs2, float rs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfsgnjx_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, vfloat64m1_t vs1,
                                         size_t vl);
vfloat64m1_t __riscv_vfsgnjx_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                         vfloat64m1_t vs2, double rs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfsgnjx_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, vfloat64m2_t vs1,
                                         size_t vl);
vfloat64m2_t __riscv_vfsgnjx_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                         vfloat64m2_t vs2, double rs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfsgnjx_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, vfloat64m4_t vs1,
                                         size_t vl);
vfloat64m4_t __riscv_vfsgnjx_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                         vfloat64m4_t vs2, double rs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfsgnjx_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, vfloat64m8_t vs1,
                                         size_t vl);
vfloat64m8_t __riscv_vfsgnjx_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                         vfloat64m8_t vs2, double rs1,
                                         size_t vl);

Vector Floating-Point Absolute Value Intrinsics

vfloat16mf4_t __riscv_vfabs_v_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                        size_t vl);
vfloat16mf2_t __riscv_vfabs_v_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                        size_t vl);
vfloat16m1_t __riscv_vfabs_v_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                      size_t vl);
vfloat16m2_t __riscv_vfabs_v_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                      size_t vl);
vfloat16m4_t __riscv_vfabs_v_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                      size_t vl);
vfloat16m8_t __riscv_vfabs_v_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                      size_t vl);
vfloat32mf2_t __riscv_vfabs_v_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                        size_t vl);
vfloat32m1_t __riscv_vfabs_v_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                      size_t vl);
vfloat32m2_t __riscv_vfabs_v_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                      size_t vl);
vfloat32m4_t __riscv_vfabs_v_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                      size_t vl);
vfloat32m8_t __riscv_vfabs_v_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                      size_t vl);
vfloat64m1_t __riscv_vfabs_v_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                      size_t vl);
vfloat64m2_t __riscv_vfabs_v_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                      size_t vl);
vfloat64m4_t __riscv_vfabs_v_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                      size_t vl);
vfloat64m8_t __riscv_vfabs_v_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                      size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfabs_v_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                         vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfabs_v_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                         vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfabs_v_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                       vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfabs_v_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                       vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfabs_v_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                       vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfabs_v_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                       vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfabs_v_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                         vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfabs_v_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                       vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfabs_v_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                       vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfabs_v_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                       vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfabs_v_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                       vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfabs_v_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                       vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfabs_v_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                       vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfabs_v_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                       vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfabs_v_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                       vfloat64m8_t vs2, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfabs_v_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                          vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfabs_v_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                          vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfabs_v_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                        vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfabs_v_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                        vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfabs_v_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                        vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfabs_v_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                        vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfabs_v_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                          vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfabs_v_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                        vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfabs_v_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                        vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfabs_v_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                        vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfabs_v_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                        vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfabs_v_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                        vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfabs_v_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                        vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfabs_v_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                        vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfabs_v_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                        vfloat64m8_t vs2, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfabs_v_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                        vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfabs_v_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                        vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfabs_v_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                      vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfabs_v_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                      vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfabs_v_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                      vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfabs_v_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                      vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfabs_v_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                        vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfabs_v_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                      vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfabs_v_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                      vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfabs_v_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                      vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfabs_v_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                      vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfabs_v_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                      vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfabs_v_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                      vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfabs_v_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                      vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfabs_v_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                      vfloat64m8_t vs2, size_t vl);

Vector Floating-Point Compare Intrinsics

// masked functions
vbool64_t __riscv_vmfeq_vv_f16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmfeq_vf_f16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vfloat16mf4_t vs2, _Float16 rs1,
                                         size_t vl);
vbool32_t __riscv_vmfeq_vv_f16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmfeq_vf_f16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vfloat16mf2_t vs2, _Float16 rs1,
                                         size_t vl);
vbool16_t __riscv_vmfeq_vv_f16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat16m1_t vs2, vfloat16m1_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmfeq_vf_f16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat16m1_t vs2, _Float16 rs1,
                                        size_t vl);
vbool8_t __riscv_vmfeq_vv_f16m2_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat16m2_t vs2, vfloat16m2_t vs1,
                                      size_t vl);
vbool8_t __riscv_vmfeq_vf_f16m2_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat16m2_t vs2, _Float16 rs1,
                                      size_t vl);
vbool4_t __riscv_vmfeq_vv_f16m4_b4_mu(vbool4_t vm, vbool4_t vd,
                                      vfloat16m4_t vs2, vfloat16m4_t vs1,
                                      size_t vl);
vbool4_t __riscv_vmfeq_vf_f16m4_b4_mu(vbool4_t vm, vbool4_t vd,
                                      vfloat16m4_t vs2, _Float16 rs1,
                                      size_t vl);
vbool2_t __riscv_vmfeq_vv_f16m8_b2_mu(vbool2_t vm, vbool2_t vd,
                                      vfloat16m8_t vs2, vfloat16m8_t vs1,
                                      size_t vl);
vbool2_t __riscv_vmfeq_vf_f16m8_b2_mu(vbool2_t vm, vbool2_t vd,
                                      vfloat16m8_t vs2, _Float16 rs1,
                                      size_t vl);
vbool64_t __riscv_vmfeq_vv_f32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmfeq_vf_f32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vfloat32mf2_t vs2, float rs1,
                                         size_t vl);
vbool32_t __riscv_vmfeq_vv_f32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vfloat32m1_t vs2, vfloat32m1_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmfeq_vf_f32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vfloat32m1_t vs2, float rs1, size_t vl);
vbool16_t __riscv_vmfeq_vv_f32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat32m2_t vs2, vfloat32m2_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmfeq_vf_f32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat32m2_t vs2, float rs1, size_t vl);
vbool8_t __riscv_vmfeq_vv_f32m4_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat32m4_t vs2, vfloat32m4_t vs1,
                                      size_t vl);
vbool8_t __riscv_vmfeq_vf_f32m4_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat32m4_t vs2, float rs1, size_t vl);
vbool4_t __riscv_vmfeq_vv_f32m8_b4_mu(vbool4_t vm, vbool4_t vd,
                                      vfloat32m8_t vs2, vfloat32m8_t vs1,
                                      size_t vl);
vbool4_t __riscv_vmfeq_vf_f32m8_b4_mu(vbool4_t vm, vbool4_t vd,
                                      vfloat32m8_t vs2, float rs1, size_t vl);
vbool64_t __riscv_vmfeq_vv_f64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vfloat64m1_t vs2, vfloat64m1_t vs1,
                                        size_t vl);
vbool64_t __riscv_vmfeq_vf_f64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vfloat64m1_t vs2, double rs1,
                                        size_t vl);
vbool32_t __riscv_vmfeq_vv_f64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vfloat64m2_t vs2, vfloat64m2_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmfeq_vf_f64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vfloat64m2_t vs2, double rs1,
                                        size_t vl);
vbool16_t __riscv_vmfeq_vv_f64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat64m4_t vs2, vfloat64m4_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmfeq_vf_f64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat64m4_t vs2, double rs1,
                                        size_t vl);
vbool8_t __riscv_vmfeq_vv_f64m8_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat64m8_t vs2, vfloat64m8_t vs1,
                                      size_t vl);
vbool8_t __riscv_vmfeq_vf_f64m8_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat64m8_t vs2, double rs1, size_t vl);
vbool64_t __riscv_vmfne_vv_f16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmfne_vf_f16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vfloat16mf4_t vs2, _Float16 rs1,
                                         size_t vl);
vbool32_t __riscv_vmfne_vv_f16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmfne_vf_f16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vfloat16mf2_t vs2, _Float16 rs1,
                                         size_t vl);
vbool16_t __riscv_vmfne_vv_f16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat16m1_t vs2, vfloat16m1_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmfne_vf_f16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat16m1_t vs2, _Float16 rs1,
                                        size_t vl);
vbool8_t __riscv_vmfne_vv_f16m2_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat16m2_t vs2, vfloat16m2_t vs1,
                                      size_t vl);
vbool8_t __riscv_vmfne_vf_f16m2_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat16m2_t vs2, _Float16 rs1,
                                      size_t vl);
vbool4_t __riscv_vmfne_vv_f16m4_b4_mu(vbool4_t vm, vbool4_t vd,
                                      vfloat16m4_t vs2, vfloat16m4_t vs1,
                                      size_t vl);
vbool4_t __riscv_vmfne_vf_f16m4_b4_mu(vbool4_t vm, vbool4_t vd,
                                      vfloat16m4_t vs2, _Float16 rs1,
                                      size_t vl);
vbool2_t __riscv_vmfne_vv_f16m8_b2_mu(vbool2_t vm, vbool2_t vd,
                                      vfloat16m8_t vs2, vfloat16m8_t vs1,
                                      size_t vl);
vbool2_t __riscv_vmfne_vf_f16m8_b2_mu(vbool2_t vm, vbool2_t vd,
                                      vfloat16m8_t vs2, _Float16 rs1,
                                      size_t vl);
vbool64_t __riscv_vmfne_vv_f32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmfne_vf_f32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vfloat32mf2_t vs2, float rs1,
                                         size_t vl);
vbool32_t __riscv_vmfne_vv_f32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vfloat32m1_t vs2, vfloat32m1_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmfne_vf_f32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vfloat32m1_t vs2, float rs1, size_t vl);
vbool16_t __riscv_vmfne_vv_f32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat32m2_t vs2, vfloat32m2_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmfne_vf_f32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat32m2_t vs2, float rs1, size_t vl);
vbool8_t __riscv_vmfne_vv_f32m4_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat32m4_t vs2, vfloat32m4_t vs1,
                                      size_t vl);
vbool8_t __riscv_vmfne_vf_f32m4_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat32m4_t vs2, float rs1, size_t vl);
vbool4_t __riscv_vmfne_vv_f32m8_b4_mu(vbool4_t vm, vbool4_t vd,
                                      vfloat32m8_t vs2, vfloat32m8_t vs1,
                                      size_t vl);
vbool4_t __riscv_vmfne_vf_f32m8_b4_mu(vbool4_t vm, vbool4_t vd,
                                      vfloat32m8_t vs2, float rs1, size_t vl);
vbool64_t __riscv_vmfne_vv_f64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vfloat64m1_t vs2, vfloat64m1_t vs1,
                                        size_t vl);
vbool64_t __riscv_vmfne_vf_f64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vfloat64m1_t vs2, double rs1,
                                        size_t vl);
vbool32_t __riscv_vmfne_vv_f64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vfloat64m2_t vs2, vfloat64m2_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmfne_vf_f64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vfloat64m2_t vs2, double rs1,
                                        size_t vl);
vbool16_t __riscv_vmfne_vv_f64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat64m4_t vs2, vfloat64m4_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmfne_vf_f64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat64m4_t vs2, double rs1,
                                        size_t vl);
vbool8_t __riscv_vmfne_vv_f64m8_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat64m8_t vs2, vfloat64m8_t vs1,
                                      size_t vl);
vbool8_t __riscv_vmfne_vf_f64m8_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat64m8_t vs2, double rs1, size_t vl);
vbool64_t __riscv_vmflt_vv_f16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmflt_vf_f16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vfloat16mf4_t vs2, _Float16 rs1,
                                         size_t vl);
vbool32_t __riscv_vmflt_vv_f16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmflt_vf_f16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vfloat16mf2_t vs2, _Float16 rs1,
                                         size_t vl);
vbool16_t __riscv_vmflt_vv_f16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat16m1_t vs2, vfloat16m1_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmflt_vf_f16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat16m1_t vs2, _Float16 rs1,
                                        size_t vl);
vbool8_t __riscv_vmflt_vv_f16m2_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat16m2_t vs2, vfloat16m2_t vs1,
                                      size_t vl);
vbool8_t __riscv_vmflt_vf_f16m2_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat16m2_t vs2, _Float16 rs1,
                                      size_t vl);
vbool4_t __riscv_vmflt_vv_f16m4_b4_mu(vbool4_t vm, vbool4_t vd,
                                      vfloat16m4_t vs2, vfloat16m4_t vs1,
                                      size_t vl);
vbool4_t __riscv_vmflt_vf_f16m4_b4_mu(vbool4_t vm, vbool4_t vd,
                                      vfloat16m4_t vs2, _Float16 rs1,
                                      size_t vl);
vbool2_t __riscv_vmflt_vv_f16m8_b2_mu(vbool2_t vm, vbool2_t vd,
                                      vfloat16m8_t vs2, vfloat16m8_t vs1,
                                      size_t vl);
vbool2_t __riscv_vmflt_vf_f16m8_b2_mu(vbool2_t vm, vbool2_t vd,
                                      vfloat16m8_t vs2, _Float16 rs1,
                                      size_t vl);
vbool64_t __riscv_vmflt_vv_f32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmflt_vf_f32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vfloat32mf2_t vs2, float rs1,
                                         size_t vl);
vbool32_t __riscv_vmflt_vv_f32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vfloat32m1_t vs2, vfloat32m1_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmflt_vf_f32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vfloat32m1_t vs2, float rs1, size_t vl);
vbool16_t __riscv_vmflt_vv_f32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat32m2_t vs2, vfloat32m2_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmflt_vf_f32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat32m2_t vs2, float rs1, size_t vl);
vbool8_t __riscv_vmflt_vv_f32m4_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat32m4_t vs2, vfloat32m4_t vs1,
                                      size_t vl);
vbool8_t __riscv_vmflt_vf_f32m4_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat32m4_t vs2, float rs1, size_t vl);
vbool4_t __riscv_vmflt_vv_f32m8_b4_mu(vbool4_t vm, vbool4_t vd,
                                      vfloat32m8_t vs2, vfloat32m8_t vs1,
                                      size_t vl);
vbool4_t __riscv_vmflt_vf_f32m8_b4_mu(vbool4_t vm, vbool4_t vd,
                                      vfloat32m8_t vs2, float rs1, size_t vl);
vbool64_t __riscv_vmflt_vv_f64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vfloat64m1_t vs2, vfloat64m1_t vs1,
                                        size_t vl);
vbool64_t __riscv_vmflt_vf_f64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vfloat64m1_t vs2, double rs1,
                                        size_t vl);
vbool32_t __riscv_vmflt_vv_f64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vfloat64m2_t vs2, vfloat64m2_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmflt_vf_f64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vfloat64m2_t vs2, double rs1,
                                        size_t vl);
vbool16_t __riscv_vmflt_vv_f64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat64m4_t vs2, vfloat64m4_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmflt_vf_f64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat64m4_t vs2, double rs1,
                                        size_t vl);
vbool8_t __riscv_vmflt_vv_f64m8_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat64m8_t vs2, vfloat64m8_t vs1,
                                      size_t vl);
vbool8_t __riscv_vmflt_vf_f64m8_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat64m8_t vs2, double rs1, size_t vl);
vbool64_t __riscv_vmfle_vv_f16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmfle_vf_f16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vfloat16mf4_t vs2, _Float16 rs1,
                                         size_t vl);
vbool32_t __riscv_vmfle_vv_f16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmfle_vf_f16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vfloat16mf2_t vs2, _Float16 rs1,
                                         size_t vl);
vbool16_t __riscv_vmfle_vv_f16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat16m1_t vs2, vfloat16m1_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmfle_vf_f16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat16m1_t vs2, _Float16 rs1,
                                        size_t vl);
vbool8_t __riscv_vmfle_vv_f16m2_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat16m2_t vs2, vfloat16m2_t vs1,
                                      size_t vl);
vbool8_t __riscv_vmfle_vf_f16m2_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat16m2_t vs2, _Float16 rs1,
                                      size_t vl);
vbool4_t __riscv_vmfle_vv_f16m4_b4_mu(vbool4_t vm, vbool4_t vd,
                                      vfloat16m4_t vs2, vfloat16m4_t vs1,
                                      size_t vl);
vbool4_t __riscv_vmfle_vf_f16m4_b4_mu(vbool4_t vm, vbool4_t vd,
                                      vfloat16m4_t vs2, _Float16 rs1,
                                      size_t vl);
vbool2_t __riscv_vmfle_vv_f16m8_b2_mu(vbool2_t vm, vbool2_t vd,
                                      vfloat16m8_t vs2, vfloat16m8_t vs1,
                                      size_t vl);
vbool2_t __riscv_vmfle_vf_f16m8_b2_mu(vbool2_t vm, vbool2_t vd,
                                      vfloat16m8_t vs2, _Float16 rs1,
                                      size_t vl);
vbool64_t __riscv_vmfle_vv_f32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmfle_vf_f32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vfloat32mf2_t vs2, float rs1,
                                         size_t vl);
vbool32_t __riscv_vmfle_vv_f32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vfloat32m1_t vs2, vfloat32m1_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmfle_vf_f32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vfloat32m1_t vs2, float rs1, size_t vl);
vbool16_t __riscv_vmfle_vv_f32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat32m2_t vs2, vfloat32m2_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmfle_vf_f32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat32m2_t vs2, float rs1, size_t vl);
vbool8_t __riscv_vmfle_vv_f32m4_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat32m4_t vs2, vfloat32m4_t vs1,
                                      size_t vl);
vbool8_t __riscv_vmfle_vf_f32m4_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat32m4_t vs2, float rs1, size_t vl);
vbool4_t __riscv_vmfle_vv_f32m8_b4_mu(vbool4_t vm, vbool4_t vd,
                                      vfloat32m8_t vs2, vfloat32m8_t vs1,
                                      size_t vl);
vbool4_t __riscv_vmfle_vf_f32m8_b4_mu(vbool4_t vm, vbool4_t vd,
                                      vfloat32m8_t vs2, float rs1, size_t vl);
vbool64_t __riscv_vmfle_vv_f64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vfloat64m1_t vs2, vfloat64m1_t vs1,
                                        size_t vl);
vbool64_t __riscv_vmfle_vf_f64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vfloat64m1_t vs2, double rs1,
                                        size_t vl);
vbool32_t __riscv_vmfle_vv_f64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vfloat64m2_t vs2, vfloat64m2_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmfle_vf_f64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vfloat64m2_t vs2, double rs1,
                                        size_t vl);
vbool16_t __riscv_vmfle_vv_f64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat64m4_t vs2, vfloat64m4_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmfle_vf_f64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat64m4_t vs2, double rs1,
                                        size_t vl);
vbool8_t __riscv_vmfle_vv_f64m8_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat64m8_t vs2, vfloat64m8_t vs1,
                                      size_t vl);
vbool8_t __riscv_vmfle_vf_f64m8_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat64m8_t vs2, double rs1, size_t vl);
vbool64_t __riscv_vmfgt_vv_f16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmfgt_vf_f16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vfloat16mf4_t vs2, _Float16 rs1,
                                         size_t vl);
vbool32_t __riscv_vmfgt_vv_f16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmfgt_vf_f16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vfloat16mf2_t vs2, _Float16 rs1,
                                         size_t vl);
vbool16_t __riscv_vmfgt_vv_f16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat16m1_t vs2, vfloat16m1_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmfgt_vf_f16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat16m1_t vs2, _Float16 rs1,
                                        size_t vl);
vbool8_t __riscv_vmfgt_vv_f16m2_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat16m2_t vs2, vfloat16m2_t vs1,
                                      size_t vl);
vbool8_t __riscv_vmfgt_vf_f16m2_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat16m2_t vs2, _Float16 rs1,
                                      size_t vl);
vbool4_t __riscv_vmfgt_vv_f16m4_b4_mu(vbool4_t vm, vbool4_t vd,
                                      vfloat16m4_t vs2, vfloat16m4_t vs1,
                                      size_t vl);
vbool4_t __riscv_vmfgt_vf_f16m4_b4_mu(vbool4_t vm, vbool4_t vd,
                                      vfloat16m4_t vs2, _Float16 rs1,
                                      size_t vl);
vbool2_t __riscv_vmfgt_vv_f16m8_b2_mu(vbool2_t vm, vbool2_t vd,
                                      vfloat16m8_t vs2, vfloat16m8_t vs1,
                                      size_t vl);
vbool2_t __riscv_vmfgt_vf_f16m8_b2_mu(vbool2_t vm, vbool2_t vd,
                                      vfloat16m8_t vs2, _Float16 rs1,
                                      size_t vl);
vbool64_t __riscv_vmfgt_vv_f32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmfgt_vf_f32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vfloat32mf2_t vs2, float rs1,
                                         size_t vl);
vbool32_t __riscv_vmfgt_vv_f32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vfloat32m1_t vs2, vfloat32m1_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmfgt_vf_f32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vfloat32m1_t vs2, float rs1, size_t vl);
vbool16_t __riscv_vmfgt_vv_f32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat32m2_t vs2, vfloat32m2_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmfgt_vf_f32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat32m2_t vs2, float rs1, size_t vl);
vbool8_t __riscv_vmfgt_vv_f32m4_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat32m4_t vs2, vfloat32m4_t vs1,
                                      size_t vl);
vbool8_t __riscv_vmfgt_vf_f32m4_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat32m4_t vs2, float rs1, size_t vl);
vbool4_t __riscv_vmfgt_vv_f32m8_b4_mu(vbool4_t vm, vbool4_t vd,
                                      vfloat32m8_t vs2, vfloat32m8_t vs1,
                                      size_t vl);
vbool4_t __riscv_vmfgt_vf_f32m8_b4_mu(vbool4_t vm, vbool4_t vd,
                                      vfloat32m8_t vs2, float rs1, size_t vl);
vbool64_t __riscv_vmfgt_vv_f64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vfloat64m1_t vs2, vfloat64m1_t vs1,
                                        size_t vl);
vbool64_t __riscv_vmfgt_vf_f64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vfloat64m1_t vs2, double rs1,
                                        size_t vl);
vbool32_t __riscv_vmfgt_vv_f64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vfloat64m2_t vs2, vfloat64m2_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmfgt_vf_f64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vfloat64m2_t vs2, double rs1,
                                        size_t vl);
vbool16_t __riscv_vmfgt_vv_f64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat64m4_t vs2, vfloat64m4_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmfgt_vf_f64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat64m4_t vs2, double rs1,
                                        size_t vl);
vbool8_t __riscv_vmfgt_vv_f64m8_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat64m8_t vs2, vfloat64m8_t vs1,
                                      size_t vl);
vbool8_t __riscv_vmfgt_vf_f64m8_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat64m8_t vs2, double rs1, size_t vl);
vbool64_t __riscv_vmfge_vv_f16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmfge_vf_f16mf4_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vfloat16mf4_t vs2, _Float16 rs1,
                                         size_t vl);
vbool32_t __riscv_vmfge_vv_f16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                         size_t vl);
vbool32_t __riscv_vmfge_vf_f16mf2_b32_mu(vbool32_t vm, vbool32_t vd,
                                         vfloat16mf2_t vs2, _Float16 rs1,
                                         size_t vl);
vbool16_t __riscv_vmfge_vv_f16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat16m1_t vs2, vfloat16m1_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmfge_vf_f16m1_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat16m1_t vs2, _Float16 rs1,
                                        size_t vl);
vbool8_t __riscv_vmfge_vv_f16m2_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat16m2_t vs2, vfloat16m2_t vs1,
                                      size_t vl);
vbool8_t __riscv_vmfge_vf_f16m2_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat16m2_t vs2, _Float16 rs1,
                                      size_t vl);
vbool4_t __riscv_vmfge_vv_f16m4_b4_mu(vbool4_t vm, vbool4_t vd,
                                      vfloat16m4_t vs2, vfloat16m4_t vs1,
                                      size_t vl);
vbool4_t __riscv_vmfge_vf_f16m4_b4_mu(vbool4_t vm, vbool4_t vd,
                                      vfloat16m4_t vs2, _Float16 rs1,
                                      size_t vl);
vbool2_t __riscv_vmfge_vv_f16m8_b2_mu(vbool2_t vm, vbool2_t vd,
                                      vfloat16m8_t vs2, vfloat16m8_t vs1,
                                      size_t vl);
vbool2_t __riscv_vmfge_vf_f16m8_b2_mu(vbool2_t vm, vbool2_t vd,
                                      vfloat16m8_t vs2, _Float16 rs1,
                                      size_t vl);
vbool64_t __riscv_vmfge_vv_f32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                         size_t vl);
vbool64_t __riscv_vmfge_vf_f32mf2_b64_mu(vbool64_t vm, vbool64_t vd,
                                         vfloat32mf2_t vs2, float rs1,
                                         size_t vl);
vbool32_t __riscv_vmfge_vv_f32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vfloat32m1_t vs2, vfloat32m1_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmfge_vf_f32m1_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vfloat32m1_t vs2, float rs1, size_t vl);
vbool16_t __riscv_vmfge_vv_f32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat32m2_t vs2, vfloat32m2_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmfge_vf_f32m2_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat32m2_t vs2, float rs1, size_t vl);
vbool8_t __riscv_vmfge_vv_f32m4_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat32m4_t vs2, vfloat32m4_t vs1,
                                      size_t vl);
vbool8_t __riscv_vmfge_vf_f32m4_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat32m4_t vs2, float rs1, size_t vl);
vbool4_t __riscv_vmfge_vv_f32m8_b4_mu(vbool4_t vm, vbool4_t vd,
                                      vfloat32m8_t vs2, vfloat32m8_t vs1,
                                      size_t vl);
vbool4_t __riscv_vmfge_vf_f32m8_b4_mu(vbool4_t vm, vbool4_t vd,
                                      vfloat32m8_t vs2, float rs1, size_t vl);
vbool64_t __riscv_vmfge_vv_f64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vfloat64m1_t vs2, vfloat64m1_t vs1,
                                        size_t vl);
vbool64_t __riscv_vmfge_vf_f64m1_b64_mu(vbool64_t vm, vbool64_t vd,
                                        vfloat64m1_t vs2, double rs1,
                                        size_t vl);
vbool32_t __riscv_vmfge_vv_f64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vfloat64m2_t vs2, vfloat64m2_t vs1,
                                        size_t vl);
vbool32_t __riscv_vmfge_vf_f64m2_b32_mu(vbool32_t vm, vbool32_t vd,
                                        vfloat64m2_t vs2, double rs1,
                                        size_t vl);
vbool16_t __riscv_vmfge_vv_f64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat64m4_t vs2, vfloat64m4_t vs1,
                                        size_t vl);
vbool16_t __riscv_vmfge_vf_f64m4_b16_mu(vbool16_t vm, vbool16_t vd,
                                        vfloat64m4_t vs2, double rs1,
                                        size_t vl);
vbool8_t __riscv_vmfge_vv_f64m8_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat64m8_t vs2, vfloat64m8_t vs1,
                                      size_t vl);
vbool8_t __riscv_vmfge_vf_f64m8_b8_mu(vbool8_t vm, vbool8_t vd,
                                      vfloat64m8_t vs2, double rs1, size_t vl);

Vector Floating-Point Classify Intrinsics

vuint16mf4_t __riscv_vfclass_v_u16mf4_tu(vuint16mf4_t vd, vfloat16mf4_t vs2,
                                         size_t vl);
vuint16mf2_t __riscv_vfclass_v_u16mf2_tu(vuint16mf2_t vd, vfloat16mf2_t vs2,
                                         size_t vl);
vuint16m1_t __riscv_vfclass_v_u16m1_tu(vuint16m1_t vd, vfloat16m1_t vs2,
                                       size_t vl);
vuint16m2_t __riscv_vfclass_v_u16m2_tu(vuint16m2_t vd, vfloat16m2_t vs2,
                                       size_t vl);
vuint16m4_t __riscv_vfclass_v_u16m4_tu(vuint16m4_t vd, vfloat16m4_t vs2,
                                       size_t vl);
vuint16m8_t __riscv_vfclass_v_u16m8_tu(vuint16m8_t vd, vfloat16m8_t vs2,
                                       size_t vl);
vuint32mf2_t __riscv_vfclass_v_u32mf2_tu(vuint32mf2_t vd, vfloat32mf2_t vs2,
                                         size_t vl);
vuint32m1_t __riscv_vfclass_v_u32m1_tu(vuint32m1_t vd, vfloat32m1_t vs2,
                                       size_t vl);
vuint32m2_t __riscv_vfclass_v_u32m2_tu(vuint32m2_t vd, vfloat32m2_t vs2,
                                       size_t vl);
vuint32m4_t __riscv_vfclass_v_u32m4_tu(vuint32m4_t vd, vfloat32m4_t vs2,
                                       size_t vl);
vuint32m8_t __riscv_vfclass_v_u32m8_tu(vuint32m8_t vd, vfloat32m8_t vs2,
                                       size_t vl);
vuint64m1_t __riscv_vfclass_v_u64m1_tu(vuint64m1_t vd, vfloat64m1_t vs2,
                                       size_t vl);
vuint64m2_t __riscv_vfclass_v_u64m2_tu(vuint64m2_t vd, vfloat64m2_t vs2,
                                       size_t vl);
vuint64m4_t __riscv_vfclass_v_u64m4_tu(vuint64m4_t vd, vfloat64m4_t vs2,
                                       size_t vl);
vuint64m8_t __riscv_vfclass_v_u64m8_tu(vuint64m8_t vd, vfloat64m8_t vs2,
                                       size_t vl);
// masked functions
vuint16mf4_t __riscv_vfclass_v_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                          vfloat16mf4_t vs2, size_t vl);
vuint16mf2_t __riscv_vfclass_v_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                          vfloat16mf2_t vs2, size_t vl);
vuint16m1_t __riscv_vfclass_v_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                        vfloat16m1_t vs2, size_t vl);
vuint16m2_t __riscv_vfclass_v_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                        vfloat16m2_t vs2, size_t vl);
vuint16m4_t __riscv_vfclass_v_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                        vfloat16m4_t vs2, size_t vl);
vuint16m8_t __riscv_vfclass_v_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                        vfloat16m8_t vs2, size_t vl);
vuint32mf2_t __riscv_vfclass_v_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                          vfloat32mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vfclass_v_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                        vfloat32m1_t vs2, size_t vl);
vuint32m2_t __riscv_vfclass_v_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                        vfloat32m2_t vs2, size_t vl);
vuint32m4_t __riscv_vfclass_v_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                        vfloat32m4_t vs2, size_t vl);
vuint32m8_t __riscv_vfclass_v_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                        vfloat32m8_t vs2, size_t vl);
vuint64m1_t __riscv_vfclass_v_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                        vfloat64m1_t vs2, size_t vl);
vuint64m2_t __riscv_vfclass_v_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                        vfloat64m2_t vs2, size_t vl);
vuint64m4_t __riscv_vfclass_v_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                        vfloat64m4_t vs2, size_t vl);
vuint64m8_t __riscv_vfclass_v_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                        vfloat64m8_t vs2, size_t vl);
// masked functions
vuint16mf4_t __riscv_vfclass_v_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                           vfloat16mf4_t vs2, size_t vl);
vuint16mf2_t __riscv_vfclass_v_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                           vfloat16mf2_t vs2, size_t vl);
vuint16m1_t __riscv_vfclass_v_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                         vfloat16m1_t vs2, size_t vl);
vuint16m2_t __riscv_vfclass_v_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                         vfloat16m2_t vs2, size_t vl);
vuint16m4_t __riscv_vfclass_v_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                         vfloat16m4_t vs2, size_t vl);
vuint16m8_t __riscv_vfclass_v_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                         vfloat16m8_t vs2, size_t vl);
vuint32mf2_t __riscv_vfclass_v_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                           vfloat32mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vfclass_v_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                         vfloat32m1_t vs2, size_t vl);
vuint32m2_t __riscv_vfclass_v_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                         vfloat32m2_t vs2, size_t vl);
vuint32m4_t __riscv_vfclass_v_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                         vfloat32m4_t vs2, size_t vl);
vuint32m8_t __riscv_vfclass_v_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                         vfloat32m8_t vs2, size_t vl);
vuint64m1_t __riscv_vfclass_v_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                         vfloat64m1_t vs2, size_t vl);
vuint64m2_t __riscv_vfclass_v_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                         vfloat64m2_t vs2, size_t vl);
vuint64m4_t __riscv_vfclass_v_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                         vfloat64m4_t vs2, size_t vl);
vuint64m8_t __riscv_vfclass_v_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                         vfloat64m8_t vs2, size_t vl);
// masked functions
vuint16mf4_t __riscv_vfclass_v_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                         vfloat16mf4_t vs2, size_t vl);
vuint16mf2_t __riscv_vfclass_v_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                         vfloat16mf2_t vs2, size_t vl);
vuint16m1_t __riscv_vfclass_v_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                       vfloat16m1_t vs2, size_t vl);
vuint16m2_t __riscv_vfclass_v_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                       vfloat16m2_t vs2, size_t vl);
vuint16m4_t __riscv_vfclass_v_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                       vfloat16m4_t vs2, size_t vl);
vuint16m8_t __riscv_vfclass_v_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                       vfloat16m8_t vs2, size_t vl);
vuint32mf2_t __riscv_vfclass_v_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                         vfloat32mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vfclass_v_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                       vfloat32m1_t vs2, size_t vl);
vuint32m2_t __riscv_vfclass_v_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                       vfloat32m2_t vs2, size_t vl);
vuint32m4_t __riscv_vfclass_v_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                       vfloat32m4_t vs2, size_t vl);
vuint32m8_t __riscv_vfclass_v_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                       vfloat32m8_t vs2, size_t vl);
vuint64m1_t __riscv_vfclass_v_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                       vfloat64m1_t vs2, size_t vl);
vuint64m2_t __riscv_vfclass_v_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                       vfloat64m2_t vs2, size_t vl);
vuint64m4_t __riscv_vfclass_v_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                       vfloat64m4_t vs2, size_t vl);
vuint64m8_t __riscv_vfclass_v_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                       vfloat64m8_t vs2, size_t vl);

Vector Floating-Point Merge Intrinsics

vfloat16mf4_t __riscv_vmerge_vvm_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                           vfloat16mf4_t vs1, vbool64_t v0,
                                           size_t vl);
vfloat16mf4_t __riscv_vfmerge_vfm_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                            _Float16 rs1, vbool64_t v0,
                                            size_t vl);
vfloat16mf2_t __riscv_vmerge_vvm_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                           vfloat16mf2_t vs1, vbool32_t v0,
                                           size_t vl);
vfloat16mf2_t __riscv_vfmerge_vfm_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                            _Float16 rs1, vbool32_t v0,
                                            size_t vl);
vfloat16m1_t __riscv_vmerge_vvm_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                         vfloat16m1_t vs1, vbool16_t v0,
                                         size_t vl);
vfloat16m1_t __riscv_vfmerge_vfm_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                          _Float16 rs1, vbool16_t v0,
                                          size_t vl);
vfloat16m2_t __riscv_vmerge_vvm_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                         vfloat16m2_t vs1, vbool8_t v0,
                                         size_t vl);
vfloat16m2_t __riscv_vfmerge_vfm_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                          _Float16 rs1, vbool8_t v0, size_t vl);
vfloat16m4_t __riscv_vmerge_vvm_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                         vfloat16m4_t vs1, vbool4_t v0,
                                         size_t vl);
vfloat16m4_t __riscv_vfmerge_vfm_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                          _Float16 rs1, vbool4_t v0, size_t vl);
vfloat16m8_t __riscv_vmerge_vvm_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                         vfloat16m8_t vs1, vbool2_t v0,
                                         size_t vl);
vfloat16m8_t __riscv_vfmerge_vfm_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                          _Float16 rs1, vbool2_t v0, size_t vl);
vfloat32mf2_t __riscv_vmerge_vvm_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                           vfloat32mf2_t vs1, vbool64_t v0,
                                           size_t vl);
vfloat32mf2_t __riscv_vfmerge_vfm_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                            float rs1, vbool64_t v0, size_t vl);
vfloat32m1_t __riscv_vmerge_vvm_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                         vfloat32m1_t vs1, vbool32_t v0,
                                         size_t vl);
vfloat32m1_t __riscv_vfmerge_vfm_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                          float rs1, vbool32_t v0, size_t vl);
vfloat32m2_t __riscv_vmerge_vvm_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                         vfloat32m2_t vs1, vbool16_t v0,
                                         size_t vl);
vfloat32m2_t __riscv_vfmerge_vfm_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                          float rs1, vbool16_t v0, size_t vl);
vfloat32m4_t __riscv_vmerge_vvm_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                         vfloat32m4_t vs1, vbool8_t v0,
                                         size_t vl);
vfloat32m4_t __riscv_vfmerge_vfm_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                          float rs1, vbool8_t v0, size_t vl);
vfloat32m8_t __riscv_vmerge_vvm_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                         vfloat32m8_t vs1, vbool4_t v0,
                                         size_t vl);
vfloat32m8_t __riscv_vfmerge_vfm_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                          float rs1, vbool4_t v0, size_t vl);
vfloat64m1_t __riscv_vmerge_vvm_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                         vfloat64m1_t vs1, vbool64_t v0,
                                         size_t vl);
vfloat64m1_t __riscv_vfmerge_vfm_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                          double rs1, vbool64_t v0, size_t vl);
vfloat64m2_t __riscv_vmerge_vvm_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                         vfloat64m2_t vs1, vbool32_t v0,
                                         size_t vl);
vfloat64m2_t __riscv_vfmerge_vfm_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                          double rs1, vbool32_t v0, size_t vl);
vfloat64m4_t __riscv_vmerge_vvm_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                         vfloat64m4_t vs1, vbool16_t v0,
                                         size_t vl);
vfloat64m4_t __riscv_vfmerge_vfm_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                          double rs1, vbool16_t v0, size_t vl);
vfloat64m8_t __riscv_vmerge_vvm_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                         vfloat64m8_t vs1, vbool8_t v0,
                                         size_t vl);
vfloat64m8_t __riscv_vfmerge_vfm_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                          double rs1, vbool8_t v0, size_t vl);

Vector Floating-Point Move Intrinsics

vfloat16mf4_t __riscv_vmv_v_v_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1,
                                        size_t vl);
vfloat16mf4_t __riscv_vfmv_v_f_f16mf4_tu(vfloat16mf4_t vd, _Float16 rs1,
                                         size_t vl);
vfloat16mf2_t __riscv_vmv_v_v_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1,
                                        size_t vl);
vfloat16mf2_t __riscv_vfmv_v_f_f16mf2_tu(vfloat16mf2_t vd, _Float16 rs1,
                                         size_t vl);
vfloat16m1_t __riscv_vmv_v_v_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                                      size_t vl);
vfloat16m1_t __riscv_vfmv_v_f_f16m1_tu(vfloat16m1_t vd, _Float16 rs1,
                                       size_t vl);
vfloat16m2_t __riscv_vmv_v_v_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                                      size_t vl);
vfloat16m2_t __riscv_vfmv_v_f_f16m2_tu(vfloat16m2_t vd, _Float16 rs1,
                                       size_t vl);
vfloat16m4_t __riscv_vmv_v_v_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                                      size_t vl);
vfloat16m4_t __riscv_vfmv_v_f_f16m4_tu(vfloat16m4_t vd, _Float16 rs1,
                                       size_t vl);
vfloat16m8_t __riscv_vmv_v_v_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                                      size_t vl);
vfloat16m8_t __riscv_vfmv_v_f_f16m8_tu(vfloat16m8_t vd, _Float16 rs1,
                                       size_t vl);
vfloat32mf2_t __riscv_vmv_v_v_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1,
                                        size_t vl);
vfloat32mf2_t __riscv_vfmv_v_f_f32mf2_tu(vfloat32mf2_t vd, float rs1,
                                         size_t vl);
vfloat32m1_t __riscv_vmv_v_v_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                                      size_t vl);
vfloat32m1_t __riscv_vfmv_v_f_f32m1_tu(vfloat32m1_t vd, float rs1, size_t vl);
vfloat32m2_t __riscv_vmv_v_v_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                                      size_t vl);
vfloat32m2_t __riscv_vfmv_v_f_f32m2_tu(vfloat32m2_t vd, float rs1, size_t vl);
vfloat32m4_t __riscv_vmv_v_v_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                                      size_t vl);
vfloat32m4_t __riscv_vfmv_v_f_f32m4_tu(vfloat32m4_t vd, float rs1, size_t vl);
vfloat32m8_t __riscv_vmv_v_v_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                                      size_t vl);
vfloat32m8_t __riscv_vfmv_v_f_f32m8_tu(vfloat32m8_t vd, float rs1, size_t vl);
vfloat64m1_t __riscv_vmv_v_v_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                                      size_t vl);
vfloat64m1_t __riscv_vfmv_v_f_f64m1_tu(vfloat64m1_t vd, double rs1, size_t vl);
vfloat64m2_t __riscv_vmv_v_v_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                                      size_t vl);
vfloat64m2_t __riscv_vfmv_v_f_f64m2_tu(vfloat64m2_t vd, double rs1, size_t vl);
vfloat64m4_t __riscv_vmv_v_v_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                                      size_t vl);
vfloat64m4_t __riscv_vfmv_v_f_f64m4_tu(vfloat64m4_t vd, double rs1, size_t vl);
vfloat64m8_t __riscv_vmv_v_v_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                                      size_t vl);
vfloat64m8_t __riscv_vfmv_v_f_f64m8_tu(vfloat64m8_t vd, double rs1, size_t vl);

Single-Width Floating-Point/Integer Type-Convert Intrinsics

vint16mf4_t __riscv_vfcvt_x_f_v_i16mf4_tu(vint16mf4_t vd, vfloat16mf4_t vs2,
                                          size_t vl);
vint16mf4_t __riscv_vfcvt_rtz_x_f_v_i16mf4_tu(vint16mf4_t vd, vfloat16mf4_t vs2,
                                              size_t vl);
vint16mf2_t __riscv_vfcvt_x_f_v_i16mf2_tu(vint16mf2_t vd, vfloat16mf2_t vs2,
                                          size_t vl);
vint16mf2_t __riscv_vfcvt_rtz_x_f_v_i16mf2_tu(vint16mf2_t vd, vfloat16mf2_t vs2,
                                              size_t vl);
vint16m1_t __riscv_vfcvt_x_f_v_i16m1_tu(vint16m1_t vd, vfloat16m1_t vs2,
                                        size_t vl);
vint16m1_t __riscv_vfcvt_rtz_x_f_v_i16m1_tu(vint16m1_t vd, vfloat16m1_t vs2,
                                            size_t vl);
vint16m2_t __riscv_vfcvt_x_f_v_i16m2_tu(vint16m2_t vd, vfloat16m2_t vs2,
                                        size_t vl);
vint16m2_t __riscv_vfcvt_rtz_x_f_v_i16m2_tu(vint16m2_t vd, vfloat16m2_t vs2,
                                            size_t vl);
vint16m4_t __riscv_vfcvt_x_f_v_i16m4_tu(vint16m4_t vd, vfloat16m4_t vs2,
                                        size_t vl);
vint16m4_t __riscv_vfcvt_rtz_x_f_v_i16m4_tu(vint16m4_t vd, vfloat16m4_t vs2,
                                            size_t vl);
vint16m8_t __riscv_vfcvt_x_f_v_i16m8_tu(vint16m8_t vd, vfloat16m8_t vs2,
                                        size_t vl);
vint16m8_t __riscv_vfcvt_rtz_x_f_v_i16m8_tu(vint16m8_t vd, vfloat16m8_t vs2,
                                            size_t vl);
vuint16mf4_t __riscv_vfcvt_xu_f_v_u16mf4_tu(vuint16mf4_t vd, vfloat16mf4_t vs2,
                                            size_t vl);
vuint16mf4_t __riscv_vfcvt_rtz_xu_f_v_u16mf4_tu(vuint16mf4_t vd,
                                                vfloat16mf4_t vs2, size_t vl);
vuint16mf2_t __riscv_vfcvt_xu_f_v_u16mf2_tu(vuint16mf2_t vd, vfloat16mf2_t vs2,
                                            size_t vl);
vuint16mf2_t __riscv_vfcvt_rtz_xu_f_v_u16mf2_tu(vuint16mf2_t vd,
                                                vfloat16mf2_t vs2, size_t vl);
vuint16m1_t __riscv_vfcvt_xu_f_v_u16m1_tu(vuint16m1_t vd, vfloat16m1_t vs2,
                                          size_t vl);
vuint16m1_t __riscv_vfcvt_rtz_xu_f_v_u16m1_tu(vuint16m1_t vd, vfloat16m1_t vs2,
                                              size_t vl);
vuint16m2_t __riscv_vfcvt_xu_f_v_u16m2_tu(vuint16m2_t vd, vfloat16m2_t vs2,
                                          size_t vl);
vuint16m2_t __riscv_vfcvt_rtz_xu_f_v_u16m2_tu(vuint16m2_t vd, vfloat16m2_t vs2,
                                              size_t vl);
vuint16m4_t __riscv_vfcvt_xu_f_v_u16m4_tu(vuint16m4_t vd, vfloat16m4_t vs2,
                                          size_t vl);
vuint16m4_t __riscv_vfcvt_rtz_xu_f_v_u16m4_tu(vuint16m4_t vd, vfloat16m4_t vs2,
                                              size_t vl);
vuint16m8_t __riscv_vfcvt_xu_f_v_u16m8_tu(vuint16m8_t vd, vfloat16m8_t vs2,
                                          size_t vl);
vuint16m8_t __riscv_vfcvt_rtz_xu_f_v_u16m8_tu(vuint16m8_t vd, vfloat16m8_t vs2,
                                              size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_x_v_f16mf4_tu(vfloat16mf4_t vd, vint16mf4_t vs2,
                                            size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_x_v_f16mf2_tu(vfloat16mf2_t vd, vint16mf2_t vs2,
                                            size_t vl);
vfloat16m1_t __riscv_vfcvt_f_x_v_f16m1_tu(vfloat16m1_t vd, vint16m1_t vs2,
                                          size_t vl);
vfloat16m2_t __riscv_vfcvt_f_x_v_f16m2_tu(vfloat16m2_t vd, vint16m2_t vs2,
                                          size_t vl);
vfloat16m4_t __riscv_vfcvt_f_x_v_f16m4_tu(vfloat16m4_t vd, vint16m4_t vs2,
                                          size_t vl);
vfloat16m8_t __riscv_vfcvt_f_x_v_f16m8_tu(vfloat16m8_t vd, vint16m8_t vs2,
                                          size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_xu_v_f16mf4_tu(vfloat16mf4_t vd, vuint16mf4_t vs2,
                                             size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_xu_v_f16mf2_tu(vfloat16mf2_t vd, vuint16mf2_t vs2,
                                             size_t vl);
vfloat16m1_t __riscv_vfcvt_f_xu_v_f16m1_tu(vfloat16m1_t vd, vuint16m1_t vs2,
                                           size_t vl);
vfloat16m2_t __riscv_vfcvt_f_xu_v_f16m2_tu(vfloat16m2_t vd, vuint16m2_t vs2,
                                           size_t vl);
vfloat16m4_t __riscv_vfcvt_f_xu_v_f16m4_tu(vfloat16m4_t vd, vuint16m4_t vs2,
                                           size_t vl);
vfloat16m8_t __riscv_vfcvt_f_xu_v_f16m8_tu(vfloat16m8_t vd, vuint16m8_t vs2,
                                           size_t vl);
vint32mf2_t __riscv_vfcvt_x_f_v_i32mf2_tu(vint32mf2_t vd, vfloat32mf2_t vs2,
                                          size_t vl);
vint32mf2_t __riscv_vfcvt_rtz_x_f_v_i32mf2_tu(vint32mf2_t vd, vfloat32mf2_t vs2,
                                              size_t vl);
vint32m1_t __riscv_vfcvt_x_f_v_i32m1_tu(vint32m1_t vd, vfloat32m1_t vs2,
                                        size_t vl);
vint32m1_t __riscv_vfcvt_rtz_x_f_v_i32m1_tu(vint32m1_t vd, vfloat32m1_t vs2,
                                            size_t vl);
vint32m2_t __riscv_vfcvt_x_f_v_i32m2_tu(vint32m2_t vd, vfloat32m2_t vs2,
                                        size_t vl);
vint32m2_t __riscv_vfcvt_rtz_x_f_v_i32m2_tu(vint32m2_t vd, vfloat32m2_t vs2,
                                            size_t vl);
vint32m4_t __riscv_vfcvt_x_f_v_i32m4_tu(vint32m4_t vd, vfloat32m4_t vs2,
                                        size_t vl);
vint32m4_t __riscv_vfcvt_rtz_x_f_v_i32m4_tu(vint32m4_t vd, vfloat32m4_t vs2,
                                            size_t vl);
vint32m8_t __riscv_vfcvt_x_f_v_i32m8_tu(vint32m8_t vd, vfloat32m8_t vs2,
                                        size_t vl);
vint32m8_t __riscv_vfcvt_rtz_x_f_v_i32m8_tu(vint32m8_t vd, vfloat32m8_t vs2,
                                            size_t vl);
vuint32mf2_t __riscv_vfcvt_xu_f_v_u32mf2_tu(vuint32mf2_t vd, vfloat32mf2_t vs2,
                                            size_t vl);
vuint32mf2_t __riscv_vfcvt_rtz_xu_f_v_u32mf2_tu(vuint32mf2_t vd,
                                                vfloat32mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vfcvt_xu_f_v_u32m1_tu(vuint32m1_t vd, vfloat32m1_t vs2,
                                          size_t vl);
vuint32m1_t __riscv_vfcvt_rtz_xu_f_v_u32m1_tu(vuint32m1_t vd, vfloat32m1_t vs2,
                                              size_t vl);
vuint32m2_t __riscv_vfcvt_xu_f_v_u32m2_tu(vuint32m2_t vd, vfloat32m2_t vs2,
                                          size_t vl);
vuint32m2_t __riscv_vfcvt_rtz_xu_f_v_u32m2_tu(vuint32m2_t vd, vfloat32m2_t vs2,
                                              size_t vl);
vuint32m4_t __riscv_vfcvt_xu_f_v_u32m4_tu(vuint32m4_t vd, vfloat32m4_t vs2,
                                          size_t vl);
vuint32m4_t __riscv_vfcvt_rtz_xu_f_v_u32m4_tu(vuint32m4_t vd, vfloat32m4_t vs2,
                                              size_t vl);
vuint32m8_t __riscv_vfcvt_xu_f_v_u32m8_tu(vuint32m8_t vd, vfloat32m8_t vs2,
                                          size_t vl);
vuint32m8_t __riscv_vfcvt_rtz_xu_f_v_u32m8_tu(vuint32m8_t vd, vfloat32m8_t vs2,
                                              size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_x_v_f32mf2_tu(vfloat32mf2_t vd, vint32mf2_t vs2,
                                            size_t vl);
vfloat32m1_t __riscv_vfcvt_f_x_v_f32m1_tu(vfloat32m1_t vd, vint32m1_t vs2,
                                          size_t vl);
vfloat32m2_t __riscv_vfcvt_f_x_v_f32m2_tu(vfloat32m2_t vd, vint32m2_t vs2,
                                          size_t vl);
vfloat32m4_t __riscv_vfcvt_f_x_v_f32m4_tu(vfloat32m4_t vd, vint32m4_t vs2,
                                          size_t vl);
vfloat32m8_t __riscv_vfcvt_f_x_v_f32m8_tu(vfloat32m8_t vd, vint32m8_t vs2,
                                          size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_xu_v_f32mf2_tu(vfloat32mf2_t vd, vuint32mf2_t vs2,
                                             size_t vl);
vfloat32m1_t __riscv_vfcvt_f_xu_v_f32m1_tu(vfloat32m1_t vd, vuint32m1_t vs2,
                                           size_t vl);
vfloat32m2_t __riscv_vfcvt_f_xu_v_f32m2_tu(vfloat32m2_t vd, vuint32m2_t vs2,
                                           size_t vl);
vfloat32m4_t __riscv_vfcvt_f_xu_v_f32m4_tu(vfloat32m4_t vd, vuint32m4_t vs2,
                                           size_t vl);
vfloat32m8_t __riscv_vfcvt_f_xu_v_f32m8_tu(vfloat32m8_t vd, vuint32m8_t vs2,
                                           size_t vl);
vint64m1_t __riscv_vfcvt_x_f_v_i64m1_tu(vint64m1_t vd, vfloat64m1_t vs2,
                                        size_t vl);
vint64m1_t __riscv_vfcvt_rtz_x_f_v_i64m1_tu(vint64m1_t vd, vfloat64m1_t vs2,
                                            size_t vl);
vint64m2_t __riscv_vfcvt_x_f_v_i64m2_tu(vint64m2_t vd, vfloat64m2_t vs2,
                                        size_t vl);
vint64m2_t __riscv_vfcvt_rtz_x_f_v_i64m2_tu(vint64m2_t vd, vfloat64m2_t vs2,
                                            size_t vl);
vint64m4_t __riscv_vfcvt_x_f_v_i64m4_tu(vint64m4_t vd, vfloat64m4_t vs2,
                                        size_t vl);
vint64m4_t __riscv_vfcvt_rtz_x_f_v_i64m4_tu(vint64m4_t vd, vfloat64m4_t vs2,
                                            size_t vl);
vint64m8_t __riscv_vfcvt_x_f_v_i64m8_tu(vint64m8_t vd, vfloat64m8_t vs2,
                                        size_t vl);
vint64m8_t __riscv_vfcvt_rtz_x_f_v_i64m8_tu(vint64m8_t vd, vfloat64m8_t vs2,
                                            size_t vl);
vuint64m1_t __riscv_vfcvt_xu_f_v_u64m1_tu(vuint64m1_t vd, vfloat64m1_t vs2,
                                          size_t vl);
vuint64m1_t __riscv_vfcvt_rtz_xu_f_v_u64m1_tu(vuint64m1_t vd, vfloat64m1_t vs2,
                                              size_t vl);
vuint64m2_t __riscv_vfcvt_xu_f_v_u64m2_tu(vuint64m2_t vd, vfloat64m2_t vs2,
                                          size_t vl);
vuint64m2_t __riscv_vfcvt_rtz_xu_f_v_u64m2_tu(vuint64m2_t vd, vfloat64m2_t vs2,
                                              size_t vl);
vuint64m4_t __riscv_vfcvt_xu_f_v_u64m4_tu(vuint64m4_t vd, vfloat64m4_t vs2,
                                          size_t vl);
vuint64m4_t __riscv_vfcvt_rtz_xu_f_v_u64m4_tu(vuint64m4_t vd, vfloat64m4_t vs2,
                                              size_t vl);
vuint64m8_t __riscv_vfcvt_xu_f_v_u64m8_tu(vuint64m8_t vd, vfloat64m8_t vs2,
                                          size_t vl);
vuint64m8_t __riscv_vfcvt_rtz_xu_f_v_u64m8_tu(vuint64m8_t vd, vfloat64m8_t vs2,
                                              size_t vl);
vfloat64m1_t __riscv_vfcvt_f_x_v_f64m1_tu(vfloat64m1_t vd, vint64m1_t vs2,
                                          size_t vl);
vfloat64m2_t __riscv_vfcvt_f_x_v_f64m2_tu(vfloat64m2_t vd, vint64m2_t vs2,
                                          size_t vl);
vfloat64m4_t __riscv_vfcvt_f_x_v_f64m4_tu(vfloat64m4_t vd, vint64m4_t vs2,
                                          size_t vl);
vfloat64m8_t __riscv_vfcvt_f_x_v_f64m8_tu(vfloat64m8_t vd, vint64m8_t vs2,
                                          size_t vl);
vfloat64m1_t __riscv_vfcvt_f_xu_v_f64m1_tu(vfloat64m1_t vd, vuint64m1_t vs2,
                                           size_t vl);
vfloat64m2_t __riscv_vfcvt_f_xu_v_f64m2_tu(vfloat64m2_t vd, vuint64m2_t vs2,
                                           size_t vl);
vfloat64m4_t __riscv_vfcvt_f_xu_v_f64m4_tu(vfloat64m4_t vd, vuint64m4_t vs2,
                                           size_t vl);
vfloat64m8_t __riscv_vfcvt_f_xu_v_f64m8_tu(vfloat64m8_t vd, vuint64m8_t vs2,
                                           size_t vl);
// masked functions
vint16mf4_t __riscv_vfcvt_x_f_v_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                           vfloat16mf4_t vs2, size_t vl);
vint16mf4_t __riscv_vfcvt_rtz_x_f_v_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                               vfloat16mf4_t vs2, size_t vl);
vint16mf2_t __riscv_vfcvt_x_f_v_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                           vfloat16mf2_t vs2, size_t vl);
vint16mf2_t __riscv_vfcvt_rtz_x_f_v_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                               vfloat16mf2_t vs2, size_t vl);
vint16m1_t __riscv_vfcvt_x_f_v_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                         vfloat16m1_t vs2, size_t vl);
vint16m1_t __riscv_vfcvt_rtz_x_f_v_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                             vfloat16m1_t vs2, size_t vl);
vint16m2_t __riscv_vfcvt_x_f_v_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                         vfloat16m2_t vs2, size_t vl);
vint16m2_t __riscv_vfcvt_rtz_x_f_v_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                             vfloat16m2_t vs2, size_t vl);
vint16m4_t __riscv_vfcvt_x_f_v_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                         vfloat16m4_t vs2, size_t vl);
vint16m4_t __riscv_vfcvt_rtz_x_f_v_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                             vfloat16m4_t vs2, size_t vl);
vint16m8_t __riscv_vfcvt_x_f_v_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                         vfloat16m8_t vs2, size_t vl);
vint16m8_t __riscv_vfcvt_rtz_x_f_v_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                             vfloat16m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vfcvt_xu_f_v_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                             vfloat16mf4_t vs2, size_t vl);
vuint16mf4_t __riscv_vfcvt_rtz_xu_f_v_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                                 vfloat16mf4_t vs2, size_t vl);
vuint16mf2_t __riscv_vfcvt_xu_f_v_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                             vfloat16mf2_t vs2, size_t vl);
vuint16mf2_t __riscv_vfcvt_rtz_xu_f_v_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                                 vfloat16mf2_t vs2, size_t vl);
vuint16m1_t __riscv_vfcvt_xu_f_v_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                           vfloat16m1_t vs2, size_t vl);
vuint16m1_t __riscv_vfcvt_rtz_xu_f_v_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                               vfloat16m1_t vs2, size_t vl);
vuint16m2_t __riscv_vfcvt_xu_f_v_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                           vfloat16m2_t vs2, size_t vl);
vuint16m2_t __riscv_vfcvt_rtz_xu_f_v_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                               vfloat16m2_t vs2, size_t vl);
vuint16m4_t __riscv_vfcvt_xu_f_v_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                           vfloat16m4_t vs2, size_t vl);
vuint16m4_t __riscv_vfcvt_rtz_xu_f_v_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                               vfloat16m4_t vs2, size_t vl);
vuint16m8_t __riscv_vfcvt_xu_f_v_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                           vfloat16m8_t vs2, size_t vl);
vuint16m8_t __riscv_vfcvt_rtz_xu_f_v_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                               vfloat16m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_x_v_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                             vint16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_x_v_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                             vint16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_x_v_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                           vint16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfcvt_f_x_v_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                           vint16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfcvt_f_x_v_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                           vint16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfcvt_f_x_v_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                           vint16m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_xu_v_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                              vuint16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_xu_v_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                              vuint16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_xu_v_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                            vuint16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfcvt_f_xu_v_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                            vuint16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfcvt_f_xu_v_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                            vuint16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfcvt_f_xu_v_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                            vuint16m8_t vs2, size_t vl);
vint32mf2_t __riscv_vfcvt_x_f_v_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                           vfloat32mf2_t vs2, size_t vl);
vint32mf2_t __riscv_vfcvt_rtz_x_f_v_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                               vfloat32mf2_t vs2, size_t vl);
vint32m1_t __riscv_vfcvt_x_f_v_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                         vfloat32m1_t vs2, size_t vl);
vint32m1_t __riscv_vfcvt_rtz_x_f_v_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                             vfloat32m1_t vs2, size_t vl);
vint32m2_t __riscv_vfcvt_x_f_v_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                         vfloat32m2_t vs2, size_t vl);
vint32m2_t __riscv_vfcvt_rtz_x_f_v_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                             vfloat32m2_t vs2, size_t vl);
vint32m4_t __riscv_vfcvt_x_f_v_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                         vfloat32m4_t vs2, size_t vl);
vint32m4_t __riscv_vfcvt_rtz_x_f_v_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                             vfloat32m4_t vs2, size_t vl);
vint32m8_t __riscv_vfcvt_x_f_v_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                         vfloat32m8_t vs2, size_t vl);
vint32m8_t __riscv_vfcvt_rtz_x_f_v_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                             vfloat32m8_t vs2, size_t vl);
vuint32mf2_t __riscv_vfcvt_xu_f_v_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                             vfloat32mf2_t vs2, size_t vl);
vuint32mf2_t __riscv_vfcvt_rtz_xu_f_v_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                                 vfloat32mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vfcvt_xu_f_v_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                           vfloat32m1_t vs2, size_t vl);
vuint32m1_t __riscv_vfcvt_rtz_xu_f_v_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                               vfloat32m1_t vs2, size_t vl);
vuint32m2_t __riscv_vfcvt_xu_f_v_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                           vfloat32m2_t vs2, size_t vl);
vuint32m2_t __riscv_vfcvt_rtz_xu_f_v_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                               vfloat32m2_t vs2, size_t vl);
vuint32m4_t __riscv_vfcvt_xu_f_v_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                           vfloat32m4_t vs2, size_t vl);
vuint32m4_t __riscv_vfcvt_rtz_xu_f_v_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                               vfloat32m4_t vs2, size_t vl);
vuint32m8_t __riscv_vfcvt_xu_f_v_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                           vfloat32m8_t vs2, size_t vl);
vuint32m8_t __riscv_vfcvt_rtz_xu_f_v_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                               vfloat32m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_x_v_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                             vint32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_x_v_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                           vint32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfcvt_f_x_v_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                           vint32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfcvt_f_x_v_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                           vint32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfcvt_f_x_v_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                           vint32m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_xu_v_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                              vuint32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_xu_v_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                            vuint32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfcvt_f_xu_v_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                            vuint32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfcvt_f_xu_v_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                            vuint32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfcvt_f_xu_v_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                            vuint32m8_t vs2, size_t vl);
vint64m1_t __riscv_vfcvt_x_f_v_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                         vfloat64m1_t vs2, size_t vl);
vint64m1_t __riscv_vfcvt_rtz_x_f_v_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                             vfloat64m1_t vs2, size_t vl);
vint64m2_t __riscv_vfcvt_x_f_v_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                         vfloat64m2_t vs2, size_t vl);
vint64m2_t __riscv_vfcvt_rtz_x_f_v_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                             vfloat64m2_t vs2, size_t vl);
vint64m4_t __riscv_vfcvt_x_f_v_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                         vfloat64m4_t vs2, size_t vl);
vint64m4_t __riscv_vfcvt_rtz_x_f_v_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                             vfloat64m4_t vs2, size_t vl);
vint64m8_t __riscv_vfcvt_x_f_v_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                         vfloat64m8_t vs2, size_t vl);
vint64m8_t __riscv_vfcvt_rtz_x_f_v_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                             vfloat64m8_t vs2, size_t vl);
vuint64m1_t __riscv_vfcvt_xu_f_v_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                           vfloat64m1_t vs2, size_t vl);
vuint64m1_t __riscv_vfcvt_rtz_xu_f_v_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                               vfloat64m1_t vs2, size_t vl);
vuint64m2_t __riscv_vfcvt_xu_f_v_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                           vfloat64m2_t vs2, size_t vl);
vuint64m2_t __riscv_vfcvt_rtz_xu_f_v_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                               vfloat64m2_t vs2, size_t vl);
vuint64m4_t __riscv_vfcvt_xu_f_v_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                           vfloat64m4_t vs2, size_t vl);
vuint64m4_t __riscv_vfcvt_rtz_xu_f_v_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                               vfloat64m4_t vs2, size_t vl);
vuint64m8_t __riscv_vfcvt_xu_f_v_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                           vfloat64m8_t vs2, size_t vl);
vuint64m8_t __riscv_vfcvt_rtz_xu_f_v_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                               vfloat64m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfcvt_f_x_v_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                           vint64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfcvt_f_x_v_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                           vint64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfcvt_f_x_v_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                           vint64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfcvt_f_x_v_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                           vint64m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfcvt_f_xu_v_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                            vuint64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfcvt_f_xu_v_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                            vuint64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfcvt_f_xu_v_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                            vuint64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfcvt_f_xu_v_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                            vuint64m8_t vs2, size_t vl);
// masked functions
vint16mf4_t __riscv_vfcvt_x_f_v_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                            vfloat16mf4_t vs2, size_t vl);
vint16mf4_t __riscv_vfcvt_rtz_x_f_v_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                                vfloat16mf4_t vs2, size_t vl);
vint16mf2_t __riscv_vfcvt_x_f_v_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                            vfloat16mf2_t vs2, size_t vl);
vint16mf2_t __riscv_vfcvt_rtz_x_f_v_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                                vfloat16mf2_t vs2, size_t vl);
vint16m1_t __riscv_vfcvt_x_f_v_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                          vfloat16m1_t vs2, size_t vl);
vint16m1_t __riscv_vfcvt_rtz_x_f_v_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                              vfloat16m1_t vs2, size_t vl);
vint16m2_t __riscv_vfcvt_x_f_v_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                          vfloat16m2_t vs2, size_t vl);
vint16m2_t __riscv_vfcvt_rtz_x_f_v_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                              vfloat16m2_t vs2, size_t vl);
vint16m4_t __riscv_vfcvt_x_f_v_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                          vfloat16m4_t vs2, size_t vl);
vint16m4_t __riscv_vfcvt_rtz_x_f_v_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                              vfloat16m4_t vs2, size_t vl);
vint16m8_t __riscv_vfcvt_x_f_v_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                          vfloat16m8_t vs2, size_t vl);
vint16m8_t __riscv_vfcvt_rtz_x_f_v_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                              vfloat16m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vfcvt_xu_f_v_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                              vfloat16mf4_t vs2, size_t vl);
vuint16mf4_t __riscv_vfcvt_rtz_xu_f_v_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                                  vfloat16mf4_t vs2, size_t vl);
vuint16mf2_t __riscv_vfcvt_xu_f_v_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                              vfloat16mf2_t vs2, size_t vl);
vuint16mf2_t __riscv_vfcvt_rtz_xu_f_v_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                                  vfloat16mf2_t vs2, size_t vl);
vuint16m1_t __riscv_vfcvt_xu_f_v_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                            vfloat16m1_t vs2, size_t vl);
vuint16m1_t __riscv_vfcvt_rtz_xu_f_v_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                                vfloat16m1_t vs2, size_t vl);
vuint16m2_t __riscv_vfcvt_xu_f_v_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                            vfloat16m2_t vs2, size_t vl);
vuint16m2_t __riscv_vfcvt_rtz_xu_f_v_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                                vfloat16m2_t vs2, size_t vl);
vuint16m4_t __riscv_vfcvt_xu_f_v_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                            vfloat16m4_t vs2, size_t vl);
vuint16m4_t __riscv_vfcvt_rtz_xu_f_v_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                                vfloat16m4_t vs2, size_t vl);
vuint16m8_t __riscv_vfcvt_xu_f_v_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                            vfloat16m8_t vs2, size_t vl);
vuint16m8_t __riscv_vfcvt_rtz_xu_f_v_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                                vfloat16m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_x_v_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                              vint16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_x_v_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                              vint16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_x_v_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                            vint16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfcvt_f_x_v_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                            vint16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfcvt_f_x_v_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                            vint16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfcvt_f_x_v_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                            vint16m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_xu_v_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                               vuint16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_xu_v_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                               vuint16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_xu_v_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                             vuint16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfcvt_f_xu_v_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                             vuint16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfcvt_f_xu_v_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                             vuint16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfcvt_f_xu_v_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                             vuint16m8_t vs2, size_t vl);
vint32mf2_t __riscv_vfcvt_x_f_v_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                            vfloat32mf2_t vs2, size_t vl);
vint32mf2_t __riscv_vfcvt_rtz_x_f_v_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                                vfloat32mf2_t vs2, size_t vl);
vint32m1_t __riscv_vfcvt_x_f_v_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                          vfloat32m1_t vs2, size_t vl);
vint32m1_t __riscv_vfcvt_rtz_x_f_v_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                              vfloat32m1_t vs2, size_t vl);
vint32m2_t __riscv_vfcvt_x_f_v_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                          vfloat32m2_t vs2, size_t vl);
vint32m2_t __riscv_vfcvt_rtz_x_f_v_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                              vfloat32m2_t vs2, size_t vl);
vint32m4_t __riscv_vfcvt_x_f_v_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                          vfloat32m4_t vs2, size_t vl);
vint32m4_t __riscv_vfcvt_rtz_x_f_v_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                              vfloat32m4_t vs2, size_t vl);
vint32m8_t __riscv_vfcvt_x_f_v_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                          vfloat32m8_t vs2, size_t vl);
vint32m8_t __riscv_vfcvt_rtz_x_f_v_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                              vfloat32m8_t vs2, size_t vl);
vuint32mf2_t __riscv_vfcvt_xu_f_v_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                              vfloat32mf2_t vs2, size_t vl);
vuint32mf2_t __riscv_vfcvt_rtz_xu_f_v_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                                  vfloat32mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vfcvt_xu_f_v_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                            vfloat32m1_t vs2, size_t vl);
vuint32m1_t __riscv_vfcvt_rtz_xu_f_v_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                                vfloat32m1_t vs2, size_t vl);
vuint32m2_t __riscv_vfcvt_xu_f_v_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                            vfloat32m2_t vs2, size_t vl);
vuint32m2_t __riscv_vfcvt_rtz_xu_f_v_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                                vfloat32m2_t vs2, size_t vl);
vuint32m4_t __riscv_vfcvt_xu_f_v_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                            vfloat32m4_t vs2, size_t vl);
vuint32m4_t __riscv_vfcvt_rtz_xu_f_v_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                                vfloat32m4_t vs2, size_t vl);
vuint32m8_t __riscv_vfcvt_xu_f_v_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                            vfloat32m8_t vs2, size_t vl);
vuint32m8_t __riscv_vfcvt_rtz_xu_f_v_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                                vfloat32m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_x_v_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                              vint32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_x_v_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                            vint32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfcvt_f_x_v_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                            vint32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfcvt_f_x_v_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                            vint32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfcvt_f_x_v_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                            vint32m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_xu_v_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                               vuint32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_xu_v_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                             vuint32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfcvt_f_xu_v_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                             vuint32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfcvt_f_xu_v_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                             vuint32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfcvt_f_xu_v_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                             vuint32m8_t vs2, size_t vl);
vint64m1_t __riscv_vfcvt_x_f_v_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                          vfloat64m1_t vs2, size_t vl);
vint64m1_t __riscv_vfcvt_rtz_x_f_v_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                              vfloat64m1_t vs2, size_t vl);
vint64m2_t __riscv_vfcvt_x_f_v_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                          vfloat64m2_t vs2, size_t vl);
vint64m2_t __riscv_vfcvt_rtz_x_f_v_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                              vfloat64m2_t vs2, size_t vl);
vint64m4_t __riscv_vfcvt_x_f_v_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                          vfloat64m4_t vs2, size_t vl);
vint64m4_t __riscv_vfcvt_rtz_x_f_v_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                              vfloat64m4_t vs2, size_t vl);
vint64m8_t __riscv_vfcvt_x_f_v_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                          vfloat64m8_t vs2, size_t vl);
vint64m8_t __riscv_vfcvt_rtz_x_f_v_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                              vfloat64m8_t vs2, size_t vl);
vuint64m1_t __riscv_vfcvt_xu_f_v_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                            vfloat64m1_t vs2, size_t vl);
vuint64m1_t __riscv_vfcvt_rtz_xu_f_v_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                                vfloat64m1_t vs2, size_t vl);
vuint64m2_t __riscv_vfcvt_xu_f_v_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                            vfloat64m2_t vs2, size_t vl);
vuint64m2_t __riscv_vfcvt_rtz_xu_f_v_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                                vfloat64m2_t vs2, size_t vl);
vuint64m4_t __riscv_vfcvt_xu_f_v_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                            vfloat64m4_t vs2, size_t vl);
vuint64m4_t __riscv_vfcvt_rtz_xu_f_v_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                                vfloat64m4_t vs2, size_t vl);
vuint64m8_t __riscv_vfcvt_xu_f_v_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                            vfloat64m8_t vs2, size_t vl);
vuint64m8_t __riscv_vfcvt_rtz_xu_f_v_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                                vfloat64m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfcvt_f_x_v_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                            vint64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfcvt_f_x_v_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                            vint64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfcvt_f_x_v_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                            vint64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfcvt_f_x_v_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                            vint64m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfcvt_f_xu_v_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                             vuint64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfcvt_f_xu_v_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                             vuint64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfcvt_f_xu_v_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                             vuint64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfcvt_f_xu_v_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                             vuint64m8_t vs2, size_t vl);
// masked functions
vint16mf4_t __riscv_vfcvt_x_f_v_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                          vfloat16mf4_t vs2, size_t vl);
vint16mf4_t __riscv_vfcvt_rtz_x_f_v_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                              vfloat16mf4_t vs2, size_t vl);
vint16mf2_t __riscv_vfcvt_x_f_v_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                          vfloat16mf2_t vs2, size_t vl);
vint16mf2_t __riscv_vfcvt_rtz_x_f_v_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                              vfloat16mf2_t vs2, size_t vl);
vint16m1_t __riscv_vfcvt_x_f_v_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                        vfloat16m1_t vs2, size_t vl);
vint16m1_t __riscv_vfcvt_rtz_x_f_v_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                            vfloat16m1_t vs2, size_t vl);
vint16m2_t __riscv_vfcvt_x_f_v_i16m2_mu(vbool8_t vm, vint16m2_t vd,
                                        vfloat16m2_t vs2, size_t vl);
vint16m2_t __riscv_vfcvt_rtz_x_f_v_i16m2_mu(vbool8_t vm, vint16m2_t vd,
                                            vfloat16m2_t vs2, size_t vl);
vint16m4_t __riscv_vfcvt_x_f_v_i16m4_mu(vbool4_t vm, vint16m4_t vd,
                                        vfloat16m4_t vs2, size_t vl);
vint16m4_t __riscv_vfcvt_rtz_x_f_v_i16m4_mu(vbool4_t vm, vint16m4_t vd,
                                            vfloat16m4_t vs2, size_t vl);
vint16m8_t __riscv_vfcvt_x_f_v_i16m8_mu(vbool2_t vm, vint16m8_t vd,
                                        vfloat16m8_t vs2, size_t vl);
vint16m8_t __riscv_vfcvt_rtz_x_f_v_i16m8_mu(vbool2_t vm, vint16m8_t vd,
                                            vfloat16m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vfcvt_xu_f_v_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                            vfloat16mf4_t vs2, size_t vl);
vuint16mf4_t __riscv_vfcvt_rtz_xu_f_v_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                                vfloat16mf4_t vs2, size_t vl);
vuint16mf2_t __riscv_vfcvt_xu_f_v_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                            vfloat16mf2_t vs2, size_t vl);
vuint16mf2_t __riscv_vfcvt_rtz_xu_f_v_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                                vfloat16mf2_t vs2, size_t vl);
vuint16m1_t __riscv_vfcvt_xu_f_v_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                          vfloat16m1_t vs2, size_t vl);
vuint16m1_t __riscv_vfcvt_rtz_xu_f_v_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                              vfloat16m1_t vs2, size_t vl);
vuint16m2_t __riscv_vfcvt_xu_f_v_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                          vfloat16m2_t vs2, size_t vl);
vuint16m2_t __riscv_vfcvt_rtz_xu_f_v_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                              vfloat16m2_t vs2, size_t vl);
vuint16m4_t __riscv_vfcvt_xu_f_v_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                          vfloat16m4_t vs2, size_t vl);
vuint16m4_t __riscv_vfcvt_rtz_xu_f_v_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                              vfloat16m4_t vs2, size_t vl);
vuint16m8_t __riscv_vfcvt_xu_f_v_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                          vfloat16m8_t vs2, size_t vl);
vuint16m8_t __riscv_vfcvt_rtz_xu_f_v_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                              vfloat16m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_x_v_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                            vint16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_x_v_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                            vint16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_x_v_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                          vint16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfcvt_f_x_v_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                          vint16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfcvt_f_x_v_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                          vint16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfcvt_f_x_v_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                          vint16m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_xu_v_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                             vuint16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_xu_v_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                             vuint16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_xu_v_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                           vuint16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfcvt_f_xu_v_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                           vuint16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfcvt_f_xu_v_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                           vuint16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfcvt_f_xu_v_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                           vuint16m8_t vs2, size_t vl);
vint32mf2_t __riscv_vfcvt_x_f_v_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                          vfloat32mf2_t vs2, size_t vl);
vint32mf2_t __riscv_vfcvt_rtz_x_f_v_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                              vfloat32mf2_t vs2, size_t vl);
vint32m1_t __riscv_vfcvt_x_f_v_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                        vfloat32m1_t vs2, size_t vl);
vint32m1_t __riscv_vfcvt_rtz_x_f_v_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                            vfloat32m1_t vs2, size_t vl);
vint32m2_t __riscv_vfcvt_x_f_v_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                        vfloat32m2_t vs2, size_t vl);
vint32m2_t __riscv_vfcvt_rtz_x_f_v_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                            vfloat32m2_t vs2, size_t vl);
vint32m4_t __riscv_vfcvt_x_f_v_i32m4_mu(vbool8_t vm, vint32m4_t vd,
                                        vfloat32m4_t vs2, size_t vl);
vint32m4_t __riscv_vfcvt_rtz_x_f_v_i32m4_mu(vbool8_t vm, vint32m4_t vd,
                                            vfloat32m4_t vs2, size_t vl);
vint32m8_t __riscv_vfcvt_x_f_v_i32m8_mu(vbool4_t vm, vint32m8_t vd,
                                        vfloat32m8_t vs2, size_t vl);
vint32m8_t __riscv_vfcvt_rtz_x_f_v_i32m8_mu(vbool4_t vm, vint32m8_t vd,
                                            vfloat32m8_t vs2, size_t vl);
vuint32mf2_t __riscv_vfcvt_xu_f_v_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                            vfloat32mf2_t vs2, size_t vl);
vuint32mf2_t __riscv_vfcvt_rtz_xu_f_v_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                                vfloat32mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vfcvt_xu_f_v_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                          vfloat32m1_t vs2, size_t vl);
vuint32m1_t __riscv_vfcvt_rtz_xu_f_v_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                              vfloat32m1_t vs2, size_t vl);
vuint32m2_t __riscv_vfcvt_xu_f_v_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                          vfloat32m2_t vs2, size_t vl);
vuint32m2_t __riscv_vfcvt_rtz_xu_f_v_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                              vfloat32m2_t vs2, size_t vl);
vuint32m4_t __riscv_vfcvt_xu_f_v_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                          vfloat32m4_t vs2, size_t vl);
vuint32m4_t __riscv_vfcvt_rtz_xu_f_v_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                              vfloat32m4_t vs2, size_t vl);
vuint32m8_t __riscv_vfcvt_xu_f_v_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                          vfloat32m8_t vs2, size_t vl);
vuint32m8_t __riscv_vfcvt_rtz_xu_f_v_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                              vfloat32m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_x_v_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                            vint32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_x_v_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                          vint32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfcvt_f_x_v_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                          vint32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfcvt_f_x_v_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                          vint32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfcvt_f_x_v_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                          vint32m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_xu_v_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                             vuint32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_xu_v_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                           vuint32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfcvt_f_xu_v_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                           vuint32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfcvt_f_xu_v_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                           vuint32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfcvt_f_xu_v_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                           vuint32m8_t vs2, size_t vl);
vint64m1_t __riscv_vfcvt_x_f_v_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                        vfloat64m1_t vs2, size_t vl);
vint64m1_t __riscv_vfcvt_rtz_x_f_v_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                            vfloat64m1_t vs2, size_t vl);
vint64m2_t __riscv_vfcvt_x_f_v_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                        vfloat64m2_t vs2, size_t vl);
vint64m2_t __riscv_vfcvt_rtz_x_f_v_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                            vfloat64m2_t vs2, size_t vl);
vint64m4_t __riscv_vfcvt_x_f_v_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                        vfloat64m4_t vs2, size_t vl);
vint64m4_t __riscv_vfcvt_rtz_x_f_v_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                            vfloat64m4_t vs2, size_t vl);
vint64m8_t __riscv_vfcvt_x_f_v_i64m8_mu(vbool8_t vm, vint64m8_t vd,
                                        vfloat64m8_t vs2, size_t vl);
vint64m8_t __riscv_vfcvt_rtz_x_f_v_i64m8_mu(vbool8_t vm, vint64m8_t vd,
                                            vfloat64m8_t vs2, size_t vl);
vuint64m1_t __riscv_vfcvt_xu_f_v_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                          vfloat64m1_t vs2, size_t vl);
vuint64m1_t __riscv_vfcvt_rtz_xu_f_v_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                              vfloat64m1_t vs2, size_t vl);
vuint64m2_t __riscv_vfcvt_xu_f_v_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                          vfloat64m2_t vs2, size_t vl);
vuint64m2_t __riscv_vfcvt_rtz_xu_f_v_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                              vfloat64m2_t vs2, size_t vl);
vuint64m4_t __riscv_vfcvt_xu_f_v_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                          vfloat64m4_t vs2, size_t vl);
vuint64m4_t __riscv_vfcvt_rtz_xu_f_v_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                              vfloat64m4_t vs2, size_t vl);
vuint64m8_t __riscv_vfcvt_xu_f_v_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                          vfloat64m8_t vs2, size_t vl);
vuint64m8_t __riscv_vfcvt_rtz_xu_f_v_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                              vfloat64m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfcvt_f_x_v_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                          vint64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfcvt_f_x_v_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                          vint64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfcvt_f_x_v_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                          vint64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfcvt_f_x_v_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                          vint64m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfcvt_f_xu_v_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                           vuint64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfcvt_f_xu_v_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                           vuint64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfcvt_f_xu_v_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                           vuint64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfcvt_f_xu_v_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                           vuint64m8_t vs2, size_t vl);
vint16mf4_t __riscv_vfcvt_x_f_v_i16mf4_rm_tu(vint16mf4_t vd, vfloat16mf4_t vs2,
                                             unsigned int frm, size_t vl);
vint16mf2_t __riscv_vfcvt_x_f_v_i16mf2_rm_tu(vint16mf2_t vd, vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vint16m1_t __riscv_vfcvt_x_f_v_i16m1_rm_tu(vint16m1_t vd, vfloat16m1_t vs2,
                                           unsigned int frm, size_t vl);
vint16m2_t __riscv_vfcvt_x_f_v_i16m2_rm_tu(vint16m2_t vd, vfloat16m2_t vs2,
                                           unsigned int frm, size_t vl);
vint16m4_t __riscv_vfcvt_x_f_v_i16m4_rm_tu(vint16m4_t vd, vfloat16m4_t vs2,
                                           unsigned int frm, size_t vl);
vint16m8_t __riscv_vfcvt_x_f_v_i16m8_rm_tu(vint16m8_t vd, vfloat16m8_t vs2,
                                           unsigned int frm, size_t vl);
vuint16mf4_t __riscv_vfcvt_xu_f_v_u16mf4_rm_tu(vuint16mf4_t vd,
                                               vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vuint16mf2_t __riscv_vfcvt_xu_f_v_u16mf2_rm_tu(vuint16mf2_t vd,
                                               vfloat16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vuint16m1_t __riscv_vfcvt_xu_f_v_u16m1_rm_tu(vuint16m1_t vd, vfloat16m1_t vs2,
                                             unsigned int frm, size_t vl);
vuint16m2_t __riscv_vfcvt_xu_f_v_u16m2_rm_tu(vuint16m2_t vd, vfloat16m2_t vs2,
                                             unsigned int frm, size_t vl);
vuint16m4_t __riscv_vfcvt_xu_f_v_u16m4_rm_tu(vuint16m4_t vd, vfloat16m4_t vs2,
                                             unsigned int frm, size_t vl);
vuint16m8_t __riscv_vfcvt_xu_f_v_u16m8_rm_tu(vuint16m8_t vd, vfloat16m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_x_v_f16mf4_rm_tu(vfloat16mf4_t vd,
                                               vint16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_x_v_f16mf2_rm_tu(vfloat16mf2_t vd,
                                               vint16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_x_v_f16m1_rm_tu(vfloat16m1_t vd, vint16m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfcvt_f_x_v_f16m2_rm_tu(vfloat16m2_t vd, vint16m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfcvt_f_x_v_f16m4_rm_tu(vfloat16m4_t vd, vint16m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfcvt_f_x_v_f16m8_rm_tu(vfloat16m8_t vd, vint16m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_xu_v_f16mf4_rm_tu(vfloat16mf4_t vd,
                                                vuint16mf4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_xu_v_f16mf2_rm_tu(vfloat16mf2_t vd,
                                                vuint16mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_xu_v_f16m1_rm_tu(vfloat16m1_t vd, vuint16m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfcvt_f_xu_v_f16m2_rm_tu(vfloat16m2_t vd, vuint16m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfcvt_f_xu_v_f16m4_rm_tu(vfloat16m4_t vd, vuint16m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfcvt_f_xu_v_f16m8_rm_tu(vfloat16m8_t vd, vuint16m8_t vs2,
                                              unsigned int frm, size_t vl);
vint32mf2_t __riscv_vfcvt_x_f_v_i32mf2_rm_tu(vint32mf2_t vd, vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vint32m1_t __riscv_vfcvt_x_f_v_i32m1_rm_tu(vint32m1_t vd, vfloat32m1_t vs2,
                                           unsigned int frm, size_t vl);
vint32m2_t __riscv_vfcvt_x_f_v_i32m2_rm_tu(vint32m2_t vd, vfloat32m2_t vs2,
                                           unsigned int frm, size_t vl);
vint32m4_t __riscv_vfcvt_x_f_v_i32m4_rm_tu(vint32m4_t vd, vfloat32m4_t vs2,
                                           unsigned int frm, size_t vl);
vint32m8_t __riscv_vfcvt_x_f_v_i32m8_rm_tu(vint32m8_t vd, vfloat32m8_t vs2,
                                           unsigned int frm, size_t vl);
vuint32mf2_t __riscv_vfcvt_xu_f_v_u32mf2_rm_tu(vuint32mf2_t vd,
                                               vfloat32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vuint32m1_t __riscv_vfcvt_xu_f_v_u32m1_rm_tu(vuint32m1_t vd, vfloat32m1_t vs2,
                                             unsigned int frm, size_t vl);
vuint32m2_t __riscv_vfcvt_xu_f_v_u32m2_rm_tu(vuint32m2_t vd, vfloat32m2_t vs2,
                                             unsigned int frm, size_t vl);
vuint32m4_t __riscv_vfcvt_xu_f_v_u32m4_rm_tu(vuint32m4_t vd, vfloat32m4_t vs2,
                                             unsigned int frm, size_t vl);
vuint32m8_t __riscv_vfcvt_xu_f_v_u32m8_rm_tu(vuint32m8_t vd, vfloat32m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_x_v_f32mf2_rm_tu(vfloat32mf2_t vd,
                                               vint32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_x_v_f32m1_rm_tu(vfloat32m1_t vd, vint32m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfcvt_f_x_v_f32m2_rm_tu(vfloat32m2_t vd, vint32m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfcvt_f_x_v_f32m4_rm_tu(vfloat32m4_t vd, vint32m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfcvt_f_x_v_f32m8_rm_tu(vfloat32m8_t vd, vint32m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_xu_v_f32mf2_rm_tu(vfloat32mf2_t vd,
                                                vuint32mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_xu_v_f32m1_rm_tu(vfloat32m1_t vd, vuint32m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfcvt_f_xu_v_f32m2_rm_tu(vfloat32m2_t vd, vuint32m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfcvt_f_xu_v_f32m4_rm_tu(vfloat32m4_t vd, vuint32m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfcvt_f_xu_v_f32m8_rm_tu(vfloat32m8_t vd, vuint32m8_t vs2,
                                              unsigned int frm, size_t vl);
vint64m1_t __riscv_vfcvt_x_f_v_i64m1_rm_tu(vint64m1_t vd, vfloat64m1_t vs2,
                                           unsigned int frm, size_t vl);
vint64m2_t __riscv_vfcvt_x_f_v_i64m2_rm_tu(vint64m2_t vd, vfloat64m2_t vs2,
                                           unsigned int frm, size_t vl);
vint64m4_t __riscv_vfcvt_x_f_v_i64m4_rm_tu(vint64m4_t vd, vfloat64m4_t vs2,
                                           unsigned int frm, size_t vl);
vint64m8_t __riscv_vfcvt_x_f_v_i64m8_rm_tu(vint64m8_t vd, vfloat64m8_t vs2,
                                           unsigned int frm, size_t vl);
vuint64m1_t __riscv_vfcvt_xu_f_v_u64m1_rm_tu(vuint64m1_t vd, vfloat64m1_t vs2,
                                             unsigned int frm, size_t vl);
vuint64m2_t __riscv_vfcvt_xu_f_v_u64m2_rm_tu(vuint64m2_t vd, vfloat64m2_t vs2,
                                             unsigned int frm, size_t vl);
vuint64m4_t __riscv_vfcvt_xu_f_v_u64m4_rm_tu(vuint64m4_t vd, vfloat64m4_t vs2,
                                             unsigned int frm, size_t vl);
vuint64m8_t __riscv_vfcvt_xu_f_v_u64m8_rm_tu(vuint64m8_t vd, vfloat64m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfcvt_f_x_v_f64m1_rm_tu(vfloat64m1_t vd, vint64m1_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfcvt_f_x_v_f64m2_rm_tu(vfloat64m2_t vd, vint64m2_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfcvt_f_x_v_f64m4_rm_tu(vfloat64m4_t vd, vint64m4_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfcvt_f_x_v_f64m8_rm_tu(vfloat64m8_t vd, vint64m8_t vs2,
                                             unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfcvt_f_xu_v_f64m1_rm_tu(vfloat64m1_t vd, vuint64m1_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfcvt_f_xu_v_f64m2_rm_tu(vfloat64m2_t vd, vuint64m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfcvt_f_xu_v_f64m4_rm_tu(vfloat64m4_t vd, vuint64m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfcvt_f_xu_v_f64m8_rm_tu(vfloat64m8_t vd, vuint64m8_t vs2,
                                              unsigned int frm, size_t vl);
// masked functions
vint16mf4_t __riscv_vfcvt_x_f_v_i16mf4_rm_tum(vbool64_t vm, vint16mf4_t vd,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vint16mf2_t __riscv_vfcvt_x_f_v_i16mf2_rm_tum(vbool32_t vm, vint16mf2_t vd,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vint16m1_t __riscv_vfcvt_x_f_v_i16m1_rm_tum(vbool16_t vm, vint16m1_t vd,
                                            vfloat16m1_t vs2, unsigned int frm,
                                            size_t vl);
vint16m2_t __riscv_vfcvt_x_f_v_i16m2_rm_tum(vbool8_t vm, vint16m2_t vd,
                                            vfloat16m2_t vs2, unsigned int frm,
                                            size_t vl);
vint16m4_t __riscv_vfcvt_x_f_v_i16m4_rm_tum(vbool4_t vm, vint16m4_t vd,
                                            vfloat16m4_t vs2, unsigned int frm,
                                            size_t vl);
vint16m8_t __riscv_vfcvt_x_f_v_i16m8_rm_tum(vbool2_t vm, vint16m8_t vd,
                                            vfloat16m8_t vs2, unsigned int frm,
                                            size_t vl);
vuint16mf4_t __riscv_vfcvt_xu_f_v_u16mf4_rm_tum(vbool64_t vm, vuint16mf4_t vd,
                                                vfloat16mf4_t vs2,
                                                unsigned int frm, size_t vl);
vuint16mf2_t __riscv_vfcvt_xu_f_v_u16mf2_rm_tum(vbool32_t vm, vuint16mf2_t vd,
                                                vfloat16mf2_t vs2,
                                                unsigned int frm, size_t vl);
vuint16m1_t __riscv_vfcvt_xu_f_v_u16m1_rm_tum(vbool16_t vm, vuint16m1_t vd,
                                              vfloat16m1_t vs2,
                                              unsigned int frm, size_t vl);
vuint16m2_t __riscv_vfcvt_xu_f_v_u16m2_rm_tum(vbool8_t vm, vuint16m2_t vd,
                                              vfloat16m2_t vs2,
                                              unsigned int frm, size_t vl);
vuint16m4_t __riscv_vfcvt_xu_f_v_u16m4_rm_tum(vbool4_t vm, vuint16m4_t vd,
                                              vfloat16m4_t vs2,
                                              unsigned int frm, size_t vl);
vuint16m8_t __riscv_vfcvt_xu_f_v_u16m8_rm_tum(vbool2_t vm, vuint16m8_t vd,
                                              vfloat16m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_x_v_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                                vint16mf4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_x_v_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                                vint16mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_x_v_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                              vint16m1_t vs2, unsigned int frm,
                                              size_t vl);
vfloat16m2_t __riscv_vfcvt_f_x_v_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                              vint16m2_t vs2, unsigned int frm,
                                              size_t vl);
vfloat16m4_t __riscv_vfcvt_f_x_v_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                              vint16m4_t vs2, unsigned int frm,
                                              size_t vl);
vfloat16m8_t __riscv_vfcvt_f_x_v_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                              vint16m8_t vs2, unsigned int frm,
                                              size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_xu_v_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                                 vuint16mf4_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_xu_v_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                                 vuint16mf2_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_xu_v_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                               vuint16m1_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfcvt_f_xu_v_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                               vuint16m2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfcvt_f_xu_v_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                               vuint16m4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfcvt_f_xu_v_f16m8_rm_tum(vbool2_t vm, vfloat16m8_t vd,
                                               vuint16m8_t vs2,
                                               unsigned int frm, size_t vl);
vint32mf2_t __riscv_vfcvt_x_f_v_i32mf2_rm_tum(vbool64_t vm, vint32mf2_t vd,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vint32m1_t __riscv_vfcvt_x_f_v_i32m1_rm_tum(vbool32_t vm, vint32m1_t vd,
                                            vfloat32m1_t vs2, unsigned int frm,
                                            size_t vl);
vint32m2_t __riscv_vfcvt_x_f_v_i32m2_rm_tum(vbool16_t vm, vint32m2_t vd,
                                            vfloat32m2_t vs2, unsigned int frm,
                                            size_t vl);
vint32m4_t __riscv_vfcvt_x_f_v_i32m4_rm_tum(vbool8_t vm, vint32m4_t vd,
                                            vfloat32m4_t vs2, unsigned int frm,
                                            size_t vl);
vint32m8_t __riscv_vfcvt_x_f_v_i32m8_rm_tum(vbool4_t vm, vint32m8_t vd,
                                            vfloat32m8_t vs2, unsigned int frm,
                                            size_t vl);
vuint32mf2_t __riscv_vfcvt_xu_f_v_u32mf2_rm_tum(vbool64_t vm, vuint32mf2_t vd,
                                                vfloat32mf2_t vs2,
                                                unsigned int frm, size_t vl);
vuint32m1_t __riscv_vfcvt_xu_f_v_u32m1_rm_tum(vbool32_t vm, vuint32m1_t vd,
                                              vfloat32m1_t vs2,
                                              unsigned int frm, size_t vl);
vuint32m2_t __riscv_vfcvt_xu_f_v_u32m2_rm_tum(vbool16_t vm, vuint32m2_t vd,
                                              vfloat32m2_t vs2,
                                              unsigned int frm, size_t vl);
vuint32m4_t __riscv_vfcvt_xu_f_v_u32m4_rm_tum(vbool8_t vm, vuint32m4_t vd,
                                              vfloat32m4_t vs2,
                                              unsigned int frm, size_t vl);
vuint32m8_t __riscv_vfcvt_xu_f_v_u32m8_rm_tum(vbool4_t vm, vuint32m8_t vd,
                                              vfloat32m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_x_v_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                                vint32mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_x_v_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                              vint32m1_t vs2, unsigned int frm,
                                              size_t vl);
vfloat32m2_t __riscv_vfcvt_f_x_v_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                              vint32m2_t vs2, unsigned int frm,
                                              size_t vl);
vfloat32m4_t __riscv_vfcvt_f_x_v_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                              vint32m4_t vs2, unsigned int frm,
                                              size_t vl);
vfloat32m8_t __riscv_vfcvt_f_x_v_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                              vint32m8_t vs2, unsigned int frm,
                                              size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_xu_v_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                                 vuint32mf2_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_xu_v_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                               vuint32m1_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfcvt_f_xu_v_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                               vuint32m2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfcvt_f_xu_v_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                               vuint32m4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfcvt_f_xu_v_f32m8_rm_tum(vbool4_t vm, vfloat32m8_t vd,
                                               vuint32m8_t vs2,
                                               unsigned int frm, size_t vl);
vint64m1_t __riscv_vfcvt_x_f_v_i64m1_rm_tum(vbool64_t vm, vint64m1_t vd,
                                            vfloat64m1_t vs2, unsigned int frm,
                                            size_t vl);
vint64m2_t __riscv_vfcvt_x_f_v_i64m2_rm_tum(vbool32_t vm, vint64m2_t vd,
                                            vfloat64m2_t vs2, unsigned int frm,
                                            size_t vl);
vint64m4_t __riscv_vfcvt_x_f_v_i64m4_rm_tum(vbool16_t vm, vint64m4_t vd,
                                            vfloat64m4_t vs2, unsigned int frm,
                                            size_t vl);
vint64m8_t __riscv_vfcvt_x_f_v_i64m8_rm_tum(vbool8_t vm, vint64m8_t vd,
                                            vfloat64m8_t vs2, unsigned int frm,
                                            size_t vl);
vuint64m1_t __riscv_vfcvt_xu_f_v_u64m1_rm_tum(vbool64_t vm, vuint64m1_t vd,
                                              vfloat64m1_t vs2,
                                              unsigned int frm, size_t vl);
vuint64m2_t __riscv_vfcvt_xu_f_v_u64m2_rm_tum(vbool32_t vm, vuint64m2_t vd,
                                              vfloat64m2_t vs2,
                                              unsigned int frm, size_t vl);
vuint64m4_t __riscv_vfcvt_xu_f_v_u64m4_rm_tum(vbool16_t vm, vuint64m4_t vd,
                                              vfloat64m4_t vs2,
                                              unsigned int frm, size_t vl);
vuint64m8_t __riscv_vfcvt_xu_f_v_u64m8_rm_tum(vbool8_t vm, vuint64m8_t vd,
                                              vfloat64m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfcvt_f_x_v_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                              vint64m1_t vs2, unsigned int frm,
                                              size_t vl);
vfloat64m2_t __riscv_vfcvt_f_x_v_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                              vint64m2_t vs2, unsigned int frm,
                                              size_t vl);
vfloat64m4_t __riscv_vfcvt_f_x_v_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                              vint64m4_t vs2, unsigned int frm,
                                              size_t vl);
vfloat64m8_t __riscv_vfcvt_f_x_v_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                              vint64m8_t vs2, unsigned int frm,
                                              size_t vl);
vfloat64m1_t __riscv_vfcvt_f_xu_v_f64m1_rm_tum(vbool64_t vm, vfloat64m1_t vd,
                                               vuint64m1_t vs2,
                                               unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfcvt_f_xu_v_f64m2_rm_tum(vbool32_t vm, vfloat64m2_t vd,
                                               vuint64m2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfcvt_f_xu_v_f64m4_rm_tum(vbool16_t vm, vfloat64m4_t vd,
                                               vuint64m4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfcvt_f_xu_v_f64m8_rm_tum(vbool8_t vm, vfloat64m8_t vd,
                                               vuint64m8_t vs2,
                                               unsigned int frm, size_t vl);
// masked functions
vint16mf4_t __riscv_vfcvt_x_f_v_i16mf4_rm_tumu(vbool64_t vm, vint16mf4_t vd,
                                               vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vint16mf2_t __riscv_vfcvt_x_f_v_i16mf2_rm_tumu(vbool32_t vm, vint16mf2_t vd,
                                               vfloat16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vint16m1_t __riscv_vfcvt_x_f_v_i16m1_rm_tumu(vbool16_t vm, vint16m1_t vd,
                                             vfloat16m1_t vs2, unsigned int frm,
                                             size_t vl);
vint16m2_t __riscv_vfcvt_x_f_v_i16m2_rm_tumu(vbool8_t vm, vint16m2_t vd,
                                             vfloat16m2_t vs2, unsigned int frm,
                                             size_t vl);
vint16m4_t __riscv_vfcvt_x_f_v_i16m4_rm_tumu(vbool4_t vm, vint16m4_t vd,
                                             vfloat16m4_t vs2, unsigned int frm,
                                             size_t vl);
vint16m8_t __riscv_vfcvt_x_f_v_i16m8_rm_tumu(vbool2_t vm, vint16m8_t vd,
                                             vfloat16m8_t vs2, unsigned int frm,
                                             size_t vl);
vuint16mf4_t __riscv_vfcvt_xu_f_v_u16mf4_rm_tumu(vbool64_t vm, vuint16mf4_t vd,
                                                 vfloat16mf4_t vs2,
                                                 unsigned int frm, size_t vl);
vuint16mf2_t __riscv_vfcvt_xu_f_v_u16mf2_rm_tumu(vbool32_t vm, vuint16mf2_t vd,
                                                 vfloat16mf2_t vs2,
                                                 unsigned int frm, size_t vl);
vuint16m1_t __riscv_vfcvt_xu_f_v_u16m1_rm_tumu(vbool16_t vm, vuint16m1_t vd,
                                               vfloat16m1_t vs2,
                                               unsigned int frm, size_t vl);
vuint16m2_t __riscv_vfcvt_xu_f_v_u16m2_rm_tumu(vbool8_t vm, vuint16m2_t vd,
                                               vfloat16m2_t vs2,
                                               unsigned int frm, size_t vl);
vuint16m4_t __riscv_vfcvt_xu_f_v_u16m4_rm_tumu(vbool4_t vm, vuint16m4_t vd,
                                               vfloat16m4_t vs2,
                                               unsigned int frm, size_t vl);
vuint16m8_t __riscv_vfcvt_xu_f_v_u16m8_rm_tumu(vbool2_t vm, vuint16m8_t vd,
                                               vfloat16m8_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_x_v_f16mf4_rm_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                                 vint16mf4_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_x_v_f16mf2_rm_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                                 vint16mf2_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_x_v_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                               vint16m1_t vs2, unsigned int frm,
                                               size_t vl);
vfloat16m2_t __riscv_vfcvt_f_x_v_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                               vint16m2_t vs2, unsigned int frm,
                                               size_t vl);
vfloat16m4_t __riscv_vfcvt_f_x_v_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                               vint16m4_t vs2, unsigned int frm,
                                               size_t vl);
vfloat16m8_t __riscv_vfcvt_f_x_v_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                               vint16m8_t vs2, unsigned int frm,
                                               size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_xu_v_f16mf4_rm_tumu(vbool64_t vm,
                                                  vfloat16mf4_t vd,
                                                  vuint16mf4_t vs2,
                                                  unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_xu_v_f16mf2_rm_tumu(vbool32_t vm,
                                                  vfloat16mf2_t vd,
                                                  vuint16mf2_t vs2,
                                                  unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_xu_v_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                                vuint16m1_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfcvt_f_xu_v_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                                vuint16m2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfcvt_f_xu_v_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                                vuint16m4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfcvt_f_xu_v_f16m8_rm_tumu(vbool2_t vm, vfloat16m8_t vd,
                                                vuint16m8_t vs2,
                                                unsigned int frm, size_t vl);
vint32mf2_t __riscv_vfcvt_x_f_v_i32mf2_rm_tumu(vbool64_t vm, vint32mf2_t vd,
                                               vfloat32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vint32m1_t __riscv_vfcvt_x_f_v_i32m1_rm_tumu(vbool32_t vm, vint32m1_t vd,
                                             vfloat32m1_t vs2, unsigned int frm,
                                             size_t vl);
vint32m2_t __riscv_vfcvt_x_f_v_i32m2_rm_tumu(vbool16_t vm, vint32m2_t vd,
                                             vfloat32m2_t vs2, unsigned int frm,
                                             size_t vl);
vint32m4_t __riscv_vfcvt_x_f_v_i32m4_rm_tumu(vbool8_t vm, vint32m4_t vd,
                                             vfloat32m4_t vs2, unsigned int frm,
                                             size_t vl);
vint32m8_t __riscv_vfcvt_x_f_v_i32m8_rm_tumu(vbool4_t vm, vint32m8_t vd,
                                             vfloat32m8_t vs2, unsigned int frm,
                                             size_t vl);
vuint32mf2_t __riscv_vfcvt_xu_f_v_u32mf2_rm_tumu(vbool64_t vm, vuint32mf2_t vd,
                                                 vfloat32mf2_t vs2,
                                                 unsigned int frm, size_t vl);
vuint32m1_t __riscv_vfcvt_xu_f_v_u32m1_rm_tumu(vbool32_t vm, vuint32m1_t vd,
                                               vfloat32m1_t vs2,
                                               unsigned int frm, size_t vl);
vuint32m2_t __riscv_vfcvt_xu_f_v_u32m2_rm_tumu(vbool16_t vm, vuint32m2_t vd,
                                               vfloat32m2_t vs2,
                                               unsigned int frm, size_t vl);
vuint32m4_t __riscv_vfcvt_xu_f_v_u32m4_rm_tumu(vbool8_t vm, vuint32m4_t vd,
                                               vfloat32m4_t vs2,
                                               unsigned int frm, size_t vl);
vuint32m8_t __riscv_vfcvt_xu_f_v_u32m8_rm_tumu(vbool4_t vm, vuint32m8_t vd,
                                               vfloat32m8_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_x_v_f32mf2_rm_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                                 vint32mf2_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_x_v_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                               vint32m1_t vs2, unsigned int frm,
                                               size_t vl);
vfloat32m2_t __riscv_vfcvt_f_x_v_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                               vint32m2_t vs2, unsigned int frm,
                                               size_t vl);
vfloat32m4_t __riscv_vfcvt_f_x_v_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                               vint32m4_t vs2, unsigned int frm,
                                               size_t vl);
vfloat32m8_t __riscv_vfcvt_f_x_v_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                               vint32m8_t vs2, unsigned int frm,
                                               size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_xu_v_f32mf2_rm_tumu(vbool64_t vm,
                                                  vfloat32mf2_t vd,
                                                  vuint32mf2_t vs2,
                                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_xu_v_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                                vuint32m1_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfcvt_f_xu_v_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                                vuint32m2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfcvt_f_xu_v_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                                vuint32m4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfcvt_f_xu_v_f32m8_rm_tumu(vbool4_t vm, vfloat32m8_t vd,
                                                vuint32m8_t vs2,
                                                unsigned int frm, size_t vl);
vint64m1_t __riscv_vfcvt_x_f_v_i64m1_rm_tumu(vbool64_t vm, vint64m1_t vd,
                                             vfloat64m1_t vs2, unsigned int frm,
                                             size_t vl);
vint64m2_t __riscv_vfcvt_x_f_v_i64m2_rm_tumu(vbool32_t vm, vint64m2_t vd,
                                             vfloat64m2_t vs2, unsigned int frm,
                                             size_t vl);
vint64m4_t __riscv_vfcvt_x_f_v_i64m4_rm_tumu(vbool16_t vm, vint64m4_t vd,
                                             vfloat64m4_t vs2, unsigned int frm,
                                             size_t vl);
vint64m8_t __riscv_vfcvt_x_f_v_i64m8_rm_tumu(vbool8_t vm, vint64m8_t vd,
                                             vfloat64m8_t vs2, unsigned int frm,
                                             size_t vl);
vuint64m1_t __riscv_vfcvt_xu_f_v_u64m1_rm_tumu(vbool64_t vm, vuint64m1_t vd,
                                               vfloat64m1_t vs2,
                                               unsigned int frm, size_t vl);
vuint64m2_t __riscv_vfcvt_xu_f_v_u64m2_rm_tumu(vbool32_t vm, vuint64m2_t vd,
                                               vfloat64m2_t vs2,
                                               unsigned int frm, size_t vl);
vuint64m4_t __riscv_vfcvt_xu_f_v_u64m4_rm_tumu(vbool16_t vm, vuint64m4_t vd,
                                               vfloat64m4_t vs2,
                                               unsigned int frm, size_t vl);
vuint64m8_t __riscv_vfcvt_xu_f_v_u64m8_rm_tumu(vbool8_t vm, vuint64m8_t vd,
                                               vfloat64m8_t vs2,
                                               unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfcvt_f_x_v_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                               vint64m1_t vs2, unsigned int frm,
                                               size_t vl);
vfloat64m2_t __riscv_vfcvt_f_x_v_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                               vint64m2_t vs2, unsigned int frm,
                                               size_t vl);
vfloat64m4_t __riscv_vfcvt_f_x_v_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                               vint64m4_t vs2, unsigned int frm,
                                               size_t vl);
vfloat64m8_t __riscv_vfcvt_f_x_v_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                               vint64m8_t vs2, unsigned int frm,
                                               size_t vl);
vfloat64m1_t __riscv_vfcvt_f_xu_v_f64m1_rm_tumu(vbool64_t vm, vfloat64m1_t vd,
                                                vuint64m1_t vs2,
                                                unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfcvt_f_xu_v_f64m2_rm_tumu(vbool32_t vm, vfloat64m2_t vd,
                                                vuint64m2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfcvt_f_xu_v_f64m4_rm_tumu(vbool16_t vm, vfloat64m4_t vd,
                                                vuint64m4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfcvt_f_xu_v_f64m8_rm_tumu(vbool8_t vm, vfloat64m8_t vd,
                                                vuint64m8_t vs2,
                                                unsigned int frm, size_t vl);
// masked functions
vint16mf4_t __riscv_vfcvt_x_f_v_i16mf4_rm_mu(vbool64_t vm, vint16mf4_t vd,
                                             vfloat16mf4_t vs2,
                                             unsigned int frm, size_t vl);
vint16mf2_t __riscv_vfcvt_x_f_v_i16mf2_rm_mu(vbool32_t vm, vint16mf2_t vd,
                                             vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vint16m1_t __riscv_vfcvt_x_f_v_i16m1_rm_mu(vbool16_t vm, vint16m1_t vd,
                                           vfloat16m1_t vs2, unsigned int frm,
                                           size_t vl);
vint16m2_t __riscv_vfcvt_x_f_v_i16m2_rm_mu(vbool8_t vm, vint16m2_t vd,
                                           vfloat16m2_t vs2, unsigned int frm,
                                           size_t vl);
vint16m4_t __riscv_vfcvt_x_f_v_i16m4_rm_mu(vbool4_t vm, vint16m4_t vd,
                                           vfloat16m4_t vs2, unsigned int frm,
                                           size_t vl);
vint16m8_t __riscv_vfcvt_x_f_v_i16m8_rm_mu(vbool2_t vm, vint16m8_t vd,
                                           vfloat16m8_t vs2, unsigned int frm,
                                           size_t vl);
vuint16mf4_t __riscv_vfcvt_xu_f_v_u16mf4_rm_mu(vbool64_t vm, vuint16mf4_t vd,
                                               vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vuint16mf2_t __riscv_vfcvt_xu_f_v_u16mf2_rm_mu(vbool32_t vm, vuint16mf2_t vd,
                                               vfloat16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vuint16m1_t __riscv_vfcvt_xu_f_v_u16m1_rm_mu(vbool16_t vm, vuint16m1_t vd,
                                             vfloat16m1_t vs2, unsigned int frm,
                                             size_t vl);
vuint16m2_t __riscv_vfcvt_xu_f_v_u16m2_rm_mu(vbool8_t vm, vuint16m2_t vd,
                                             vfloat16m2_t vs2, unsigned int frm,
                                             size_t vl);
vuint16m4_t __riscv_vfcvt_xu_f_v_u16m4_rm_mu(vbool4_t vm, vuint16m4_t vd,
                                             vfloat16m4_t vs2, unsigned int frm,
                                             size_t vl);
vuint16m8_t __riscv_vfcvt_xu_f_v_u16m8_rm_mu(vbool2_t vm, vuint16m8_t vd,
                                             vfloat16m8_t vs2, unsigned int frm,
                                             size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_x_v_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                               vint16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_x_v_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                               vint16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_x_v_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                             vint16m1_t vs2, unsigned int frm,
                                             size_t vl);
vfloat16m2_t __riscv_vfcvt_f_x_v_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                             vint16m2_t vs2, unsigned int frm,
                                             size_t vl);
vfloat16m4_t __riscv_vfcvt_f_x_v_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                             vint16m4_t vs2, unsigned int frm,
                                             size_t vl);
vfloat16m8_t __riscv_vfcvt_f_x_v_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                             vint16m8_t vs2, unsigned int frm,
                                             size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_xu_v_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                                vuint16mf4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_xu_v_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                                vuint16mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_xu_v_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                              vuint16m1_t vs2, unsigned int frm,
                                              size_t vl);
vfloat16m2_t __riscv_vfcvt_f_xu_v_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                              vuint16m2_t vs2, unsigned int frm,
                                              size_t vl);
vfloat16m4_t __riscv_vfcvt_f_xu_v_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                              vuint16m4_t vs2, unsigned int frm,
                                              size_t vl);
vfloat16m8_t __riscv_vfcvt_f_xu_v_f16m8_rm_mu(vbool2_t vm, vfloat16m8_t vd,
                                              vuint16m8_t vs2, unsigned int frm,
                                              size_t vl);
vint32mf2_t __riscv_vfcvt_x_f_v_i32mf2_rm_mu(vbool64_t vm, vint32mf2_t vd,
                                             vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vint32m1_t __riscv_vfcvt_x_f_v_i32m1_rm_mu(vbool32_t vm, vint32m1_t vd,
                                           vfloat32m1_t vs2, unsigned int frm,
                                           size_t vl);
vint32m2_t __riscv_vfcvt_x_f_v_i32m2_rm_mu(vbool16_t vm, vint32m2_t vd,
                                           vfloat32m2_t vs2, unsigned int frm,
                                           size_t vl);
vint32m4_t __riscv_vfcvt_x_f_v_i32m4_rm_mu(vbool8_t vm, vint32m4_t vd,
                                           vfloat32m4_t vs2, unsigned int frm,
                                           size_t vl);
vint32m8_t __riscv_vfcvt_x_f_v_i32m8_rm_mu(vbool4_t vm, vint32m8_t vd,
                                           vfloat32m8_t vs2, unsigned int frm,
                                           size_t vl);
vuint32mf2_t __riscv_vfcvt_xu_f_v_u32mf2_rm_mu(vbool64_t vm, vuint32mf2_t vd,
                                               vfloat32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vuint32m1_t __riscv_vfcvt_xu_f_v_u32m1_rm_mu(vbool32_t vm, vuint32m1_t vd,
                                             vfloat32m1_t vs2, unsigned int frm,
                                             size_t vl);
vuint32m2_t __riscv_vfcvt_xu_f_v_u32m2_rm_mu(vbool16_t vm, vuint32m2_t vd,
                                             vfloat32m2_t vs2, unsigned int frm,
                                             size_t vl);
vuint32m4_t __riscv_vfcvt_xu_f_v_u32m4_rm_mu(vbool8_t vm, vuint32m4_t vd,
                                             vfloat32m4_t vs2, unsigned int frm,
                                             size_t vl);
vuint32m8_t __riscv_vfcvt_xu_f_v_u32m8_rm_mu(vbool4_t vm, vuint32m8_t vd,
                                             vfloat32m8_t vs2, unsigned int frm,
                                             size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_x_v_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                               vint32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_x_v_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                             vint32m1_t vs2, unsigned int frm,
                                             size_t vl);
vfloat32m2_t __riscv_vfcvt_f_x_v_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                             vint32m2_t vs2, unsigned int frm,
                                             size_t vl);
vfloat32m4_t __riscv_vfcvt_f_x_v_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                             vint32m4_t vs2, unsigned int frm,
                                             size_t vl);
vfloat32m8_t __riscv_vfcvt_f_x_v_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                             vint32m8_t vs2, unsigned int frm,
                                             size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_xu_v_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                                vuint32mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_xu_v_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                              vuint32m1_t vs2, unsigned int frm,
                                              size_t vl);
vfloat32m2_t __riscv_vfcvt_f_xu_v_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                              vuint32m2_t vs2, unsigned int frm,
                                              size_t vl);
vfloat32m4_t __riscv_vfcvt_f_xu_v_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                              vuint32m4_t vs2, unsigned int frm,
                                              size_t vl);
vfloat32m8_t __riscv_vfcvt_f_xu_v_f32m8_rm_mu(vbool4_t vm, vfloat32m8_t vd,
                                              vuint32m8_t vs2, unsigned int frm,
                                              size_t vl);
vint64m1_t __riscv_vfcvt_x_f_v_i64m1_rm_mu(vbool64_t vm, vint64m1_t vd,
                                           vfloat64m1_t vs2, unsigned int frm,
                                           size_t vl);
vint64m2_t __riscv_vfcvt_x_f_v_i64m2_rm_mu(vbool32_t vm, vint64m2_t vd,
                                           vfloat64m2_t vs2, unsigned int frm,
                                           size_t vl);
vint64m4_t __riscv_vfcvt_x_f_v_i64m4_rm_mu(vbool16_t vm, vint64m4_t vd,
                                           vfloat64m4_t vs2, unsigned int frm,
                                           size_t vl);
vint64m8_t __riscv_vfcvt_x_f_v_i64m8_rm_mu(vbool8_t vm, vint64m8_t vd,
                                           vfloat64m8_t vs2, unsigned int frm,
                                           size_t vl);
vuint64m1_t __riscv_vfcvt_xu_f_v_u64m1_rm_mu(vbool64_t vm, vuint64m1_t vd,
                                             vfloat64m1_t vs2, unsigned int frm,
                                             size_t vl);
vuint64m2_t __riscv_vfcvt_xu_f_v_u64m2_rm_mu(vbool32_t vm, vuint64m2_t vd,
                                             vfloat64m2_t vs2, unsigned int frm,
                                             size_t vl);
vuint64m4_t __riscv_vfcvt_xu_f_v_u64m4_rm_mu(vbool16_t vm, vuint64m4_t vd,
                                             vfloat64m4_t vs2, unsigned int frm,
                                             size_t vl);
vuint64m8_t __riscv_vfcvt_xu_f_v_u64m8_rm_mu(vbool8_t vm, vuint64m8_t vd,
                                             vfloat64m8_t vs2, unsigned int frm,
                                             size_t vl);
vfloat64m1_t __riscv_vfcvt_f_x_v_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                             vint64m1_t vs2, unsigned int frm,
                                             size_t vl);
vfloat64m2_t __riscv_vfcvt_f_x_v_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                             vint64m2_t vs2, unsigned int frm,
                                             size_t vl);
vfloat64m4_t __riscv_vfcvt_f_x_v_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                             vint64m4_t vs2, unsigned int frm,
                                             size_t vl);
vfloat64m8_t __riscv_vfcvt_f_x_v_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                             vint64m8_t vs2, unsigned int frm,
                                             size_t vl);
vfloat64m1_t __riscv_vfcvt_f_xu_v_f64m1_rm_mu(vbool64_t vm, vfloat64m1_t vd,
                                              vuint64m1_t vs2, unsigned int frm,
                                              size_t vl);
vfloat64m2_t __riscv_vfcvt_f_xu_v_f64m2_rm_mu(vbool32_t vm, vfloat64m2_t vd,
                                              vuint64m2_t vs2, unsigned int frm,
                                              size_t vl);
vfloat64m4_t __riscv_vfcvt_f_xu_v_f64m4_rm_mu(vbool16_t vm, vfloat64m4_t vd,
                                              vuint64m4_t vs2, unsigned int frm,
                                              size_t vl);
vfloat64m8_t __riscv_vfcvt_f_xu_v_f64m8_rm_mu(vbool8_t vm, vfloat64m8_t vd,
                                              vuint64m8_t vs2, unsigned int frm,
                                              size_t vl);

Widening Floating-Point/Integer Type-Convert Intrinsics

vfloat16mf4_t __riscv_vfwcvt_f_x_v_f16mf4_tu(vfloat16mf4_t vd, vint8mf8_t vs2,
                                             size_t vl);
vfloat16mf2_t __riscv_vfwcvt_f_x_v_f16mf2_tu(vfloat16mf2_t vd, vint8mf4_t vs2,
                                             size_t vl);
vfloat16m1_t __riscv_vfwcvt_f_x_v_f16m1_tu(vfloat16m1_t vd, vint8mf2_t vs2,
                                           size_t vl);
vfloat16m2_t __riscv_vfwcvt_f_x_v_f16m2_tu(vfloat16m2_t vd, vint8m1_t vs2,
                                           size_t vl);
vfloat16m4_t __riscv_vfwcvt_f_x_v_f16m4_tu(vfloat16m4_t vd, vint8m2_t vs2,
                                           size_t vl);
vfloat16m8_t __riscv_vfwcvt_f_x_v_f16m8_tu(vfloat16m8_t vd, vint8m4_t vs2,
                                           size_t vl);
vfloat16mf4_t __riscv_vfwcvt_f_xu_v_f16mf4_tu(vfloat16mf4_t vd, vuint8mf8_t vs2,
                                              size_t vl);
vfloat16mf2_t __riscv_vfwcvt_f_xu_v_f16mf2_tu(vfloat16mf2_t vd, vuint8mf4_t vs2,
                                              size_t vl);
vfloat16m1_t __riscv_vfwcvt_f_xu_v_f16m1_tu(vfloat16m1_t vd, vuint8mf2_t vs2,
                                            size_t vl);
vfloat16m2_t __riscv_vfwcvt_f_xu_v_f16m2_tu(vfloat16m2_t vd, vuint8m1_t vs2,
                                            size_t vl);
vfloat16m4_t __riscv_vfwcvt_f_xu_v_f16m4_tu(vfloat16m4_t vd, vuint8m2_t vs2,
                                            size_t vl);
vfloat16m8_t __riscv_vfwcvt_f_xu_v_f16m8_tu(vfloat16m8_t vd, vuint8m4_t vs2,
                                            size_t vl);
vint32mf2_t __riscv_vfwcvt_x_f_v_i32mf2_tu(vint32mf2_t vd, vfloat16mf4_t vs2,
                                           size_t vl);
vint32mf2_t __riscv_vfwcvt_rtz_x_f_v_i32mf2_tu(vint32mf2_t vd,
                                               vfloat16mf4_t vs2, size_t vl);
vint32m1_t __riscv_vfwcvt_x_f_v_i32m1_tu(vint32m1_t vd, vfloat16mf2_t vs2,
                                         size_t vl);
vint32m1_t __riscv_vfwcvt_rtz_x_f_v_i32m1_tu(vint32m1_t vd, vfloat16mf2_t vs2,
                                             size_t vl);
vint32m2_t __riscv_vfwcvt_x_f_v_i32m2_tu(vint32m2_t vd, vfloat16m1_t vs2,
                                         size_t vl);
vint32m2_t __riscv_vfwcvt_rtz_x_f_v_i32m2_tu(vint32m2_t vd, vfloat16m1_t vs2,
                                             size_t vl);
vint32m4_t __riscv_vfwcvt_x_f_v_i32m4_tu(vint32m4_t vd, vfloat16m2_t vs2,
                                         size_t vl);
vint32m4_t __riscv_vfwcvt_rtz_x_f_v_i32m4_tu(vint32m4_t vd, vfloat16m2_t vs2,
                                             size_t vl);
vint32m8_t __riscv_vfwcvt_x_f_v_i32m8_tu(vint32m8_t vd, vfloat16m4_t vs2,
                                         size_t vl);
vint32m8_t __riscv_vfwcvt_rtz_x_f_v_i32m8_tu(vint32m8_t vd, vfloat16m4_t vs2,
                                             size_t vl);
vuint32mf2_t __riscv_vfwcvt_xu_f_v_u32mf2_tu(vuint32mf2_t vd, vfloat16mf4_t vs2,
                                             size_t vl);
vuint32mf2_t __riscv_vfwcvt_rtz_xu_f_v_u32mf2_tu(vuint32mf2_t vd,
                                                 vfloat16mf4_t vs2, size_t vl);
vuint32m1_t __riscv_vfwcvt_xu_f_v_u32m1_tu(vuint32m1_t vd, vfloat16mf2_t vs2,
                                           size_t vl);
vuint32m1_t __riscv_vfwcvt_rtz_xu_f_v_u32m1_tu(vuint32m1_t vd,
                                               vfloat16mf2_t vs2, size_t vl);
vuint32m2_t __riscv_vfwcvt_xu_f_v_u32m2_tu(vuint32m2_t vd, vfloat16m1_t vs2,
                                           size_t vl);
vuint32m2_t __riscv_vfwcvt_rtz_xu_f_v_u32m2_tu(vuint32m2_t vd, vfloat16m1_t vs2,
                                               size_t vl);
vuint32m4_t __riscv_vfwcvt_xu_f_v_u32m4_tu(vuint32m4_t vd, vfloat16m2_t vs2,
                                           size_t vl);
vuint32m4_t __riscv_vfwcvt_rtz_xu_f_v_u32m4_tu(vuint32m4_t vd, vfloat16m2_t vs2,
                                               size_t vl);
vuint32m8_t __riscv_vfwcvt_xu_f_v_u32m8_tu(vuint32m8_t vd, vfloat16m4_t vs2,
                                           size_t vl);
vuint32m8_t __riscv_vfwcvt_rtz_xu_f_v_u32m8_tu(vuint32m8_t vd, vfloat16m4_t vs2,
                                               size_t vl);
vfloat32mf2_t __riscv_vfwcvt_f_x_v_f32mf2_tu(vfloat32mf2_t vd, vint16mf4_t vs2,
                                             size_t vl);
vfloat32m1_t __riscv_vfwcvt_f_x_v_f32m1_tu(vfloat32m1_t vd, vint16mf2_t vs2,
                                           size_t vl);
vfloat32m2_t __riscv_vfwcvt_f_x_v_f32m2_tu(vfloat32m2_t vd, vint16m1_t vs2,
                                           size_t vl);
vfloat32m4_t __riscv_vfwcvt_f_x_v_f32m4_tu(vfloat32m4_t vd, vint16m2_t vs2,
                                           size_t vl);
vfloat32m8_t __riscv_vfwcvt_f_x_v_f32m8_tu(vfloat32m8_t vd, vint16m4_t vs2,
                                           size_t vl);
vfloat32mf2_t __riscv_vfwcvt_f_xu_v_f32mf2_tu(vfloat32mf2_t vd,
                                              vuint16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwcvt_f_xu_v_f32m1_tu(vfloat32m1_t vd, vuint16mf2_t vs2,
                                            size_t vl);
vfloat32m2_t __riscv_vfwcvt_f_xu_v_f32m2_tu(vfloat32m2_t vd, vuint16m1_t vs2,
                                            size_t vl);
vfloat32m4_t __riscv_vfwcvt_f_xu_v_f32m4_tu(vfloat32m4_t vd, vuint16m2_t vs2,
                                            size_t vl);
vfloat32m8_t __riscv_vfwcvt_f_xu_v_f32m8_tu(vfloat32m8_t vd, vuint16m4_t vs2,
                                            size_t vl);
vfloat32mf2_t __riscv_vfwcvt_f_f_v_f32mf2_tu(vfloat32mf2_t vd,
                                             vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwcvt_f_f_v_f32m1_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                                           size_t vl);
vfloat32m2_t __riscv_vfwcvt_f_f_v_f32m2_tu(vfloat32m2_t vd, vfloat16m1_t vs2,
                                           size_t vl);
vfloat32m4_t __riscv_vfwcvt_f_f_v_f32m4_tu(vfloat32m4_t vd, vfloat16m2_t vs2,
                                           size_t vl);
vfloat32m8_t __riscv_vfwcvt_f_f_v_f32m8_tu(vfloat32m8_t vd, vfloat16m4_t vs2,
                                           size_t vl);
vint64m1_t __riscv_vfwcvt_x_f_v_i64m1_tu(vint64m1_t vd, vfloat32mf2_t vs2,
                                         size_t vl);
vint64m1_t __riscv_vfwcvt_rtz_x_f_v_i64m1_tu(vint64m1_t vd, vfloat32mf2_t vs2,
                                             size_t vl);
vint64m2_t __riscv_vfwcvt_x_f_v_i64m2_tu(vint64m2_t vd, vfloat32m1_t vs2,
                                         size_t vl);
vint64m2_t __riscv_vfwcvt_rtz_x_f_v_i64m2_tu(vint64m2_t vd, vfloat32m1_t vs2,
                                             size_t vl);
vint64m4_t __riscv_vfwcvt_x_f_v_i64m4_tu(vint64m4_t vd, vfloat32m2_t vs2,
                                         size_t vl);
vint64m4_t __riscv_vfwcvt_rtz_x_f_v_i64m4_tu(vint64m4_t vd, vfloat32m2_t vs2,
                                             size_t vl);
vint64m8_t __riscv_vfwcvt_x_f_v_i64m8_tu(vint64m8_t vd, vfloat32m4_t vs2,
                                         size_t vl);
vint64m8_t __riscv_vfwcvt_rtz_x_f_v_i64m8_tu(vint64m8_t vd, vfloat32m4_t vs2,
                                             size_t vl);
vuint64m1_t __riscv_vfwcvt_xu_f_v_u64m1_tu(vuint64m1_t vd, vfloat32mf2_t vs2,
                                           size_t vl);
vuint64m1_t __riscv_vfwcvt_rtz_xu_f_v_u64m1_tu(vuint64m1_t vd,
                                               vfloat32mf2_t vs2, size_t vl);
vuint64m2_t __riscv_vfwcvt_xu_f_v_u64m2_tu(vuint64m2_t vd, vfloat32m1_t vs2,
                                           size_t vl);
vuint64m2_t __riscv_vfwcvt_rtz_xu_f_v_u64m2_tu(vuint64m2_t vd, vfloat32m1_t vs2,
                                               size_t vl);
vuint64m4_t __riscv_vfwcvt_xu_f_v_u64m4_tu(vuint64m4_t vd, vfloat32m2_t vs2,
                                           size_t vl);
vuint64m4_t __riscv_vfwcvt_rtz_xu_f_v_u64m4_tu(vuint64m4_t vd, vfloat32m2_t vs2,
                                               size_t vl);
vuint64m8_t __riscv_vfwcvt_xu_f_v_u64m8_tu(vuint64m8_t vd, vfloat32m4_t vs2,
                                           size_t vl);
vuint64m8_t __riscv_vfwcvt_rtz_xu_f_v_u64m8_tu(vuint64m8_t vd, vfloat32m4_t vs2,
                                               size_t vl);
vfloat64m1_t __riscv_vfwcvt_f_x_v_f64m1_tu(vfloat64m1_t vd, vint32mf2_t vs2,
                                           size_t vl);
vfloat64m2_t __riscv_vfwcvt_f_x_v_f64m2_tu(vfloat64m2_t vd, vint32m1_t vs2,
                                           size_t vl);
vfloat64m4_t __riscv_vfwcvt_f_x_v_f64m4_tu(vfloat64m4_t vd, vint32m2_t vs2,
                                           size_t vl);
vfloat64m8_t __riscv_vfwcvt_f_x_v_f64m8_tu(vfloat64m8_t vd, vint32m4_t vs2,
                                           size_t vl);
vfloat64m1_t __riscv_vfwcvt_f_xu_v_f64m1_tu(vfloat64m1_t vd, vuint32mf2_t vs2,
                                            size_t vl);
vfloat64m2_t __riscv_vfwcvt_f_xu_v_f64m2_tu(vfloat64m2_t vd, vuint32m1_t vs2,
                                            size_t vl);
vfloat64m4_t __riscv_vfwcvt_f_xu_v_f64m4_tu(vfloat64m4_t vd, vuint32m2_t vs2,
                                            size_t vl);
vfloat64m8_t __riscv_vfwcvt_f_xu_v_f64m8_tu(vfloat64m8_t vd, vuint32m4_t vs2,
                                            size_t vl);
vfloat64m1_t __riscv_vfwcvt_f_f_v_f64m1_tu(vfloat64m1_t vd, vfloat32mf2_t vs2,
                                           size_t vl);
vfloat64m2_t __riscv_vfwcvt_f_f_v_f64m2_tu(vfloat64m2_t vd, vfloat32m1_t vs2,
                                           size_t vl);
vfloat64m4_t __riscv_vfwcvt_f_f_v_f64m4_tu(vfloat64m4_t vd, vfloat32m2_t vs2,
                                           size_t vl);
vfloat64m8_t __riscv_vfwcvt_f_f_v_f64m8_tu(vfloat64m8_t vd, vfloat32m4_t vs2,
                                           size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfwcvt_f_x_v_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                              vint8mf8_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfwcvt_f_x_v_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                              vint8mf4_t vs2, size_t vl);
vfloat16m1_t __riscv_vfwcvt_f_x_v_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                            vint8mf2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfwcvt_f_x_v_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                            vint8m1_t vs2, size_t vl);
vfloat16m4_t __riscv_vfwcvt_f_x_v_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                            vint8m2_t vs2, size_t vl);
vfloat16m8_t __riscv_vfwcvt_f_x_v_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                            vint8m4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfwcvt_f_xu_v_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                               vuint8mf8_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfwcvt_f_xu_v_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                               vuint8mf4_t vs2, size_t vl);
vfloat16m1_t __riscv_vfwcvt_f_xu_v_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                             vuint8mf2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfwcvt_f_xu_v_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                             vuint8m1_t vs2, size_t vl);
vfloat16m4_t __riscv_vfwcvt_f_xu_v_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                             vuint8m2_t vs2, size_t vl);
vfloat16m8_t __riscv_vfwcvt_f_xu_v_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                             vuint8m4_t vs2, size_t vl);
vint32mf2_t __riscv_vfwcvt_x_f_v_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                            vfloat16mf4_t vs2, size_t vl);
vint32mf2_t __riscv_vfwcvt_rtz_x_f_v_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                                vfloat16mf4_t vs2, size_t vl);
vint32m1_t __riscv_vfwcvt_x_f_v_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                          vfloat16mf2_t vs2, size_t vl);
vint32m1_t __riscv_vfwcvt_rtz_x_f_v_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                              vfloat16mf2_t vs2, size_t vl);
vint32m2_t __riscv_vfwcvt_x_f_v_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                          vfloat16m1_t vs2, size_t vl);
vint32m2_t __riscv_vfwcvt_rtz_x_f_v_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                              vfloat16m1_t vs2, size_t vl);
vint32m4_t __riscv_vfwcvt_x_f_v_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                          vfloat16m2_t vs2, size_t vl);
vint32m4_t __riscv_vfwcvt_rtz_x_f_v_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                              vfloat16m2_t vs2, size_t vl);
vint32m8_t __riscv_vfwcvt_x_f_v_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                          vfloat16m4_t vs2, size_t vl);
vint32m8_t __riscv_vfwcvt_rtz_x_f_v_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                              vfloat16m4_t vs2, size_t vl);
vuint32mf2_t __riscv_vfwcvt_xu_f_v_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                              vfloat16mf4_t vs2, size_t vl);
vuint32mf2_t __riscv_vfwcvt_rtz_xu_f_v_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                                  vfloat16mf4_t vs2, size_t vl);
vuint32m1_t __riscv_vfwcvt_xu_f_v_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                            vfloat16mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vfwcvt_rtz_xu_f_v_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                                vfloat16mf2_t vs2, size_t vl);
vuint32m2_t __riscv_vfwcvt_xu_f_v_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                            vfloat16m1_t vs2, size_t vl);
vuint32m2_t __riscv_vfwcvt_rtz_xu_f_v_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                                vfloat16m1_t vs2, size_t vl);
vuint32m4_t __riscv_vfwcvt_xu_f_v_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                            vfloat16m2_t vs2, size_t vl);
vuint32m4_t __riscv_vfwcvt_rtz_xu_f_v_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                                vfloat16m2_t vs2, size_t vl);
vuint32m8_t __riscv_vfwcvt_xu_f_v_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                            vfloat16m4_t vs2, size_t vl);
vuint32m8_t __riscv_vfwcvt_rtz_xu_f_v_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                                vfloat16m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwcvt_f_x_v_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                              vint16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwcvt_f_x_v_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                            vint16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwcvt_f_x_v_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                            vint16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwcvt_f_x_v_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                            vint16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwcvt_f_x_v_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                            vint16m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwcvt_f_xu_v_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                               vuint16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwcvt_f_xu_v_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                             vuint16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwcvt_f_xu_v_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                             vuint16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwcvt_f_xu_v_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                             vuint16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwcvt_f_xu_v_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                             vuint16m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwcvt_f_f_v_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwcvt_f_f_v_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwcvt_f_f_v_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwcvt_f_f_v_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwcvt_f_f_v_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat16m4_t vs2, size_t vl);
vint64m1_t __riscv_vfwcvt_x_f_v_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                          vfloat32mf2_t vs2, size_t vl);
vint64m1_t __riscv_vfwcvt_rtz_x_f_v_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                              vfloat32mf2_t vs2, size_t vl);
vint64m2_t __riscv_vfwcvt_x_f_v_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                          vfloat32m1_t vs2, size_t vl);
vint64m2_t __riscv_vfwcvt_rtz_x_f_v_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                              vfloat32m1_t vs2, size_t vl);
vint64m4_t __riscv_vfwcvt_x_f_v_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                          vfloat32m2_t vs2, size_t vl);
vint64m4_t __riscv_vfwcvt_rtz_x_f_v_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                              vfloat32m2_t vs2, size_t vl);
vint64m8_t __riscv_vfwcvt_x_f_v_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                          vfloat32m4_t vs2, size_t vl);
vint64m8_t __riscv_vfwcvt_rtz_x_f_v_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                              vfloat32m4_t vs2, size_t vl);
vuint64m1_t __riscv_vfwcvt_xu_f_v_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                            vfloat32mf2_t vs2, size_t vl);
vuint64m1_t __riscv_vfwcvt_rtz_xu_f_v_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                                vfloat32mf2_t vs2, size_t vl);
vuint64m2_t __riscv_vfwcvt_xu_f_v_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                            vfloat32m1_t vs2, size_t vl);
vuint64m2_t __riscv_vfwcvt_rtz_xu_f_v_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                                vfloat32m1_t vs2, size_t vl);
vuint64m4_t __riscv_vfwcvt_xu_f_v_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                            vfloat32m2_t vs2, size_t vl);
vuint64m4_t __riscv_vfwcvt_rtz_xu_f_v_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                                vfloat32m2_t vs2, size_t vl);
vuint64m8_t __riscv_vfwcvt_xu_f_v_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                            vfloat32m4_t vs2, size_t vl);
vuint64m8_t __riscv_vfwcvt_rtz_xu_f_v_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                                vfloat32m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwcvt_f_x_v_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                            vint32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwcvt_f_x_v_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                            vint32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwcvt_f_x_v_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                            vint32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwcvt_f_x_v_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                            vint32m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwcvt_f_xu_v_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                             vuint32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwcvt_f_xu_v_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                             vuint32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwcvt_f_xu_v_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                             vuint32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwcvt_f_xu_v_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                             vuint32m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwcvt_f_f_v_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwcvt_f_f_v_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwcvt_f_f_v_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwcvt_f_f_v_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat32m4_t vs2, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfwcvt_f_x_v_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                               vint8mf8_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfwcvt_f_x_v_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                               vint8mf4_t vs2, size_t vl);
vfloat16m1_t __riscv_vfwcvt_f_x_v_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                             vint8mf2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfwcvt_f_x_v_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                             vint8m1_t vs2, size_t vl);
vfloat16m4_t __riscv_vfwcvt_f_x_v_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                             vint8m2_t vs2, size_t vl);
vfloat16m8_t __riscv_vfwcvt_f_x_v_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                             vint8m4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfwcvt_f_xu_v_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                                vuint8mf8_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfwcvt_f_xu_v_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                                vuint8mf4_t vs2, size_t vl);
vfloat16m1_t __riscv_vfwcvt_f_xu_v_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                              vuint8mf2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfwcvt_f_xu_v_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                              vuint8m1_t vs2, size_t vl);
vfloat16m4_t __riscv_vfwcvt_f_xu_v_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                              vuint8m2_t vs2, size_t vl);
vfloat16m8_t __riscv_vfwcvt_f_xu_v_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                              vuint8m4_t vs2, size_t vl);
vint32mf2_t __riscv_vfwcvt_x_f_v_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                             vfloat16mf4_t vs2, size_t vl);
vint32mf2_t __riscv_vfwcvt_rtz_x_f_v_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                                 vfloat16mf4_t vs2, size_t vl);
vint32m1_t __riscv_vfwcvt_x_f_v_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                           vfloat16mf2_t vs2, size_t vl);
vint32m1_t __riscv_vfwcvt_rtz_x_f_v_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                               vfloat16mf2_t vs2, size_t vl);
vint32m2_t __riscv_vfwcvt_x_f_v_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                           vfloat16m1_t vs2, size_t vl);
vint32m2_t __riscv_vfwcvt_rtz_x_f_v_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                               vfloat16m1_t vs2, size_t vl);
vint32m4_t __riscv_vfwcvt_x_f_v_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                           vfloat16m2_t vs2, size_t vl);
vint32m4_t __riscv_vfwcvt_rtz_x_f_v_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                               vfloat16m2_t vs2, size_t vl);
vint32m8_t __riscv_vfwcvt_x_f_v_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                           vfloat16m4_t vs2, size_t vl);
vint32m8_t __riscv_vfwcvt_rtz_x_f_v_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                               vfloat16m4_t vs2, size_t vl);
vuint32mf2_t __riscv_vfwcvt_xu_f_v_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                               vfloat16mf4_t vs2, size_t vl);
vuint32mf2_t __riscv_vfwcvt_rtz_xu_f_v_u32mf2_tumu(vbool64_t vm,
                                                   vuint32mf2_t vd,
                                                   vfloat16mf4_t vs2,
                                                   size_t vl);
vuint32m1_t __riscv_vfwcvt_xu_f_v_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                             vfloat16mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vfwcvt_rtz_xu_f_v_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                                 vfloat16mf2_t vs2, size_t vl);
vuint32m2_t __riscv_vfwcvt_xu_f_v_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                             vfloat16m1_t vs2, size_t vl);
vuint32m2_t __riscv_vfwcvt_rtz_xu_f_v_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                                 vfloat16m1_t vs2, size_t vl);
vuint32m4_t __riscv_vfwcvt_xu_f_v_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                             vfloat16m2_t vs2, size_t vl);
vuint32m4_t __riscv_vfwcvt_rtz_xu_f_v_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                                 vfloat16m2_t vs2, size_t vl);
vuint32m8_t __riscv_vfwcvt_xu_f_v_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                             vfloat16m4_t vs2, size_t vl);
vuint32m8_t __riscv_vfwcvt_rtz_xu_f_v_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                                 vfloat16m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwcvt_f_x_v_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                               vint16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwcvt_f_x_v_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                             vint16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwcvt_f_x_v_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                             vint16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwcvt_f_x_v_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                             vint16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwcvt_f_x_v_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                             vint16m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwcvt_f_xu_v_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                                vuint16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwcvt_f_xu_v_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                              vuint16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwcvt_f_xu_v_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                              vuint16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwcvt_f_xu_v_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                              vuint16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwcvt_f_xu_v_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                              vuint16m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwcvt_f_f_v_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwcvt_f_f_v_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwcvt_f_f_v_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwcvt_f_f_v_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwcvt_f_f_v_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat16m4_t vs2, size_t vl);
vint64m1_t __riscv_vfwcvt_x_f_v_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                           vfloat32mf2_t vs2, size_t vl);
vint64m1_t __riscv_vfwcvt_rtz_x_f_v_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                               vfloat32mf2_t vs2, size_t vl);
vint64m2_t __riscv_vfwcvt_x_f_v_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                           vfloat32m1_t vs2, size_t vl);
vint64m2_t __riscv_vfwcvt_rtz_x_f_v_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                               vfloat32m1_t vs2, size_t vl);
vint64m4_t __riscv_vfwcvt_x_f_v_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                           vfloat32m2_t vs2, size_t vl);
vint64m4_t __riscv_vfwcvt_rtz_x_f_v_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                               vfloat32m2_t vs2, size_t vl);
vint64m8_t __riscv_vfwcvt_x_f_v_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                           vfloat32m4_t vs2, size_t vl);
vint64m8_t __riscv_vfwcvt_rtz_x_f_v_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                               vfloat32m4_t vs2, size_t vl);
vuint64m1_t __riscv_vfwcvt_xu_f_v_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                             vfloat32mf2_t vs2, size_t vl);
vuint64m1_t __riscv_vfwcvt_rtz_xu_f_v_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                                 vfloat32mf2_t vs2, size_t vl);
vuint64m2_t __riscv_vfwcvt_xu_f_v_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                             vfloat32m1_t vs2, size_t vl);
vuint64m2_t __riscv_vfwcvt_rtz_xu_f_v_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                                 vfloat32m1_t vs2, size_t vl);
vuint64m4_t __riscv_vfwcvt_xu_f_v_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                             vfloat32m2_t vs2, size_t vl);
vuint64m4_t __riscv_vfwcvt_rtz_xu_f_v_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                                 vfloat32m2_t vs2, size_t vl);
vuint64m8_t __riscv_vfwcvt_xu_f_v_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                             vfloat32m4_t vs2, size_t vl);
vuint64m8_t __riscv_vfwcvt_rtz_xu_f_v_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                                 vfloat32m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwcvt_f_x_v_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                             vint32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwcvt_f_x_v_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                             vint32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwcvt_f_x_v_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                             vint32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwcvt_f_x_v_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                             vint32m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwcvt_f_xu_v_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                              vuint32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwcvt_f_xu_v_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                              vuint32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwcvt_f_xu_v_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                              vuint32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwcvt_f_xu_v_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                              vuint32m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwcvt_f_f_v_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwcvt_f_f_v_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwcvt_f_f_v_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwcvt_f_f_v_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat32m4_t vs2, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfwcvt_f_x_v_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                             vint8mf8_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfwcvt_f_x_v_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                             vint8mf4_t vs2, size_t vl);
vfloat16m1_t __riscv_vfwcvt_f_x_v_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                           vint8mf2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfwcvt_f_x_v_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                           vint8m1_t vs2, size_t vl);
vfloat16m4_t __riscv_vfwcvt_f_x_v_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                           vint8m2_t vs2, size_t vl);
vfloat16m8_t __riscv_vfwcvt_f_x_v_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                           vint8m4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfwcvt_f_xu_v_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                              vuint8mf8_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfwcvt_f_xu_v_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                              vuint8mf4_t vs2, size_t vl);
vfloat16m1_t __riscv_vfwcvt_f_xu_v_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                            vuint8mf2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfwcvt_f_xu_v_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                            vuint8m1_t vs2, size_t vl);
vfloat16m4_t __riscv_vfwcvt_f_xu_v_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                            vuint8m2_t vs2, size_t vl);
vfloat16m8_t __riscv_vfwcvt_f_xu_v_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                            vuint8m4_t vs2, size_t vl);
vint32mf2_t __riscv_vfwcvt_x_f_v_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                           vfloat16mf4_t vs2, size_t vl);
vint32mf2_t __riscv_vfwcvt_rtz_x_f_v_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                               vfloat16mf4_t vs2, size_t vl);
vint32m1_t __riscv_vfwcvt_x_f_v_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                         vfloat16mf2_t vs2, size_t vl);
vint32m1_t __riscv_vfwcvt_rtz_x_f_v_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                             vfloat16mf2_t vs2, size_t vl);
vint32m2_t __riscv_vfwcvt_x_f_v_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                         vfloat16m1_t vs2, size_t vl);
vint32m2_t __riscv_vfwcvt_rtz_x_f_v_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                             vfloat16m1_t vs2, size_t vl);
vint32m4_t __riscv_vfwcvt_x_f_v_i32m4_mu(vbool8_t vm, vint32m4_t vd,
                                         vfloat16m2_t vs2, size_t vl);
vint32m4_t __riscv_vfwcvt_rtz_x_f_v_i32m4_mu(vbool8_t vm, vint32m4_t vd,
                                             vfloat16m2_t vs2, size_t vl);
vint32m8_t __riscv_vfwcvt_x_f_v_i32m8_mu(vbool4_t vm, vint32m8_t vd,
                                         vfloat16m4_t vs2, size_t vl);
vint32m8_t __riscv_vfwcvt_rtz_x_f_v_i32m8_mu(vbool4_t vm, vint32m8_t vd,
                                             vfloat16m4_t vs2, size_t vl);
vuint32mf2_t __riscv_vfwcvt_xu_f_v_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                             vfloat16mf4_t vs2, size_t vl);
vuint32mf2_t __riscv_vfwcvt_rtz_xu_f_v_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                                 vfloat16mf4_t vs2, size_t vl);
vuint32m1_t __riscv_vfwcvt_xu_f_v_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                           vfloat16mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vfwcvt_rtz_xu_f_v_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                               vfloat16mf2_t vs2, size_t vl);
vuint32m2_t __riscv_vfwcvt_xu_f_v_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                           vfloat16m1_t vs2, size_t vl);
vuint32m2_t __riscv_vfwcvt_rtz_xu_f_v_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                               vfloat16m1_t vs2, size_t vl);
vuint32m4_t __riscv_vfwcvt_xu_f_v_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                           vfloat16m2_t vs2, size_t vl);
vuint32m4_t __riscv_vfwcvt_rtz_xu_f_v_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                               vfloat16m2_t vs2, size_t vl);
vuint32m8_t __riscv_vfwcvt_xu_f_v_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                           vfloat16m4_t vs2, size_t vl);
vuint32m8_t __riscv_vfwcvt_rtz_xu_f_v_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                               vfloat16m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwcvt_f_x_v_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                             vint16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwcvt_f_x_v_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                           vint16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwcvt_f_x_v_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                           vint16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwcvt_f_x_v_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                           vint16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwcvt_f_x_v_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                           vint16m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwcvt_f_xu_v_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                              vuint16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwcvt_f_xu_v_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                            vuint16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwcvt_f_xu_v_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                            vuint16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwcvt_f_xu_v_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                            vuint16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwcvt_f_xu_v_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                            vuint16m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwcvt_f_f_v_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwcvt_f_f_v_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwcvt_f_f_v_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwcvt_f_f_v_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwcvt_f_f_v_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat16m4_t vs2, size_t vl);
vint64m1_t __riscv_vfwcvt_x_f_v_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                         vfloat32mf2_t vs2, size_t vl);
vint64m1_t __riscv_vfwcvt_rtz_x_f_v_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                             vfloat32mf2_t vs2, size_t vl);
vint64m2_t __riscv_vfwcvt_x_f_v_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                         vfloat32m1_t vs2, size_t vl);
vint64m2_t __riscv_vfwcvt_rtz_x_f_v_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                             vfloat32m1_t vs2, size_t vl);
vint64m4_t __riscv_vfwcvt_x_f_v_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                         vfloat32m2_t vs2, size_t vl);
vint64m4_t __riscv_vfwcvt_rtz_x_f_v_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                             vfloat32m2_t vs2, size_t vl);
vint64m8_t __riscv_vfwcvt_x_f_v_i64m8_mu(vbool8_t vm, vint64m8_t vd,
                                         vfloat32m4_t vs2, size_t vl);
vint64m8_t __riscv_vfwcvt_rtz_x_f_v_i64m8_mu(vbool8_t vm, vint64m8_t vd,
                                             vfloat32m4_t vs2, size_t vl);
vuint64m1_t __riscv_vfwcvt_xu_f_v_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                           vfloat32mf2_t vs2, size_t vl);
vuint64m1_t __riscv_vfwcvt_rtz_xu_f_v_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                               vfloat32mf2_t vs2, size_t vl);
vuint64m2_t __riscv_vfwcvt_xu_f_v_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                           vfloat32m1_t vs2, size_t vl);
vuint64m2_t __riscv_vfwcvt_rtz_xu_f_v_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                               vfloat32m1_t vs2, size_t vl);
vuint64m4_t __riscv_vfwcvt_xu_f_v_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                           vfloat32m2_t vs2, size_t vl);
vuint64m4_t __riscv_vfwcvt_rtz_xu_f_v_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                               vfloat32m2_t vs2, size_t vl);
vuint64m8_t __riscv_vfwcvt_xu_f_v_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                           vfloat32m4_t vs2, size_t vl);
vuint64m8_t __riscv_vfwcvt_rtz_xu_f_v_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                               vfloat32m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwcvt_f_x_v_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                           vint32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwcvt_f_x_v_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                           vint32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwcvt_f_x_v_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                           vint32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwcvt_f_x_v_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                           vint32m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwcvt_f_xu_v_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                            vuint32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwcvt_f_xu_v_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                            vuint32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwcvt_f_xu_v_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                            vuint32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwcvt_f_xu_v_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                            vuint32m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwcvt_f_f_v_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwcvt_f_f_v_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwcvt_f_f_v_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwcvt_f_f_v_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat32m4_t vs2, size_t vl);
vint32mf2_t __riscv_vfwcvt_x_f_v_i32mf2_rm_tu(vint32mf2_t vd, vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vint32m1_t __riscv_vfwcvt_x_f_v_i32m1_rm_tu(vint32m1_t vd, vfloat16mf2_t vs2,
                                            unsigned int frm, size_t vl);
vint32m2_t __riscv_vfwcvt_x_f_v_i32m2_rm_tu(vint32m2_t vd, vfloat16m1_t vs2,
                                            unsigned int frm, size_t vl);
vint32m4_t __riscv_vfwcvt_x_f_v_i32m4_rm_tu(vint32m4_t vd, vfloat16m2_t vs2,
                                            unsigned int frm, size_t vl);
vint32m8_t __riscv_vfwcvt_x_f_v_i32m8_rm_tu(vint32m8_t vd, vfloat16m4_t vs2,
                                            unsigned int frm, size_t vl);
vuint32mf2_t __riscv_vfwcvt_xu_f_v_u32mf2_rm_tu(vuint32mf2_t vd,
                                                vfloat16mf4_t vs2,
                                                unsigned int frm, size_t vl);
vuint32m1_t __riscv_vfwcvt_xu_f_v_u32m1_rm_tu(vuint32m1_t vd, vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vuint32m2_t __riscv_vfwcvt_xu_f_v_u32m2_rm_tu(vuint32m2_t vd, vfloat16m1_t vs2,
                                              unsigned int frm, size_t vl);
vuint32m4_t __riscv_vfwcvt_xu_f_v_u32m4_rm_tu(vuint32m4_t vd, vfloat16m2_t vs2,
                                              unsigned int frm, size_t vl);
vuint32m8_t __riscv_vfwcvt_xu_f_v_u32m8_rm_tu(vuint32m8_t vd, vfloat16m4_t vs2,
                                              unsigned int frm, size_t vl);
vint64m1_t __riscv_vfwcvt_x_f_v_i64m1_rm_tu(vint64m1_t vd, vfloat32mf2_t vs2,
                                            unsigned int frm, size_t vl);
vint64m2_t __riscv_vfwcvt_x_f_v_i64m2_rm_tu(vint64m2_t vd, vfloat32m1_t vs2,
                                            unsigned int frm, size_t vl);
vint64m4_t __riscv_vfwcvt_x_f_v_i64m4_rm_tu(vint64m4_t vd, vfloat32m2_t vs2,
                                            unsigned int frm, size_t vl);
vint64m8_t __riscv_vfwcvt_x_f_v_i64m8_rm_tu(vint64m8_t vd, vfloat32m4_t vs2,
                                            unsigned int frm, size_t vl);
vuint64m1_t __riscv_vfwcvt_xu_f_v_u64m1_rm_tu(vuint64m1_t vd, vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vuint64m2_t __riscv_vfwcvt_xu_f_v_u64m2_rm_tu(vuint64m2_t vd, vfloat32m1_t vs2,
                                              unsigned int frm, size_t vl);
vuint64m4_t __riscv_vfwcvt_xu_f_v_u64m4_rm_tu(vuint64m4_t vd, vfloat32m2_t vs2,
                                              unsigned int frm, size_t vl);
vuint64m8_t __riscv_vfwcvt_xu_f_v_u64m8_rm_tu(vuint64m8_t vd, vfloat32m4_t vs2,
                                              unsigned int frm, size_t vl);
// masked functions
vint32mf2_t __riscv_vfwcvt_x_f_v_i32mf2_rm_tum(vbool64_t vm, vint32mf2_t vd,
                                               vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vint32m1_t __riscv_vfwcvt_x_f_v_i32m1_rm_tum(vbool32_t vm, vint32m1_t vd,
                                             vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vint32m2_t __riscv_vfwcvt_x_f_v_i32m2_rm_tum(vbool16_t vm, vint32m2_t vd,
                                             vfloat16m1_t vs2, unsigned int frm,
                                             size_t vl);
vint32m4_t __riscv_vfwcvt_x_f_v_i32m4_rm_tum(vbool8_t vm, vint32m4_t vd,
                                             vfloat16m2_t vs2, unsigned int frm,
                                             size_t vl);
vint32m8_t __riscv_vfwcvt_x_f_v_i32m8_rm_tum(vbool4_t vm, vint32m8_t vd,
                                             vfloat16m4_t vs2, unsigned int frm,
                                             size_t vl);
vuint32mf2_t __riscv_vfwcvt_xu_f_v_u32mf2_rm_tum(vbool64_t vm, vuint32mf2_t vd,
                                                 vfloat16mf4_t vs2,
                                                 unsigned int frm, size_t vl);
vuint32m1_t __riscv_vfwcvt_xu_f_v_u32m1_rm_tum(vbool32_t vm, vuint32m1_t vd,
                                               vfloat16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vuint32m2_t __riscv_vfwcvt_xu_f_v_u32m2_rm_tum(vbool16_t vm, vuint32m2_t vd,
                                               vfloat16m1_t vs2,
                                               unsigned int frm, size_t vl);
vuint32m4_t __riscv_vfwcvt_xu_f_v_u32m4_rm_tum(vbool8_t vm, vuint32m4_t vd,
                                               vfloat16m2_t vs2,
                                               unsigned int frm, size_t vl);
vuint32m8_t __riscv_vfwcvt_xu_f_v_u32m8_rm_tum(vbool4_t vm, vuint32m8_t vd,
                                               vfloat16m4_t vs2,
                                               unsigned int frm, size_t vl);
vint64m1_t __riscv_vfwcvt_x_f_v_i64m1_rm_tum(vbool64_t vm, vint64m1_t vd,
                                             vfloat32mf2_t vs2,
                                             unsigned int frm, size_t vl);
vint64m2_t __riscv_vfwcvt_x_f_v_i64m2_rm_tum(vbool32_t vm, vint64m2_t vd,
                                             vfloat32m1_t vs2, unsigned int frm,
                                             size_t vl);
vint64m4_t __riscv_vfwcvt_x_f_v_i64m4_rm_tum(vbool16_t vm, vint64m4_t vd,
                                             vfloat32m2_t vs2, unsigned int frm,
                                             size_t vl);
vint64m8_t __riscv_vfwcvt_x_f_v_i64m8_rm_tum(vbool8_t vm, vint64m8_t vd,
                                             vfloat32m4_t vs2, unsigned int frm,
                                             size_t vl);
vuint64m1_t __riscv_vfwcvt_xu_f_v_u64m1_rm_tum(vbool64_t vm, vuint64m1_t vd,
                                               vfloat32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vuint64m2_t __riscv_vfwcvt_xu_f_v_u64m2_rm_tum(vbool32_t vm, vuint64m2_t vd,
                                               vfloat32m1_t vs2,
                                               unsigned int frm, size_t vl);
vuint64m4_t __riscv_vfwcvt_xu_f_v_u64m4_rm_tum(vbool16_t vm, vuint64m4_t vd,
                                               vfloat32m2_t vs2,
                                               unsigned int frm, size_t vl);
vuint64m8_t __riscv_vfwcvt_xu_f_v_u64m8_rm_tum(vbool8_t vm, vuint64m8_t vd,
                                               vfloat32m4_t vs2,
                                               unsigned int frm, size_t vl);
// masked functions
vint32mf2_t __riscv_vfwcvt_x_f_v_i32mf2_rm_tumu(vbool64_t vm, vint32mf2_t vd,
                                                vfloat16mf4_t vs2,
                                                unsigned int frm, size_t vl);
vint32m1_t __riscv_vfwcvt_x_f_v_i32m1_rm_tumu(vbool32_t vm, vint32m1_t vd,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vint32m2_t __riscv_vfwcvt_x_f_v_i32m2_rm_tumu(vbool16_t vm, vint32m2_t vd,
                                              vfloat16m1_t vs2,
                                              unsigned int frm, size_t vl);
vint32m4_t __riscv_vfwcvt_x_f_v_i32m4_rm_tumu(vbool8_t vm, vint32m4_t vd,
                                              vfloat16m2_t vs2,
                                              unsigned int frm, size_t vl);
vint32m8_t __riscv_vfwcvt_x_f_v_i32m8_rm_tumu(vbool4_t vm, vint32m8_t vd,
                                              vfloat16m4_t vs2,
                                              unsigned int frm, size_t vl);
vuint32mf2_t __riscv_vfwcvt_xu_f_v_u32mf2_rm_tumu(vbool64_t vm, vuint32mf2_t vd,
                                                  vfloat16mf4_t vs2,
                                                  unsigned int frm, size_t vl);
vuint32m1_t __riscv_vfwcvt_xu_f_v_u32m1_rm_tumu(vbool32_t vm, vuint32m1_t vd,
                                                vfloat16mf2_t vs2,
                                                unsigned int frm, size_t vl);
vuint32m2_t __riscv_vfwcvt_xu_f_v_u32m2_rm_tumu(vbool16_t vm, vuint32m2_t vd,
                                                vfloat16m1_t vs2,
                                                unsigned int frm, size_t vl);
vuint32m4_t __riscv_vfwcvt_xu_f_v_u32m4_rm_tumu(vbool8_t vm, vuint32m4_t vd,
                                                vfloat16m2_t vs2,
                                                unsigned int frm, size_t vl);
vuint32m8_t __riscv_vfwcvt_xu_f_v_u32m8_rm_tumu(vbool4_t vm, vuint32m8_t vd,
                                                vfloat16m4_t vs2,
                                                unsigned int frm, size_t vl);
vint64m1_t __riscv_vfwcvt_x_f_v_i64m1_rm_tumu(vbool64_t vm, vint64m1_t vd,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vint64m2_t __riscv_vfwcvt_x_f_v_i64m2_rm_tumu(vbool32_t vm, vint64m2_t vd,
                                              vfloat32m1_t vs2,
                                              unsigned int frm, size_t vl);
vint64m4_t __riscv_vfwcvt_x_f_v_i64m4_rm_tumu(vbool16_t vm, vint64m4_t vd,
                                              vfloat32m2_t vs2,
                                              unsigned int frm, size_t vl);
vint64m8_t __riscv_vfwcvt_x_f_v_i64m8_rm_tumu(vbool8_t vm, vint64m8_t vd,
                                              vfloat32m4_t vs2,
                                              unsigned int frm, size_t vl);
vuint64m1_t __riscv_vfwcvt_xu_f_v_u64m1_rm_tumu(vbool64_t vm, vuint64m1_t vd,
                                                vfloat32mf2_t vs2,
                                                unsigned int frm, size_t vl);
vuint64m2_t __riscv_vfwcvt_xu_f_v_u64m2_rm_tumu(vbool32_t vm, vuint64m2_t vd,
                                                vfloat32m1_t vs2,
                                                unsigned int frm, size_t vl);
vuint64m4_t __riscv_vfwcvt_xu_f_v_u64m4_rm_tumu(vbool16_t vm, vuint64m4_t vd,
                                                vfloat32m2_t vs2,
                                                unsigned int frm, size_t vl);
vuint64m8_t __riscv_vfwcvt_xu_f_v_u64m8_rm_tumu(vbool8_t vm, vuint64m8_t vd,
                                                vfloat32m4_t vs2,
                                                unsigned int frm, size_t vl);
// masked functions
vint32mf2_t __riscv_vfwcvt_x_f_v_i32mf2_rm_mu(vbool64_t vm, vint32mf2_t vd,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vint32m1_t __riscv_vfwcvt_x_f_v_i32m1_rm_mu(vbool32_t vm, vint32m1_t vd,
                                            vfloat16mf2_t vs2, unsigned int frm,
                                            size_t vl);
vint32m2_t __riscv_vfwcvt_x_f_v_i32m2_rm_mu(vbool16_t vm, vint32m2_t vd,
                                            vfloat16m1_t vs2, unsigned int frm,
                                            size_t vl);
vint32m4_t __riscv_vfwcvt_x_f_v_i32m4_rm_mu(vbool8_t vm, vint32m4_t vd,
                                            vfloat16m2_t vs2, unsigned int frm,
                                            size_t vl);
vint32m8_t __riscv_vfwcvt_x_f_v_i32m8_rm_mu(vbool4_t vm, vint32m8_t vd,
                                            vfloat16m4_t vs2, unsigned int frm,
                                            size_t vl);
vuint32mf2_t __riscv_vfwcvt_xu_f_v_u32mf2_rm_mu(vbool64_t vm, vuint32mf2_t vd,
                                                vfloat16mf4_t vs2,
                                                unsigned int frm, size_t vl);
vuint32m1_t __riscv_vfwcvt_xu_f_v_u32m1_rm_mu(vbool32_t vm, vuint32m1_t vd,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vuint32m2_t __riscv_vfwcvt_xu_f_v_u32m2_rm_mu(vbool16_t vm, vuint32m2_t vd,
                                              vfloat16m1_t vs2,
                                              unsigned int frm, size_t vl);
vuint32m4_t __riscv_vfwcvt_xu_f_v_u32m4_rm_mu(vbool8_t vm, vuint32m4_t vd,
                                              vfloat16m2_t vs2,
                                              unsigned int frm, size_t vl);
vuint32m8_t __riscv_vfwcvt_xu_f_v_u32m8_rm_mu(vbool4_t vm, vuint32m8_t vd,
                                              vfloat16m4_t vs2,
                                              unsigned int frm, size_t vl);
vint64m1_t __riscv_vfwcvt_x_f_v_i64m1_rm_mu(vbool64_t vm, vint64m1_t vd,
                                            vfloat32mf2_t vs2, unsigned int frm,
                                            size_t vl);
vint64m2_t __riscv_vfwcvt_x_f_v_i64m2_rm_mu(vbool32_t vm, vint64m2_t vd,
                                            vfloat32m1_t vs2, unsigned int frm,
                                            size_t vl);
vint64m4_t __riscv_vfwcvt_x_f_v_i64m4_rm_mu(vbool16_t vm, vint64m4_t vd,
                                            vfloat32m2_t vs2, unsigned int frm,
                                            size_t vl);
vint64m8_t __riscv_vfwcvt_x_f_v_i64m8_rm_mu(vbool8_t vm, vint64m8_t vd,
                                            vfloat32m4_t vs2, unsigned int frm,
                                            size_t vl);
vuint64m1_t __riscv_vfwcvt_xu_f_v_u64m1_rm_mu(vbool64_t vm, vuint64m1_t vd,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vuint64m2_t __riscv_vfwcvt_xu_f_v_u64m2_rm_mu(vbool32_t vm, vuint64m2_t vd,
                                              vfloat32m1_t vs2,
                                              unsigned int frm, size_t vl);
vuint64m4_t __riscv_vfwcvt_xu_f_v_u64m4_rm_mu(vbool16_t vm, vuint64m4_t vd,
                                              vfloat32m2_t vs2,
                                              unsigned int frm, size_t vl);
vuint64m8_t __riscv_vfwcvt_xu_f_v_u64m8_rm_mu(vbool8_t vm, vuint64m8_t vd,
                                              vfloat32m4_t vs2,
                                              unsigned int frm, size_t vl);

Narrowing Floating-Point/Integer Type-Convert Intrinsics

vint8mf8_t __riscv_vfncvt_x_f_w_i8mf8_tu(vint8mf8_t vd, vfloat16mf4_t vs2,
                                         size_t vl);
vint8mf8_t __riscv_vfncvt_rtz_x_f_w_i8mf8_tu(vint8mf8_t vd, vfloat16mf4_t vs2,
                                             size_t vl);
vint8mf4_t __riscv_vfncvt_x_f_w_i8mf4_tu(vint8mf4_t vd, vfloat16mf2_t vs2,
                                         size_t vl);
vint8mf4_t __riscv_vfncvt_rtz_x_f_w_i8mf4_tu(vint8mf4_t vd, vfloat16mf2_t vs2,
                                             size_t vl);
vint8mf2_t __riscv_vfncvt_x_f_w_i8mf2_tu(vint8mf2_t vd, vfloat16m1_t vs2,
                                         size_t vl);
vint8mf2_t __riscv_vfncvt_rtz_x_f_w_i8mf2_tu(vint8mf2_t vd, vfloat16m1_t vs2,
                                             size_t vl);
vint8m1_t __riscv_vfncvt_x_f_w_i8m1_tu(vint8m1_t vd, vfloat16m2_t vs2,
                                       size_t vl);
vint8m1_t __riscv_vfncvt_rtz_x_f_w_i8m1_tu(vint8m1_t vd, vfloat16m2_t vs2,
                                           size_t vl);
vint8m2_t __riscv_vfncvt_x_f_w_i8m2_tu(vint8m2_t vd, vfloat16m4_t vs2,
                                       size_t vl);
vint8m2_t __riscv_vfncvt_rtz_x_f_w_i8m2_tu(vint8m2_t vd, vfloat16m4_t vs2,
                                           size_t vl);
vint8m4_t __riscv_vfncvt_x_f_w_i8m4_tu(vint8m4_t vd, vfloat16m8_t vs2,
                                       size_t vl);
vint8m4_t __riscv_vfncvt_rtz_x_f_w_i8m4_tu(vint8m4_t vd, vfloat16m8_t vs2,
                                           size_t vl);
vuint8mf8_t __riscv_vfncvt_xu_f_w_u8mf8_tu(vuint8mf8_t vd, vfloat16mf4_t vs2,
                                           size_t vl);
vuint8mf8_t __riscv_vfncvt_rtz_xu_f_w_u8mf8_tu(vuint8mf8_t vd,
                                               vfloat16mf4_t vs2, size_t vl);
vuint8mf4_t __riscv_vfncvt_xu_f_w_u8mf4_tu(vuint8mf4_t vd, vfloat16mf2_t vs2,
                                           size_t vl);
vuint8mf4_t __riscv_vfncvt_rtz_xu_f_w_u8mf4_tu(vuint8mf4_t vd,
                                               vfloat16mf2_t vs2, size_t vl);
vuint8mf2_t __riscv_vfncvt_xu_f_w_u8mf2_tu(vuint8mf2_t vd, vfloat16m1_t vs2,
                                           size_t vl);
vuint8mf2_t __riscv_vfncvt_rtz_xu_f_w_u8mf2_tu(vuint8mf2_t vd, vfloat16m1_t vs2,
                                               size_t vl);
vuint8m1_t __riscv_vfncvt_xu_f_w_u8m1_tu(vuint8m1_t vd, vfloat16m2_t vs2,
                                         size_t vl);
vuint8m1_t __riscv_vfncvt_rtz_xu_f_w_u8m1_tu(vuint8m1_t vd, vfloat16m2_t vs2,
                                             size_t vl);
vuint8m2_t __riscv_vfncvt_xu_f_w_u8m2_tu(vuint8m2_t vd, vfloat16m4_t vs2,
                                         size_t vl);
vuint8m2_t __riscv_vfncvt_rtz_xu_f_w_u8m2_tu(vuint8m2_t vd, vfloat16m4_t vs2,
                                             size_t vl);
vuint8m4_t __riscv_vfncvt_xu_f_w_u8m4_tu(vuint8m4_t vd, vfloat16m8_t vs2,
                                         size_t vl);
vuint8m4_t __riscv_vfncvt_rtz_xu_f_w_u8m4_tu(vuint8m4_t vd, vfloat16m8_t vs2,
                                             size_t vl);
vint16mf4_t __riscv_vfncvt_x_f_w_i16mf4_tu(vint16mf4_t vd, vfloat32mf2_t vs2,
                                           size_t vl);
vint16mf4_t __riscv_vfncvt_rtz_x_f_w_i16mf4_tu(vint16mf4_t vd,
                                               vfloat32mf2_t vs2, size_t vl);
vint16mf2_t __riscv_vfncvt_x_f_w_i16mf2_tu(vint16mf2_t vd, vfloat32m1_t vs2,
                                           size_t vl);
vint16mf2_t __riscv_vfncvt_rtz_x_f_w_i16mf2_tu(vint16mf2_t vd, vfloat32m1_t vs2,
                                               size_t vl);
vint16m1_t __riscv_vfncvt_x_f_w_i16m1_tu(vint16m1_t vd, vfloat32m2_t vs2,
                                         size_t vl);
vint16m1_t __riscv_vfncvt_rtz_x_f_w_i16m1_tu(vint16m1_t vd, vfloat32m2_t vs2,
                                             size_t vl);
vint16m2_t __riscv_vfncvt_x_f_w_i16m2_tu(vint16m2_t vd, vfloat32m4_t vs2,
                                         size_t vl);
vint16m2_t __riscv_vfncvt_rtz_x_f_w_i16m2_tu(vint16m2_t vd, vfloat32m4_t vs2,
                                             size_t vl);
vint16m4_t __riscv_vfncvt_x_f_w_i16m4_tu(vint16m4_t vd, vfloat32m8_t vs2,
                                         size_t vl);
vint16m4_t __riscv_vfncvt_rtz_x_f_w_i16m4_tu(vint16m4_t vd, vfloat32m8_t vs2,
                                             size_t vl);
vuint16mf4_t __riscv_vfncvt_xu_f_w_u16mf4_tu(vuint16mf4_t vd, vfloat32mf2_t vs2,
                                             size_t vl);
vuint16mf4_t __riscv_vfncvt_rtz_xu_f_w_u16mf4_tu(vuint16mf4_t vd,
                                                 vfloat32mf2_t vs2, size_t vl);
vuint16mf2_t __riscv_vfncvt_xu_f_w_u16mf2_tu(vuint16mf2_t vd, vfloat32m1_t vs2,
                                             size_t vl);
vuint16mf2_t __riscv_vfncvt_rtz_xu_f_w_u16mf2_tu(vuint16mf2_t vd,
                                                 vfloat32m1_t vs2, size_t vl);
vuint16m1_t __riscv_vfncvt_xu_f_w_u16m1_tu(vuint16m1_t vd, vfloat32m2_t vs2,
                                           size_t vl);
vuint16m1_t __riscv_vfncvt_rtz_xu_f_w_u16m1_tu(vuint16m1_t vd, vfloat32m2_t vs2,
                                               size_t vl);
vuint16m2_t __riscv_vfncvt_xu_f_w_u16m2_tu(vuint16m2_t vd, vfloat32m4_t vs2,
                                           size_t vl);
vuint16m2_t __riscv_vfncvt_rtz_xu_f_w_u16m2_tu(vuint16m2_t vd, vfloat32m4_t vs2,
                                               size_t vl);
vuint16m4_t __riscv_vfncvt_xu_f_w_u16m4_tu(vuint16m4_t vd, vfloat32m8_t vs2,
                                           size_t vl);
vuint16m4_t __riscv_vfncvt_rtz_xu_f_w_u16m4_tu(vuint16m4_t vd, vfloat32m8_t vs2,
                                               size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_x_w_f16mf4_tu(vfloat16mf4_t vd, vint32mf2_t vs2,
                                             size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_x_w_f16mf2_tu(vfloat16mf2_t vd, vint32m1_t vs2,
                                             size_t vl);
vfloat16m1_t __riscv_vfncvt_f_x_w_f16m1_tu(vfloat16m1_t vd, vint32m2_t vs2,
                                           size_t vl);
vfloat16m2_t __riscv_vfncvt_f_x_w_f16m2_tu(vfloat16m2_t vd, vint32m4_t vs2,
                                           size_t vl);
vfloat16m4_t __riscv_vfncvt_f_x_w_f16m4_tu(vfloat16m4_t vd, vint32m8_t vs2,
                                           size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_xu_w_f16mf4_tu(vfloat16mf4_t vd,
                                              vuint32mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_xu_w_f16mf2_tu(vfloat16mf2_t vd, vuint32m1_t vs2,
                                              size_t vl);
vfloat16m1_t __riscv_vfncvt_f_xu_w_f16m1_tu(vfloat16m1_t vd, vuint32m2_t vs2,
                                            size_t vl);
vfloat16m2_t __riscv_vfncvt_f_xu_w_f16m2_tu(vfloat16m2_t vd, vuint32m4_t vs2,
                                            size_t vl);
vfloat16m4_t __riscv_vfncvt_f_xu_w_f16m4_tu(vfloat16m4_t vd, vuint32m8_t vs2,
                                            size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_f_w_f16mf4_tu(vfloat16mf4_t vd,
                                             vfloat32mf2_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfncvt_rod_f_f_w_f16mf4_tu(vfloat16mf4_t vd,
                                                 vfloat32mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_f_w_f16mf2_tu(vfloat16mf2_t vd, vfloat32m1_t vs2,
                                             size_t vl);
vfloat16mf2_t __riscv_vfncvt_rod_f_f_w_f16mf2_tu(vfloat16mf2_t vd,
                                                 vfloat32m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_f_w_f16m1_tu(vfloat16m1_t vd, vfloat32m2_t vs2,
                                           size_t vl);
vfloat16m1_t __riscv_vfncvt_rod_f_f_w_f16m1_tu(vfloat16m1_t vd,
                                               vfloat32m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_f_w_f16m2_tu(vfloat16m2_t vd, vfloat32m4_t vs2,
                                           size_t vl);
vfloat16m2_t __riscv_vfncvt_rod_f_f_w_f16m2_tu(vfloat16m2_t vd,
                                               vfloat32m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_f_w_f16m4_tu(vfloat16m4_t vd, vfloat32m8_t vs2,
                                           size_t vl);
vfloat16m4_t __riscv_vfncvt_rod_f_f_w_f16m4_tu(vfloat16m4_t vd,
                                               vfloat32m8_t vs2, size_t vl);
vint32mf2_t __riscv_vfncvt_x_f_w_i32mf2_tu(vint32mf2_t vd, vfloat64m1_t vs2,
                                           size_t vl);
vint32mf2_t __riscv_vfncvt_rtz_x_f_w_i32mf2_tu(vint32mf2_t vd, vfloat64m1_t vs2,
                                               size_t vl);
vint32m1_t __riscv_vfncvt_x_f_w_i32m1_tu(vint32m1_t vd, vfloat64m2_t vs2,
                                         size_t vl);
vint32m1_t __riscv_vfncvt_rtz_x_f_w_i32m1_tu(vint32m1_t vd, vfloat64m2_t vs2,
                                             size_t vl);
vint32m2_t __riscv_vfncvt_x_f_w_i32m2_tu(vint32m2_t vd, vfloat64m4_t vs2,
                                         size_t vl);
vint32m2_t __riscv_vfncvt_rtz_x_f_w_i32m2_tu(vint32m2_t vd, vfloat64m4_t vs2,
                                             size_t vl);
vint32m4_t __riscv_vfncvt_x_f_w_i32m4_tu(vint32m4_t vd, vfloat64m8_t vs2,
                                         size_t vl);
vint32m4_t __riscv_vfncvt_rtz_x_f_w_i32m4_tu(vint32m4_t vd, vfloat64m8_t vs2,
                                             size_t vl);
vuint32mf2_t __riscv_vfncvt_xu_f_w_u32mf2_tu(vuint32mf2_t vd, vfloat64m1_t vs2,
                                             size_t vl);
vuint32mf2_t __riscv_vfncvt_rtz_xu_f_w_u32mf2_tu(vuint32mf2_t vd,
                                                 vfloat64m1_t vs2, size_t vl);
vuint32m1_t __riscv_vfncvt_xu_f_w_u32m1_tu(vuint32m1_t vd, vfloat64m2_t vs2,
                                           size_t vl);
vuint32m1_t __riscv_vfncvt_rtz_xu_f_w_u32m1_tu(vuint32m1_t vd, vfloat64m2_t vs2,
                                               size_t vl);
vuint32m2_t __riscv_vfncvt_xu_f_w_u32m2_tu(vuint32m2_t vd, vfloat64m4_t vs2,
                                           size_t vl);
vuint32m2_t __riscv_vfncvt_rtz_xu_f_w_u32m2_tu(vuint32m2_t vd, vfloat64m4_t vs2,
                                               size_t vl);
vuint32m4_t __riscv_vfncvt_xu_f_w_u32m4_tu(vuint32m4_t vd, vfloat64m8_t vs2,
                                           size_t vl);
vuint32m4_t __riscv_vfncvt_rtz_xu_f_w_u32m4_tu(vuint32m4_t vd, vfloat64m8_t vs2,
                                               size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_x_w_f32mf2_tu(vfloat32mf2_t vd, vint64m1_t vs2,
                                             size_t vl);
vfloat32m1_t __riscv_vfncvt_f_x_w_f32m1_tu(vfloat32m1_t vd, vint64m2_t vs2,
                                           size_t vl);
vfloat32m2_t __riscv_vfncvt_f_x_w_f32m2_tu(vfloat32m2_t vd, vint64m4_t vs2,
                                           size_t vl);
vfloat32m4_t __riscv_vfncvt_f_x_w_f32m4_tu(vfloat32m4_t vd, vint64m8_t vs2,
                                           size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_xu_w_f32mf2_tu(vfloat32mf2_t vd, vuint64m1_t vs2,
                                              size_t vl);
vfloat32m1_t __riscv_vfncvt_f_xu_w_f32m1_tu(vfloat32m1_t vd, vuint64m2_t vs2,
                                            size_t vl);
vfloat32m2_t __riscv_vfncvt_f_xu_w_f32m2_tu(vfloat32m2_t vd, vuint64m4_t vs2,
                                            size_t vl);
vfloat32m4_t __riscv_vfncvt_f_xu_w_f32m4_tu(vfloat32m4_t vd, vuint64m8_t vs2,
                                            size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_f_w_f32mf2_tu(vfloat32mf2_t vd, vfloat64m1_t vs2,
                                             size_t vl);
vfloat32mf2_t __riscv_vfncvt_rod_f_f_w_f32mf2_tu(vfloat32mf2_t vd,
                                                 vfloat64m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_f_w_f32m1_tu(vfloat32m1_t vd, vfloat64m2_t vs2,
                                           size_t vl);
vfloat32m1_t __riscv_vfncvt_rod_f_f_w_f32m1_tu(vfloat32m1_t vd,
                                               vfloat64m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_f_w_f32m2_tu(vfloat32m2_t vd, vfloat64m4_t vs2,
                                           size_t vl);
vfloat32m2_t __riscv_vfncvt_rod_f_f_w_f32m2_tu(vfloat32m2_t vd,
                                               vfloat64m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_f_w_f32m4_tu(vfloat32m4_t vd, vfloat64m8_t vs2,
                                           size_t vl);
vfloat32m4_t __riscv_vfncvt_rod_f_f_w_f32m4_tu(vfloat32m4_t vd,
                                               vfloat64m8_t vs2, size_t vl);
// masked functions
vint8mf8_t __riscv_vfncvt_x_f_w_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                          vfloat16mf4_t vs2, size_t vl);
vint8mf8_t __riscv_vfncvt_rtz_x_f_w_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                              vfloat16mf4_t vs2, size_t vl);
vint8mf4_t __riscv_vfncvt_x_f_w_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                          vfloat16mf2_t vs2, size_t vl);
vint8mf4_t __riscv_vfncvt_rtz_x_f_w_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                              vfloat16mf2_t vs2, size_t vl);
vint8mf2_t __riscv_vfncvt_x_f_w_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                          vfloat16m1_t vs2, size_t vl);
vint8mf2_t __riscv_vfncvt_rtz_x_f_w_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                              vfloat16m1_t vs2, size_t vl);
vint8m1_t __riscv_vfncvt_x_f_w_i8m1_tum(vbool8_t vm, vint8m1_t vd,
                                        vfloat16m2_t vs2, size_t vl);
vint8m1_t __riscv_vfncvt_rtz_x_f_w_i8m1_tum(vbool8_t vm, vint8m1_t vd,
                                            vfloat16m2_t vs2, size_t vl);
vint8m2_t __riscv_vfncvt_x_f_w_i8m2_tum(vbool4_t vm, vint8m2_t vd,
                                        vfloat16m4_t vs2, size_t vl);
vint8m2_t __riscv_vfncvt_rtz_x_f_w_i8m2_tum(vbool4_t vm, vint8m2_t vd,
                                            vfloat16m4_t vs2, size_t vl);
vint8m4_t __riscv_vfncvt_x_f_w_i8m4_tum(vbool2_t vm, vint8m4_t vd,
                                        vfloat16m8_t vs2, size_t vl);
vint8m4_t __riscv_vfncvt_rtz_x_f_w_i8m4_tum(vbool2_t vm, vint8m4_t vd,
                                            vfloat16m8_t vs2, size_t vl);
vuint8mf8_t __riscv_vfncvt_xu_f_w_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                            vfloat16mf4_t vs2, size_t vl);
vuint8mf8_t __riscv_vfncvt_rtz_xu_f_w_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                                vfloat16mf4_t vs2, size_t vl);
vuint8mf4_t __riscv_vfncvt_xu_f_w_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                            vfloat16mf2_t vs2, size_t vl);
vuint8mf4_t __riscv_vfncvt_rtz_xu_f_w_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                                vfloat16mf2_t vs2, size_t vl);
vuint8mf2_t __riscv_vfncvt_xu_f_w_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                            vfloat16m1_t vs2, size_t vl);
vuint8mf2_t __riscv_vfncvt_rtz_xu_f_w_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                                vfloat16m1_t vs2, size_t vl);
vuint8m1_t __riscv_vfncvt_xu_f_w_u8m1_tum(vbool8_t vm, vuint8m1_t vd,
                                          vfloat16m2_t vs2, size_t vl);
vuint8m1_t __riscv_vfncvt_rtz_xu_f_w_u8m1_tum(vbool8_t vm, vuint8m1_t vd,
                                              vfloat16m2_t vs2, size_t vl);
vuint8m2_t __riscv_vfncvt_xu_f_w_u8m2_tum(vbool4_t vm, vuint8m2_t vd,
                                          vfloat16m4_t vs2, size_t vl);
vuint8m2_t __riscv_vfncvt_rtz_xu_f_w_u8m2_tum(vbool4_t vm, vuint8m2_t vd,
                                              vfloat16m4_t vs2, size_t vl);
vuint8m4_t __riscv_vfncvt_xu_f_w_u8m4_tum(vbool2_t vm, vuint8m4_t vd,
                                          vfloat16m8_t vs2, size_t vl);
vuint8m4_t __riscv_vfncvt_rtz_xu_f_w_u8m4_tum(vbool2_t vm, vuint8m4_t vd,
                                              vfloat16m8_t vs2, size_t vl);
vint16mf4_t __riscv_vfncvt_x_f_w_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                            vfloat32mf2_t vs2, size_t vl);
vint16mf4_t __riscv_vfncvt_rtz_x_f_w_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                                vfloat32mf2_t vs2, size_t vl);
vint16mf2_t __riscv_vfncvt_x_f_w_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                            vfloat32m1_t vs2, size_t vl);
vint16mf2_t __riscv_vfncvt_rtz_x_f_w_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                                vfloat32m1_t vs2, size_t vl);
vint16m1_t __riscv_vfncvt_x_f_w_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                          vfloat32m2_t vs2, size_t vl);
vint16m1_t __riscv_vfncvt_rtz_x_f_w_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                              vfloat32m2_t vs2, size_t vl);
vint16m2_t __riscv_vfncvt_x_f_w_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                          vfloat32m4_t vs2, size_t vl);
vint16m2_t __riscv_vfncvt_rtz_x_f_w_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                              vfloat32m4_t vs2, size_t vl);
vint16m4_t __riscv_vfncvt_x_f_w_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                          vfloat32m8_t vs2, size_t vl);
vint16m4_t __riscv_vfncvt_rtz_x_f_w_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                              vfloat32m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vfncvt_xu_f_w_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                              vfloat32mf2_t vs2, size_t vl);
vuint16mf4_t __riscv_vfncvt_rtz_xu_f_w_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                                  vfloat32mf2_t vs2, size_t vl);
vuint16mf2_t __riscv_vfncvt_xu_f_w_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                              vfloat32m1_t vs2, size_t vl);
vuint16mf2_t __riscv_vfncvt_rtz_xu_f_w_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                                  vfloat32m1_t vs2, size_t vl);
vuint16m1_t __riscv_vfncvt_xu_f_w_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                            vfloat32m2_t vs2, size_t vl);
vuint16m1_t __riscv_vfncvt_rtz_xu_f_w_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                                vfloat32m2_t vs2, size_t vl);
vuint16m2_t __riscv_vfncvt_xu_f_w_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                            vfloat32m4_t vs2, size_t vl);
vuint16m2_t __riscv_vfncvt_rtz_xu_f_w_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                                vfloat32m4_t vs2, size_t vl);
vuint16m4_t __riscv_vfncvt_xu_f_w_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                            vfloat32m8_t vs2, size_t vl);
vuint16m4_t __riscv_vfncvt_rtz_xu_f_w_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                                vfloat32m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_x_w_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                              vint32mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_x_w_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                              vint32m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_x_w_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                            vint32m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_x_w_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                            vint32m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_x_w_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                            vint32m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_xu_w_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                               vuint32mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_xu_w_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                               vuint32m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_xu_w_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                             vuint32m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_xu_w_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                             vuint32m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_xu_w_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                             vuint32m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_f_w_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat32mf2_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfncvt_rod_f_f_w_f16mf4_tum(vbool64_t vm,
                                                  vfloat16mf4_t vd,
                                                  vfloat32mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_f_w_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat32m1_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_rod_f_f_w_f16mf2_tum(vbool32_t vm,
                                                  vfloat16mf2_t vd,
                                                  vfloat32m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_f_w_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat32m2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_rod_f_f_w_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                                vfloat32m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_f_w_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat32m4_t vs2, size_t vl);
vfloat16m2_t __riscv_vfncvt_rod_f_f_w_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                                vfloat32m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_f_w_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat32m8_t vs2, size_t vl);
vfloat16m4_t __riscv_vfncvt_rod_f_f_w_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                                vfloat32m8_t vs2, size_t vl);
vint32mf2_t __riscv_vfncvt_x_f_w_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                            vfloat64m1_t vs2, size_t vl);
vint32mf2_t __riscv_vfncvt_rtz_x_f_w_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                                vfloat64m1_t vs2, size_t vl);
vint32m1_t __riscv_vfncvt_x_f_w_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                          vfloat64m2_t vs2, size_t vl);
vint32m1_t __riscv_vfncvt_rtz_x_f_w_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                              vfloat64m2_t vs2, size_t vl);
vint32m2_t __riscv_vfncvt_x_f_w_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                          vfloat64m4_t vs2, size_t vl);
vint32m2_t __riscv_vfncvt_rtz_x_f_w_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                              vfloat64m4_t vs2, size_t vl);
vint32m4_t __riscv_vfncvt_x_f_w_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                          vfloat64m8_t vs2, size_t vl);
vint32m4_t __riscv_vfncvt_rtz_x_f_w_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                              vfloat64m8_t vs2, size_t vl);
vuint32mf2_t __riscv_vfncvt_xu_f_w_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                              vfloat64m1_t vs2, size_t vl);
vuint32mf2_t __riscv_vfncvt_rtz_xu_f_w_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                                  vfloat64m1_t vs2, size_t vl);
vuint32m1_t __riscv_vfncvt_xu_f_w_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                            vfloat64m2_t vs2, size_t vl);
vuint32m1_t __riscv_vfncvt_rtz_xu_f_w_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                                vfloat64m2_t vs2, size_t vl);
vuint32m2_t __riscv_vfncvt_xu_f_w_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                            vfloat64m4_t vs2, size_t vl);
vuint32m2_t __riscv_vfncvt_rtz_xu_f_w_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                                vfloat64m4_t vs2, size_t vl);
vuint32m4_t __riscv_vfncvt_xu_f_w_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                            vfloat64m8_t vs2, size_t vl);
vuint32m4_t __riscv_vfncvt_rtz_xu_f_w_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                                vfloat64m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_x_w_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                              vint64m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_x_w_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                            vint64m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_x_w_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                            vint64m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_x_w_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                            vint64m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_xu_w_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                               vuint64m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_xu_w_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                             vuint64m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_xu_w_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                             vuint64m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_xu_w_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                             vuint64m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_f_w_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat64m1_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfncvt_rod_f_f_w_f32mf2_tum(vbool64_t vm,
                                                  vfloat32mf2_t vd,
                                                  vfloat64m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_f_w_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat64m2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_rod_f_f_w_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                                vfloat64m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_f_w_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat64m4_t vs2, size_t vl);
vfloat32m2_t __riscv_vfncvt_rod_f_f_w_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                                vfloat64m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_f_w_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat64m8_t vs2, size_t vl);
vfloat32m4_t __riscv_vfncvt_rod_f_f_w_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                                vfloat64m8_t vs2, size_t vl);
// masked functions
vint8mf8_t __riscv_vfncvt_x_f_w_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                           vfloat16mf4_t vs2, size_t vl);
vint8mf8_t __riscv_vfncvt_rtz_x_f_w_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                               vfloat16mf4_t vs2, size_t vl);
vint8mf4_t __riscv_vfncvt_x_f_w_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                           vfloat16mf2_t vs2, size_t vl);
vint8mf4_t __riscv_vfncvt_rtz_x_f_w_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                               vfloat16mf2_t vs2, size_t vl);
vint8mf2_t __riscv_vfncvt_x_f_w_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                           vfloat16m1_t vs2, size_t vl);
vint8mf2_t __riscv_vfncvt_rtz_x_f_w_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                               vfloat16m1_t vs2, size_t vl);
vint8m1_t __riscv_vfncvt_x_f_w_i8m1_tumu(vbool8_t vm, vint8m1_t vd,
                                         vfloat16m2_t vs2, size_t vl);
vint8m1_t __riscv_vfncvt_rtz_x_f_w_i8m1_tumu(vbool8_t vm, vint8m1_t vd,
                                             vfloat16m2_t vs2, size_t vl);
vint8m2_t __riscv_vfncvt_x_f_w_i8m2_tumu(vbool4_t vm, vint8m2_t vd,
                                         vfloat16m4_t vs2, size_t vl);
vint8m2_t __riscv_vfncvt_rtz_x_f_w_i8m2_tumu(vbool4_t vm, vint8m2_t vd,
                                             vfloat16m4_t vs2, size_t vl);
vint8m4_t __riscv_vfncvt_x_f_w_i8m4_tumu(vbool2_t vm, vint8m4_t vd,
                                         vfloat16m8_t vs2, size_t vl);
vint8m4_t __riscv_vfncvt_rtz_x_f_w_i8m4_tumu(vbool2_t vm, vint8m4_t vd,
                                             vfloat16m8_t vs2, size_t vl);
vuint8mf8_t __riscv_vfncvt_xu_f_w_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                             vfloat16mf4_t vs2, size_t vl);
vuint8mf8_t __riscv_vfncvt_rtz_xu_f_w_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                                 vfloat16mf4_t vs2, size_t vl);
vuint8mf4_t __riscv_vfncvt_xu_f_w_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                             vfloat16mf2_t vs2, size_t vl);
vuint8mf4_t __riscv_vfncvt_rtz_xu_f_w_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                                 vfloat16mf2_t vs2, size_t vl);
vuint8mf2_t __riscv_vfncvt_xu_f_w_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                             vfloat16m1_t vs2, size_t vl);
vuint8mf2_t __riscv_vfncvt_rtz_xu_f_w_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                                 vfloat16m1_t vs2, size_t vl);
vuint8m1_t __riscv_vfncvt_xu_f_w_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                           vfloat16m2_t vs2, size_t vl);
vuint8m1_t __riscv_vfncvt_rtz_xu_f_w_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                               vfloat16m2_t vs2, size_t vl);
vuint8m2_t __riscv_vfncvt_xu_f_w_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                           vfloat16m4_t vs2, size_t vl);
vuint8m2_t __riscv_vfncvt_rtz_xu_f_w_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                               vfloat16m4_t vs2, size_t vl);
vuint8m4_t __riscv_vfncvt_xu_f_w_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                           vfloat16m8_t vs2, size_t vl);
vuint8m4_t __riscv_vfncvt_rtz_xu_f_w_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                               vfloat16m8_t vs2, size_t vl);
vint16mf4_t __riscv_vfncvt_x_f_w_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                             vfloat32mf2_t vs2, size_t vl);
vint16mf4_t __riscv_vfncvt_rtz_x_f_w_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                                 vfloat32mf2_t vs2, size_t vl);
vint16mf2_t __riscv_vfncvt_x_f_w_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                             vfloat32m1_t vs2, size_t vl);
vint16mf2_t __riscv_vfncvt_rtz_x_f_w_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                                 vfloat32m1_t vs2, size_t vl);
vint16m1_t __riscv_vfncvt_x_f_w_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                           vfloat32m2_t vs2, size_t vl);
vint16m1_t __riscv_vfncvt_rtz_x_f_w_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                               vfloat32m2_t vs2, size_t vl);
vint16m2_t __riscv_vfncvt_x_f_w_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                           vfloat32m4_t vs2, size_t vl);
vint16m2_t __riscv_vfncvt_rtz_x_f_w_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                               vfloat32m4_t vs2, size_t vl);
vint16m4_t __riscv_vfncvt_x_f_w_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                           vfloat32m8_t vs2, size_t vl);
vint16m4_t __riscv_vfncvt_rtz_x_f_w_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                               vfloat32m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vfncvt_xu_f_w_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                               vfloat32mf2_t vs2, size_t vl);
vuint16mf4_t __riscv_vfncvt_rtz_xu_f_w_u16mf4_tumu(vbool64_t vm,
                                                   vuint16mf4_t vd,
                                                   vfloat32mf2_t vs2,
                                                   size_t vl);
vuint16mf2_t __riscv_vfncvt_xu_f_w_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                               vfloat32m1_t vs2, size_t vl);
vuint16mf2_t __riscv_vfncvt_rtz_xu_f_w_u16mf2_tumu(vbool32_t vm,
                                                   vuint16mf2_t vd,
                                                   vfloat32m1_t vs2, size_t vl);
vuint16m1_t __riscv_vfncvt_xu_f_w_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                             vfloat32m2_t vs2, size_t vl);
vuint16m1_t __riscv_vfncvt_rtz_xu_f_w_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                                 vfloat32m2_t vs2, size_t vl);
vuint16m2_t __riscv_vfncvt_xu_f_w_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                             vfloat32m4_t vs2, size_t vl);
vuint16m2_t __riscv_vfncvt_rtz_xu_f_w_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                                 vfloat32m4_t vs2, size_t vl);
vuint16m4_t __riscv_vfncvt_xu_f_w_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                             vfloat32m8_t vs2, size_t vl);
vuint16m4_t __riscv_vfncvt_rtz_xu_f_w_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                                 vfloat32m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_x_w_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                               vint32mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_x_w_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                               vint32m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_x_w_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                             vint32m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_x_w_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                             vint32m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_x_w_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                             vint32m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_xu_w_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                                vuint32mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_xu_w_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                                vuint32m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_xu_w_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                              vuint32m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_xu_w_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                              vuint32m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_xu_w_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                              vuint32m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_f_w_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                               vfloat32mf2_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfncvt_rod_f_f_w_f16mf4_tumu(vbool64_t vm,
                                                   vfloat16mf4_t vd,
                                                   vfloat32mf2_t vs2,
                                                   size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_f_w_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                               vfloat32m1_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_rod_f_f_w_f16mf2_tumu(vbool32_t vm,
                                                   vfloat16mf2_t vd,
                                                   vfloat32m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_f_w_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                             vfloat32m2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_rod_f_f_w_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                                 vfloat32m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_f_w_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                             vfloat32m4_t vs2, size_t vl);
vfloat16m2_t __riscv_vfncvt_rod_f_f_w_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                                 vfloat32m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_f_w_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                             vfloat32m8_t vs2, size_t vl);
vfloat16m4_t __riscv_vfncvt_rod_f_f_w_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                                 vfloat32m8_t vs2, size_t vl);
vint32mf2_t __riscv_vfncvt_x_f_w_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                             vfloat64m1_t vs2, size_t vl);
vint32mf2_t __riscv_vfncvt_rtz_x_f_w_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                                 vfloat64m1_t vs2, size_t vl);
vint32m1_t __riscv_vfncvt_x_f_w_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                           vfloat64m2_t vs2, size_t vl);
vint32m1_t __riscv_vfncvt_rtz_x_f_w_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                               vfloat64m2_t vs2, size_t vl);
vint32m2_t __riscv_vfncvt_x_f_w_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                           vfloat64m4_t vs2, size_t vl);
vint32m2_t __riscv_vfncvt_rtz_x_f_w_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                               vfloat64m4_t vs2, size_t vl);
vint32m4_t __riscv_vfncvt_x_f_w_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                           vfloat64m8_t vs2, size_t vl);
vint32m4_t __riscv_vfncvt_rtz_x_f_w_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                               vfloat64m8_t vs2, size_t vl);
vuint32mf2_t __riscv_vfncvt_xu_f_w_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                               vfloat64m1_t vs2, size_t vl);
vuint32mf2_t __riscv_vfncvt_rtz_xu_f_w_u32mf2_tumu(vbool64_t vm,
                                                   vuint32mf2_t vd,
                                                   vfloat64m1_t vs2, size_t vl);
vuint32m1_t __riscv_vfncvt_xu_f_w_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                             vfloat64m2_t vs2, size_t vl);
vuint32m1_t __riscv_vfncvt_rtz_xu_f_w_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                                 vfloat64m2_t vs2, size_t vl);
vuint32m2_t __riscv_vfncvt_xu_f_w_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                             vfloat64m4_t vs2, size_t vl);
vuint32m2_t __riscv_vfncvt_rtz_xu_f_w_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                                 vfloat64m4_t vs2, size_t vl);
vuint32m4_t __riscv_vfncvt_xu_f_w_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                             vfloat64m8_t vs2, size_t vl);
vuint32m4_t __riscv_vfncvt_rtz_xu_f_w_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                                 vfloat64m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_x_w_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                               vint64m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_x_w_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                             vint64m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_x_w_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                             vint64m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_x_w_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                             vint64m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_xu_w_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                                vuint64m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_xu_w_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                              vuint64m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_xu_w_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                              vuint64m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_xu_w_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                              vuint64m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_f_w_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat64m1_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfncvt_rod_f_f_w_f32mf2_tumu(vbool64_t vm,
                                                   vfloat32mf2_t vd,
                                                   vfloat64m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_f_w_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat64m2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_rod_f_f_w_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                                 vfloat64m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_f_w_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat64m4_t vs2, size_t vl);
vfloat32m2_t __riscv_vfncvt_rod_f_f_w_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                                 vfloat64m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_f_w_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat64m8_t vs2, size_t vl);
vfloat32m4_t __riscv_vfncvt_rod_f_f_w_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                                 vfloat64m8_t vs2, size_t vl);
// masked functions
vint8mf8_t __riscv_vfncvt_x_f_w_i8mf8_mu(vbool64_t vm, vint8mf8_t vd,
                                         vfloat16mf4_t vs2, size_t vl);
vint8mf8_t __riscv_vfncvt_rtz_x_f_w_i8mf8_mu(vbool64_t vm, vint8mf8_t vd,
                                             vfloat16mf4_t vs2, size_t vl);
vint8mf4_t __riscv_vfncvt_x_f_w_i8mf4_mu(vbool32_t vm, vint8mf4_t vd,
                                         vfloat16mf2_t vs2, size_t vl);
vint8mf4_t __riscv_vfncvt_rtz_x_f_w_i8mf4_mu(vbool32_t vm, vint8mf4_t vd,
                                             vfloat16mf2_t vs2, size_t vl);
vint8mf2_t __riscv_vfncvt_x_f_w_i8mf2_mu(vbool16_t vm, vint8mf2_t vd,
                                         vfloat16m1_t vs2, size_t vl);
vint8mf2_t __riscv_vfncvt_rtz_x_f_w_i8mf2_mu(vbool16_t vm, vint8mf2_t vd,
                                             vfloat16m1_t vs2, size_t vl);
vint8m1_t __riscv_vfncvt_x_f_w_i8m1_mu(vbool8_t vm, vint8m1_t vd,
                                       vfloat16m2_t vs2, size_t vl);
vint8m1_t __riscv_vfncvt_rtz_x_f_w_i8m1_mu(vbool8_t vm, vint8m1_t vd,
                                           vfloat16m2_t vs2, size_t vl);
vint8m2_t __riscv_vfncvt_x_f_w_i8m2_mu(vbool4_t vm, vint8m2_t vd,
                                       vfloat16m4_t vs2, size_t vl);
vint8m2_t __riscv_vfncvt_rtz_x_f_w_i8m2_mu(vbool4_t vm, vint8m2_t vd,
                                           vfloat16m4_t vs2, size_t vl);
vint8m4_t __riscv_vfncvt_x_f_w_i8m4_mu(vbool2_t vm, vint8m4_t vd,
                                       vfloat16m8_t vs2, size_t vl);
vint8m4_t __riscv_vfncvt_rtz_x_f_w_i8m4_mu(vbool2_t vm, vint8m4_t vd,
                                           vfloat16m8_t vs2, size_t vl);
vuint8mf8_t __riscv_vfncvt_xu_f_w_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                           vfloat16mf4_t vs2, size_t vl);
vuint8mf8_t __riscv_vfncvt_rtz_xu_f_w_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                               vfloat16mf4_t vs2, size_t vl);
vuint8mf4_t __riscv_vfncvt_xu_f_w_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                           vfloat16mf2_t vs2, size_t vl);
vuint8mf4_t __riscv_vfncvt_rtz_xu_f_w_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                               vfloat16mf2_t vs2, size_t vl);
vuint8mf2_t __riscv_vfncvt_xu_f_w_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                           vfloat16m1_t vs2, size_t vl);
vuint8mf2_t __riscv_vfncvt_rtz_xu_f_w_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                               vfloat16m1_t vs2, size_t vl);
vuint8m1_t __riscv_vfncvt_xu_f_w_u8m1_mu(vbool8_t vm, vuint8m1_t vd,
                                         vfloat16m2_t vs2, size_t vl);
vuint8m1_t __riscv_vfncvt_rtz_xu_f_w_u8m1_mu(vbool8_t vm, vuint8m1_t vd,
                                             vfloat16m2_t vs2, size_t vl);
vuint8m2_t __riscv_vfncvt_xu_f_w_u8m2_mu(vbool4_t vm, vuint8m2_t vd,
                                         vfloat16m4_t vs2, size_t vl);
vuint8m2_t __riscv_vfncvt_rtz_xu_f_w_u8m2_mu(vbool4_t vm, vuint8m2_t vd,
                                             vfloat16m4_t vs2, size_t vl);
vuint8m4_t __riscv_vfncvt_xu_f_w_u8m4_mu(vbool2_t vm, vuint8m4_t vd,
                                         vfloat16m8_t vs2, size_t vl);
vuint8m4_t __riscv_vfncvt_rtz_xu_f_w_u8m4_mu(vbool2_t vm, vuint8m4_t vd,
                                             vfloat16m8_t vs2, size_t vl);
vint16mf4_t __riscv_vfncvt_x_f_w_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                           vfloat32mf2_t vs2, size_t vl);
vint16mf4_t __riscv_vfncvt_rtz_x_f_w_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                               vfloat32mf2_t vs2, size_t vl);
vint16mf2_t __riscv_vfncvt_x_f_w_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                           vfloat32m1_t vs2, size_t vl);
vint16mf2_t __riscv_vfncvt_rtz_x_f_w_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                               vfloat32m1_t vs2, size_t vl);
vint16m1_t __riscv_vfncvt_x_f_w_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                         vfloat32m2_t vs2, size_t vl);
vint16m1_t __riscv_vfncvt_rtz_x_f_w_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                             vfloat32m2_t vs2, size_t vl);
vint16m2_t __riscv_vfncvt_x_f_w_i16m2_mu(vbool8_t vm, vint16m2_t vd,
                                         vfloat32m4_t vs2, size_t vl);
vint16m2_t __riscv_vfncvt_rtz_x_f_w_i16m2_mu(vbool8_t vm, vint16m2_t vd,
                                             vfloat32m4_t vs2, size_t vl);
vint16m4_t __riscv_vfncvt_x_f_w_i16m4_mu(vbool4_t vm, vint16m4_t vd,
                                         vfloat32m8_t vs2, size_t vl);
vint16m4_t __riscv_vfncvt_rtz_x_f_w_i16m4_mu(vbool4_t vm, vint16m4_t vd,
                                             vfloat32m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vfncvt_xu_f_w_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                             vfloat32mf2_t vs2, size_t vl);
vuint16mf4_t __riscv_vfncvt_rtz_xu_f_w_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                                 vfloat32mf2_t vs2, size_t vl);
vuint16mf2_t __riscv_vfncvt_xu_f_w_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                             vfloat32m1_t vs2, size_t vl);
vuint16mf2_t __riscv_vfncvt_rtz_xu_f_w_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                                 vfloat32m1_t vs2, size_t vl);
vuint16m1_t __riscv_vfncvt_xu_f_w_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                           vfloat32m2_t vs2, size_t vl);
vuint16m1_t __riscv_vfncvt_rtz_xu_f_w_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                               vfloat32m2_t vs2, size_t vl);
vuint16m2_t __riscv_vfncvt_xu_f_w_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                           vfloat32m4_t vs2, size_t vl);
vuint16m2_t __riscv_vfncvt_rtz_xu_f_w_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                               vfloat32m4_t vs2, size_t vl);
vuint16m4_t __riscv_vfncvt_xu_f_w_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                           vfloat32m8_t vs2, size_t vl);
vuint16m4_t __riscv_vfncvt_rtz_xu_f_w_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                               vfloat32m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_x_w_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                             vint32mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_x_w_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                             vint32m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_x_w_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                           vint32m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_x_w_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                           vint32m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_x_w_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                           vint32m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_xu_w_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                              vuint32mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_xu_w_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                              vuint32m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_xu_w_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                            vuint32m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_xu_w_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                            vuint32m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_xu_w_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                            vuint32m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_f_w_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat32mf2_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfncvt_rod_f_f_w_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                                 vfloat32mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_f_w_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat32m1_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_rod_f_f_w_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                                 vfloat32m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_f_w_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat32m2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_rod_f_f_w_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                               vfloat32m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_f_w_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat32m4_t vs2, size_t vl);
vfloat16m2_t __riscv_vfncvt_rod_f_f_w_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                               vfloat32m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_f_w_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat32m8_t vs2, size_t vl);
vfloat16m4_t __riscv_vfncvt_rod_f_f_w_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                               vfloat32m8_t vs2, size_t vl);
vint32mf2_t __riscv_vfncvt_x_f_w_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                           vfloat64m1_t vs2, size_t vl);
vint32mf2_t __riscv_vfncvt_rtz_x_f_w_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                               vfloat64m1_t vs2, size_t vl);
vint32m1_t __riscv_vfncvt_x_f_w_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                         vfloat64m2_t vs2, size_t vl);
vint32m1_t __riscv_vfncvt_rtz_x_f_w_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                             vfloat64m2_t vs2, size_t vl);
vint32m2_t __riscv_vfncvt_x_f_w_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                         vfloat64m4_t vs2, size_t vl);
vint32m2_t __riscv_vfncvt_rtz_x_f_w_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                             vfloat64m4_t vs2, size_t vl);
vint32m4_t __riscv_vfncvt_x_f_w_i32m4_mu(vbool8_t vm, vint32m4_t vd,
                                         vfloat64m8_t vs2, size_t vl);
vint32m4_t __riscv_vfncvt_rtz_x_f_w_i32m4_mu(vbool8_t vm, vint32m4_t vd,
                                             vfloat64m8_t vs2, size_t vl);
vuint32mf2_t __riscv_vfncvt_xu_f_w_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                             vfloat64m1_t vs2, size_t vl);
vuint32mf2_t __riscv_vfncvt_rtz_xu_f_w_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                                 vfloat64m1_t vs2, size_t vl);
vuint32m1_t __riscv_vfncvt_xu_f_w_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                           vfloat64m2_t vs2, size_t vl);
vuint32m1_t __riscv_vfncvt_rtz_xu_f_w_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                               vfloat64m2_t vs2, size_t vl);
vuint32m2_t __riscv_vfncvt_xu_f_w_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                           vfloat64m4_t vs2, size_t vl);
vuint32m2_t __riscv_vfncvt_rtz_xu_f_w_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                               vfloat64m4_t vs2, size_t vl);
vuint32m4_t __riscv_vfncvt_xu_f_w_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                           vfloat64m8_t vs2, size_t vl);
vuint32m4_t __riscv_vfncvt_rtz_xu_f_w_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                               vfloat64m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_x_w_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                             vint64m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_x_w_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                           vint64m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_x_w_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                           vint64m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_x_w_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                           vint64m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_xu_w_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                              vuint64m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_xu_w_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                            vuint64m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_xu_w_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                            vuint64m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_xu_w_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                            vuint64m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_f_w_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat64m1_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfncvt_rod_f_f_w_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                                 vfloat64m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_f_w_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat64m2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_rod_f_f_w_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                               vfloat64m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_f_w_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat64m4_t vs2, size_t vl);
vfloat32m2_t __riscv_vfncvt_rod_f_f_w_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                               vfloat64m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_f_w_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat64m8_t vs2, size_t vl);
vfloat32m4_t __riscv_vfncvt_rod_f_f_w_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                               vfloat64m8_t vs2, size_t vl);
vint8mf8_t __riscv_vfncvt_x_f_w_i8mf8_rm_tu(vint8mf8_t vd, vfloat16mf4_t vs2,
                                            unsigned int frm, size_t vl);
vint8mf4_t __riscv_vfncvt_x_f_w_i8mf4_rm_tu(vint8mf4_t vd, vfloat16mf2_t vs2,
                                            unsigned int frm, size_t vl);
vint8mf2_t __riscv_vfncvt_x_f_w_i8mf2_rm_tu(vint8mf2_t vd, vfloat16m1_t vs2,
                                            unsigned int frm, size_t vl);
vint8m1_t __riscv_vfncvt_x_f_w_i8m1_rm_tu(vint8m1_t vd, vfloat16m2_t vs2,
                                          unsigned int frm, size_t vl);
vint8m2_t __riscv_vfncvt_x_f_w_i8m2_rm_tu(vint8m2_t vd, vfloat16m4_t vs2,
                                          unsigned int frm, size_t vl);
vint8m4_t __riscv_vfncvt_x_f_w_i8m4_rm_tu(vint8m4_t vd, vfloat16m8_t vs2,
                                          unsigned int frm, size_t vl);
vuint8mf8_t __riscv_vfncvt_xu_f_w_u8mf8_rm_tu(vuint8mf8_t vd, vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vuint8mf4_t __riscv_vfncvt_xu_f_w_u8mf4_rm_tu(vuint8mf4_t vd, vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vuint8mf2_t __riscv_vfncvt_xu_f_w_u8mf2_rm_tu(vuint8mf2_t vd, vfloat16m1_t vs2,
                                              unsigned int frm, size_t vl);
vuint8m1_t __riscv_vfncvt_xu_f_w_u8m1_rm_tu(vuint8m1_t vd, vfloat16m2_t vs2,
                                            unsigned int frm, size_t vl);
vuint8m2_t __riscv_vfncvt_xu_f_w_u8m2_rm_tu(vuint8m2_t vd, vfloat16m4_t vs2,
                                            unsigned int frm, size_t vl);
vuint8m4_t __riscv_vfncvt_xu_f_w_u8m4_rm_tu(vuint8m4_t vd, vfloat16m8_t vs2,
                                            unsigned int frm, size_t vl);
vint16mf4_t __riscv_vfncvt_x_f_w_i16mf4_rm_tu(vint16mf4_t vd, vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vint16mf2_t __riscv_vfncvt_x_f_w_i16mf2_rm_tu(vint16mf2_t vd, vfloat32m1_t vs2,
                                              unsigned int frm, size_t vl);
vint16m1_t __riscv_vfncvt_x_f_w_i16m1_rm_tu(vint16m1_t vd, vfloat32m2_t vs2,
                                            unsigned int frm, size_t vl);
vint16m2_t __riscv_vfncvt_x_f_w_i16m2_rm_tu(vint16m2_t vd, vfloat32m4_t vs2,
                                            unsigned int frm, size_t vl);
vint16m4_t __riscv_vfncvt_x_f_w_i16m4_rm_tu(vint16m4_t vd, vfloat32m8_t vs2,
                                            unsigned int frm, size_t vl);
vuint16mf4_t __riscv_vfncvt_xu_f_w_u16mf4_rm_tu(vuint16mf4_t vd,
                                                vfloat32mf2_t vs2,
                                                unsigned int frm, size_t vl);
vuint16mf2_t __riscv_vfncvt_xu_f_w_u16mf2_rm_tu(vuint16mf2_t vd,
                                                vfloat32m1_t vs2,
                                                unsigned int frm, size_t vl);
vuint16m1_t __riscv_vfncvt_xu_f_w_u16m1_rm_tu(vuint16m1_t vd, vfloat32m2_t vs2,
                                              unsigned int frm, size_t vl);
vuint16m2_t __riscv_vfncvt_xu_f_w_u16m2_rm_tu(vuint16m2_t vd, vfloat32m4_t vs2,
                                              unsigned int frm, size_t vl);
vuint16m4_t __riscv_vfncvt_xu_f_w_u16m4_rm_tu(vuint16m4_t vd, vfloat32m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_x_w_f16mf4_rm_tu(vfloat16mf4_t vd,
                                                vint32mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_x_w_f16mf2_rm_tu(vfloat16mf2_t vd,
                                                vint32m1_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_x_w_f16m1_rm_tu(vfloat16m1_t vd, vint32m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_x_w_f16m2_rm_tu(vfloat16m2_t vd, vint32m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_x_w_f16m4_rm_tu(vfloat16m4_t vd, vint32m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_xu_w_f16mf4_rm_tu(vfloat16mf4_t vd,
                                                 vuint32mf2_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_xu_w_f16mf2_rm_tu(vfloat16mf2_t vd,
                                                 vuint32m1_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_xu_w_f16m1_rm_tu(vfloat16m1_t vd, vuint32m2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_xu_w_f16m2_rm_tu(vfloat16m2_t vd, vuint32m4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_xu_w_f16m4_rm_tu(vfloat16m4_t vd, vuint32m8_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_f_w_f16mf4_rm_tu(vfloat16mf4_t vd,
                                                vfloat32mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_f_w_f16mf2_rm_tu(vfloat16mf2_t vd,
                                                vfloat32m1_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_f_w_f16m1_rm_tu(vfloat16m1_t vd, vfloat32m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_f_w_f16m2_rm_tu(vfloat16m2_t vd, vfloat32m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_f_w_f16m4_rm_tu(vfloat16m4_t vd, vfloat32m8_t vs2,
                                              unsigned int frm, size_t vl);
vint32mf2_t __riscv_vfncvt_x_f_w_i32mf2_rm_tu(vint32mf2_t vd, vfloat64m1_t vs2,
                                              unsigned int frm, size_t vl);
vint32m1_t __riscv_vfncvt_x_f_w_i32m1_rm_tu(vint32m1_t vd, vfloat64m2_t vs2,
                                            unsigned int frm, size_t vl);
vint32m2_t __riscv_vfncvt_x_f_w_i32m2_rm_tu(vint32m2_t vd, vfloat64m4_t vs2,
                                            unsigned int frm, size_t vl);
vint32m4_t __riscv_vfncvt_x_f_w_i32m4_rm_tu(vint32m4_t vd, vfloat64m8_t vs2,
                                            unsigned int frm, size_t vl);
vuint32mf2_t __riscv_vfncvt_xu_f_w_u32mf2_rm_tu(vuint32mf2_t vd,
                                                vfloat64m1_t vs2,
                                                unsigned int frm, size_t vl);
vuint32m1_t __riscv_vfncvt_xu_f_w_u32m1_rm_tu(vuint32m1_t vd, vfloat64m2_t vs2,
                                              unsigned int frm, size_t vl);
vuint32m2_t __riscv_vfncvt_xu_f_w_u32m2_rm_tu(vuint32m2_t vd, vfloat64m4_t vs2,
                                              unsigned int frm, size_t vl);
vuint32m4_t __riscv_vfncvt_xu_f_w_u32m4_rm_tu(vuint32m4_t vd, vfloat64m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_x_w_f32mf2_rm_tu(vfloat32mf2_t vd,
                                                vint64m1_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_x_w_f32m1_rm_tu(vfloat32m1_t vd, vint64m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_x_w_f32m2_rm_tu(vfloat32m2_t vd, vint64m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_x_w_f32m4_rm_tu(vfloat32m4_t vd, vint64m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_xu_w_f32mf2_rm_tu(vfloat32mf2_t vd,
                                                 vuint64m1_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_xu_w_f32m1_rm_tu(vfloat32m1_t vd, vuint64m2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_xu_w_f32m2_rm_tu(vfloat32m2_t vd, vuint64m4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_xu_w_f32m4_rm_tu(vfloat32m4_t vd, vuint64m8_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_f_w_f32mf2_rm_tu(vfloat32mf2_t vd,
                                                vfloat64m1_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_f_w_f32m1_rm_tu(vfloat32m1_t vd, vfloat64m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_f_w_f32m2_rm_tu(vfloat32m2_t vd, vfloat64m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_f_w_f32m4_rm_tu(vfloat32m4_t vd, vfloat64m8_t vs2,
                                              unsigned int frm, size_t vl);
// masked functions
vint8mf8_t __riscv_vfncvt_x_f_w_i8mf8_rm_tum(vbool64_t vm, vint8mf8_t vd,
                                             vfloat16mf4_t vs2,
                                             unsigned int frm, size_t vl);
vint8mf4_t __riscv_vfncvt_x_f_w_i8mf4_rm_tum(vbool32_t vm, vint8mf4_t vd,
                                             vfloat16mf2_t vs2,
                                             unsigned int frm, size_t vl);
vint8mf2_t __riscv_vfncvt_x_f_w_i8mf2_rm_tum(vbool16_t vm, vint8mf2_t vd,
                                             vfloat16m1_t vs2, unsigned int frm,
                                             size_t vl);
vint8m1_t __riscv_vfncvt_x_f_w_i8m1_rm_tum(vbool8_t vm, vint8m1_t vd,
                                           vfloat16m2_t vs2, unsigned int frm,
                                           size_t vl);
vint8m2_t __riscv_vfncvt_x_f_w_i8m2_rm_tum(vbool4_t vm, vint8m2_t vd,
                                           vfloat16m4_t vs2, unsigned int frm,
                                           size_t vl);
vint8m4_t __riscv_vfncvt_x_f_w_i8m4_rm_tum(vbool2_t vm, vint8m4_t vd,
                                           vfloat16m8_t vs2, unsigned int frm,
                                           size_t vl);
vuint8mf8_t __riscv_vfncvt_xu_f_w_u8mf8_rm_tum(vbool64_t vm, vuint8mf8_t vd,
                                               vfloat16mf4_t vs2,
                                               unsigned int frm, size_t vl);
vuint8mf4_t __riscv_vfncvt_xu_f_w_u8mf4_rm_tum(vbool32_t vm, vuint8mf4_t vd,
                                               vfloat16mf2_t vs2,
                                               unsigned int frm, size_t vl);
vuint8mf2_t __riscv_vfncvt_xu_f_w_u8mf2_rm_tum(vbool16_t vm, vuint8mf2_t vd,
                                               vfloat16m1_t vs2,
                                               unsigned int frm, size_t vl);
vuint8m1_t __riscv_vfncvt_xu_f_w_u8m1_rm_tum(vbool8_t vm, vuint8m1_t vd,
                                             vfloat16m2_t vs2, unsigned int frm,
                                             size_t vl);
vuint8m2_t __riscv_vfncvt_xu_f_w_u8m2_rm_tum(vbool4_t vm, vuint8m2_t vd,
                                             vfloat16m4_t vs2, unsigned int frm,
                                             size_t vl);
vuint8m4_t __riscv_vfncvt_xu_f_w_u8m4_rm_tum(vbool2_t vm, vuint8m4_t vd,
                                             vfloat16m8_t vs2, unsigned int frm,
                                             size_t vl);
vint16mf4_t __riscv_vfncvt_x_f_w_i16mf4_rm_tum(vbool64_t vm, vint16mf4_t vd,
                                               vfloat32mf2_t vs2,
                                               unsigned int frm, size_t vl);
vint16mf2_t __riscv_vfncvt_x_f_w_i16mf2_rm_tum(vbool32_t vm, vint16mf2_t vd,
                                               vfloat32m1_t vs2,
                                               unsigned int frm, size_t vl);
vint16m1_t __riscv_vfncvt_x_f_w_i16m1_rm_tum(vbool16_t vm, vint16m1_t vd,
                                             vfloat32m2_t vs2, unsigned int frm,
                                             size_t vl);
vint16m2_t __riscv_vfncvt_x_f_w_i16m2_rm_tum(vbool8_t vm, vint16m2_t vd,
                                             vfloat32m4_t vs2, unsigned int frm,
                                             size_t vl);
vint16m4_t __riscv_vfncvt_x_f_w_i16m4_rm_tum(vbool4_t vm, vint16m4_t vd,
                                             vfloat32m8_t vs2, unsigned int frm,
                                             size_t vl);
vuint16mf4_t __riscv_vfncvt_xu_f_w_u16mf4_rm_tum(vbool64_t vm, vuint16mf4_t vd,
                                                 vfloat32mf2_t vs2,
                                                 unsigned int frm, size_t vl);
vuint16mf2_t __riscv_vfncvt_xu_f_w_u16mf2_rm_tum(vbool32_t vm, vuint16mf2_t vd,
                                                 vfloat32m1_t vs2,
                                                 unsigned int frm, size_t vl);
vuint16m1_t __riscv_vfncvt_xu_f_w_u16m1_rm_tum(vbool16_t vm, vuint16m1_t vd,
                                               vfloat32m2_t vs2,
                                               unsigned int frm, size_t vl);
vuint16m2_t __riscv_vfncvt_xu_f_w_u16m2_rm_tum(vbool8_t vm, vuint16m2_t vd,
                                               vfloat32m4_t vs2,
                                               unsigned int frm, size_t vl);
vuint16m4_t __riscv_vfncvt_xu_f_w_u16m4_rm_tum(vbool4_t vm, vuint16m4_t vd,
                                               vfloat32m8_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_x_w_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                                 vint32mf2_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_x_w_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                                 vint32m1_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_x_w_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                               vint32m2_t vs2, unsigned int frm,
                                               size_t vl);
vfloat16m2_t __riscv_vfncvt_f_x_w_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                               vint32m4_t vs2, unsigned int frm,
                                               size_t vl);
vfloat16m4_t __riscv_vfncvt_f_x_w_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                               vint32m8_t vs2, unsigned int frm,
                                               size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_xu_w_f16mf4_rm_tum(vbool64_t vm,
                                                  vfloat16mf4_t vd,
                                                  vuint32mf2_t vs2,
                                                  unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_xu_w_f16mf2_rm_tum(vbool32_t vm,
                                                  vfloat16mf2_t vd,
                                                  vuint32m1_t vs2,
                                                  unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_xu_w_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                                vuint32m2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_xu_w_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                                vuint32m4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_xu_w_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                                vuint32m8_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_f_w_f16mf4_rm_tum(vbool64_t vm, vfloat16mf4_t vd,
                                                 vfloat32mf2_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_f_w_f16mf2_rm_tum(vbool32_t vm, vfloat16mf2_t vd,
                                                 vfloat32m1_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_f_w_f16m1_rm_tum(vbool16_t vm, vfloat16m1_t vd,
                                               vfloat32m2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_f_w_f16m2_rm_tum(vbool8_t vm, vfloat16m2_t vd,
                                               vfloat32m4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_f_w_f16m4_rm_tum(vbool4_t vm, vfloat16m4_t vd,
                                               vfloat32m8_t vs2,
                                               unsigned int frm, size_t vl);
vint32mf2_t __riscv_vfncvt_x_f_w_i32mf2_rm_tum(vbool64_t vm, vint32mf2_t vd,
                                               vfloat64m1_t vs2,
                                               unsigned int frm, size_t vl);
vint32m1_t __riscv_vfncvt_x_f_w_i32m1_rm_tum(vbool32_t vm, vint32m1_t vd,
                                             vfloat64m2_t vs2, unsigned int frm,
                                             size_t vl);
vint32m2_t __riscv_vfncvt_x_f_w_i32m2_rm_tum(vbool16_t vm, vint32m2_t vd,
                                             vfloat64m4_t vs2, unsigned int frm,
                                             size_t vl);
vint32m4_t __riscv_vfncvt_x_f_w_i32m4_rm_tum(vbool8_t vm, vint32m4_t vd,
                                             vfloat64m8_t vs2, unsigned int frm,
                                             size_t vl);
vuint32mf2_t __riscv_vfncvt_xu_f_w_u32mf2_rm_tum(vbool64_t vm, vuint32mf2_t vd,
                                                 vfloat64m1_t vs2,
                                                 unsigned int frm, size_t vl);
vuint32m1_t __riscv_vfncvt_xu_f_w_u32m1_rm_tum(vbool32_t vm, vuint32m1_t vd,
                                               vfloat64m2_t vs2,
                                               unsigned int frm, size_t vl);
vuint32m2_t __riscv_vfncvt_xu_f_w_u32m2_rm_tum(vbool16_t vm, vuint32m2_t vd,
                                               vfloat64m4_t vs2,
                                               unsigned int frm, size_t vl);
vuint32m4_t __riscv_vfncvt_xu_f_w_u32m4_rm_tum(vbool8_t vm, vuint32m4_t vd,
                                               vfloat64m8_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_x_w_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                                 vint64m1_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_x_w_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                               vint64m2_t vs2, unsigned int frm,
                                               size_t vl);
vfloat32m2_t __riscv_vfncvt_f_x_w_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                               vint64m4_t vs2, unsigned int frm,
                                               size_t vl);
vfloat32m4_t __riscv_vfncvt_f_x_w_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                               vint64m8_t vs2, unsigned int frm,
                                               size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_xu_w_f32mf2_rm_tum(vbool64_t vm,
                                                  vfloat32mf2_t vd,
                                                  vuint64m1_t vs2,
                                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_xu_w_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                                vuint64m2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_xu_w_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                                vuint64m4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_xu_w_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                                vuint64m8_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_f_w_f32mf2_rm_tum(vbool64_t vm, vfloat32mf2_t vd,
                                                 vfloat64m1_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_f_w_f32m1_rm_tum(vbool32_t vm, vfloat32m1_t vd,
                                               vfloat64m2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_f_w_f32m2_rm_tum(vbool16_t vm, vfloat32m2_t vd,
                                               vfloat64m4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_f_w_f32m4_rm_tum(vbool8_t vm, vfloat32m4_t vd,
                                               vfloat64m8_t vs2,
                                               unsigned int frm, size_t vl);
// masked functions
vint8mf8_t __riscv_vfncvt_x_f_w_i8mf8_rm_tumu(vbool64_t vm, vint8mf8_t vd,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vint8mf4_t __riscv_vfncvt_x_f_w_i8mf4_rm_tumu(vbool32_t vm, vint8mf4_t vd,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vint8mf2_t __riscv_vfncvt_x_f_w_i8mf2_rm_tumu(vbool16_t vm, vint8mf2_t vd,
                                              vfloat16m1_t vs2,
                                              unsigned int frm, size_t vl);
vint8m1_t __riscv_vfncvt_x_f_w_i8m1_rm_tumu(vbool8_t vm, vint8m1_t vd,
                                            vfloat16m2_t vs2, unsigned int frm,
                                            size_t vl);
vint8m2_t __riscv_vfncvt_x_f_w_i8m2_rm_tumu(vbool4_t vm, vint8m2_t vd,
                                            vfloat16m4_t vs2, unsigned int frm,
                                            size_t vl);
vint8m4_t __riscv_vfncvt_x_f_w_i8m4_rm_tumu(vbool2_t vm, vint8m4_t vd,
                                            vfloat16m8_t vs2, unsigned int frm,
                                            size_t vl);
vuint8mf8_t __riscv_vfncvt_xu_f_w_u8mf8_rm_tumu(vbool64_t vm, vuint8mf8_t vd,
                                                vfloat16mf4_t vs2,
                                                unsigned int frm, size_t vl);
vuint8mf4_t __riscv_vfncvt_xu_f_w_u8mf4_rm_tumu(vbool32_t vm, vuint8mf4_t vd,
                                                vfloat16mf2_t vs2,
                                                unsigned int frm, size_t vl);
vuint8mf2_t __riscv_vfncvt_xu_f_w_u8mf2_rm_tumu(vbool16_t vm, vuint8mf2_t vd,
                                                vfloat16m1_t vs2,
                                                unsigned int frm, size_t vl);
vuint8m1_t __riscv_vfncvt_xu_f_w_u8m1_rm_tumu(vbool8_t vm, vuint8m1_t vd,
                                              vfloat16m2_t vs2,
                                              unsigned int frm, size_t vl);
vuint8m2_t __riscv_vfncvt_xu_f_w_u8m2_rm_tumu(vbool4_t vm, vuint8m2_t vd,
                                              vfloat16m4_t vs2,
                                              unsigned int frm, size_t vl);
vuint8m4_t __riscv_vfncvt_xu_f_w_u8m4_rm_tumu(vbool2_t vm, vuint8m4_t vd,
                                              vfloat16m8_t vs2,
                                              unsigned int frm, size_t vl);
vint16mf4_t __riscv_vfncvt_x_f_w_i16mf4_rm_tumu(vbool64_t vm, vint16mf4_t vd,
                                                vfloat32mf2_t vs2,
                                                unsigned int frm, size_t vl);
vint16mf2_t __riscv_vfncvt_x_f_w_i16mf2_rm_tumu(vbool32_t vm, vint16mf2_t vd,
                                                vfloat32m1_t vs2,
                                                unsigned int frm, size_t vl);
vint16m1_t __riscv_vfncvt_x_f_w_i16m1_rm_tumu(vbool16_t vm, vint16m1_t vd,
                                              vfloat32m2_t vs2,
                                              unsigned int frm, size_t vl);
vint16m2_t __riscv_vfncvt_x_f_w_i16m2_rm_tumu(vbool8_t vm, vint16m2_t vd,
                                              vfloat32m4_t vs2,
                                              unsigned int frm, size_t vl);
vint16m4_t __riscv_vfncvt_x_f_w_i16m4_rm_tumu(vbool4_t vm, vint16m4_t vd,
                                              vfloat32m8_t vs2,
                                              unsigned int frm, size_t vl);
vuint16mf4_t __riscv_vfncvt_xu_f_w_u16mf4_rm_tumu(vbool64_t vm, vuint16mf4_t vd,
                                                  vfloat32mf2_t vs2,
                                                  unsigned int frm, size_t vl);
vuint16mf2_t __riscv_vfncvt_xu_f_w_u16mf2_rm_tumu(vbool32_t vm, vuint16mf2_t vd,
                                                  vfloat32m1_t vs2,
                                                  unsigned int frm, size_t vl);
vuint16m1_t __riscv_vfncvt_xu_f_w_u16m1_rm_tumu(vbool16_t vm, vuint16m1_t vd,
                                                vfloat32m2_t vs2,
                                                unsigned int frm, size_t vl);
vuint16m2_t __riscv_vfncvt_xu_f_w_u16m2_rm_tumu(vbool8_t vm, vuint16m2_t vd,
                                                vfloat32m4_t vs2,
                                                unsigned int frm, size_t vl);
vuint16m4_t __riscv_vfncvt_xu_f_w_u16m4_rm_tumu(vbool4_t vm, vuint16m4_t vd,
                                                vfloat32m8_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_x_w_f16mf4_rm_tumu(vbool64_t vm,
                                                  vfloat16mf4_t vd,
                                                  vint32mf2_t vs2,
                                                  unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_x_w_f16mf2_rm_tumu(vbool32_t vm,
                                                  vfloat16mf2_t vd,
                                                  vint32m1_t vs2,
                                                  unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_x_w_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                                vint32m2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_x_w_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                                vint32m4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_x_w_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                                vint32m8_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_xu_w_f16mf4_rm_tumu(vbool64_t vm,
                                                   vfloat16mf4_t vd,
                                                   vuint32mf2_t vs2,
                                                   unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_xu_w_f16mf2_rm_tumu(vbool32_t vm,
                                                   vfloat16mf2_t vd,
                                                   vuint32m1_t vs2,
                                                   unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_xu_w_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                                 vuint32m2_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_xu_w_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                                 vuint32m4_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_xu_w_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                                 vuint32m8_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_f_w_f16mf4_rm_tumu(vbool64_t vm,
                                                  vfloat16mf4_t vd,
                                                  vfloat32mf2_t vs2,
                                                  unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_f_w_f16mf2_rm_tumu(vbool32_t vm,
                                                  vfloat16mf2_t vd,
                                                  vfloat32m1_t vs2,
                                                  unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_f_w_f16m1_rm_tumu(vbool16_t vm, vfloat16m1_t vd,
                                                vfloat32m2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_f_w_f16m2_rm_tumu(vbool8_t vm, vfloat16m2_t vd,
                                                vfloat32m4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_f_w_f16m4_rm_tumu(vbool4_t vm, vfloat16m4_t vd,
                                                vfloat32m8_t vs2,
                                                unsigned int frm, size_t vl);
vint32mf2_t __riscv_vfncvt_x_f_w_i32mf2_rm_tumu(vbool64_t vm, vint32mf2_t vd,
                                                vfloat64m1_t vs2,
                                                unsigned int frm, size_t vl);
vint32m1_t __riscv_vfncvt_x_f_w_i32m1_rm_tumu(vbool32_t vm, vint32m1_t vd,
                                              vfloat64m2_t vs2,
                                              unsigned int frm, size_t vl);
vint32m2_t __riscv_vfncvt_x_f_w_i32m2_rm_tumu(vbool16_t vm, vint32m2_t vd,
                                              vfloat64m4_t vs2,
                                              unsigned int frm, size_t vl);
vint32m4_t __riscv_vfncvt_x_f_w_i32m4_rm_tumu(vbool8_t vm, vint32m4_t vd,
                                              vfloat64m8_t vs2,
                                              unsigned int frm, size_t vl);
vuint32mf2_t __riscv_vfncvt_xu_f_w_u32mf2_rm_tumu(vbool64_t vm, vuint32mf2_t vd,
                                                  vfloat64m1_t vs2,
                                                  unsigned int frm, size_t vl);
vuint32m1_t __riscv_vfncvt_xu_f_w_u32m1_rm_tumu(vbool32_t vm, vuint32m1_t vd,
                                                vfloat64m2_t vs2,
                                                unsigned int frm, size_t vl);
vuint32m2_t __riscv_vfncvt_xu_f_w_u32m2_rm_tumu(vbool16_t vm, vuint32m2_t vd,
                                                vfloat64m4_t vs2,
                                                unsigned int frm, size_t vl);
vuint32m4_t __riscv_vfncvt_xu_f_w_u32m4_rm_tumu(vbool8_t vm, vuint32m4_t vd,
                                                vfloat64m8_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_x_w_f32mf2_rm_tumu(vbool64_t vm,
                                                  vfloat32mf2_t vd,
                                                  vint64m1_t vs2,
                                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_x_w_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                                vint64m2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_x_w_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                                vint64m4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_x_w_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                                vint64m8_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_xu_w_f32mf2_rm_tumu(vbool64_t vm,
                                                   vfloat32mf2_t vd,
                                                   vuint64m1_t vs2,
                                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_xu_w_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                                 vuint64m2_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_xu_w_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                                 vuint64m4_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_xu_w_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                                 vuint64m8_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_f_w_f32mf2_rm_tumu(vbool64_t vm,
                                                  vfloat32mf2_t vd,
                                                  vfloat64m1_t vs2,
                                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_f_w_f32m1_rm_tumu(vbool32_t vm, vfloat32m1_t vd,
                                                vfloat64m2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_f_w_f32m2_rm_tumu(vbool16_t vm, vfloat32m2_t vd,
                                                vfloat64m4_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_f_w_f32m4_rm_tumu(vbool8_t vm, vfloat32m4_t vd,
                                                vfloat64m8_t vs2,
                                                unsigned int frm, size_t vl);
// masked functions
vint8mf8_t __riscv_vfncvt_x_f_w_i8mf8_rm_mu(vbool64_t vm, vint8mf8_t vd,
                                            vfloat16mf4_t vs2, unsigned int frm,
                                            size_t vl);
vint8mf4_t __riscv_vfncvt_x_f_w_i8mf4_rm_mu(vbool32_t vm, vint8mf4_t vd,
                                            vfloat16mf2_t vs2, unsigned int frm,
                                            size_t vl);
vint8mf2_t __riscv_vfncvt_x_f_w_i8mf2_rm_mu(vbool16_t vm, vint8mf2_t vd,
                                            vfloat16m1_t vs2, unsigned int frm,
                                            size_t vl);
vint8m1_t __riscv_vfncvt_x_f_w_i8m1_rm_mu(vbool8_t vm, vint8m1_t vd,
                                          vfloat16m2_t vs2, unsigned int frm,
                                          size_t vl);
vint8m2_t __riscv_vfncvt_x_f_w_i8m2_rm_mu(vbool4_t vm, vint8m2_t vd,
                                          vfloat16m4_t vs2, unsigned int frm,
                                          size_t vl);
vint8m4_t __riscv_vfncvt_x_f_w_i8m4_rm_mu(vbool2_t vm, vint8m4_t vd,
                                          vfloat16m8_t vs2, unsigned int frm,
                                          size_t vl);
vuint8mf8_t __riscv_vfncvt_xu_f_w_u8mf8_rm_mu(vbool64_t vm, vuint8mf8_t vd,
                                              vfloat16mf4_t vs2,
                                              unsigned int frm, size_t vl);
vuint8mf4_t __riscv_vfncvt_xu_f_w_u8mf4_rm_mu(vbool32_t vm, vuint8mf4_t vd,
                                              vfloat16mf2_t vs2,
                                              unsigned int frm, size_t vl);
vuint8mf2_t __riscv_vfncvt_xu_f_w_u8mf2_rm_mu(vbool16_t vm, vuint8mf2_t vd,
                                              vfloat16m1_t vs2,
                                              unsigned int frm, size_t vl);
vuint8m1_t __riscv_vfncvt_xu_f_w_u8m1_rm_mu(vbool8_t vm, vuint8m1_t vd,
                                            vfloat16m2_t vs2, unsigned int frm,
                                            size_t vl);
vuint8m2_t __riscv_vfncvt_xu_f_w_u8m2_rm_mu(vbool4_t vm, vuint8m2_t vd,
                                            vfloat16m4_t vs2, unsigned int frm,
                                            size_t vl);
vuint8m4_t __riscv_vfncvt_xu_f_w_u8m4_rm_mu(vbool2_t vm, vuint8m4_t vd,
                                            vfloat16m8_t vs2, unsigned int frm,
                                            size_t vl);
vint16mf4_t __riscv_vfncvt_x_f_w_i16mf4_rm_mu(vbool64_t vm, vint16mf4_t vd,
                                              vfloat32mf2_t vs2,
                                              unsigned int frm, size_t vl);
vint16mf2_t __riscv_vfncvt_x_f_w_i16mf2_rm_mu(vbool32_t vm, vint16mf2_t vd,
                                              vfloat32m1_t vs2,
                                              unsigned int frm, size_t vl);
vint16m1_t __riscv_vfncvt_x_f_w_i16m1_rm_mu(vbool16_t vm, vint16m1_t vd,
                                            vfloat32m2_t vs2, unsigned int frm,
                                            size_t vl);
vint16m2_t __riscv_vfncvt_x_f_w_i16m2_rm_mu(vbool8_t vm, vint16m2_t vd,
                                            vfloat32m4_t vs2, unsigned int frm,
                                            size_t vl);
vint16m4_t __riscv_vfncvt_x_f_w_i16m4_rm_mu(vbool4_t vm, vint16m4_t vd,
                                            vfloat32m8_t vs2, unsigned int frm,
                                            size_t vl);
vuint16mf4_t __riscv_vfncvt_xu_f_w_u16mf4_rm_mu(vbool64_t vm, vuint16mf4_t vd,
                                                vfloat32mf2_t vs2,
                                                unsigned int frm, size_t vl);
vuint16mf2_t __riscv_vfncvt_xu_f_w_u16mf2_rm_mu(vbool32_t vm, vuint16mf2_t vd,
                                                vfloat32m1_t vs2,
                                                unsigned int frm, size_t vl);
vuint16m1_t __riscv_vfncvt_xu_f_w_u16m1_rm_mu(vbool16_t vm, vuint16m1_t vd,
                                              vfloat32m2_t vs2,
                                              unsigned int frm, size_t vl);
vuint16m2_t __riscv_vfncvt_xu_f_w_u16m2_rm_mu(vbool8_t vm, vuint16m2_t vd,
                                              vfloat32m4_t vs2,
                                              unsigned int frm, size_t vl);
vuint16m4_t __riscv_vfncvt_xu_f_w_u16m4_rm_mu(vbool4_t vm, vuint16m4_t vd,
                                              vfloat32m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_x_w_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                                vint32mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_x_w_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                                vint32m1_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_x_w_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                              vint32m2_t vs2, unsigned int frm,
                                              size_t vl);
vfloat16m2_t __riscv_vfncvt_f_x_w_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                              vint32m4_t vs2, unsigned int frm,
                                              size_t vl);
vfloat16m4_t __riscv_vfncvt_f_x_w_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                              vint32m8_t vs2, unsigned int frm,
                                              size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_xu_w_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                                 vuint32mf2_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_xu_w_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                                 vuint32m1_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_xu_w_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                               vuint32m2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_xu_w_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                               vuint32m4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_xu_w_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                               vuint32m8_t vs2,
                                               unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_f_w_f16mf4_rm_mu(vbool64_t vm, vfloat16mf4_t vd,
                                                vfloat32mf2_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_f_w_f16mf2_rm_mu(vbool32_t vm, vfloat16mf2_t vd,
                                                vfloat32m1_t vs2,
                                                unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_f_w_f16m1_rm_mu(vbool16_t vm, vfloat16m1_t vd,
                                              vfloat32m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_f_w_f16m2_rm_mu(vbool8_t vm, vfloat16m2_t vd,
                                              vfloat32m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_f_w_f16m4_rm_mu(vbool4_t vm, vfloat16m4_t vd,
                                              vfloat32m8_t vs2,
                                              unsigned int frm, size_t vl);
vint32mf2_t __riscv_vfncvt_x_f_w_i32mf2_rm_mu(vbool64_t vm, vint32mf2_t vd,
                                              vfloat64m1_t vs2,
                                              unsigned int frm, size_t vl);
vint32m1_t __riscv_vfncvt_x_f_w_i32m1_rm_mu(vbool32_t vm, vint32m1_t vd,
                                            vfloat64m2_t vs2, unsigned int frm,
                                            size_t vl);
vint32m2_t __riscv_vfncvt_x_f_w_i32m2_rm_mu(vbool16_t vm, vint32m2_t vd,
                                            vfloat64m4_t vs2, unsigned int frm,
                                            size_t vl);
vint32m4_t __riscv_vfncvt_x_f_w_i32m4_rm_mu(vbool8_t vm, vint32m4_t vd,
                                            vfloat64m8_t vs2, unsigned int frm,
                                            size_t vl);
vuint32mf2_t __riscv_vfncvt_xu_f_w_u32mf2_rm_mu(vbool64_t vm, vuint32mf2_t vd,
                                                vfloat64m1_t vs2,
                                                unsigned int frm, size_t vl);
vuint32m1_t __riscv_vfncvt_xu_f_w_u32m1_rm_mu(vbool32_t vm, vuint32m1_t vd,
                                              vfloat64m2_t vs2,
                                              unsigned int frm, size_t vl);
vuint32m2_t __riscv_vfncvt_xu_f_w_u32m2_rm_mu(vbool16_t vm, vuint32m2_t vd,
                                              vfloat64m4_t vs2,
                                              unsigned int frm, size_t vl);
vuint32m4_t __riscv_vfncvt_xu_f_w_u32m4_rm_mu(vbool8_t vm, vuint32m4_t vd,
                                              vfloat64m8_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_x_w_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                                vint64m1_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_x_w_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                              vint64m2_t vs2, unsigned int frm,
                                              size_t vl);
vfloat32m2_t __riscv_vfncvt_f_x_w_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                              vint64m4_t vs2, unsigned int frm,
                                              size_t vl);
vfloat32m4_t __riscv_vfncvt_f_x_w_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                              vint64m8_t vs2, unsigned int frm,
                                              size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_xu_w_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                                 vuint64m1_t vs2,
                                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_xu_w_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                               vuint64m2_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_xu_w_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                               vuint64m4_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_xu_w_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                               vuint64m8_t vs2,
                                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_f_w_f32mf2_rm_mu(vbool64_t vm, vfloat32mf2_t vd,
                                                vfloat64m1_t vs2,
                                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_f_w_f32m1_rm_mu(vbool32_t vm, vfloat32m1_t vd,
                                              vfloat64m2_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_f_w_f32m2_rm_mu(vbool16_t vm, vfloat32m2_t vd,
                                              vfloat64m4_t vs2,
                                              unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_f_w_f32m4_rm_mu(vbool8_t vm, vfloat32m4_t vd,
                                              vfloat64m8_t vs2,
                                              unsigned int frm, size_t vl);