Vector Floating-Point Intrinsics

Vector Single-Width Floating-Point Add/Subtract Intrinsics

vfloat16mf4_t __riscv_vfadd_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                               vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfadd_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfadd_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                               vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfadd_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfadd_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                              vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfadd_tu(vfloat16m1_t vd, vfloat16m1_t vs2, _Float16 rs1,
                              size_t vl);
vfloat16m2_t __riscv_vfadd_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                              vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfadd_tu(vfloat16m2_t vd, vfloat16m2_t vs2, _Float16 rs1,
                              size_t vl);
vfloat16m4_t __riscv_vfadd_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                              vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfadd_tu(vfloat16m4_t vd, vfloat16m4_t vs2, _Float16 rs1,
                              size_t vl);
vfloat16m8_t __riscv_vfadd_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                              vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfadd_tu(vfloat16m8_t vd, vfloat16m8_t vs2, _Float16 rs1,
                              size_t vl);
vfloat32mf2_t __riscv_vfadd_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                               vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfadd_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2, float rs1,
                               size_t vl);
vfloat32m1_t __riscv_vfadd_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                              vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfadd_tu(vfloat32m1_t vd, vfloat32m1_t vs2, float rs1,
                              size_t vl);
vfloat32m2_t __riscv_vfadd_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                              vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfadd_tu(vfloat32m2_t vd, vfloat32m2_t vs2, float rs1,
                              size_t vl);
vfloat32m4_t __riscv_vfadd_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                              vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfadd_tu(vfloat32m4_t vd, vfloat32m4_t vs2, float rs1,
                              size_t vl);
vfloat32m8_t __riscv_vfadd_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                              vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfadd_tu(vfloat32m8_t vd, vfloat32m8_t vs2, float rs1,
                              size_t vl);
vfloat64m1_t __riscv_vfadd_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                              vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfadd_tu(vfloat64m1_t vd, vfloat64m1_t vs2, double rs1,
                              size_t vl);
vfloat64m2_t __riscv_vfadd_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                              vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfadd_tu(vfloat64m2_t vd, vfloat64m2_t vs2, double rs1,
                              size_t vl);
vfloat64m4_t __riscv_vfadd_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                              vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfadd_tu(vfloat64m4_t vd, vfloat64m4_t vs2, double rs1,
                              size_t vl);
vfloat64m8_t __riscv_vfadd_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                              vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfadd_tu(vfloat64m8_t vd, vfloat64m8_t vs2, double rs1,
                              size_t vl);
vfloat16mf4_t __riscv_vfsub_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                               vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfsub_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfsub_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                               vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfsub_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfsub_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                              vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfsub_tu(vfloat16m1_t vd, vfloat16m1_t vs2, _Float16 rs1,
                              size_t vl);
vfloat16m2_t __riscv_vfsub_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                              vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfsub_tu(vfloat16m2_t vd, vfloat16m2_t vs2, _Float16 rs1,
                              size_t vl);
vfloat16m4_t __riscv_vfsub_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                              vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfsub_tu(vfloat16m4_t vd, vfloat16m4_t vs2, _Float16 rs1,
                              size_t vl);
vfloat16m8_t __riscv_vfsub_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                              vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfsub_tu(vfloat16m8_t vd, vfloat16m8_t vs2, _Float16 rs1,
                              size_t vl);
vfloat32mf2_t __riscv_vfsub_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                               vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfsub_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2, float rs1,
                               size_t vl);
vfloat32m1_t __riscv_vfsub_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                              vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfsub_tu(vfloat32m1_t vd, vfloat32m1_t vs2, float rs1,
                              size_t vl);
vfloat32m2_t __riscv_vfsub_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                              vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfsub_tu(vfloat32m2_t vd, vfloat32m2_t vs2, float rs1,
                              size_t vl);
vfloat32m4_t __riscv_vfsub_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                              vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfsub_tu(vfloat32m4_t vd, vfloat32m4_t vs2, float rs1,
                              size_t vl);
vfloat32m8_t __riscv_vfsub_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                              vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfsub_tu(vfloat32m8_t vd, vfloat32m8_t vs2, float rs1,
                              size_t vl);
vfloat64m1_t __riscv_vfsub_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                              vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfsub_tu(vfloat64m1_t vd, vfloat64m1_t vs2, double rs1,
                              size_t vl);
vfloat64m2_t __riscv_vfsub_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                              vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfsub_tu(vfloat64m2_t vd, vfloat64m2_t vs2, double rs1,
                              size_t vl);
vfloat64m4_t __riscv_vfsub_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                              vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfsub_tu(vfloat64m4_t vd, vfloat64m4_t vs2, double rs1,
                              size_t vl);
vfloat64m8_t __riscv_vfsub_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                              vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfsub_tu(vfloat64m8_t vd, vfloat64m8_t vs2, double rs1,
                              size_t vl);
vfloat16mf4_t __riscv_vfrsub_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfrsub_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfrsub_tu(vfloat16m1_t vd, vfloat16m1_t vs2, _Float16 rs1,
                               size_t vl);
vfloat16m2_t __riscv_vfrsub_tu(vfloat16m2_t vd, vfloat16m2_t vs2, _Float16 rs1,
                               size_t vl);
vfloat16m4_t __riscv_vfrsub_tu(vfloat16m4_t vd, vfloat16m4_t vs2, _Float16 rs1,
                               size_t vl);
vfloat16m8_t __riscv_vfrsub_tu(vfloat16m8_t vd, vfloat16m8_t vs2, _Float16 rs1,
                               size_t vl);
vfloat32mf2_t __riscv_vfrsub_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2, float rs1,
                                size_t vl);
vfloat32m1_t __riscv_vfrsub_tu(vfloat32m1_t vd, vfloat32m1_t vs2, float rs1,
                               size_t vl);
vfloat32m2_t __riscv_vfrsub_tu(vfloat32m2_t vd, vfloat32m2_t vs2, float rs1,
                               size_t vl);
vfloat32m4_t __riscv_vfrsub_tu(vfloat32m4_t vd, vfloat32m4_t vs2, float rs1,
                               size_t vl);
vfloat32m8_t __riscv_vfrsub_tu(vfloat32m8_t vd, vfloat32m8_t vs2, float rs1,
                               size_t vl);
vfloat64m1_t __riscv_vfrsub_tu(vfloat64m1_t vd, vfloat64m1_t vs2, double rs1,
                               size_t vl);
vfloat64m2_t __riscv_vfrsub_tu(vfloat64m2_t vd, vfloat64m2_t vs2, double rs1,
                               size_t vl);
vfloat64m4_t __riscv_vfrsub_tu(vfloat64m4_t vd, vfloat64m4_t vs2, double rs1,
                               size_t vl);
vfloat64m8_t __riscv_vfrsub_tu(vfloat64m8_t vd, vfloat64m8_t vs2, double rs1,
                               size_t vl);
vfloat16mf4_t __riscv_vfneg_tu(vfloat16mf4_t vd, vfloat16mf4_t vs, size_t vl);
vfloat16mf2_t __riscv_vfneg_tu(vfloat16mf2_t vd, vfloat16mf2_t vs, size_t vl);
vfloat16m1_t __riscv_vfneg_tu(vfloat16m1_t vd, vfloat16m1_t vs, size_t vl);
vfloat16m2_t __riscv_vfneg_tu(vfloat16m2_t vd, vfloat16m2_t vs, size_t vl);
vfloat16m4_t __riscv_vfneg_tu(vfloat16m4_t vd, vfloat16m4_t vs, size_t vl);
vfloat16m8_t __riscv_vfneg_tu(vfloat16m8_t vd, vfloat16m8_t vs, size_t vl);
vfloat32mf2_t __riscv_vfneg_tu(vfloat32mf2_t vd, vfloat32mf2_t vs, size_t vl);
vfloat32m1_t __riscv_vfneg_tu(vfloat32m1_t vd, vfloat32m1_t vs, size_t vl);
vfloat32m2_t __riscv_vfneg_tu(vfloat32m2_t vd, vfloat32m2_t vs, size_t vl);
vfloat32m4_t __riscv_vfneg_tu(vfloat32m4_t vd, vfloat32m4_t vs, size_t vl);
vfloat32m8_t __riscv_vfneg_tu(vfloat32m8_t vd, vfloat32m8_t vs, size_t vl);
vfloat64m1_t __riscv_vfneg_tu(vfloat64m1_t vd, vfloat64m1_t vs, size_t vl);
vfloat64m2_t __riscv_vfneg_tu(vfloat64m2_t vd, vfloat64m2_t vs, size_t vl);
vfloat64m4_t __riscv_vfneg_tu(vfloat64m4_t vd, vfloat64m4_t vs, size_t vl);
vfloat64m8_t __riscv_vfneg_tu(vfloat64m8_t vd, vfloat64m8_t vs, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfadd_tum(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                size_t vl);
vfloat16mf4_t __riscv_vfadd_tum(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfadd_tum(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                size_t vl);
vfloat16mf2_t __riscv_vfadd_tum(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfadd_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfadd_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfadd_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfadd_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfadd_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfadd_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfadd_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfadd_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfadd_tum(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                size_t vl);
vfloat32mf2_t __riscv_vfadd_tum(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfadd_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfadd_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               float rs1, size_t vl);
vfloat32m2_t __riscv_vfadd_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfadd_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               float rs1, size_t vl);
vfloat32m4_t __riscv_vfadd_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfadd_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               float rs1, size_t vl);
vfloat32m8_t __riscv_vfadd_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfadd_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               float rs1, size_t vl);
vfloat64m1_t __riscv_vfadd_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfadd_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               double rs1, size_t vl);
vfloat64m2_t __riscv_vfadd_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfadd_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               double rs1, size_t vl);
vfloat64m4_t __riscv_vfadd_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfadd_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               double rs1, size_t vl);
vfloat64m8_t __riscv_vfadd_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfadd_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               double rs1, size_t vl);
vfloat16mf4_t __riscv_vfsub_tum(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                size_t vl);
vfloat16mf4_t __riscv_vfsub_tum(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfsub_tum(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                size_t vl);
vfloat16mf2_t __riscv_vfsub_tum(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfsub_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfsub_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfsub_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfsub_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfsub_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfsub_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfsub_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfsub_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfsub_tum(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                size_t vl);
vfloat32mf2_t __riscv_vfsub_tum(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfsub_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfsub_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               float rs1, size_t vl);
vfloat32m2_t __riscv_vfsub_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfsub_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               float rs1, size_t vl);
vfloat32m4_t __riscv_vfsub_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfsub_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               float rs1, size_t vl);
vfloat32m8_t __riscv_vfsub_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfsub_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               float rs1, size_t vl);
vfloat64m1_t __riscv_vfsub_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfsub_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               double rs1, size_t vl);
vfloat64m2_t __riscv_vfsub_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfsub_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               double rs1, size_t vl);
vfloat64m4_t __riscv_vfsub_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfsub_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               double rs1, size_t vl);
vfloat64m8_t __riscv_vfsub_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfsub_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               double rs1, size_t vl);
vfloat16mf4_t __riscv_vfrsub_tum(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfrsub_tum(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfrsub_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfrsub_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfrsub_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfrsub_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfrsub_tum(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfrsub_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                float rs1, size_t vl);
vfloat32m2_t __riscv_vfrsub_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                float rs1, size_t vl);
vfloat32m4_t __riscv_vfrsub_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                float rs1, size_t vl);
vfloat32m8_t __riscv_vfrsub_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                float rs1, size_t vl);
vfloat64m1_t __riscv_vfrsub_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                double rs1, size_t vl);
vfloat64m2_t __riscv_vfrsub_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                double rs1, size_t vl);
vfloat64m4_t __riscv_vfrsub_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                double rs1, size_t vl);
vfloat64m8_t __riscv_vfrsub_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                double rs1, size_t vl);
vfloat16mf4_t __riscv_vfneg_tum(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs, size_t vl);
vfloat16mf2_t __riscv_vfneg_tum(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs, size_t vl);
vfloat16m1_t __riscv_vfneg_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs,
                               size_t vl);
vfloat16m2_t __riscv_vfneg_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs,
                               size_t vl);
vfloat16m4_t __riscv_vfneg_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs,
                               size_t vl);
vfloat16m8_t __riscv_vfneg_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs,
                               size_t vl);
vfloat32mf2_t __riscv_vfneg_tum(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs, size_t vl);
vfloat32m1_t __riscv_vfneg_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs,
                               size_t vl);
vfloat32m2_t __riscv_vfneg_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs,
                               size_t vl);
vfloat32m4_t __riscv_vfneg_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs,
                               size_t vl);
vfloat32m8_t __riscv_vfneg_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs,
                               size_t vl);
vfloat64m1_t __riscv_vfneg_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs,
                               size_t vl);
vfloat64m2_t __riscv_vfneg_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs,
                               size_t vl);
vfloat64m4_t __riscv_vfneg_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs,
                               size_t vl);
vfloat64m8_t __riscv_vfneg_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs,
                               size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfadd_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                 size_t vl);
vfloat16mf4_t __riscv_vfadd_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfadd_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                 size_t vl);
vfloat16mf2_t __riscv_vfadd_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfadd_tumu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfadd_tumu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfadd_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfadd_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfadd_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfadd_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfadd_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfadd_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfadd_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                 size_t vl);
vfloat32mf2_t __riscv_vfadd_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfadd_tumu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfadd_tumu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                float rs1, size_t vl);
vfloat32m2_t __riscv_vfadd_tumu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfadd_tumu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                float rs1, size_t vl);
vfloat32m4_t __riscv_vfadd_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfadd_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                float rs1, size_t vl);
vfloat32m8_t __riscv_vfadd_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfadd_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                float rs1, size_t vl);
vfloat64m1_t __riscv_vfadd_tumu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfadd_tumu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                double rs1, size_t vl);
vfloat64m2_t __riscv_vfadd_tumu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfadd_tumu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                double rs1, size_t vl);
vfloat64m4_t __riscv_vfadd_tumu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfadd_tumu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                double rs1, size_t vl);
vfloat64m8_t __riscv_vfadd_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfadd_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                double rs1, size_t vl);
vfloat16mf4_t __riscv_vfsub_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                 size_t vl);
vfloat16mf4_t __riscv_vfsub_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfsub_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                 size_t vl);
vfloat16mf2_t __riscv_vfsub_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfsub_tumu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfsub_tumu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfsub_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfsub_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfsub_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfsub_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfsub_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfsub_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfsub_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                 size_t vl);
vfloat32mf2_t __riscv_vfsub_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfsub_tumu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfsub_tumu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                float rs1, size_t vl);
vfloat32m2_t __riscv_vfsub_tumu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfsub_tumu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                float rs1, size_t vl);
vfloat32m4_t __riscv_vfsub_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfsub_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                float rs1, size_t vl);
vfloat32m8_t __riscv_vfsub_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfsub_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                float rs1, size_t vl);
vfloat64m1_t __riscv_vfsub_tumu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfsub_tumu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                double rs1, size_t vl);
vfloat64m2_t __riscv_vfsub_tumu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfsub_tumu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                double rs1, size_t vl);
vfloat64m4_t __riscv_vfsub_tumu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfsub_tumu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                double rs1, size_t vl);
vfloat64m8_t __riscv_vfsub_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfsub_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                double rs1, size_t vl);
vfloat16mf4_t __riscv_vfrsub_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfrsub_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfrsub_tumu(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs2, _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfrsub_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                 _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfrsub_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                 _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfrsub_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                 _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfrsub_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfrsub_tumu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs2, float rs1, size_t vl);
vfloat32m2_t __riscv_vfrsub_tumu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs2, float rs1, size_t vl);
vfloat32m4_t __riscv_vfrsub_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                 float rs1, size_t vl);
vfloat32m8_t __riscv_vfrsub_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                 float rs1, size_t vl);
vfloat64m1_t __riscv_vfrsub_tumu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs2, double rs1, size_t vl);
vfloat64m2_t __riscv_vfrsub_tumu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs2, double rs1, size_t vl);
vfloat64m4_t __riscv_vfrsub_tumu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs2, double rs1, size_t vl);
vfloat64m8_t __riscv_vfrsub_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                 double rs1, size_t vl);
vfloat16mf4_t __riscv_vfneg_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs, size_t vl);
vfloat16mf2_t __riscv_vfneg_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs, size_t vl);
vfloat16m1_t __riscv_vfneg_tumu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs,
                                size_t vl);
vfloat16m2_t __riscv_vfneg_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs,
                                size_t vl);
vfloat16m4_t __riscv_vfneg_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs,
                                size_t vl);
vfloat16m8_t __riscv_vfneg_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs,
                                size_t vl);
vfloat32mf2_t __riscv_vfneg_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs, size_t vl);
vfloat32m1_t __riscv_vfneg_tumu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs,
                                size_t vl);
vfloat32m2_t __riscv_vfneg_tumu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs,
                                size_t vl);
vfloat32m4_t __riscv_vfneg_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs,
                                size_t vl);
vfloat32m8_t __riscv_vfneg_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs,
                                size_t vl);
vfloat64m1_t __riscv_vfneg_tumu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs,
                                size_t vl);
vfloat64m2_t __riscv_vfneg_tumu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs,
                                size_t vl);
vfloat64m4_t __riscv_vfneg_tumu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs,
                                size_t vl);
vfloat64m8_t __riscv_vfneg_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs,
                                size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfadd_mu(vbool64_t vm, vfloat16mf4_t vd,
                               vfloat16mf4_t vs2, vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfadd_mu(vbool64_t vm, vfloat16mf4_t vd,
                               vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfadd_mu(vbool32_t vm, vfloat16mf2_t vd,
                               vfloat16mf2_t vs2, vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfadd_mu(vbool32_t vm, vfloat16mf2_t vd,
                               vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfadd_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                              vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfadd_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                              _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfadd_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                              vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfadd_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                              _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfadd_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                              vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfadd_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                              _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfadd_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                              vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfadd_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                              _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfadd_mu(vbool64_t vm, vfloat32mf2_t vd,
                               vfloat32mf2_t vs2, vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfadd_mu(vbool64_t vm, vfloat32mf2_t vd,
                               vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfadd_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                              vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfadd_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                              float rs1, size_t vl);
vfloat32m2_t __riscv_vfadd_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                              vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfadd_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                              float rs1, size_t vl);
vfloat32m4_t __riscv_vfadd_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                              vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfadd_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                              float rs1, size_t vl);
vfloat32m8_t __riscv_vfadd_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                              vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfadd_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                              float rs1, size_t vl);
vfloat64m1_t __riscv_vfadd_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                              vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfadd_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                              double rs1, size_t vl);
vfloat64m2_t __riscv_vfadd_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                              vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfadd_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                              double rs1, size_t vl);
vfloat64m4_t __riscv_vfadd_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                              vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfadd_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                              double rs1, size_t vl);
vfloat64m8_t __riscv_vfadd_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                              vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfadd_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                              double rs1, size_t vl);
vfloat16mf4_t __riscv_vfsub_mu(vbool64_t vm, vfloat16mf4_t vd,
                               vfloat16mf4_t vs2, vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfsub_mu(vbool64_t vm, vfloat16mf4_t vd,
                               vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfsub_mu(vbool32_t vm, vfloat16mf2_t vd,
                               vfloat16mf2_t vs2, vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfsub_mu(vbool32_t vm, vfloat16mf2_t vd,
                               vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfsub_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                              vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfsub_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                              _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfsub_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                              vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfsub_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                              _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfsub_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                              vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfsub_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                              _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfsub_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                              vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfsub_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                              _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfsub_mu(vbool64_t vm, vfloat32mf2_t vd,
                               vfloat32mf2_t vs2, vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfsub_mu(vbool64_t vm, vfloat32mf2_t vd,
                               vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfsub_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                              vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfsub_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                              float rs1, size_t vl);
vfloat32m2_t __riscv_vfsub_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                              vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfsub_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                              float rs1, size_t vl);
vfloat32m4_t __riscv_vfsub_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                              vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfsub_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                              float rs1, size_t vl);
vfloat32m8_t __riscv_vfsub_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                              vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfsub_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                              float rs1, size_t vl);
vfloat64m1_t __riscv_vfsub_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                              vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfsub_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                              double rs1, size_t vl);
vfloat64m2_t __riscv_vfsub_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                              vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfsub_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                              double rs1, size_t vl);
vfloat64m4_t __riscv_vfsub_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                              vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfsub_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                              double rs1, size_t vl);
vfloat64m8_t __riscv_vfsub_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                              vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfsub_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                              double rs1, size_t vl);
vfloat16mf4_t __riscv_vfrsub_mu(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfrsub_mu(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfrsub_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfrsub_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfrsub_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfrsub_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfrsub_mu(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfrsub_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               float rs1, size_t vl);
vfloat32m2_t __riscv_vfrsub_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               float rs1, size_t vl);
vfloat32m4_t __riscv_vfrsub_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               float rs1, size_t vl);
vfloat32m8_t __riscv_vfrsub_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               float rs1, size_t vl);
vfloat64m1_t __riscv_vfrsub_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               double rs1, size_t vl);
vfloat64m2_t __riscv_vfrsub_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               double rs1, size_t vl);
vfloat64m4_t __riscv_vfrsub_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               double rs1, size_t vl);
vfloat64m8_t __riscv_vfrsub_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               double rs1, size_t vl);
vfloat16mf4_t __riscv_vfneg_mu(vbool64_t vm, vfloat16mf4_t vd, vfloat16mf4_t vs,
                               size_t vl);
vfloat16mf2_t __riscv_vfneg_mu(vbool32_t vm, vfloat16mf2_t vd, vfloat16mf2_t vs,
                               size_t vl);
vfloat16m1_t __riscv_vfneg_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs,
                              size_t vl);
vfloat16m2_t __riscv_vfneg_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs,
                              size_t vl);
vfloat16m4_t __riscv_vfneg_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs,
                              size_t vl);
vfloat16m8_t __riscv_vfneg_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs,
                              size_t vl);
vfloat32mf2_t __riscv_vfneg_mu(vbool64_t vm, vfloat32mf2_t vd, vfloat32mf2_t vs,
                               size_t vl);
vfloat32m1_t __riscv_vfneg_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs,
                              size_t vl);
vfloat32m2_t __riscv_vfneg_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs,
                              size_t vl);
vfloat32m4_t __riscv_vfneg_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs,
                              size_t vl);
vfloat32m8_t __riscv_vfneg_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs,
                              size_t vl);
vfloat64m1_t __riscv_vfneg_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs,
                              size_t vl);
vfloat64m2_t __riscv_vfneg_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs,
                              size_t vl);
vfloat64m4_t __riscv_vfneg_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs,
                              size_t vl);
vfloat64m8_t __riscv_vfneg_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs,
                              size_t vl);
vfloat16mf4_t __riscv_vfadd_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                               vfloat16mf4_t vs1, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfadd_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfadd_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                               vfloat16mf2_t vs1, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfadd_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfadd_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                              vfloat16m1_t vs1, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfadd_tu(vfloat16m1_t vd, vfloat16m1_t vs2, _Float16 rs1,
                              unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfadd_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                              vfloat16m2_t vs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfadd_tu(vfloat16m2_t vd, vfloat16m2_t vs2, _Float16 rs1,
                              unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfadd_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                              vfloat16m4_t vs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfadd_tu(vfloat16m4_t vd, vfloat16m4_t vs2, _Float16 rs1,
                              unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfadd_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                              vfloat16m8_t vs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfadd_tu(vfloat16m8_t vd, vfloat16m8_t vs2, _Float16 rs1,
                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfadd_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                               vfloat32mf2_t vs1, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfadd_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2, float rs1,
                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfadd_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                              vfloat32m1_t vs1, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfadd_tu(vfloat32m1_t vd, vfloat32m1_t vs2, float rs1,
                              unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfadd_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                              vfloat32m2_t vs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfadd_tu(vfloat32m2_t vd, vfloat32m2_t vs2, float rs1,
                              unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfadd_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                              vfloat32m4_t vs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfadd_tu(vfloat32m4_t vd, vfloat32m4_t vs2, float rs1,
                              unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfadd_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                              vfloat32m8_t vs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfadd_tu(vfloat32m8_t vd, vfloat32m8_t vs2, float rs1,
                              unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfadd_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                              vfloat64m1_t vs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfadd_tu(vfloat64m1_t vd, vfloat64m1_t vs2, double rs1,
                              unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfadd_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                              vfloat64m2_t vs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfadd_tu(vfloat64m2_t vd, vfloat64m2_t vs2, double rs1,
                              unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfadd_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                              vfloat64m4_t vs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfadd_tu(vfloat64m4_t vd, vfloat64m4_t vs2, double rs1,
                              unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfadd_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                              vfloat64m8_t vs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfadd_tu(vfloat64m8_t vd, vfloat64m8_t vs2, double rs1,
                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfsub_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                               vfloat16mf4_t vs1, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfsub_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfsub_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                               vfloat16mf2_t vs1, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfsub_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfsub_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                              vfloat16m1_t vs1, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfsub_tu(vfloat16m1_t vd, vfloat16m1_t vs2, _Float16 rs1,
                              unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfsub_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                              vfloat16m2_t vs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfsub_tu(vfloat16m2_t vd, vfloat16m2_t vs2, _Float16 rs1,
                              unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfsub_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                              vfloat16m4_t vs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfsub_tu(vfloat16m4_t vd, vfloat16m4_t vs2, _Float16 rs1,
                              unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfsub_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                              vfloat16m8_t vs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfsub_tu(vfloat16m8_t vd, vfloat16m8_t vs2, _Float16 rs1,
                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfsub_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                               vfloat32mf2_t vs1, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfsub_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2, float rs1,
                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfsub_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                              vfloat32m1_t vs1, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfsub_tu(vfloat32m1_t vd, vfloat32m1_t vs2, float rs1,
                              unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfsub_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                              vfloat32m2_t vs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfsub_tu(vfloat32m2_t vd, vfloat32m2_t vs2, float rs1,
                              unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfsub_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                              vfloat32m4_t vs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfsub_tu(vfloat32m4_t vd, vfloat32m4_t vs2, float rs1,
                              unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfsub_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                              vfloat32m8_t vs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfsub_tu(vfloat32m8_t vd, vfloat32m8_t vs2, float rs1,
                              unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfsub_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                              vfloat64m1_t vs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfsub_tu(vfloat64m1_t vd, vfloat64m1_t vs2, double rs1,
                              unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfsub_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                              vfloat64m2_t vs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfsub_tu(vfloat64m2_t vd, vfloat64m2_t vs2, double rs1,
                              unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfsub_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                              vfloat64m4_t vs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfsub_tu(vfloat64m4_t vd, vfloat64m4_t vs2, double rs1,
                              unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfsub_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                              vfloat64m8_t vs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfsub_tu(vfloat64m8_t vd, vfloat64m8_t vs2, double rs1,
                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfrsub_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfrsub_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfrsub_tu(vfloat16m1_t vd, vfloat16m1_t vs2, _Float16 rs1,
                               unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfrsub_tu(vfloat16m2_t vd, vfloat16m2_t vs2, _Float16 rs1,
                               unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfrsub_tu(vfloat16m4_t vd, vfloat16m4_t vs2, _Float16 rs1,
                               unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfrsub_tu(vfloat16m8_t vd, vfloat16m8_t vs2, _Float16 rs1,
                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfrsub_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2, float rs1,
                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfrsub_tu(vfloat32m1_t vd, vfloat32m1_t vs2, float rs1,
                               unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfrsub_tu(vfloat32m2_t vd, vfloat32m2_t vs2, float rs1,
                               unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfrsub_tu(vfloat32m4_t vd, vfloat32m4_t vs2, float rs1,
                               unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfrsub_tu(vfloat32m8_t vd, vfloat32m8_t vs2, float rs1,
                               unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfrsub_tu(vfloat64m1_t vd, vfloat64m1_t vs2, double rs1,
                               unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfrsub_tu(vfloat64m2_t vd, vfloat64m2_t vs2, double rs1,
                               unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfrsub_tu(vfloat64m4_t vd, vfloat64m4_t vs2, double rs1,
                               unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfrsub_tu(vfloat64m8_t vd, vfloat64m8_t vs2, double rs1,
                               unsigned int frm, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfadd_tum(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfadd_tum(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, _Float16 rs1,
                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfadd_tum(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfadd_tum(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, _Float16 rs1,
                                unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfadd_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               vfloat16m1_t vs1, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfadd_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfadd_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               vfloat16m2_t vs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfadd_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfadd_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               vfloat16m4_t vs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfadd_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfadd_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               vfloat16m8_t vs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfadd_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfadd_tum(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfadd_tum(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, float rs1, unsigned int frm,
                                size_t vl);
vfloat32m1_t __riscv_vfadd_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               vfloat32m1_t vs1, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfadd_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfadd_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               vfloat32m2_t vs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfadd_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfadd_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               vfloat32m4_t vs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfadd_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfadd_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               vfloat32m8_t vs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfadd_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfadd_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               vfloat64m1_t vs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfadd_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               double rs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfadd_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               vfloat64m2_t vs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfadd_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               double rs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfadd_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               vfloat64m4_t vs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfadd_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               double rs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfadd_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               vfloat64m8_t vs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfadd_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               double rs1, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfsub_tum(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfsub_tum(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, _Float16 rs1,
                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfsub_tum(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfsub_tum(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, _Float16 rs1,
                                unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfsub_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               vfloat16m1_t vs1, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfsub_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfsub_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               vfloat16m2_t vs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfsub_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfsub_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               vfloat16m4_t vs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfsub_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfsub_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               vfloat16m8_t vs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfsub_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfsub_tum(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfsub_tum(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, float rs1, unsigned int frm,
                                size_t vl);
vfloat32m1_t __riscv_vfsub_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               vfloat32m1_t vs1, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfsub_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfsub_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               vfloat32m2_t vs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfsub_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfsub_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               vfloat32m4_t vs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfsub_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfsub_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               vfloat32m8_t vs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfsub_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfsub_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               vfloat64m1_t vs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfsub_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               double rs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfsub_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               vfloat64m2_t vs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfsub_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               double rs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfsub_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               vfloat64m4_t vs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfsub_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               double rs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfsub_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               vfloat64m8_t vs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfsub_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               double rs1, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfrsub_tum(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, _Float16 rs1,
                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfrsub_tum(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, _Float16 rs1,
                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfrsub_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfrsub_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfrsub_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfrsub_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfrsub_tum(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, float rs1, unsigned int frm,
                                 size_t vl);
vfloat32m1_t __riscv_vfrsub_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfrsub_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfrsub_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfrsub_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfrsub_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                double rs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfrsub_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                double rs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfrsub_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                double rs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfrsub_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                double rs1, unsigned int frm, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfadd_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                 unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfadd_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, _Float16 rs1,
                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfadd_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfadd_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, _Float16 rs1,
                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfadd_tumu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                vfloat16m1_t vs1, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfadd_tumu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfadd_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                vfloat16m2_t vs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfadd_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfadd_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                vfloat16m4_t vs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfadd_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfadd_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                vfloat16m8_t vs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfadd_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfadd_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfadd_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, float rs1, unsigned int frm,
                                 size_t vl);
vfloat32m1_t __riscv_vfadd_tumu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                vfloat32m1_t vs1, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfadd_tumu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfadd_tumu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                vfloat32m2_t vs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfadd_tumu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfadd_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                vfloat32m4_t vs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfadd_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfadd_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                vfloat32m8_t vs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfadd_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfadd_tumu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                vfloat64m1_t vs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfadd_tumu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                double rs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfadd_tumu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                vfloat64m2_t vs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfadd_tumu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                double rs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfadd_tumu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                vfloat64m4_t vs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfadd_tumu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                double rs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfadd_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                vfloat64m8_t vs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfadd_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                double rs1, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfsub_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                 unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfsub_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, _Float16 rs1,
                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfsub_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfsub_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, _Float16 rs1,
                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfsub_tumu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                vfloat16m1_t vs1, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfsub_tumu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfsub_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                vfloat16m2_t vs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfsub_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfsub_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                vfloat16m4_t vs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfsub_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfsub_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                vfloat16m8_t vs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfsub_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfsub_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfsub_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, float rs1, unsigned int frm,
                                 size_t vl);
vfloat32m1_t __riscv_vfsub_tumu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                vfloat32m1_t vs1, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfsub_tumu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfsub_tumu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                vfloat32m2_t vs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfsub_tumu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfsub_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                vfloat32m4_t vs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfsub_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfsub_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                vfloat32m8_t vs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfsub_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfsub_tumu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                vfloat64m1_t vs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfsub_tumu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                double rs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfsub_tumu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                vfloat64m2_t vs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfsub_tumu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                double rs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfsub_tumu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                vfloat64m4_t vs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfsub_tumu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                double rs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfsub_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                vfloat64m8_t vs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfsub_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                double rs1, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfrsub_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs2, _Float16 rs1,
                                  unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfrsub_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs2, _Float16 rs1,
                                  unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfrsub_tumu(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs2, _Float16 rs1,
                                 unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfrsub_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                 _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfrsub_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                 _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfrsub_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                 _Float16 rs1, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfrsub_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs2, float rs1,
                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfrsub_tumu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs2, float rs1, unsigned int frm,
                                 size_t vl);
vfloat32m2_t __riscv_vfrsub_tumu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs2, float rs1, unsigned int frm,
                                 size_t vl);
vfloat32m4_t __riscv_vfrsub_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                 float rs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfrsub_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                 float rs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfrsub_tumu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs2, double rs1, unsigned int frm,
                                 size_t vl);
vfloat64m2_t __riscv_vfrsub_tumu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs2, double rs1, unsigned int frm,
                                 size_t vl);
vfloat64m4_t __riscv_vfrsub_tumu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs2, double rs1, unsigned int frm,
                                 size_t vl);
vfloat64m8_t __riscv_vfrsub_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                 double rs1, unsigned int frm, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfadd_mu(vbool64_t vm, vfloat16mf4_t vd,
                               vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                               unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfadd_mu(vbool64_t vm, vfloat16mf4_t vd,
                               vfloat16mf4_t vs2, _Float16 rs1,
                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfadd_mu(vbool32_t vm, vfloat16mf2_t vd,
                               vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfadd_mu(vbool32_t vm, vfloat16mf2_t vd,
                               vfloat16mf2_t vs2, _Float16 rs1,
                               unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfadd_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                              vfloat16m1_t vs1, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfadd_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                              _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfadd_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                              vfloat16m2_t vs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfadd_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                              _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfadd_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                              vfloat16m4_t vs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfadd_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                              _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfadd_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                              vfloat16m8_t vs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfadd_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                              _Float16 rs1, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfadd_mu(vbool64_t vm, vfloat32mf2_t vd,
                               vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfadd_mu(vbool64_t vm, vfloat32mf2_t vd,
                               vfloat32mf2_t vs2, float rs1, unsigned int frm,
                               size_t vl);
vfloat32m1_t __riscv_vfadd_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                              vfloat32m1_t vs1, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfadd_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                              float rs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfadd_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                              vfloat32m2_t vs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfadd_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                              float rs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfadd_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                              vfloat32m4_t vs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfadd_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                              float rs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfadd_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                              vfloat32m8_t vs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfadd_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                              float rs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfadd_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                              vfloat64m1_t vs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfadd_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                              double rs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfadd_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                              vfloat64m2_t vs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfadd_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                              double rs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfadd_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                              vfloat64m4_t vs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfadd_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                              double rs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfadd_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                              vfloat64m8_t vs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfadd_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                              double rs1, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfsub_mu(vbool64_t vm, vfloat16mf4_t vd,
                               vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                               unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfsub_mu(vbool64_t vm, vfloat16mf4_t vd,
                               vfloat16mf4_t vs2, _Float16 rs1,
                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfsub_mu(vbool32_t vm, vfloat16mf2_t vd,
                               vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfsub_mu(vbool32_t vm, vfloat16mf2_t vd,
                               vfloat16mf2_t vs2, _Float16 rs1,
                               unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfsub_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                              vfloat16m1_t vs1, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfsub_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                              _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfsub_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                              vfloat16m2_t vs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfsub_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                              _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfsub_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                              vfloat16m4_t vs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfsub_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                              _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfsub_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                              vfloat16m8_t vs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfsub_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                              _Float16 rs1, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfsub_mu(vbool64_t vm, vfloat32mf2_t vd,
                               vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfsub_mu(vbool64_t vm, vfloat32mf2_t vd,
                               vfloat32mf2_t vs2, float rs1, unsigned int frm,
                               size_t vl);
vfloat32m1_t __riscv_vfsub_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                              vfloat32m1_t vs1, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfsub_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                              float rs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfsub_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                              vfloat32m2_t vs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfsub_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                              float rs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfsub_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                              vfloat32m4_t vs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfsub_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                              float rs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfsub_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                              vfloat32m8_t vs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfsub_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                              float rs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfsub_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                              vfloat64m1_t vs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfsub_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                              double rs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfsub_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                              vfloat64m2_t vs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfsub_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                              double rs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfsub_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                              vfloat64m4_t vs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfsub_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                              double rs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfsub_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                              vfloat64m8_t vs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfsub_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                              double rs1, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfrsub_mu(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, _Float16 rs1,
                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfrsub_mu(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, _Float16 rs1,
                                unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfrsub_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfrsub_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfrsub_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfrsub_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfrsub_mu(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, float rs1, unsigned int frm,
                                size_t vl);
vfloat32m1_t __riscv_vfrsub_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfrsub_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfrsub_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfrsub_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfrsub_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               double rs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfrsub_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               double rs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfrsub_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               double rs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfrsub_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               double rs1, unsigned int frm, size_t vl);

Vector Widening Floating-Point Add/Subtract Intrinsics

vfloat32mf2_t __riscv_vfwadd_vv_tu(vfloat32mf2_t vd, vfloat16mf4_t vs2,
                                   vfloat16mf4_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfwadd_vf_tu(vfloat32mf2_t vd, vfloat16mf4_t vs2,
                                   _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfwadd_wv_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                   vfloat16mf4_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfwadd_wf_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                   _Float16 rs1, size_t vl);
vfloat32m1_t __riscv_vfwadd_vv_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                                  vfloat16mf2_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwadd_vf_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                                  _Float16 rs1, size_t vl);
vfloat32m1_t __riscv_vfwadd_wv_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                  vfloat16mf2_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwadd_wf_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                  _Float16 rs1, size_t vl);
vfloat32m2_t __riscv_vfwadd_vv_tu(vfloat32m2_t vd, vfloat16m1_t vs2,
                                  vfloat16m1_t vs1, size_t vl);
vfloat32m2_t __riscv_vfwadd_vf_tu(vfloat32m2_t vd, vfloat16m1_t vs2,
                                  _Float16 rs1, size_t vl);
vfloat32m2_t __riscv_vfwadd_wv_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                  vfloat16m1_t vs1, size_t vl);
vfloat32m2_t __riscv_vfwadd_wf_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                  _Float16 rs1, size_t vl);
vfloat32m4_t __riscv_vfwadd_vv_tu(vfloat32m4_t vd, vfloat16m2_t vs2,
                                  vfloat16m2_t vs1, size_t vl);
vfloat32m4_t __riscv_vfwadd_vf_tu(vfloat32m4_t vd, vfloat16m2_t vs2,
                                  _Float16 rs1, size_t vl);
vfloat32m4_t __riscv_vfwadd_wv_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                  vfloat16m2_t vs1, size_t vl);
vfloat32m4_t __riscv_vfwadd_wf_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                  _Float16 rs1, size_t vl);
vfloat32m8_t __riscv_vfwadd_vv_tu(vfloat32m8_t vd, vfloat16m4_t vs2,
                                  vfloat16m4_t vs1, size_t vl);
vfloat32m8_t __riscv_vfwadd_vf_tu(vfloat32m8_t vd, vfloat16m4_t vs2,
                                  _Float16 rs1, size_t vl);
vfloat32m8_t __riscv_vfwadd_wv_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                  vfloat16m4_t vs1, size_t vl);
vfloat32m8_t __riscv_vfwadd_wf_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                  _Float16 rs1, size_t vl);
vfloat64m1_t __riscv_vfwadd_vv_tu(vfloat64m1_t vd, vfloat32mf2_t vs2,
                                  vfloat32mf2_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwadd_vf_tu(vfloat64m1_t vd, vfloat32mf2_t vs2, float rs1,
                                  size_t vl);
vfloat64m1_t __riscv_vfwadd_wv_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                  vfloat32mf2_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwadd_wf_tu(vfloat64m1_t vd, vfloat64m1_t vs2, float rs1,
                                  size_t vl);
vfloat64m2_t __riscv_vfwadd_vv_tu(vfloat64m2_t vd, vfloat32m1_t vs2,
                                  vfloat32m1_t vs1, size_t vl);
vfloat64m2_t __riscv_vfwadd_vf_tu(vfloat64m2_t vd, vfloat32m1_t vs2, float rs1,
                                  size_t vl);
vfloat64m2_t __riscv_vfwadd_wv_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                  vfloat32m1_t vs1, size_t vl);
vfloat64m2_t __riscv_vfwadd_wf_tu(vfloat64m2_t vd, vfloat64m2_t vs2, float rs1,
                                  size_t vl);
vfloat64m4_t __riscv_vfwadd_vv_tu(vfloat64m4_t vd, vfloat32m2_t vs2,
                                  vfloat32m2_t vs1, size_t vl);
vfloat64m4_t __riscv_vfwadd_vf_tu(vfloat64m4_t vd, vfloat32m2_t vs2, float rs1,
                                  size_t vl);
vfloat64m4_t __riscv_vfwadd_wv_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                  vfloat32m2_t vs1, size_t vl);
vfloat64m4_t __riscv_vfwadd_wf_tu(vfloat64m4_t vd, vfloat64m4_t vs2, float rs1,
                                  size_t vl);
vfloat64m8_t __riscv_vfwadd_vv_tu(vfloat64m8_t vd, vfloat32m4_t vs2,
                                  vfloat32m4_t vs1, size_t vl);
vfloat64m8_t __riscv_vfwadd_vf_tu(vfloat64m8_t vd, vfloat32m4_t vs2, float rs1,
                                  size_t vl);
vfloat64m8_t __riscv_vfwadd_wv_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                  vfloat32m4_t vs1, size_t vl);
vfloat64m8_t __riscv_vfwadd_wf_tu(vfloat64m8_t vd, vfloat64m8_t vs2, float rs1,
                                  size_t vl);
vfloat32mf2_t __riscv_vfwsub_vv_tu(vfloat32mf2_t vd, vfloat16mf4_t vs2,
                                   vfloat16mf4_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfwsub_vf_tu(vfloat32mf2_t vd, vfloat16mf4_t vs2,
                                   _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfwsub_wv_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                   vfloat16mf4_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfwsub_wf_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                   _Float16 rs1, size_t vl);
vfloat32m1_t __riscv_vfwsub_vv_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                                  vfloat16mf2_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwsub_vf_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                                  _Float16 rs1, size_t vl);
vfloat32m1_t __riscv_vfwsub_wv_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                  vfloat16mf2_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwsub_wf_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                  _Float16 rs1, size_t vl);
vfloat32m2_t __riscv_vfwsub_vv_tu(vfloat32m2_t vd, vfloat16m1_t vs2,
                                  vfloat16m1_t vs1, size_t vl);
vfloat32m2_t __riscv_vfwsub_vf_tu(vfloat32m2_t vd, vfloat16m1_t vs2,
                                  _Float16 rs1, size_t vl);
vfloat32m2_t __riscv_vfwsub_wv_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                  vfloat16m1_t vs1, size_t vl);
vfloat32m2_t __riscv_vfwsub_wf_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                  _Float16 rs1, size_t vl);
vfloat32m4_t __riscv_vfwsub_vv_tu(vfloat32m4_t vd, vfloat16m2_t vs2,
                                  vfloat16m2_t vs1, size_t vl);
vfloat32m4_t __riscv_vfwsub_vf_tu(vfloat32m4_t vd, vfloat16m2_t vs2,
                                  _Float16 rs1, size_t vl);
vfloat32m4_t __riscv_vfwsub_wv_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                  vfloat16m2_t vs1, size_t vl);
vfloat32m4_t __riscv_vfwsub_wf_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                  _Float16 rs1, size_t vl);
vfloat32m8_t __riscv_vfwsub_vv_tu(vfloat32m8_t vd, vfloat16m4_t vs2,
                                  vfloat16m4_t vs1, size_t vl);
vfloat32m8_t __riscv_vfwsub_vf_tu(vfloat32m8_t vd, vfloat16m4_t vs2,
                                  _Float16 rs1, size_t vl);
vfloat32m8_t __riscv_vfwsub_wv_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                  vfloat16m4_t vs1, size_t vl);
vfloat32m8_t __riscv_vfwsub_wf_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                  _Float16 rs1, size_t vl);
vfloat64m1_t __riscv_vfwsub_vv_tu(vfloat64m1_t vd, vfloat32mf2_t vs2,
                                  vfloat32mf2_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwsub_vf_tu(vfloat64m1_t vd, vfloat32mf2_t vs2, float rs1,
                                  size_t vl);
vfloat64m1_t __riscv_vfwsub_wv_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                  vfloat32mf2_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwsub_wf_tu(vfloat64m1_t vd, vfloat64m1_t vs2, float rs1,
                                  size_t vl);
vfloat64m2_t __riscv_vfwsub_vv_tu(vfloat64m2_t vd, vfloat32m1_t vs2,
                                  vfloat32m1_t vs1, size_t vl);
vfloat64m2_t __riscv_vfwsub_vf_tu(vfloat64m2_t vd, vfloat32m1_t vs2, float rs1,
                                  size_t vl);
vfloat64m2_t __riscv_vfwsub_wv_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                  vfloat32m1_t vs1, size_t vl);
vfloat64m2_t __riscv_vfwsub_wf_tu(vfloat64m2_t vd, vfloat64m2_t vs2, float rs1,
                                  size_t vl);
vfloat64m4_t __riscv_vfwsub_vv_tu(vfloat64m4_t vd, vfloat32m2_t vs2,
                                  vfloat32m2_t vs1, size_t vl);
vfloat64m4_t __riscv_vfwsub_vf_tu(vfloat64m4_t vd, vfloat32m2_t vs2, float rs1,
                                  size_t vl);
vfloat64m4_t __riscv_vfwsub_wv_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                  vfloat32m2_t vs1, size_t vl);
vfloat64m4_t __riscv_vfwsub_wf_tu(vfloat64m4_t vd, vfloat64m4_t vs2, float rs1,
                                  size_t vl);
vfloat64m8_t __riscv_vfwsub_vv_tu(vfloat64m8_t vd, vfloat32m4_t vs2,
                                  vfloat32m4_t vs1, size_t vl);
vfloat64m8_t __riscv_vfwsub_vf_tu(vfloat64m8_t vd, vfloat32m4_t vs2, float rs1,
                                  size_t vl);
vfloat64m8_t __riscv_vfwsub_wv_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                  vfloat32m4_t vs1, size_t vl);
vfloat64m8_t __riscv_vfwsub_wf_tu(vfloat64m8_t vd, vfloat64m8_t vs2, float rs1,
                                  size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwadd_vv_tum(vbool64_t vm, vfloat32mf2_t vd,
                                    vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                    size_t vl);
vfloat32mf2_t __riscv_vfwadd_vf_tum(vbool64_t vm, vfloat32mf2_t vd,
                                    vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfwadd_wv_tum(vbool64_t vm, vfloat32mf2_t vd,
                                    vfloat32mf2_t vs2, vfloat16mf4_t vs1,
                                    size_t vl);
vfloat32mf2_t __riscv_vfwadd_wf_tum(vbool64_t vm, vfloat32mf2_t vd,
                                    vfloat32mf2_t vs2, _Float16 rs1, size_t vl);
vfloat32m1_t __riscv_vfwadd_vv_tum(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                   size_t vl);
vfloat32m1_t __riscv_vfwadd_vf_tum(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat32m1_t __riscv_vfwadd_wv_tum(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat32m1_t vs2, vfloat16mf2_t vs1,
                                   size_t vl);
vfloat32m1_t __riscv_vfwadd_wf_tum(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat32m1_t vs2, _Float16 rs1, size_t vl);
vfloat32m2_t __riscv_vfwadd_vv_tum(vbool16_t vm, vfloat32m2_t vd,
                                   vfloat16m1_t vs2, vfloat16m1_t vs1,
                                   size_t vl);
vfloat32m2_t __riscv_vfwadd_vf_tum(vbool16_t vm, vfloat32m2_t vd,
                                   vfloat16m1_t vs2, _Float16 rs1, size_t vl);
vfloat32m2_t __riscv_vfwadd_wv_tum(vbool16_t vm, vfloat32m2_t vd,
                                   vfloat32m2_t vs2, vfloat16m1_t vs1,
                                   size_t vl);
vfloat32m2_t __riscv_vfwadd_wf_tum(vbool16_t vm, vfloat32m2_t vd,
                                   vfloat32m2_t vs2, _Float16 rs1, size_t vl);
vfloat32m4_t __riscv_vfwadd_vv_tum(vbool8_t vm, vfloat32m4_t vd,
                                   vfloat16m2_t vs2, vfloat16m2_t vs1,
                                   size_t vl);
vfloat32m4_t __riscv_vfwadd_vf_tum(vbool8_t vm, vfloat32m4_t vd,
                                   vfloat16m2_t vs2, _Float16 rs1, size_t vl);
vfloat32m4_t __riscv_vfwadd_wv_tum(vbool8_t vm, vfloat32m4_t vd,
                                   vfloat32m4_t vs2, vfloat16m2_t vs1,
                                   size_t vl);
vfloat32m4_t __riscv_vfwadd_wf_tum(vbool8_t vm, vfloat32m4_t vd,
                                   vfloat32m4_t vs2, _Float16 rs1, size_t vl);
vfloat32m8_t __riscv_vfwadd_vv_tum(vbool4_t vm, vfloat32m8_t vd,
                                   vfloat16m4_t vs2, vfloat16m4_t vs1,
                                   size_t vl);
vfloat32m8_t __riscv_vfwadd_vf_tum(vbool4_t vm, vfloat32m8_t vd,
                                   vfloat16m4_t vs2, _Float16 rs1, size_t vl);
vfloat32m8_t __riscv_vfwadd_wv_tum(vbool4_t vm, vfloat32m8_t vd,
                                   vfloat32m8_t vs2, vfloat16m4_t vs1,
                                   size_t vl);
vfloat32m8_t __riscv_vfwadd_wf_tum(vbool4_t vm, vfloat32m8_t vd,
                                   vfloat32m8_t vs2, _Float16 rs1, size_t vl);
vfloat64m1_t __riscv_vfwadd_vv_tum(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                   size_t vl);
vfloat64m1_t __riscv_vfwadd_vf_tum(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat64m1_t __riscv_vfwadd_wv_tum(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat64m1_t vs2, vfloat32mf2_t vs1,
                                   size_t vl);
vfloat64m1_t __riscv_vfwadd_wf_tum(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat64m1_t vs2, float rs1, size_t vl);
vfloat64m2_t __riscv_vfwadd_vv_tum(vbool32_t vm, vfloat64m2_t vd,
                                   vfloat32m1_t vs2, vfloat32m1_t vs1,
                                   size_t vl);
vfloat64m2_t __riscv_vfwadd_vf_tum(vbool32_t vm, vfloat64m2_t vd,
                                   vfloat32m1_t vs2, float rs1, size_t vl);
vfloat64m2_t __riscv_vfwadd_wv_tum(vbool32_t vm, vfloat64m2_t vd,
                                   vfloat64m2_t vs2, vfloat32m1_t vs1,
                                   size_t vl);
vfloat64m2_t __riscv_vfwadd_wf_tum(vbool32_t vm, vfloat64m2_t vd,
                                   vfloat64m2_t vs2, float rs1, size_t vl);
vfloat64m4_t __riscv_vfwadd_vv_tum(vbool16_t vm, vfloat64m4_t vd,
                                   vfloat32m2_t vs2, vfloat32m2_t vs1,
                                   size_t vl);
vfloat64m4_t __riscv_vfwadd_vf_tum(vbool16_t vm, vfloat64m4_t vd,
                                   vfloat32m2_t vs2, float rs1, size_t vl);
vfloat64m4_t __riscv_vfwadd_wv_tum(vbool16_t vm, vfloat64m4_t vd,
                                   vfloat64m4_t vs2, vfloat32m2_t vs1,
                                   size_t vl);
vfloat64m4_t __riscv_vfwadd_wf_tum(vbool16_t vm, vfloat64m4_t vd,
                                   vfloat64m4_t vs2, float rs1, size_t vl);
vfloat64m8_t __riscv_vfwadd_vv_tum(vbool8_t vm, vfloat64m8_t vd,
                                   vfloat32m4_t vs2, vfloat32m4_t vs1,
                                   size_t vl);
vfloat64m8_t __riscv_vfwadd_vf_tum(vbool8_t vm, vfloat64m8_t vd,
                                   vfloat32m4_t vs2, float rs1, size_t vl);
vfloat64m8_t __riscv_vfwadd_wv_tum(vbool8_t vm, vfloat64m8_t vd,
                                   vfloat64m8_t vs2, vfloat32m4_t vs1,
                                   size_t vl);
vfloat64m8_t __riscv_vfwadd_wf_tum(vbool8_t vm, vfloat64m8_t vd,
                                   vfloat64m8_t vs2, float rs1, size_t vl);
vfloat32mf2_t __riscv_vfwsub_vv_tum(vbool64_t vm, vfloat32mf2_t vd,
                                    vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                    size_t vl);
vfloat32mf2_t __riscv_vfwsub_vf_tum(vbool64_t vm, vfloat32mf2_t vd,
                                    vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfwsub_wv_tum(vbool64_t vm, vfloat32mf2_t vd,
                                    vfloat32mf2_t vs2, vfloat16mf4_t vs1,
                                    size_t vl);
vfloat32mf2_t __riscv_vfwsub_wf_tum(vbool64_t vm, vfloat32mf2_t vd,
                                    vfloat32mf2_t vs2, _Float16 rs1, size_t vl);
vfloat32m1_t __riscv_vfwsub_vv_tum(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                   size_t vl);
vfloat32m1_t __riscv_vfwsub_vf_tum(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat32m1_t __riscv_vfwsub_wv_tum(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat32m1_t vs2, vfloat16mf2_t vs1,
                                   size_t vl);
vfloat32m1_t __riscv_vfwsub_wf_tum(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat32m1_t vs2, _Float16 rs1, size_t vl);
vfloat32m2_t __riscv_vfwsub_vv_tum(vbool16_t vm, vfloat32m2_t vd,
                                   vfloat16m1_t vs2, vfloat16m1_t vs1,
                                   size_t vl);
vfloat32m2_t __riscv_vfwsub_vf_tum(vbool16_t vm, vfloat32m2_t vd,
                                   vfloat16m1_t vs2, _Float16 rs1, size_t vl);
vfloat32m2_t __riscv_vfwsub_wv_tum(vbool16_t vm, vfloat32m2_t vd,
                                   vfloat32m2_t vs2, vfloat16m1_t vs1,
                                   size_t vl);
vfloat32m2_t __riscv_vfwsub_wf_tum(vbool16_t vm, vfloat32m2_t vd,
                                   vfloat32m2_t vs2, _Float16 rs1, size_t vl);
vfloat32m4_t __riscv_vfwsub_vv_tum(vbool8_t vm, vfloat32m4_t vd,
                                   vfloat16m2_t vs2, vfloat16m2_t vs1,
                                   size_t vl);
vfloat32m4_t __riscv_vfwsub_vf_tum(vbool8_t vm, vfloat32m4_t vd,
                                   vfloat16m2_t vs2, _Float16 rs1, size_t vl);
vfloat32m4_t __riscv_vfwsub_wv_tum(vbool8_t vm, vfloat32m4_t vd,
                                   vfloat32m4_t vs2, vfloat16m2_t vs1,
                                   size_t vl);
vfloat32m4_t __riscv_vfwsub_wf_tum(vbool8_t vm, vfloat32m4_t vd,
                                   vfloat32m4_t vs2, _Float16 rs1, size_t vl);
vfloat32m8_t __riscv_vfwsub_vv_tum(vbool4_t vm, vfloat32m8_t vd,
                                   vfloat16m4_t vs2, vfloat16m4_t vs1,
                                   size_t vl);
vfloat32m8_t __riscv_vfwsub_vf_tum(vbool4_t vm, vfloat32m8_t vd,
                                   vfloat16m4_t vs2, _Float16 rs1, size_t vl);
vfloat32m8_t __riscv_vfwsub_wv_tum(vbool4_t vm, vfloat32m8_t vd,
                                   vfloat32m8_t vs2, vfloat16m4_t vs1,
                                   size_t vl);
vfloat32m8_t __riscv_vfwsub_wf_tum(vbool4_t vm, vfloat32m8_t vd,
                                   vfloat32m8_t vs2, _Float16 rs1, size_t vl);
vfloat64m1_t __riscv_vfwsub_vv_tum(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                   size_t vl);
vfloat64m1_t __riscv_vfwsub_vf_tum(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat64m1_t __riscv_vfwsub_wv_tum(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat64m1_t vs2, vfloat32mf2_t vs1,
                                   size_t vl);
vfloat64m1_t __riscv_vfwsub_wf_tum(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat64m1_t vs2, float rs1, size_t vl);
vfloat64m2_t __riscv_vfwsub_vv_tum(vbool32_t vm, vfloat64m2_t vd,
                                   vfloat32m1_t vs2, vfloat32m1_t vs1,
                                   size_t vl);
vfloat64m2_t __riscv_vfwsub_vf_tum(vbool32_t vm, vfloat64m2_t vd,
                                   vfloat32m1_t vs2, float rs1, size_t vl);
vfloat64m2_t __riscv_vfwsub_wv_tum(vbool32_t vm, vfloat64m2_t vd,
                                   vfloat64m2_t vs2, vfloat32m1_t vs1,
                                   size_t vl);
vfloat64m2_t __riscv_vfwsub_wf_tum(vbool32_t vm, vfloat64m2_t vd,
                                   vfloat64m2_t vs2, float rs1, size_t vl);
vfloat64m4_t __riscv_vfwsub_vv_tum(vbool16_t vm, vfloat64m4_t vd,
                                   vfloat32m2_t vs2, vfloat32m2_t vs1,
                                   size_t vl);
vfloat64m4_t __riscv_vfwsub_vf_tum(vbool16_t vm, vfloat64m4_t vd,
                                   vfloat32m2_t vs2, float rs1, size_t vl);
vfloat64m4_t __riscv_vfwsub_wv_tum(vbool16_t vm, vfloat64m4_t vd,
                                   vfloat64m4_t vs2, vfloat32m2_t vs1,
                                   size_t vl);
vfloat64m4_t __riscv_vfwsub_wf_tum(vbool16_t vm, vfloat64m4_t vd,
                                   vfloat64m4_t vs2, float rs1, size_t vl);
vfloat64m8_t __riscv_vfwsub_vv_tum(vbool8_t vm, vfloat64m8_t vd,
                                   vfloat32m4_t vs2, vfloat32m4_t vs1,
                                   size_t vl);
vfloat64m8_t __riscv_vfwsub_vf_tum(vbool8_t vm, vfloat64m8_t vd,
                                   vfloat32m4_t vs2, float rs1, size_t vl);
vfloat64m8_t __riscv_vfwsub_wv_tum(vbool8_t vm, vfloat64m8_t vd,
                                   vfloat64m8_t vs2, vfloat32m4_t vs1,
                                   size_t vl);
vfloat64m8_t __riscv_vfwsub_wf_tum(vbool8_t vm, vfloat64m8_t vd,
                                   vfloat64m8_t vs2, float rs1, size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwadd_vv_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                     vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                     size_t vl);
vfloat32mf2_t __riscv_vfwadd_vf_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                     vfloat16mf4_t vs2, _Float16 rs1,
                                     size_t vl);
vfloat32mf2_t __riscv_vfwadd_wv_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                     vfloat32mf2_t vs2, vfloat16mf4_t vs1,
                                     size_t vl);
vfloat32mf2_t __riscv_vfwadd_wf_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                     vfloat32mf2_t vs2, _Float16 rs1,
                                     size_t vl);
vfloat32m1_t __riscv_vfwadd_vv_tumu(vbool32_t vm, vfloat32m1_t vd,
                                    vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                    size_t vl);
vfloat32m1_t __riscv_vfwadd_vf_tumu(vbool32_t vm, vfloat32m1_t vd,
                                    vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat32m1_t __riscv_vfwadd_wv_tumu(vbool32_t vm, vfloat32m1_t vd,
                                    vfloat32m1_t vs2, vfloat16mf2_t vs1,
                                    size_t vl);
vfloat32m1_t __riscv_vfwadd_wf_tumu(vbool32_t vm, vfloat32m1_t vd,
                                    vfloat32m1_t vs2, _Float16 rs1, size_t vl);
vfloat32m2_t __riscv_vfwadd_vv_tumu(vbool16_t vm, vfloat32m2_t vd,
                                    vfloat16m1_t vs2, vfloat16m1_t vs1,
                                    size_t vl);
vfloat32m2_t __riscv_vfwadd_vf_tumu(vbool16_t vm, vfloat32m2_t vd,
                                    vfloat16m1_t vs2, _Float16 rs1, size_t vl);
vfloat32m2_t __riscv_vfwadd_wv_tumu(vbool16_t vm, vfloat32m2_t vd,
                                    vfloat32m2_t vs2, vfloat16m1_t vs1,
                                    size_t vl);
vfloat32m2_t __riscv_vfwadd_wf_tumu(vbool16_t vm, vfloat32m2_t vd,
                                    vfloat32m2_t vs2, _Float16 rs1, size_t vl);
vfloat32m4_t __riscv_vfwadd_vv_tumu(vbool8_t vm, vfloat32m4_t vd,
                                    vfloat16m2_t vs2, vfloat16m2_t vs1,
                                    size_t vl);
vfloat32m4_t __riscv_vfwadd_vf_tumu(vbool8_t vm, vfloat32m4_t vd,
                                    vfloat16m2_t vs2, _Float16 rs1, size_t vl);
vfloat32m4_t __riscv_vfwadd_wv_tumu(vbool8_t vm, vfloat32m4_t vd,
                                    vfloat32m4_t vs2, vfloat16m2_t vs1,
                                    size_t vl);
vfloat32m4_t __riscv_vfwadd_wf_tumu(vbool8_t vm, vfloat32m4_t vd,
                                    vfloat32m4_t vs2, _Float16 rs1, size_t vl);
vfloat32m8_t __riscv_vfwadd_vv_tumu(vbool4_t vm, vfloat32m8_t vd,
                                    vfloat16m4_t vs2, vfloat16m4_t vs1,
                                    size_t vl);
vfloat32m8_t __riscv_vfwadd_vf_tumu(vbool4_t vm, vfloat32m8_t vd,
                                    vfloat16m4_t vs2, _Float16 rs1, size_t vl);
vfloat32m8_t __riscv_vfwadd_wv_tumu(vbool4_t vm, vfloat32m8_t vd,
                                    vfloat32m8_t vs2, vfloat16m4_t vs1,
                                    size_t vl);
vfloat32m8_t __riscv_vfwadd_wf_tumu(vbool4_t vm, vfloat32m8_t vd,
                                    vfloat32m8_t vs2, _Float16 rs1, size_t vl);
vfloat64m1_t __riscv_vfwadd_vv_tumu(vbool64_t vm, vfloat64m1_t vd,
                                    vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                    size_t vl);
vfloat64m1_t __riscv_vfwadd_vf_tumu(vbool64_t vm, vfloat64m1_t vd,
                                    vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat64m1_t __riscv_vfwadd_wv_tumu(vbool64_t vm, vfloat64m1_t vd,
                                    vfloat64m1_t vs2, vfloat32mf2_t vs1,
                                    size_t vl);
vfloat64m1_t __riscv_vfwadd_wf_tumu(vbool64_t vm, vfloat64m1_t vd,
                                    vfloat64m1_t vs2, float rs1, size_t vl);
vfloat64m2_t __riscv_vfwadd_vv_tumu(vbool32_t vm, vfloat64m2_t vd,
                                    vfloat32m1_t vs2, vfloat32m1_t vs1,
                                    size_t vl);
vfloat64m2_t __riscv_vfwadd_vf_tumu(vbool32_t vm, vfloat64m2_t vd,
                                    vfloat32m1_t vs2, float rs1, size_t vl);
vfloat64m2_t __riscv_vfwadd_wv_tumu(vbool32_t vm, vfloat64m2_t vd,
                                    vfloat64m2_t vs2, vfloat32m1_t vs1,
                                    size_t vl);
vfloat64m2_t __riscv_vfwadd_wf_tumu(vbool32_t vm, vfloat64m2_t vd,
                                    vfloat64m2_t vs2, float rs1, size_t vl);
vfloat64m4_t __riscv_vfwadd_vv_tumu(vbool16_t vm, vfloat64m4_t vd,
                                    vfloat32m2_t vs2, vfloat32m2_t vs1,
                                    size_t vl);
vfloat64m4_t __riscv_vfwadd_vf_tumu(vbool16_t vm, vfloat64m4_t vd,
                                    vfloat32m2_t vs2, float rs1, size_t vl);
vfloat64m4_t __riscv_vfwadd_wv_tumu(vbool16_t vm, vfloat64m4_t vd,
                                    vfloat64m4_t vs2, vfloat32m2_t vs1,
                                    size_t vl);
vfloat64m4_t __riscv_vfwadd_wf_tumu(vbool16_t vm, vfloat64m4_t vd,
                                    vfloat64m4_t vs2, float rs1, size_t vl);
vfloat64m8_t __riscv_vfwadd_vv_tumu(vbool8_t vm, vfloat64m8_t vd,
                                    vfloat32m4_t vs2, vfloat32m4_t vs1,
                                    size_t vl);
vfloat64m8_t __riscv_vfwadd_vf_tumu(vbool8_t vm, vfloat64m8_t vd,
                                    vfloat32m4_t vs2, float rs1, size_t vl);
vfloat64m8_t __riscv_vfwadd_wv_tumu(vbool8_t vm, vfloat64m8_t vd,
                                    vfloat64m8_t vs2, vfloat32m4_t vs1,
                                    size_t vl);
vfloat64m8_t __riscv_vfwadd_wf_tumu(vbool8_t vm, vfloat64m8_t vd,
                                    vfloat64m8_t vs2, float rs1, size_t vl);
vfloat32mf2_t __riscv_vfwsub_vv_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                     vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                     size_t vl);
vfloat32mf2_t __riscv_vfwsub_vf_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                     vfloat16mf4_t vs2, _Float16 rs1,
                                     size_t vl);
vfloat32mf2_t __riscv_vfwsub_wv_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                     vfloat32mf2_t vs2, vfloat16mf4_t vs1,
                                     size_t vl);
vfloat32mf2_t __riscv_vfwsub_wf_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                     vfloat32mf2_t vs2, _Float16 rs1,
                                     size_t vl);
vfloat32m1_t __riscv_vfwsub_vv_tumu(vbool32_t vm, vfloat32m1_t vd,
                                    vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                    size_t vl);
vfloat32m1_t __riscv_vfwsub_vf_tumu(vbool32_t vm, vfloat32m1_t vd,
                                    vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat32m1_t __riscv_vfwsub_wv_tumu(vbool32_t vm, vfloat32m1_t vd,
                                    vfloat32m1_t vs2, vfloat16mf2_t vs1,
                                    size_t vl);
vfloat32m1_t __riscv_vfwsub_wf_tumu(vbool32_t vm, vfloat32m1_t vd,
                                    vfloat32m1_t vs2, _Float16 rs1, size_t vl);
vfloat32m2_t __riscv_vfwsub_vv_tumu(vbool16_t vm, vfloat32m2_t vd,
                                    vfloat16m1_t vs2, vfloat16m1_t vs1,
                                    size_t vl);
vfloat32m2_t __riscv_vfwsub_vf_tumu(vbool16_t vm, vfloat32m2_t vd,
                                    vfloat16m1_t vs2, _Float16 rs1, size_t vl);
vfloat32m2_t __riscv_vfwsub_wv_tumu(vbool16_t vm, vfloat32m2_t vd,
                                    vfloat32m2_t vs2, vfloat16m1_t vs1,
                                    size_t vl);
vfloat32m2_t __riscv_vfwsub_wf_tumu(vbool16_t vm, vfloat32m2_t vd,
                                    vfloat32m2_t vs2, _Float16 rs1, size_t vl);
vfloat32m4_t __riscv_vfwsub_vv_tumu(vbool8_t vm, vfloat32m4_t vd,
                                    vfloat16m2_t vs2, vfloat16m2_t vs1,
                                    size_t vl);
vfloat32m4_t __riscv_vfwsub_vf_tumu(vbool8_t vm, vfloat32m4_t vd,
                                    vfloat16m2_t vs2, _Float16 rs1, size_t vl);
vfloat32m4_t __riscv_vfwsub_wv_tumu(vbool8_t vm, vfloat32m4_t vd,
                                    vfloat32m4_t vs2, vfloat16m2_t vs1,
                                    size_t vl);
vfloat32m4_t __riscv_vfwsub_wf_tumu(vbool8_t vm, vfloat32m4_t vd,
                                    vfloat32m4_t vs2, _Float16 rs1, size_t vl);
vfloat32m8_t __riscv_vfwsub_vv_tumu(vbool4_t vm, vfloat32m8_t vd,
                                    vfloat16m4_t vs2, vfloat16m4_t vs1,
                                    size_t vl);
vfloat32m8_t __riscv_vfwsub_vf_tumu(vbool4_t vm, vfloat32m8_t vd,
                                    vfloat16m4_t vs2, _Float16 rs1, size_t vl);
vfloat32m8_t __riscv_vfwsub_wv_tumu(vbool4_t vm, vfloat32m8_t vd,
                                    vfloat32m8_t vs2, vfloat16m4_t vs1,
                                    size_t vl);
vfloat32m8_t __riscv_vfwsub_wf_tumu(vbool4_t vm, vfloat32m8_t vd,
                                    vfloat32m8_t vs2, _Float16 rs1, size_t vl);
vfloat64m1_t __riscv_vfwsub_vv_tumu(vbool64_t vm, vfloat64m1_t vd,
                                    vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                    size_t vl);
vfloat64m1_t __riscv_vfwsub_vf_tumu(vbool64_t vm, vfloat64m1_t vd,
                                    vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat64m1_t __riscv_vfwsub_wv_tumu(vbool64_t vm, vfloat64m1_t vd,
                                    vfloat64m1_t vs2, vfloat32mf2_t vs1,
                                    size_t vl);
vfloat64m1_t __riscv_vfwsub_wf_tumu(vbool64_t vm, vfloat64m1_t vd,
                                    vfloat64m1_t vs2, float rs1, size_t vl);
vfloat64m2_t __riscv_vfwsub_vv_tumu(vbool32_t vm, vfloat64m2_t vd,
                                    vfloat32m1_t vs2, vfloat32m1_t vs1,
                                    size_t vl);
vfloat64m2_t __riscv_vfwsub_vf_tumu(vbool32_t vm, vfloat64m2_t vd,
                                    vfloat32m1_t vs2, float rs1, size_t vl);
vfloat64m2_t __riscv_vfwsub_wv_tumu(vbool32_t vm, vfloat64m2_t vd,
                                    vfloat64m2_t vs2, vfloat32m1_t vs1,
                                    size_t vl);
vfloat64m2_t __riscv_vfwsub_wf_tumu(vbool32_t vm, vfloat64m2_t vd,
                                    vfloat64m2_t vs2, float rs1, size_t vl);
vfloat64m4_t __riscv_vfwsub_vv_tumu(vbool16_t vm, vfloat64m4_t vd,
                                    vfloat32m2_t vs2, vfloat32m2_t vs1,
                                    size_t vl);
vfloat64m4_t __riscv_vfwsub_vf_tumu(vbool16_t vm, vfloat64m4_t vd,
                                    vfloat32m2_t vs2, float rs1, size_t vl);
vfloat64m4_t __riscv_vfwsub_wv_tumu(vbool16_t vm, vfloat64m4_t vd,
                                    vfloat64m4_t vs2, vfloat32m2_t vs1,
                                    size_t vl);
vfloat64m4_t __riscv_vfwsub_wf_tumu(vbool16_t vm, vfloat64m4_t vd,
                                    vfloat64m4_t vs2, float rs1, size_t vl);
vfloat64m8_t __riscv_vfwsub_vv_tumu(vbool8_t vm, vfloat64m8_t vd,
                                    vfloat32m4_t vs2, vfloat32m4_t vs1,
                                    size_t vl);
vfloat64m8_t __riscv_vfwsub_vf_tumu(vbool8_t vm, vfloat64m8_t vd,
                                    vfloat32m4_t vs2, float rs1, size_t vl);
vfloat64m8_t __riscv_vfwsub_wv_tumu(vbool8_t vm, vfloat64m8_t vd,
                                    vfloat64m8_t vs2, vfloat32m4_t vs1,
                                    size_t vl);
vfloat64m8_t __riscv_vfwsub_wf_tumu(vbool8_t vm, vfloat64m8_t vd,
                                    vfloat64m8_t vs2, float rs1, size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwadd_vv_mu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                   size_t vl);
vfloat32mf2_t __riscv_vfwadd_vf_mu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfwadd_wv_mu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat32mf2_t vs2, vfloat16mf4_t vs1,
                                   size_t vl);
vfloat32mf2_t __riscv_vfwadd_wf_mu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat32mf2_t vs2, _Float16 rs1, size_t vl);
vfloat32m1_t __riscv_vfwadd_vv_mu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                  size_t vl);
vfloat32m1_t __riscv_vfwadd_vf_mu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat32m1_t __riscv_vfwadd_wv_mu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat32m1_t vs2, vfloat16mf2_t vs1,
                                  size_t vl);
vfloat32m1_t __riscv_vfwadd_wf_mu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat32m1_t vs2, _Float16 rs1, size_t vl);
vfloat32m2_t __riscv_vfwadd_vv_mu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat16m1_t vs2, vfloat16m1_t vs1,
                                  size_t vl);
vfloat32m2_t __riscv_vfwadd_vf_mu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat16m1_t vs2, _Float16 rs1, size_t vl);
vfloat32m2_t __riscv_vfwadd_wv_mu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat32m2_t vs2, vfloat16m1_t vs1,
                                  size_t vl);
vfloat32m2_t __riscv_vfwadd_wf_mu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat32m2_t vs2, _Float16 rs1, size_t vl);
vfloat32m4_t __riscv_vfwadd_vv_mu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat16m2_t vs2, vfloat16m2_t vs1,
                                  size_t vl);
vfloat32m4_t __riscv_vfwadd_vf_mu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat16m2_t vs2, _Float16 rs1, size_t vl);
vfloat32m4_t __riscv_vfwadd_wv_mu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat32m4_t vs2, vfloat16m2_t vs1,
                                  size_t vl);
vfloat32m4_t __riscv_vfwadd_wf_mu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat32m4_t vs2, _Float16 rs1, size_t vl);
vfloat32m8_t __riscv_vfwadd_vv_mu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat16m4_t vs2, vfloat16m4_t vs1,
                                  size_t vl);
vfloat32m8_t __riscv_vfwadd_vf_mu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat16m4_t vs2, _Float16 rs1, size_t vl);
vfloat32m8_t __riscv_vfwadd_wv_mu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat32m8_t vs2, vfloat16m4_t vs1,
                                  size_t vl);
vfloat32m8_t __riscv_vfwadd_wf_mu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat32m8_t vs2, _Float16 rs1, size_t vl);
vfloat64m1_t __riscv_vfwadd_vv_mu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                  size_t vl);
vfloat64m1_t __riscv_vfwadd_vf_mu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat64m1_t __riscv_vfwadd_wv_mu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat64m1_t vs2, vfloat32mf2_t vs1,
                                  size_t vl);
vfloat64m1_t __riscv_vfwadd_wf_mu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat64m1_t vs2, float rs1, size_t vl);
vfloat64m2_t __riscv_vfwadd_vv_mu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat32m1_t vs2, vfloat32m1_t vs1,
                                  size_t vl);
vfloat64m2_t __riscv_vfwadd_vf_mu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat32m1_t vs2, float rs1, size_t vl);
vfloat64m2_t __riscv_vfwadd_wv_mu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat64m2_t vs2, vfloat32m1_t vs1,
                                  size_t vl);
vfloat64m2_t __riscv_vfwadd_wf_mu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat64m2_t vs2, float rs1, size_t vl);
vfloat64m4_t __riscv_vfwadd_vv_mu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat32m2_t vs2, vfloat32m2_t vs1,
                                  size_t vl);
vfloat64m4_t __riscv_vfwadd_vf_mu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat32m2_t vs2, float rs1, size_t vl);
vfloat64m4_t __riscv_vfwadd_wv_mu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat64m4_t vs2, vfloat32m2_t vs1,
                                  size_t vl);
vfloat64m4_t __riscv_vfwadd_wf_mu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat64m4_t vs2, float rs1, size_t vl);
vfloat64m8_t __riscv_vfwadd_vv_mu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat32m4_t vs2, vfloat32m4_t vs1,
                                  size_t vl);
vfloat64m8_t __riscv_vfwadd_vf_mu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat32m4_t vs2, float rs1, size_t vl);
vfloat64m8_t __riscv_vfwadd_wv_mu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat64m8_t vs2, vfloat32m4_t vs1,
                                  size_t vl);
vfloat64m8_t __riscv_vfwadd_wf_mu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat64m8_t vs2, float rs1, size_t vl);
vfloat32mf2_t __riscv_vfwsub_vv_mu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                   size_t vl);
vfloat32mf2_t __riscv_vfwsub_vf_mu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfwsub_wv_mu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat32mf2_t vs2, vfloat16mf4_t vs1,
                                   size_t vl);
vfloat32mf2_t __riscv_vfwsub_wf_mu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat32mf2_t vs2, _Float16 rs1, size_t vl);
vfloat32m1_t __riscv_vfwsub_vv_mu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                  size_t vl);
vfloat32m1_t __riscv_vfwsub_vf_mu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat32m1_t __riscv_vfwsub_wv_mu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat32m1_t vs2, vfloat16mf2_t vs1,
                                  size_t vl);
vfloat32m1_t __riscv_vfwsub_wf_mu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat32m1_t vs2, _Float16 rs1, size_t vl);
vfloat32m2_t __riscv_vfwsub_vv_mu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat16m1_t vs2, vfloat16m1_t vs1,
                                  size_t vl);
vfloat32m2_t __riscv_vfwsub_vf_mu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat16m1_t vs2, _Float16 rs1, size_t vl);
vfloat32m2_t __riscv_vfwsub_wv_mu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat32m2_t vs2, vfloat16m1_t vs1,
                                  size_t vl);
vfloat32m2_t __riscv_vfwsub_wf_mu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat32m2_t vs2, _Float16 rs1, size_t vl);
vfloat32m4_t __riscv_vfwsub_vv_mu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat16m2_t vs2, vfloat16m2_t vs1,
                                  size_t vl);
vfloat32m4_t __riscv_vfwsub_vf_mu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat16m2_t vs2, _Float16 rs1, size_t vl);
vfloat32m4_t __riscv_vfwsub_wv_mu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat32m4_t vs2, vfloat16m2_t vs1,
                                  size_t vl);
vfloat32m4_t __riscv_vfwsub_wf_mu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat32m4_t vs2, _Float16 rs1, size_t vl);
vfloat32m8_t __riscv_vfwsub_vv_mu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat16m4_t vs2, vfloat16m4_t vs1,
                                  size_t vl);
vfloat32m8_t __riscv_vfwsub_vf_mu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat16m4_t vs2, _Float16 rs1, size_t vl);
vfloat32m8_t __riscv_vfwsub_wv_mu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat32m8_t vs2, vfloat16m4_t vs1,
                                  size_t vl);
vfloat32m8_t __riscv_vfwsub_wf_mu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat32m8_t vs2, _Float16 rs1, size_t vl);
vfloat64m1_t __riscv_vfwsub_vv_mu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                  size_t vl);
vfloat64m1_t __riscv_vfwsub_vf_mu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat64m1_t __riscv_vfwsub_wv_mu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat64m1_t vs2, vfloat32mf2_t vs1,
                                  size_t vl);
vfloat64m1_t __riscv_vfwsub_wf_mu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat64m1_t vs2, float rs1, size_t vl);
vfloat64m2_t __riscv_vfwsub_vv_mu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat32m1_t vs2, vfloat32m1_t vs1,
                                  size_t vl);
vfloat64m2_t __riscv_vfwsub_vf_mu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat32m1_t vs2, float rs1, size_t vl);
vfloat64m2_t __riscv_vfwsub_wv_mu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat64m2_t vs2, vfloat32m1_t vs1,
                                  size_t vl);
vfloat64m2_t __riscv_vfwsub_wf_mu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat64m2_t vs2, float rs1, size_t vl);
vfloat64m4_t __riscv_vfwsub_vv_mu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat32m2_t vs2, vfloat32m2_t vs1,
                                  size_t vl);
vfloat64m4_t __riscv_vfwsub_vf_mu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat32m2_t vs2, float rs1, size_t vl);
vfloat64m4_t __riscv_vfwsub_wv_mu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat64m4_t vs2, vfloat32m2_t vs1,
                                  size_t vl);
vfloat64m4_t __riscv_vfwsub_wf_mu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat64m4_t vs2, float rs1, size_t vl);
vfloat64m8_t __riscv_vfwsub_vv_mu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat32m4_t vs2, vfloat32m4_t vs1,
                                  size_t vl);
vfloat64m8_t __riscv_vfwsub_vf_mu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat32m4_t vs2, float rs1, size_t vl);
vfloat64m8_t __riscv_vfwsub_wv_mu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat64m8_t vs2, vfloat32m4_t vs1,
                                  size_t vl);
vfloat64m8_t __riscv_vfwsub_wf_mu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat64m8_t vs2, float rs1, size_t vl);
vfloat32mf2_t __riscv_vfwadd_vv_tu(vfloat32mf2_t vd, vfloat16mf4_t vs2,
                                   vfloat16mf4_t vs1, unsigned int frm,
                                   size_t vl);
vfloat32mf2_t __riscv_vfwadd_vf_tu(vfloat32mf2_t vd, vfloat16mf4_t vs2,
                                   _Float16 rs1, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwadd_wv_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                   vfloat16mf4_t vs1, unsigned int frm,
                                   size_t vl);
vfloat32mf2_t __riscv_vfwadd_wf_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                   _Float16 rs1, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_vv_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                                  vfloat16mf2_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfwadd_vf_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                                  _Float16 rs1, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_wv_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                  vfloat16mf2_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfwadd_wf_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                  _Float16 rs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_vv_tu(vfloat32m2_t vd, vfloat16m1_t vs2,
                                  vfloat16m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m2_t __riscv_vfwadd_vf_tu(vfloat32m2_t vd, vfloat16m1_t vs2,
                                  _Float16 rs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_wv_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                  vfloat16m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m2_t __riscv_vfwadd_wf_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                  _Float16 rs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_vv_tu(vfloat32m4_t vd, vfloat16m2_t vs2,
                                  vfloat16m2_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m4_t __riscv_vfwadd_vf_tu(vfloat32m4_t vd, vfloat16m2_t vs2,
                                  _Float16 rs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_wv_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                  vfloat16m2_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m4_t __riscv_vfwadd_wf_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                  _Float16 rs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_vv_tu(vfloat32m8_t vd, vfloat16m4_t vs2,
                                  vfloat16m4_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m8_t __riscv_vfwadd_vf_tu(vfloat32m8_t vd, vfloat16m4_t vs2,
                                  _Float16 rs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_wv_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                  vfloat16m4_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m8_t __riscv_vfwadd_wf_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                  _Float16 rs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwadd_vv_tu(vfloat64m1_t vd, vfloat32mf2_t vs2,
                                  vfloat32mf2_t vs1, unsigned int frm,
                                  size_t vl);
vfloat64m1_t __riscv_vfwadd_vf_tu(vfloat64m1_t vd, vfloat32mf2_t vs2, float rs1,
                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwadd_wv_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                  vfloat32mf2_t vs1, unsigned int frm,
                                  size_t vl);
vfloat64m1_t __riscv_vfwadd_wf_tu(vfloat64m1_t vd, vfloat64m1_t vs2, float rs1,
                                  unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwadd_vv_tu(vfloat64m2_t vd, vfloat32m1_t vs2,
                                  vfloat32m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat64m2_t __riscv_vfwadd_vf_tu(vfloat64m2_t vd, vfloat32m1_t vs2, float rs1,
                                  unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwadd_wv_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                  vfloat32m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat64m2_t __riscv_vfwadd_wf_tu(vfloat64m2_t vd, vfloat64m2_t vs2, float rs1,
                                  unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwadd_vv_tu(vfloat64m4_t vd, vfloat32m2_t vs2,
                                  vfloat32m2_t vs1, unsigned int frm,
                                  size_t vl);
vfloat64m4_t __riscv_vfwadd_vf_tu(vfloat64m4_t vd, vfloat32m2_t vs2, float rs1,
                                  unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwadd_wv_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                  vfloat32m2_t vs1, unsigned int frm,
                                  size_t vl);
vfloat64m4_t __riscv_vfwadd_wf_tu(vfloat64m4_t vd, vfloat64m4_t vs2, float rs1,
                                  unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwadd_vv_tu(vfloat64m8_t vd, vfloat32m4_t vs2,
                                  vfloat32m4_t vs1, unsigned int frm,
                                  size_t vl);
vfloat64m8_t __riscv_vfwadd_vf_tu(vfloat64m8_t vd, vfloat32m4_t vs2, float rs1,
                                  unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwadd_wv_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                  vfloat32m4_t vs1, unsigned int frm,
                                  size_t vl);
vfloat64m8_t __riscv_vfwadd_wf_tu(vfloat64m8_t vd, vfloat64m8_t vs2, float rs1,
                                  unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_vv_tu(vfloat32mf2_t vd, vfloat16mf4_t vs2,
                                   vfloat16mf4_t vs1, unsigned int frm,
                                   size_t vl);
vfloat32mf2_t __riscv_vfwsub_vf_tu(vfloat32mf2_t vd, vfloat16mf4_t vs2,
                                   _Float16 rs1, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_wv_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                   vfloat16mf4_t vs1, unsigned int frm,
                                   size_t vl);
vfloat32mf2_t __riscv_vfwsub_wf_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                   _Float16 rs1, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_vv_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                                  vfloat16mf2_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfwsub_vf_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                                  _Float16 rs1, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_wv_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                  vfloat16mf2_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfwsub_wf_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                  _Float16 rs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_vv_tu(vfloat32m2_t vd, vfloat16m1_t vs2,
                                  vfloat16m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m2_t __riscv_vfwsub_vf_tu(vfloat32m2_t vd, vfloat16m1_t vs2,
                                  _Float16 rs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_wv_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                  vfloat16m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m2_t __riscv_vfwsub_wf_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                  _Float16 rs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_vv_tu(vfloat32m4_t vd, vfloat16m2_t vs2,
                                  vfloat16m2_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m4_t __riscv_vfwsub_vf_tu(vfloat32m4_t vd, vfloat16m2_t vs2,
                                  _Float16 rs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_wv_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                  vfloat16m2_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m4_t __riscv_vfwsub_wf_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                  _Float16 rs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_vv_tu(vfloat32m8_t vd, vfloat16m4_t vs2,
                                  vfloat16m4_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m8_t __riscv_vfwsub_vf_tu(vfloat32m8_t vd, vfloat16m4_t vs2,
                                  _Float16 rs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_wv_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                  vfloat16m4_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m8_t __riscv_vfwsub_wf_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                  _Float16 rs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwsub_vv_tu(vfloat64m1_t vd, vfloat32mf2_t vs2,
                                  vfloat32mf2_t vs1, unsigned int frm,
                                  size_t vl);
vfloat64m1_t __riscv_vfwsub_vf_tu(vfloat64m1_t vd, vfloat32mf2_t vs2, float rs1,
                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwsub_wv_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                  vfloat32mf2_t vs1, unsigned int frm,
                                  size_t vl);
vfloat64m1_t __riscv_vfwsub_wf_tu(vfloat64m1_t vd, vfloat64m1_t vs2, float rs1,
                                  unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwsub_vv_tu(vfloat64m2_t vd, vfloat32m1_t vs2,
                                  vfloat32m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat64m2_t __riscv_vfwsub_vf_tu(vfloat64m2_t vd, vfloat32m1_t vs2, float rs1,
                                  unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwsub_wv_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                  vfloat32m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat64m2_t __riscv_vfwsub_wf_tu(vfloat64m2_t vd, vfloat64m2_t vs2, float rs1,
                                  unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwsub_vv_tu(vfloat64m4_t vd, vfloat32m2_t vs2,
                                  vfloat32m2_t vs1, unsigned int frm,
                                  size_t vl);
vfloat64m4_t __riscv_vfwsub_vf_tu(vfloat64m4_t vd, vfloat32m2_t vs2, float rs1,
                                  unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwsub_wv_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                  vfloat32m2_t vs1, unsigned int frm,
                                  size_t vl);
vfloat64m4_t __riscv_vfwsub_wf_tu(vfloat64m4_t vd, vfloat64m4_t vs2, float rs1,
                                  unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwsub_vv_tu(vfloat64m8_t vd, vfloat32m4_t vs2,
                                  vfloat32m4_t vs1, unsigned int frm,
                                  size_t vl);
vfloat64m8_t __riscv_vfwsub_vf_tu(vfloat64m8_t vd, vfloat32m4_t vs2, float rs1,
                                  unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwsub_wv_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                  vfloat32m4_t vs1, unsigned int frm,
                                  size_t vl);
vfloat64m8_t __riscv_vfwsub_wf_tu(vfloat64m8_t vd, vfloat64m8_t vs2, float rs1,
                                  unsigned int frm, size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwadd_vv_tum(vbool64_t vm, vfloat32mf2_t vd,
                                    vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwadd_vf_tum(vbool64_t vm, vfloat32mf2_t vd,
                                    vfloat16mf4_t vs2, _Float16 rs1,
                                    unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwadd_wv_tum(vbool64_t vm, vfloat32mf2_t vd,
                                    vfloat32mf2_t vs2, vfloat16mf4_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwadd_wf_tum(vbool64_t vm, vfloat32mf2_t vd,
                                    vfloat32mf2_t vs2, _Float16 rs1,
                                    unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_vv_tum(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_vf_tum(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat16mf2_t vs2, _Float16 rs1,
                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_wv_tum(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat32m1_t vs2, vfloat16mf2_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_wf_tum(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat32m1_t vs2, _Float16 rs1,
                                   unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_vv_tum(vbool16_t vm, vfloat32m2_t vd,
                                   vfloat16m1_t vs2, vfloat16m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_vf_tum(vbool16_t vm, vfloat32m2_t vd,
                                   vfloat16m1_t vs2, _Float16 rs1,
                                   unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_wv_tum(vbool16_t vm, vfloat32m2_t vd,
                                   vfloat32m2_t vs2, vfloat16m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_wf_tum(vbool16_t vm, vfloat32m2_t vd,
                                   vfloat32m2_t vs2, _Float16 rs1,
                                   unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_vv_tum(vbool8_t vm, vfloat32m4_t vd,
                                   vfloat16m2_t vs2, vfloat16m2_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_vf_tum(vbool8_t vm, vfloat32m4_t vd,
                                   vfloat16m2_t vs2, _Float16 rs1,
                                   unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_wv_tum(vbool8_t vm, vfloat32m4_t vd,
                                   vfloat32m4_t vs2, vfloat16m2_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_wf_tum(vbool8_t vm, vfloat32m4_t vd,
                                   vfloat32m4_t vs2, _Float16 rs1,
                                   unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_vv_tum(vbool4_t vm, vfloat32m8_t vd,
                                   vfloat16m4_t vs2, vfloat16m4_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_vf_tum(vbool4_t vm, vfloat32m8_t vd,
                                   vfloat16m4_t vs2, _Float16 rs1,
                                   unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_wv_tum(vbool4_t vm, vfloat32m8_t vd,
                                   vfloat32m8_t vs2, vfloat16m4_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_wf_tum(vbool4_t vm, vfloat32m8_t vd,
                                   vfloat32m8_t vs2, _Float16 rs1,
                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwadd_vv_tum(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwadd_vf_tum(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat32mf2_t vs2, float rs1,
                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwadd_wv_tum(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat64m1_t vs2, vfloat32mf2_t vs1,
                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwadd_wf_tum(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat64m1_t vs2, float rs1,
                                   unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwadd_vv_tum(vbool32_t vm, vfloat64m2_t vd,
                                   vfloat32m1_t vs2, vfloat32m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwadd_vf_tum(vbool32_t vm, vfloat64m2_t vd,
                                   vfloat32m1_t vs2, float rs1,
                                   unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwadd_wv_tum(vbool32_t vm, vfloat64m2_t vd,
                                   vfloat64m2_t vs2, vfloat32m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwadd_wf_tum(vbool32_t vm, vfloat64m2_t vd,
                                   vfloat64m2_t vs2, float rs1,
                                   unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwadd_vv_tum(vbool16_t vm, vfloat64m4_t vd,
                                   vfloat32m2_t vs2, vfloat32m2_t vs1,
                                   unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwadd_vf_tum(vbool16_t vm, vfloat64m4_t vd,
                                   vfloat32m2_t vs2, float rs1,
                                   unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwadd_wv_tum(vbool16_t vm, vfloat64m4_t vd,
                                   vfloat64m4_t vs2, vfloat32m2_t vs1,
                                   unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwadd_wf_tum(vbool16_t vm, vfloat64m4_t vd,
                                   vfloat64m4_t vs2, float rs1,
                                   unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwadd_vv_tum(vbool8_t vm, vfloat64m8_t vd,
                                   vfloat32m4_t vs2, vfloat32m4_t vs1,
                                   unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwadd_vf_tum(vbool8_t vm, vfloat64m8_t vd,
                                   vfloat32m4_t vs2, float rs1,
                                   unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwadd_wv_tum(vbool8_t vm, vfloat64m8_t vd,
                                   vfloat64m8_t vs2, vfloat32m4_t vs1,
                                   unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwadd_wf_tum(vbool8_t vm, vfloat64m8_t vd,
                                   vfloat64m8_t vs2, float rs1,
                                   unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_vv_tum(vbool64_t vm, vfloat32mf2_t vd,
                                    vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_vf_tum(vbool64_t vm, vfloat32mf2_t vd,
                                    vfloat16mf4_t vs2, _Float16 rs1,
                                    unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_wv_tum(vbool64_t vm, vfloat32mf2_t vd,
                                    vfloat32mf2_t vs2, vfloat16mf4_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_wf_tum(vbool64_t vm, vfloat32mf2_t vd,
                                    vfloat32mf2_t vs2, _Float16 rs1,
                                    unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_vv_tum(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_vf_tum(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat16mf2_t vs2, _Float16 rs1,
                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_wv_tum(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat32m1_t vs2, vfloat16mf2_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_wf_tum(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat32m1_t vs2, _Float16 rs1,
                                   unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_vv_tum(vbool16_t vm, vfloat32m2_t vd,
                                   vfloat16m1_t vs2, vfloat16m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_vf_tum(vbool16_t vm, vfloat32m2_t vd,
                                   vfloat16m1_t vs2, _Float16 rs1,
                                   unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_wv_tum(vbool16_t vm, vfloat32m2_t vd,
                                   vfloat32m2_t vs2, vfloat16m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_wf_tum(vbool16_t vm, vfloat32m2_t vd,
                                   vfloat32m2_t vs2, _Float16 rs1,
                                   unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_vv_tum(vbool8_t vm, vfloat32m4_t vd,
                                   vfloat16m2_t vs2, vfloat16m2_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_vf_tum(vbool8_t vm, vfloat32m4_t vd,
                                   vfloat16m2_t vs2, _Float16 rs1,
                                   unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_wv_tum(vbool8_t vm, vfloat32m4_t vd,
                                   vfloat32m4_t vs2, vfloat16m2_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_wf_tum(vbool8_t vm, vfloat32m4_t vd,
                                   vfloat32m4_t vs2, _Float16 rs1,
                                   unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_vv_tum(vbool4_t vm, vfloat32m8_t vd,
                                   vfloat16m4_t vs2, vfloat16m4_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_vf_tum(vbool4_t vm, vfloat32m8_t vd,
                                   vfloat16m4_t vs2, _Float16 rs1,
                                   unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_wv_tum(vbool4_t vm, vfloat32m8_t vd,
                                   vfloat32m8_t vs2, vfloat16m4_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_wf_tum(vbool4_t vm, vfloat32m8_t vd,
                                   vfloat32m8_t vs2, _Float16 rs1,
                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwsub_vv_tum(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwsub_vf_tum(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat32mf2_t vs2, float rs1,
                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwsub_wv_tum(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat64m1_t vs2, vfloat32mf2_t vs1,
                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwsub_wf_tum(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat64m1_t vs2, float rs1,
                                   unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwsub_vv_tum(vbool32_t vm, vfloat64m2_t vd,
                                   vfloat32m1_t vs2, vfloat32m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwsub_vf_tum(vbool32_t vm, vfloat64m2_t vd,
                                   vfloat32m1_t vs2, float rs1,
                                   unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwsub_wv_tum(vbool32_t vm, vfloat64m2_t vd,
                                   vfloat64m2_t vs2, vfloat32m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwsub_wf_tum(vbool32_t vm, vfloat64m2_t vd,
                                   vfloat64m2_t vs2, float rs1,
                                   unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwsub_vv_tum(vbool16_t vm, vfloat64m4_t vd,
                                   vfloat32m2_t vs2, vfloat32m2_t vs1,
                                   unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwsub_vf_tum(vbool16_t vm, vfloat64m4_t vd,
                                   vfloat32m2_t vs2, float rs1,
                                   unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwsub_wv_tum(vbool16_t vm, vfloat64m4_t vd,
                                   vfloat64m4_t vs2, vfloat32m2_t vs1,
                                   unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwsub_wf_tum(vbool16_t vm, vfloat64m4_t vd,
                                   vfloat64m4_t vs2, float rs1,
                                   unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwsub_vv_tum(vbool8_t vm, vfloat64m8_t vd,
                                   vfloat32m4_t vs2, vfloat32m4_t vs1,
                                   unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwsub_vf_tum(vbool8_t vm, vfloat64m8_t vd,
                                   vfloat32m4_t vs2, float rs1,
                                   unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwsub_wv_tum(vbool8_t vm, vfloat64m8_t vd,
                                   vfloat64m8_t vs2, vfloat32m4_t vs1,
                                   unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwsub_wf_tum(vbool8_t vm, vfloat64m8_t vd,
                                   vfloat64m8_t vs2, float rs1,
                                   unsigned int frm, size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwadd_vv_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                     vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                     unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwadd_vf_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                     vfloat16mf4_t vs2, _Float16 rs1,
                                     unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwadd_wv_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                     vfloat32mf2_t vs2, vfloat16mf4_t vs1,
                                     unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwadd_wf_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                     vfloat32mf2_t vs2, _Float16 rs1,
                                     unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_vv_tumu(vbool32_t vm, vfloat32m1_t vd,
                                    vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_vf_tumu(vbool32_t vm, vfloat32m1_t vd,
                                    vfloat16mf2_t vs2, _Float16 rs1,
                                    unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_wv_tumu(vbool32_t vm, vfloat32m1_t vd,
                                    vfloat32m1_t vs2, vfloat16mf2_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_wf_tumu(vbool32_t vm, vfloat32m1_t vd,
                                    vfloat32m1_t vs2, _Float16 rs1,
                                    unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_vv_tumu(vbool16_t vm, vfloat32m2_t vd,
                                    vfloat16m1_t vs2, vfloat16m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_vf_tumu(vbool16_t vm, vfloat32m2_t vd,
                                    vfloat16m1_t vs2, _Float16 rs1,
                                    unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_wv_tumu(vbool16_t vm, vfloat32m2_t vd,
                                    vfloat32m2_t vs2, vfloat16m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_wf_tumu(vbool16_t vm, vfloat32m2_t vd,
                                    vfloat32m2_t vs2, _Float16 rs1,
                                    unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_vv_tumu(vbool8_t vm, vfloat32m4_t vd,
                                    vfloat16m2_t vs2, vfloat16m2_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_vf_tumu(vbool8_t vm, vfloat32m4_t vd,
                                    vfloat16m2_t vs2, _Float16 rs1,
                                    unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_wv_tumu(vbool8_t vm, vfloat32m4_t vd,
                                    vfloat32m4_t vs2, vfloat16m2_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_wf_tumu(vbool8_t vm, vfloat32m4_t vd,
                                    vfloat32m4_t vs2, _Float16 rs1,
                                    unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_vv_tumu(vbool4_t vm, vfloat32m8_t vd,
                                    vfloat16m4_t vs2, vfloat16m4_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_vf_tumu(vbool4_t vm, vfloat32m8_t vd,
                                    vfloat16m4_t vs2, _Float16 rs1,
                                    unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_wv_tumu(vbool4_t vm, vfloat32m8_t vd,
                                    vfloat32m8_t vs2, vfloat16m4_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_wf_tumu(vbool4_t vm, vfloat32m8_t vd,
                                    vfloat32m8_t vs2, _Float16 rs1,
                                    unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwadd_vv_tumu(vbool64_t vm, vfloat64m1_t vd,
                                    vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwadd_vf_tumu(vbool64_t vm, vfloat64m1_t vd,
                                    vfloat32mf2_t vs2, float rs1,
                                    unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwadd_wv_tumu(vbool64_t vm, vfloat64m1_t vd,
                                    vfloat64m1_t vs2, vfloat32mf2_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwadd_wf_tumu(vbool64_t vm, vfloat64m1_t vd,
                                    vfloat64m1_t vs2, float rs1,
                                    unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwadd_vv_tumu(vbool32_t vm, vfloat64m2_t vd,
                                    vfloat32m1_t vs2, vfloat32m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwadd_vf_tumu(vbool32_t vm, vfloat64m2_t vd,
                                    vfloat32m1_t vs2, float rs1,
                                    unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwadd_wv_tumu(vbool32_t vm, vfloat64m2_t vd,
                                    vfloat64m2_t vs2, vfloat32m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwadd_wf_tumu(vbool32_t vm, vfloat64m2_t vd,
                                    vfloat64m2_t vs2, float rs1,
                                    unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwadd_vv_tumu(vbool16_t vm, vfloat64m4_t vd,
                                    vfloat32m2_t vs2, vfloat32m2_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwadd_vf_tumu(vbool16_t vm, vfloat64m4_t vd,
                                    vfloat32m2_t vs2, float rs1,
                                    unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwadd_wv_tumu(vbool16_t vm, vfloat64m4_t vd,
                                    vfloat64m4_t vs2, vfloat32m2_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwadd_wf_tumu(vbool16_t vm, vfloat64m4_t vd,
                                    vfloat64m4_t vs2, float rs1,
                                    unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwadd_vv_tumu(vbool8_t vm, vfloat64m8_t vd,
                                    vfloat32m4_t vs2, vfloat32m4_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwadd_vf_tumu(vbool8_t vm, vfloat64m8_t vd,
                                    vfloat32m4_t vs2, float rs1,
                                    unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwadd_wv_tumu(vbool8_t vm, vfloat64m8_t vd,
                                    vfloat64m8_t vs2, vfloat32m4_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwadd_wf_tumu(vbool8_t vm, vfloat64m8_t vd,
                                    vfloat64m8_t vs2, float rs1,
                                    unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_vv_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                     vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                     unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_vf_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                     vfloat16mf4_t vs2, _Float16 rs1,
                                     unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_wv_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                     vfloat32mf2_t vs2, vfloat16mf4_t vs1,
                                     unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_wf_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                     vfloat32mf2_t vs2, _Float16 rs1,
                                     unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_vv_tumu(vbool32_t vm, vfloat32m1_t vd,
                                    vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_vf_tumu(vbool32_t vm, vfloat32m1_t vd,
                                    vfloat16mf2_t vs2, _Float16 rs1,
                                    unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_wv_tumu(vbool32_t vm, vfloat32m1_t vd,
                                    vfloat32m1_t vs2, vfloat16mf2_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_wf_tumu(vbool32_t vm, vfloat32m1_t vd,
                                    vfloat32m1_t vs2, _Float16 rs1,
                                    unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_vv_tumu(vbool16_t vm, vfloat32m2_t vd,
                                    vfloat16m1_t vs2, vfloat16m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_vf_tumu(vbool16_t vm, vfloat32m2_t vd,
                                    vfloat16m1_t vs2, _Float16 rs1,
                                    unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_wv_tumu(vbool16_t vm, vfloat32m2_t vd,
                                    vfloat32m2_t vs2, vfloat16m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_wf_tumu(vbool16_t vm, vfloat32m2_t vd,
                                    vfloat32m2_t vs2, _Float16 rs1,
                                    unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_vv_tumu(vbool8_t vm, vfloat32m4_t vd,
                                    vfloat16m2_t vs2, vfloat16m2_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_vf_tumu(vbool8_t vm, vfloat32m4_t vd,
                                    vfloat16m2_t vs2, _Float16 rs1,
                                    unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_wv_tumu(vbool8_t vm, vfloat32m4_t vd,
                                    vfloat32m4_t vs2, vfloat16m2_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_wf_tumu(vbool8_t vm, vfloat32m4_t vd,
                                    vfloat32m4_t vs2, _Float16 rs1,
                                    unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_vv_tumu(vbool4_t vm, vfloat32m8_t vd,
                                    vfloat16m4_t vs2, vfloat16m4_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_vf_tumu(vbool4_t vm, vfloat32m8_t vd,
                                    vfloat16m4_t vs2, _Float16 rs1,
                                    unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_wv_tumu(vbool4_t vm, vfloat32m8_t vd,
                                    vfloat32m8_t vs2, vfloat16m4_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_wf_tumu(vbool4_t vm, vfloat32m8_t vd,
                                    vfloat32m8_t vs2, _Float16 rs1,
                                    unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwsub_vv_tumu(vbool64_t vm, vfloat64m1_t vd,
                                    vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwsub_vf_tumu(vbool64_t vm, vfloat64m1_t vd,
                                    vfloat32mf2_t vs2, float rs1,
                                    unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwsub_wv_tumu(vbool64_t vm, vfloat64m1_t vd,
                                    vfloat64m1_t vs2, vfloat32mf2_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwsub_wf_tumu(vbool64_t vm, vfloat64m1_t vd,
                                    vfloat64m1_t vs2, float rs1,
                                    unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwsub_vv_tumu(vbool32_t vm, vfloat64m2_t vd,
                                    vfloat32m1_t vs2, vfloat32m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwsub_vf_tumu(vbool32_t vm, vfloat64m2_t vd,
                                    vfloat32m1_t vs2, float rs1,
                                    unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwsub_wv_tumu(vbool32_t vm, vfloat64m2_t vd,
                                    vfloat64m2_t vs2, vfloat32m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwsub_wf_tumu(vbool32_t vm, vfloat64m2_t vd,
                                    vfloat64m2_t vs2, float rs1,
                                    unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwsub_vv_tumu(vbool16_t vm, vfloat64m4_t vd,
                                    vfloat32m2_t vs2, vfloat32m2_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwsub_vf_tumu(vbool16_t vm, vfloat64m4_t vd,
                                    vfloat32m2_t vs2, float rs1,
                                    unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwsub_wv_tumu(vbool16_t vm, vfloat64m4_t vd,
                                    vfloat64m4_t vs2, vfloat32m2_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwsub_wf_tumu(vbool16_t vm, vfloat64m4_t vd,
                                    vfloat64m4_t vs2, float rs1,
                                    unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwsub_vv_tumu(vbool8_t vm, vfloat64m8_t vd,
                                    vfloat32m4_t vs2, vfloat32m4_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwsub_vf_tumu(vbool8_t vm, vfloat64m8_t vd,
                                    vfloat32m4_t vs2, float rs1,
                                    unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwsub_wv_tumu(vbool8_t vm, vfloat64m8_t vd,
                                    vfloat64m8_t vs2, vfloat32m4_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwsub_wf_tumu(vbool8_t vm, vfloat64m8_t vd,
                                    vfloat64m8_t vs2, float rs1,
                                    unsigned int frm, size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwadd_vv_mu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwadd_vf_mu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat16mf4_t vs2, _Float16 rs1,
                                   unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwadd_wv_mu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat32mf2_t vs2, vfloat16mf4_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwadd_wf_mu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat32mf2_t vs2, _Float16 rs1,
                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_vv_mu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_vf_mu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat16mf2_t vs2, _Float16 rs1,
                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_wv_mu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat32m1_t vs2, vfloat16mf2_t vs1,
                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwadd_wf_mu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat32m1_t vs2, _Float16 rs1,
                                  unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_vv_mu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat16m1_t vs2, vfloat16m1_t vs1,
                                  unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_vf_mu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat16m1_t vs2, _Float16 rs1,
                                  unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_wv_mu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat32m2_t vs2, vfloat16m1_t vs1,
                                  unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwadd_wf_mu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat32m2_t vs2, _Float16 rs1,
                                  unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_vv_mu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat16m2_t vs2, vfloat16m2_t vs1,
                                  unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_vf_mu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat16m2_t vs2, _Float16 rs1,
                                  unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_wv_mu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat32m4_t vs2, vfloat16m2_t vs1,
                                  unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwadd_wf_mu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat32m4_t vs2, _Float16 rs1,
                                  unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_vv_mu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat16m4_t vs2, vfloat16m4_t vs1,
                                  unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_vf_mu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat16m4_t vs2, _Float16 rs1,
                                  unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_wv_mu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat32m8_t vs2, vfloat16m4_t vs1,
                                  unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwadd_wf_mu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat32m8_t vs2, _Float16 rs1,
                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwadd_vv_mu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwadd_vf_mu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat32mf2_t vs2, float rs1,
                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwadd_wv_mu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat64m1_t vs2, vfloat32mf2_t vs1,
                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwadd_wf_mu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat64m1_t vs2, float rs1, unsigned int frm,
                                  size_t vl);
vfloat64m2_t __riscv_vfwadd_vv_mu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat32m1_t vs2, vfloat32m1_t vs1,
                                  unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwadd_vf_mu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat32m1_t vs2, float rs1, unsigned int frm,
                                  size_t vl);
vfloat64m2_t __riscv_vfwadd_wv_mu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat64m2_t vs2, vfloat32m1_t vs1,
                                  unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwadd_wf_mu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat64m2_t vs2, float rs1, unsigned int frm,
                                  size_t vl);
vfloat64m4_t __riscv_vfwadd_vv_mu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat32m2_t vs2, vfloat32m2_t vs1,
                                  unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwadd_vf_mu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat32m2_t vs2, float rs1, unsigned int frm,
                                  size_t vl);
vfloat64m4_t __riscv_vfwadd_wv_mu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat64m4_t vs2, vfloat32m2_t vs1,
                                  unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwadd_wf_mu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat64m4_t vs2, float rs1, unsigned int frm,
                                  size_t vl);
vfloat64m8_t __riscv_vfwadd_vv_mu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat32m4_t vs2, vfloat32m4_t vs1,
                                  unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwadd_vf_mu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat32m4_t vs2, float rs1, unsigned int frm,
                                  size_t vl);
vfloat64m8_t __riscv_vfwadd_wv_mu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat64m8_t vs2, vfloat32m4_t vs1,
                                  unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwadd_wf_mu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat64m8_t vs2, float rs1, unsigned int frm,
                                  size_t vl);
vfloat32mf2_t __riscv_vfwsub_vv_mu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_vf_mu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat16mf4_t vs2, _Float16 rs1,
                                   unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_wv_mu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat32mf2_t vs2, vfloat16mf4_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwsub_wf_mu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat32mf2_t vs2, _Float16 rs1,
                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_vv_mu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_vf_mu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat16mf2_t vs2, _Float16 rs1,
                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_wv_mu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat32m1_t vs2, vfloat16mf2_t vs1,
                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwsub_wf_mu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat32m1_t vs2, _Float16 rs1,
                                  unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_vv_mu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat16m1_t vs2, vfloat16m1_t vs1,
                                  unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_vf_mu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat16m1_t vs2, _Float16 rs1,
                                  unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_wv_mu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat32m2_t vs2, vfloat16m1_t vs1,
                                  unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwsub_wf_mu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat32m2_t vs2, _Float16 rs1,
                                  unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_vv_mu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat16m2_t vs2, vfloat16m2_t vs1,
                                  unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_vf_mu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat16m2_t vs2, _Float16 rs1,
                                  unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_wv_mu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat32m4_t vs2, vfloat16m2_t vs1,
                                  unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwsub_wf_mu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat32m4_t vs2, _Float16 rs1,
                                  unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_vv_mu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat16m4_t vs2, vfloat16m4_t vs1,
                                  unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_vf_mu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat16m4_t vs2, _Float16 rs1,
                                  unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_wv_mu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat32m8_t vs2, vfloat16m4_t vs1,
                                  unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwsub_wf_mu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat32m8_t vs2, _Float16 rs1,
                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwsub_vv_mu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwsub_vf_mu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat32mf2_t vs2, float rs1,
                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwsub_wv_mu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat64m1_t vs2, vfloat32mf2_t vs1,
                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwsub_wf_mu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat64m1_t vs2, float rs1, unsigned int frm,
                                  size_t vl);
vfloat64m2_t __riscv_vfwsub_vv_mu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat32m1_t vs2, vfloat32m1_t vs1,
                                  unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwsub_vf_mu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat32m1_t vs2, float rs1, unsigned int frm,
                                  size_t vl);
vfloat64m2_t __riscv_vfwsub_wv_mu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat64m2_t vs2, vfloat32m1_t vs1,
                                  unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwsub_wf_mu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat64m2_t vs2, float rs1, unsigned int frm,
                                  size_t vl);
vfloat64m4_t __riscv_vfwsub_vv_mu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat32m2_t vs2, vfloat32m2_t vs1,
                                  unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwsub_vf_mu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat32m2_t vs2, float rs1, unsigned int frm,
                                  size_t vl);
vfloat64m4_t __riscv_vfwsub_wv_mu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat64m4_t vs2, vfloat32m2_t vs1,
                                  unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwsub_wf_mu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat64m4_t vs2, float rs1, unsigned int frm,
                                  size_t vl);
vfloat64m8_t __riscv_vfwsub_vv_mu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat32m4_t vs2, vfloat32m4_t vs1,
                                  unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwsub_vf_mu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat32m4_t vs2, float rs1, unsigned int frm,
                                  size_t vl);
vfloat64m8_t __riscv_vfwsub_wv_mu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat64m8_t vs2, vfloat32m4_t vs1,
                                  unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwsub_wf_mu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat64m8_t vs2, float rs1, unsigned int frm,
                                  size_t vl);

Vector Single-Width Floating-Point Multiply/Divide Intrinsics

vfloat16mf4_t __riscv_vfmul_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                               vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfmul_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfmul_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                               vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfmul_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfmul_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                              vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfmul_tu(vfloat16m1_t vd, vfloat16m1_t vs2, _Float16 rs1,
                              size_t vl);
vfloat16m2_t __riscv_vfmul_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                              vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfmul_tu(vfloat16m2_t vd, vfloat16m2_t vs2, _Float16 rs1,
                              size_t vl);
vfloat16m4_t __riscv_vfmul_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                              vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfmul_tu(vfloat16m4_t vd, vfloat16m4_t vs2, _Float16 rs1,
                              size_t vl);
vfloat16m8_t __riscv_vfmul_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                              vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfmul_tu(vfloat16m8_t vd, vfloat16m8_t vs2, _Float16 rs1,
                              size_t vl);
vfloat32mf2_t __riscv_vfmul_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                               vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfmul_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2, float rs1,
                               size_t vl);
vfloat32m1_t __riscv_vfmul_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                              vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfmul_tu(vfloat32m1_t vd, vfloat32m1_t vs2, float rs1,
                              size_t vl);
vfloat32m2_t __riscv_vfmul_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                              vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfmul_tu(vfloat32m2_t vd, vfloat32m2_t vs2, float rs1,
                              size_t vl);
vfloat32m4_t __riscv_vfmul_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                              vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfmul_tu(vfloat32m4_t vd, vfloat32m4_t vs2, float rs1,
                              size_t vl);
vfloat32m8_t __riscv_vfmul_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                              vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfmul_tu(vfloat32m8_t vd, vfloat32m8_t vs2, float rs1,
                              size_t vl);
vfloat64m1_t __riscv_vfmul_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                              vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfmul_tu(vfloat64m1_t vd, vfloat64m1_t vs2, double rs1,
                              size_t vl);
vfloat64m2_t __riscv_vfmul_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                              vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfmul_tu(vfloat64m2_t vd, vfloat64m2_t vs2, double rs1,
                              size_t vl);
vfloat64m4_t __riscv_vfmul_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                              vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfmul_tu(vfloat64m4_t vd, vfloat64m4_t vs2, double rs1,
                              size_t vl);
vfloat64m8_t __riscv_vfmul_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                              vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfmul_tu(vfloat64m8_t vd, vfloat64m8_t vs2, double rs1,
                              size_t vl);
vfloat16mf4_t __riscv_vfdiv_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                               vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfdiv_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfdiv_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                               vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfdiv_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfdiv_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                              vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfdiv_tu(vfloat16m1_t vd, vfloat16m1_t vs2, _Float16 rs1,
                              size_t vl);
vfloat16m2_t __riscv_vfdiv_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                              vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfdiv_tu(vfloat16m2_t vd, vfloat16m2_t vs2, _Float16 rs1,
                              size_t vl);
vfloat16m4_t __riscv_vfdiv_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                              vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfdiv_tu(vfloat16m4_t vd, vfloat16m4_t vs2, _Float16 rs1,
                              size_t vl);
vfloat16m8_t __riscv_vfdiv_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                              vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfdiv_tu(vfloat16m8_t vd, vfloat16m8_t vs2, _Float16 rs1,
                              size_t vl);
vfloat32mf2_t __riscv_vfdiv_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                               vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfdiv_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2, float rs1,
                               size_t vl);
vfloat32m1_t __riscv_vfdiv_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                              vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfdiv_tu(vfloat32m1_t vd, vfloat32m1_t vs2, float rs1,
                              size_t vl);
vfloat32m2_t __riscv_vfdiv_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                              vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfdiv_tu(vfloat32m2_t vd, vfloat32m2_t vs2, float rs1,
                              size_t vl);
vfloat32m4_t __riscv_vfdiv_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                              vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfdiv_tu(vfloat32m4_t vd, vfloat32m4_t vs2, float rs1,
                              size_t vl);
vfloat32m8_t __riscv_vfdiv_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                              vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfdiv_tu(vfloat32m8_t vd, vfloat32m8_t vs2, float rs1,
                              size_t vl);
vfloat64m1_t __riscv_vfdiv_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                              vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfdiv_tu(vfloat64m1_t vd, vfloat64m1_t vs2, double rs1,
                              size_t vl);
vfloat64m2_t __riscv_vfdiv_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                              vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfdiv_tu(vfloat64m2_t vd, vfloat64m2_t vs2, double rs1,
                              size_t vl);
vfloat64m4_t __riscv_vfdiv_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                              vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfdiv_tu(vfloat64m4_t vd, vfloat64m4_t vs2, double rs1,
                              size_t vl);
vfloat64m8_t __riscv_vfdiv_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                              vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfdiv_tu(vfloat64m8_t vd, vfloat64m8_t vs2, double rs1,
                              size_t vl);
vfloat16mf4_t __riscv_vfrdiv_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfrdiv_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfrdiv_tu(vfloat16m1_t vd, vfloat16m1_t vs2, _Float16 rs1,
                               size_t vl);
vfloat16m2_t __riscv_vfrdiv_tu(vfloat16m2_t vd, vfloat16m2_t vs2, _Float16 rs1,
                               size_t vl);
vfloat16m4_t __riscv_vfrdiv_tu(vfloat16m4_t vd, vfloat16m4_t vs2, _Float16 rs1,
                               size_t vl);
vfloat16m8_t __riscv_vfrdiv_tu(vfloat16m8_t vd, vfloat16m8_t vs2, _Float16 rs1,
                               size_t vl);
vfloat32mf2_t __riscv_vfrdiv_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2, float rs1,
                                size_t vl);
vfloat32m1_t __riscv_vfrdiv_tu(vfloat32m1_t vd, vfloat32m1_t vs2, float rs1,
                               size_t vl);
vfloat32m2_t __riscv_vfrdiv_tu(vfloat32m2_t vd, vfloat32m2_t vs2, float rs1,
                               size_t vl);
vfloat32m4_t __riscv_vfrdiv_tu(vfloat32m4_t vd, vfloat32m4_t vs2, float rs1,
                               size_t vl);
vfloat32m8_t __riscv_vfrdiv_tu(vfloat32m8_t vd, vfloat32m8_t vs2, float rs1,
                               size_t vl);
vfloat64m1_t __riscv_vfrdiv_tu(vfloat64m1_t vd, vfloat64m1_t vs2, double rs1,
                               size_t vl);
vfloat64m2_t __riscv_vfrdiv_tu(vfloat64m2_t vd, vfloat64m2_t vs2, double rs1,
                               size_t vl);
vfloat64m4_t __riscv_vfrdiv_tu(vfloat64m4_t vd, vfloat64m4_t vs2, double rs1,
                               size_t vl);
vfloat64m8_t __riscv_vfrdiv_tu(vfloat64m8_t vd, vfloat64m8_t vs2, double rs1,
                               size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmul_tum(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                size_t vl);
vfloat16mf4_t __riscv_vfmul_tum(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfmul_tum(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                size_t vl);
vfloat16mf2_t __riscv_vfmul_tum(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfmul_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfmul_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfmul_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfmul_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfmul_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfmul_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfmul_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfmul_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfmul_tum(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                size_t vl);
vfloat32mf2_t __riscv_vfmul_tum(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfmul_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfmul_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               float rs1, size_t vl);
vfloat32m2_t __riscv_vfmul_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfmul_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               float rs1, size_t vl);
vfloat32m4_t __riscv_vfmul_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfmul_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               float rs1, size_t vl);
vfloat32m8_t __riscv_vfmul_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfmul_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               float rs1, size_t vl);
vfloat64m1_t __riscv_vfmul_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfmul_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               double rs1, size_t vl);
vfloat64m2_t __riscv_vfmul_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfmul_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               double rs1, size_t vl);
vfloat64m4_t __riscv_vfmul_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfmul_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               double rs1, size_t vl);
vfloat64m8_t __riscv_vfmul_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfmul_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               double rs1, size_t vl);
vfloat16mf4_t __riscv_vfdiv_tum(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                size_t vl);
vfloat16mf4_t __riscv_vfdiv_tum(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfdiv_tum(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                size_t vl);
vfloat16mf2_t __riscv_vfdiv_tum(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfdiv_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfdiv_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfdiv_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfdiv_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfdiv_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfdiv_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfdiv_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfdiv_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfdiv_tum(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                size_t vl);
vfloat32mf2_t __riscv_vfdiv_tum(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfdiv_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfdiv_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               float rs1, size_t vl);
vfloat32m2_t __riscv_vfdiv_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfdiv_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               float rs1, size_t vl);
vfloat32m4_t __riscv_vfdiv_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfdiv_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               float rs1, size_t vl);
vfloat32m8_t __riscv_vfdiv_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfdiv_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               float rs1, size_t vl);
vfloat64m1_t __riscv_vfdiv_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfdiv_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               double rs1, size_t vl);
vfloat64m2_t __riscv_vfdiv_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfdiv_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               double rs1, size_t vl);
vfloat64m4_t __riscv_vfdiv_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfdiv_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               double rs1, size_t vl);
vfloat64m8_t __riscv_vfdiv_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfdiv_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               double rs1, size_t vl);
vfloat16mf4_t __riscv_vfrdiv_tum(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfrdiv_tum(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfrdiv_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfrdiv_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfrdiv_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfrdiv_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfrdiv_tum(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfrdiv_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                float rs1, size_t vl);
vfloat32m2_t __riscv_vfrdiv_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                float rs1, size_t vl);
vfloat32m4_t __riscv_vfrdiv_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                float rs1, size_t vl);
vfloat32m8_t __riscv_vfrdiv_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                float rs1, size_t vl);
vfloat64m1_t __riscv_vfrdiv_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                double rs1, size_t vl);
vfloat64m2_t __riscv_vfrdiv_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                double rs1, size_t vl);
vfloat64m4_t __riscv_vfrdiv_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                double rs1, size_t vl);
vfloat64m8_t __riscv_vfrdiv_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                double rs1, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmul_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                 size_t vl);
vfloat16mf4_t __riscv_vfmul_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfmul_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                 size_t vl);
vfloat16mf2_t __riscv_vfmul_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfmul_tumu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfmul_tumu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfmul_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfmul_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfmul_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfmul_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfmul_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfmul_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfmul_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                 size_t vl);
vfloat32mf2_t __riscv_vfmul_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfmul_tumu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfmul_tumu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                float rs1, size_t vl);
vfloat32m2_t __riscv_vfmul_tumu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfmul_tumu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                float rs1, size_t vl);
vfloat32m4_t __riscv_vfmul_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfmul_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                float rs1, size_t vl);
vfloat32m8_t __riscv_vfmul_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfmul_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                float rs1, size_t vl);
vfloat64m1_t __riscv_vfmul_tumu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfmul_tumu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                double rs1, size_t vl);
vfloat64m2_t __riscv_vfmul_tumu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfmul_tumu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                double rs1, size_t vl);
vfloat64m4_t __riscv_vfmul_tumu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfmul_tumu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                double rs1, size_t vl);
vfloat64m8_t __riscv_vfmul_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfmul_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                double rs1, size_t vl);
vfloat16mf4_t __riscv_vfdiv_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                 size_t vl);
vfloat16mf4_t __riscv_vfdiv_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfdiv_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                 size_t vl);
vfloat16mf2_t __riscv_vfdiv_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfdiv_tumu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfdiv_tumu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfdiv_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfdiv_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfdiv_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfdiv_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfdiv_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfdiv_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfdiv_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                 size_t vl);
vfloat32mf2_t __riscv_vfdiv_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfdiv_tumu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfdiv_tumu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                float rs1, size_t vl);
vfloat32m2_t __riscv_vfdiv_tumu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfdiv_tumu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                float rs1, size_t vl);
vfloat32m4_t __riscv_vfdiv_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfdiv_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                float rs1, size_t vl);
vfloat32m8_t __riscv_vfdiv_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfdiv_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                float rs1, size_t vl);
vfloat64m1_t __riscv_vfdiv_tumu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfdiv_tumu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                double rs1, size_t vl);
vfloat64m2_t __riscv_vfdiv_tumu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfdiv_tumu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                double rs1, size_t vl);
vfloat64m4_t __riscv_vfdiv_tumu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfdiv_tumu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                double rs1, size_t vl);
vfloat64m8_t __riscv_vfdiv_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfdiv_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                double rs1, size_t vl);
vfloat16mf4_t __riscv_vfrdiv_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfrdiv_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfrdiv_tumu(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs2, _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfrdiv_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                 _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfrdiv_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                 _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfrdiv_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                 _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfrdiv_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfrdiv_tumu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs2, float rs1, size_t vl);
vfloat32m2_t __riscv_vfrdiv_tumu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs2, float rs1, size_t vl);
vfloat32m4_t __riscv_vfrdiv_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                 float rs1, size_t vl);
vfloat32m8_t __riscv_vfrdiv_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                 float rs1, size_t vl);
vfloat64m1_t __riscv_vfrdiv_tumu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs2, double rs1, size_t vl);
vfloat64m2_t __riscv_vfrdiv_tumu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs2, double rs1, size_t vl);
vfloat64m4_t __riscv_vfrdiv_tumu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs2, double rs1, size_t vl);
vfloat64m8_t __riscv_vfrdiv_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                 double rs1, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmul_mu(vbool64_t vm, vfloat16mf4_t vd,
                               vfloat16mf4_t vs2, vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfmul_mu(vbool64_t vm, vfloat16mf4_t vd,
                               vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfmul_mu(vbool32_t vm, vfloat16mf2_t vd,
                               vfloat16mf2_t vs2, vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfmul_mu(vbool32_t vm, vfloat16mf2_t vd,
                               vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfmul_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                              vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfmul_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                              _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfmul_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                              vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfmul_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                              _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfmul_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                              vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfmul_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                              _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfmul_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                              vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfmul_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                              _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfmul_mu(vbool64_t vm, vfloat32mf2_t vd,
                               vfloat32mf2_t vs2, vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfmul_mu(vbool64_t vm, vfloat32mf2_t vd,
                               vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfmul_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                              vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfmul_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                              float rs1, size_t vl);
vfloat32m2_t __riscv_vfmul_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                              vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfmul_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                              float rs1, size_t vl);
vfloat32m4_t __riscv_vfmul_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                              vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfmul_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                              float rs1, size_t vl);
vfloat32m8_t __riscv_vfmul_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                              vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfmul_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                              float rs1, size_t vl);
vfloat64m1_t __riscv_vfmul_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                              vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfmul_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                              double rs1, size_t vl);
vfloat64m2_t __riscv_vfmul_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                              vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfmul_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                              double rs1, size_t vl);
vfloat64m4_t __riscv_vfmul_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                              vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfmul_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                              double rs1, size_t vl);
vfloat64m8_t __riscv_vfmul_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                              vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfmul_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                              double rs1, size_t vl);
vfloat16mf4_t __riscv_vfdiv_mu(vbool64_t vm, vfloat16mf4_t vd,
                               vfloat16mf4_t vs2, vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfdiv_mu(vbool64_t vm, vfloat16mf4_t vd,
                               vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfdiv_mu(vbool32_t vm, vfloat16mf2_t vd,
                               vfloat16mf2_t vs2, vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfdiv_mu(vbool32_t vm, vfloat16mf2_t vd,
                               vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfdiv_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                              vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfdiv_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                              _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfdiv_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                              vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfdiv_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                              _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfdiv_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                              vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfdiv_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                              _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfdiv_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                              vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfdiv_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                              _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfdiv_mu(vbool64_t vm, vfloat32mf2_t vd,
                               vfloat32mf2_t vs2, vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfdiv_mu(vbool64_t vm, vfloat32mf2_t vd,
                               vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfdiv_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                              vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfdiv_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                              float rs1, size_t vl);
vfloat32m2_t __riscv_vfdiv_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                              vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfdiv_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                              float rs1, size_t vl);
vfloat32m4_t __riscv_vfdiv_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                              vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfdiv_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                              float rs1, size_t vl);
vfloat32m8_t __riscv_vfdiv_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                              vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfdiv_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                              float rs1, size_t vl);
vfloat64m1_t __riscv_vfdiv_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                              vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfdiv_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                              double rs1, size_t vl);
vfloat64m2_t __riscv_vfdiv_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                              vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfdiv_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                              double rs1, size_t vl);
vfloat64m4_t __riscv_vfdiv_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                              vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfdiv_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                              double rs1, size_t vl);
vfloat64m8_t __riscv_vfdiv_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                              vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfdiv_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                              double rs1, size_t vl);
vfloat16mf4_t __riscv_vfrdiv_mu(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfrdiv_mu(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfrdiv_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfrdiv_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfrdiv_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfrdiv_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfrdiv_mu(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfrdiv_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               float rs1, size_t vl);
vfloat32m2_t __riscv_vfrdiv_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               float rs1, size_t vl);
vfloat32m4_t __riscv_vfrdiv_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               float rs1, size_t vl);
vfloat32m8_t __riscv_vfrdiv_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               float rs1, size_t vl);
vfloat64m1_t __riscv_vfrdiv_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               double rs1, size_t vl);
vfloat64m2_t __riscv_vfrdiv_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               double rs1, size_t vl);
vfloat64m4_t __riscv_vfrdiv_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               double rs1, size_t vl);
vfloat64m8_t __riscv_vfrdiv_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               double rs1, size_t vl);
vfloat16mf4_t __riscv_vfmul_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                               vfloat16mf4_t vs1, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmul_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmul_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                               vfloat16mf2_t vs1, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmul_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmul_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                              vfloat16m1_t vs1, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmul_tu(vfloat16m1_t vd, vfloat16m1_t vs2, _Float16 rs1,
                              unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmul_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                              vfloat16m2_t vs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmul_tu(vfloat16m2_t vd, vfloat16m2_t vs2, _Float16 rs1,
                              unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmul_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                              vfloat16m4_t vs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmul_tu(vfloat16m4_t vd, vfloat16m4_t vs2, _Float16 rs1,
                              unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmul_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                              vfloat16m8_t vs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmul_tu(vfloat16m8_t vd, vfloat16m8_t vs2, _Float16 rs1,
                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmul_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                               vfloat32mf2_t vs1, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmul_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2, float rs1,
                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmul_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                              vfloat32m1_t vs1, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmul_tu(vfloat32m1_t vd, vfloat32m1_t vs2, float rs1,
                              unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmul_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                              vfloat32m2_t vs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmul_tu(vfloat32m2_t vd, vfloat32m2_t vs2, float rs1,
                              unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmul_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                              vfloat32m4_t vs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmul_tu(vfloat32m4_t vd, vfloat32m4_t vs2, float rs1,
                              unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmul_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                              vfloat32m8_t vs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmul_tu(vfloat32m8_t vd, vfloat32m8_t vs2, float rs1,
                              unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmul_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                              vfloat64m1_t vs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmul_tu(vfloat64m1_t vd, vfloat64m1_t vs2, double rs1,
                              unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmul_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                              vfloat64m2_t vs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmul_tu(vfloat64m2_t vd, vfloat64m2_t vs2, double rs1,
                              unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmul_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                              vfloat64m4_t vs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmul_tu(vfloat64m4_t vd, vfloat64m4_t vs2, double rs1,
                              unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmul_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                              vfloat64m8_t vs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmul_tu(vfloat64m8_t vd, vfloat64m8_t vs2, double rs1,
                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfdiv_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                               vfloat16mf4_t vs1, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfdiv_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfdiv_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                               vfloat16mf2_t vs1, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfdiv_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfdiv_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                              vfloat16m1_t vs1, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfdiv_tu(vfloat16m1_t vd, vfloat16m1_t vs2, _Float16 rs1,
                              unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfdiv_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                              vfloat16m2_t vs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfdiv_tu(vfloat16m2_t vd, vfloat16m2_t vs2, _Float16 rs1,
                              unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfdiv_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                              vfloat16m4_t vs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfdiv_tu(vfloat16m4_t vd, vfloat16m4_t vs2, _Float16 rs1,
                              unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfdiv_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                              vfloat16m8_t vs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfdiv_tu(vfloat16m8_t vd, vfloat16m8_t vs2, _Float16 rs1,
                              unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfdiv_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                               vfloat32mf2_t vs1, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfdiv_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2, float rs1,
                               unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfdiv_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                              vfloat32m1_t vs1, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfdiv_tu(vfloat32m1_t vd, vfloat32m1_t vs2, float rs1,
                              unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfdiv_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                              vfloat32m2_t vs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfdiv_tu(vfloat32m2_t vd, vfloat32m2_t vs2, float rs1,
                              unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfdiv_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                              vfloat32m4_t vs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfdiv_tu(vfloat32m4_t vd, vfloat32m4_t vs2, float rs1,
                              unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfdiv_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                              vfloat32m8_t vs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfdiv_tu(vfloat32m8_t vd, vfloat32m8_t vs2, float rs1,
                              unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfdiv_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                              vfloat64m1_t vs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfdiv_tu(vfloat64m1_t vd, vfloat64m1_t vs2, double rs1,
                              unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfdiv_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                              vfloat64m2_t vs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfdiv_tu(vfloat64m2_t vd, vfloat64m2_t vs2, double rs1,
                              unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfdiv_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                              vfloat64m4_t vs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfdiv_tu(vfloat64m4_t vd, vfloat64m4_t vs2, double rs1,
                              unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfdiv_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                              vfloat64m8_t vs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfdiv_tu(vfloat64m8_t vd, vfloat64m8_t vs2, double rs1,
                              unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfrdiv_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfrdiv_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfrdiv_tu(vfloat16m1_t vd, vfloat16m1_t vs2, _Float16 rs1,
                               unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfrdiv_tu(vfloat16m2_t vd, vfloat16m2_t vs2, _Float16 rs1,
                               unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfrdiv_tu(vfloat16m4_t vd, vfloat16m4_t vs2, _Float16 rs1,
                               unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfrdiv_tu(vfloat16m8_t vd, vfloat16m8_t vs2, _Float16 rs1,
                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfrdiv_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2, float rs1,
                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfrdiv_tu(vfloat32m1_t vd, vfloat32m1_t vs2, float rs1,
                               unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfrdiv_tu(vfloat32m2_t vd, vfloat32m2_t vs2, float rs1,
                               unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfrdiv_tu(vfloat32m4_t vd, vfloat32m4_t vs2, float rs1,
                               unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfrdiv_tu(vfloat32m8_t vd, vfloat32m8_t vs2, float rs1,
                               unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfrdiv_tu(vfloat64m1_t vd, vfloat64m1_t vs2, double rs1,
                               unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfrdiv_tu(vfloat64m2_t vd, vfloat64m2_t vs2, double rs1,
                               unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfrdiv_tu(vfloat64m4_t vd, vfloat64m4_t vs2, double rs1,
                               unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfrdiv_tu(vfloat64m8_t vd, vfloat64m8_t vs2, double rs1,
                               unsigned int frm, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmul_tum(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmul_tum(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, _Float16 rs1,
                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmul_tum(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmul_tum(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, _Float16 rs1,
                                unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmul_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               vfloat16m1_t vs1, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmul_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmul_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               vfloat16m2_t vs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmul_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmul_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               vfloat16m4_t vs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmul_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmul_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               vfloat16m8_t vs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmul_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmul_tum(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmul_tum(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, float rs1, unsigned int frm,
                                size_t vl);
vfloat32m1_t __riscv_vfmul_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               vfloat32m1_t vs1, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmul_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmul_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               vfloat32m2_t vs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmul_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmul_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               vfloat32m4_t vs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmul_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmul_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               vfloat32m8_t vs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmul_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmul_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               vfloat64m1_t vs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmul_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               double rs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmul_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               vfloat64m2_t vs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmul_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               double rs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmul_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               vfloat64m4_t vs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmul_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               double rs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmul_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               vfloat64m8_t vs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmul_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               double rs1, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfdiv_tum(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfdiv_tum(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, _Float16 rs1,
                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfdiv_tum(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfdiv_tum(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, _Float16 rs1,
                                unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfdiv_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               vfloat16m1_t vs1, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfdiv_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfdiv_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               vfloat16m2_t vs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfdiv_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfdiv_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               vfloat16m4_t vs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfdiv_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfdiv_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               vfloat16m8_t vs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfdiv_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfdiv_tum(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfdiv_tum(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, float rs1, unsigned int frm,
                                size_t vl);
vfloat32m1_t __riscv_vfdiv_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               vfloat32m1_t vs1, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfdiv_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfdiv_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               vfloat32m2_t vs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfdiv_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfdiv_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               vfloat32m4_t vs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfdiv_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfdiv_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               vfloat32m8_t vs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfdiv_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfdiv_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               vfloat64m1_t vs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfdiv_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               double rs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfdiv_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               vfloat64m2_t vs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfdiv_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               double rs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfdiv_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               vfloat64m4_t vs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfdiv_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               double rs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfdiv_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               vfloat64m8_t vs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfdiv_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               double rs1, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfrdiv_tum(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, _Float16 rs1,
                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfrdiv_tum(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, _Float16 rs1,
                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfrdiv_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfrdiv_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfrdiv_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfrdiv_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfrdiv_tum(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, float rs1, unsigned int frm,
                                 size_t vl);
vfloat32m1_t __riscv_vfrdiv_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfrdiv_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfrdiv_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfrdiv_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfrdiv_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                double rs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfrdiv_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                double rs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfrdiv_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                double rs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfrdiv_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                double rs1, unsigned int frm, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmul_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                 unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmul_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, _Float16 rs1,
                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmul_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmul_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, _Float16 rs1,
                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmul_tumu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                vfloat16m1_t vs1, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmul_tumu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmul_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                vfloat16m2_t vs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmul_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmul_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                vfloat16m4_t vs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmul_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmul_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                vfloat16m8_t vs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmul_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmul_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmul_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, float rs1, unsigned int frm,
                                 size_t vl);
vfloat32m1_t __riscv_vfmul_tumu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                vfloat32m1_t vs1, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmul_tumu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmul_tumu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                vfloat32m2_t vs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmul_tumu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmul_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                vfloat32m4_t vs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmul_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmul_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                vfloat32m8_t vs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmul_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmul_tumu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                vfloat64m1_t vs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmul_tumu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                double rs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmul_tumu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                vfloat64m2_t vs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmul_tumu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                double rs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmul_tumu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                vfloat64m4_t vs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmul_tumu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                double rs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmul_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                vfloat64m8_t vs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmul_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                double rs1, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfdiv_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                 unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfdiv_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, _Float16 rs1,
                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfdiv_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfdiv_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, _Float16 rs1,
                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfdiv_tumu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                vfloat16m1_t vs1, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfdiv_tumu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfdiv_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                vfloat16m2_t vs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfdiv_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfdiv_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                vfloat16m4_t vs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfdiv_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfdiv_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                vfloat16m8_t vs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfdiv_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfdiv_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfdiv_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, float rs1, unsigned int frm,
                                 size_t vl);
vfloat32m1_t __riscv_vfdiv_tumu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                vfloat32m1_t vs1, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfdiv_tumu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfdiv_tumu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                vfloat32m2_t vs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfdiv_tumu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfdiv_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                vfloat32m4_t vs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfdiv_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfdiv_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                vfloat32m8_t vs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfdiv_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfdiv_tumu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                vfloat64m1_t vs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfdiv_tumu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                double rs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfdiv_tumu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                vfloat64m2_t vs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfdiv_tumu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                double rs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfdiv_tumu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                vfloat64m4_t vs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfdiv_tumu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                double rs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfdiv_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                vfloat64m8_t vs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfdiv_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                double rs1, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfrdiv_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs2, _Float16 rs1,
                                  unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfrdiv_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs2, _Float16 rs1,
                                  unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfrdiv_tumu(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs2, _Float16 rs1,
                                 unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfrdiv_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                 _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfrdiv_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                 _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfrdiv_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                 _Float16 rs1, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfrdiv_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs2, float rs1,
                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfrdiv_tumu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs2, float rs1, unsigned int frm,
                                 size_t vl);
vfloat32m2_t __riscv_vfrdiv_tumu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs2, float rs1, unsigned int frm,
                                 size_t vl);
vfloat32m4_t __riscv_vfrdiv_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                 float rs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfrdiv_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                 float rs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfrdiv_tumu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs2, double rs1, unsigned int frm,
                                 size_t vl);
vfloat64m2_t __riscv_vfrdiv_tumu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs2, double rs1, unsigned int frm,
                                 size_t vl);
vfloat64m4_t __riscv_vfrdiv_tumu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs2, double rs1, unsigned int frm,
                                 size_t vl);
vfloat64m8_t __riscv_vfrdiv_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                 double rs1, unsigned int frm, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmul_mu(vbool64_t vm, vfloat16mf4_t vd,
                               vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                               unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmul_mu(vbool64_t vm, vfloat16mf4_t vd,
                               vfloat16mf4_t vs2, _Float16 rs1,
                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmul_mu(vbool32_t vm, vfloat16mf2_t vd,
                               vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmul_mu(vbool32_t vm, vfloat16mf2_t vd,
                               vfloat16mf2_t vs2, _Float16 rs1,
                               unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmul_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                              vfloat16m1_t vs1, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmul_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                              _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmul_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                              vfloat16m2_t vs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmul_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                              _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmul_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                              vfloat16m4_t vs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmul_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                              _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmul_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                              vfloat16m8_t vs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmul_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                              _Float16 rs1, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmul_mu(vbool64_t vm, vfloat32mf2_t vd,
                               vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmul_mu(vbool64_t vm, vfloat32mf2_t vd,
                               vfloat32mf2_t vs2, float rs1, unsigned int frm,
                               size_t vl);
vfloat32m1_t __riscv_vfmul_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                              vfloat32m1_t vs1, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmul_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                              float rs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmul_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                              vfloat32m2_t vs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmul_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                              float rs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmul_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                              vfloat32m4_t vs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmul_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                              float rs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmul_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                              vfloat32m8_t vs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmul_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                              float rs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmul_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                              vfloat64m1_t vs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmul_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                              double rs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmul_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                              vfloat64m2_t vs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmul_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                              double rs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmul_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                              vfloat64m4_t vs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmul_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                              double rs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmul_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                              vfloat64m8_t vs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmul_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                              double rs1, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfdiv_mu(vbool64_t vm, vfloat16mf4_t vd,
                               vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                               unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfdiv_mu(vbool64_t vm, vfloat16mf4_t vd,
                               vfloat16mf4_t vs2, _Float16 rs1,
                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfdiv_mu(vbool32_t vm, vfloat16mf2_t vd,
                               vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                               unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfdiv_mu(vbool32_t vm, vfloat16mf2_t vd,
                               vfloat16mf2_t vs2, _Float16 rs1,
                               unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfdiv_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                              vfloat16m1_t vs1, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfdiv_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                              _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfdiv_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                              vfloat16m2_t vs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfdiv_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                              _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfdiv_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                              vfloat16m4_t vs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfdiv_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                              _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfdiv_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                              vfloat16m8_t vs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfdiv_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                              _Float16 rs1, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfdiv_mu(vbool64_t vm, vfloat32mf2_t vd,
                               vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfdiv_mu(vbool64_t vm, vfloat32mf2_t vd,
                               vfloat32mf2_t vs2, float rs1, unsigned int frm,
                               size_t vl);
vfloat32m1_t __riscv_vfdiv_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                              vfloat32m1_t vs1, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfdiv_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                              float rs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfdiv_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                              vfloat32m2_t vs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfdiv_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                              float rs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfdiv_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                              vfloat32m4_t vs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfdiv_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                              float rs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfdiv_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                              vfloat32m8_t vs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfdiv_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                              float rs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfdiv_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                              vfloat64m1_t vs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfdiv_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                              double rs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfdiv_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                              vfloat64m2_t vs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfdiv_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                              double rs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfdiv_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                              vfloat64m4_t vs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfdiv_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                              double rs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfdiv_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                              vfloat64m8_t vs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfdiv_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                              double rs1, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfrdiv_mu(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, _Float16 rs1,
                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfrdiv_mu(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, _Float16 rs1,
                                unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfrdiv_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfrdiv_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfrdiv_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfrdiv_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfrdiv_mu(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, float rs1, unsigned int frm,
                                size_t vl);
vfloat32m1_t __riscv_vfrdiv_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfrdiv_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfrdiv_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfrdiv_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfrdiv_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               double rs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfrdiv_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               double rs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfrdiv_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               double rs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfrdiv_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               double rs1, unsigned int frm, size_t vl);

Vector Widening Floating-Point Multiply Intrinsics

vfloat32mf2_t __riscv_vfwmul_tu(vfloat32mf2_t vd, vfloat16mf4_t vs2,
                                vfloat16mf4_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfwmul_tu(vfloat32mf2_t vd, vfloat16mf4_t vs2,
                                _Float16 rs1, size_t vl);
vfloat32m1_t __riscv_vfwmul_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                               vfloat16mf2_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwmul_tu(vfloat32m1_t vd, vfloat16mf2_t vs2, _Float16 rs1,
                               size_t vl);
vfloat32m2_t __riscv_vfwmul_tu(vfloat32m2_t vd, vfloat16m1_t vs2,
                               vfloat16m1_t vs1, size_t vl);
vfloat32m2_t __riscv_vfwmul_tu(vfloat32m2_t vd, vfloat16m1_t vs2, _Float16 rs1,
                               size_t vl);
vfloat32m4_t __riscv_vfwmul_tu(vfloat32m4_t vd, vfloat16m2_t vs2,
                               vfloat16m2_t vs1, size_t vl);
vfloat32m4_t __riscv_vfwmul_tu(vfloat32m4_t vd, vfloat16m2_t vs2, _Float16 rs1,
                               size_t vl);
vfloat32m8_t __riscv_vfwmul_tu(vfloat32m8_t vd, vfloat16m4_t vs2,
                               vfloat16m4_t vs1, size_t vl);
vfloat32m8_t __riscv_vfwmul_tu(vfloat32m8_t vd, vfloat16m4_t vs2, _Float16 rs1,
                               size_t vl);
vfloat64m1_t __riscv_vfwmul_tu(vfloat64m1_t vd, vfloat32mf2_t vs2,
                               vfloat32mf2_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwmul_tu(vfloat64m1_t vd, vfloat32mf2_t vs2, float rs1,
                               size_t vl);
vfloat64m2_t __riscv_vfwmul_tu(vfloat64m2_t vd, vfloat32m1_t vs2,
                               vfloat32m1_t vs1, size_t vl);
vfloat64m2_t __riscv_vfwmul_tu(vfloat64m2_t vd, vfloat32m1_t vs2, float rs1,
                               size_t vl);
vfloat64m4_t __riscv_vfwmul_tu(vfloat64m4_t vd, vfloat32m2_t vs2,
                               vfloat32m2_t vs1, size_t vl);
vfloat64m4_t __riscv_vfwmul_tu(vfloat64m4_t vd, vfloat32m2_t vs2, float rs1,
                               size_t vl);
vfloat64m8_t __riscv_vfwmul_tu(vfloat64m8_t vd, vfloat32m4_t vs2,
                               vfloat32m4_t vs1, size_t vl);
vfloat64m8_t __riscv_vfwmul_tu(vfloat64m8_t vd, vfloat32m4_t vs2, float rs1,
                               size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwmul_tum(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                 size_t vl);
vfloat32mf2_t __riscv_vfwmul_tum(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat32m1_t __riscv_vfwmul_tum(vbool32_t vm, vfloat32m1_t vd,
                                vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                size_t vl);
vfloat32m1_t __riscv_vfwmul_tum(vbool32_t vm, vfloat32m1_t vd,
                                vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat32m2_t __riscv_vfwmul_tum(vbool16_t vm, vfloat32m2_t vd, vfloat16m1_t vs2,
                                vfloat16m1_t vs1, size_t vl);
vfloat32m2_t __riscv_vfwmul_tum(vbool16_t vm, vfloat32m2_t vd, vfloat16m1_t vs2,
                                _Float16 rs1, size_t vl);
vfloat32m4_t __riscv_vfwmul_tum(vbool8_t vm, vfloat32m4_t vd, vfloat16m2_t vs2,
                                vfloat16m2_t vs1, size_t vl);
vfloat32m4_t __riscv_vfwmul_tum(vbool8_t vm, vfloat32m4_t vd, vfloat16m2_t vs2,
                                _Float16 rs1, size_t vl);
vfloat32m8_t __riscv_vfwmul_tum(vbool4_t vm, vfloat32m8_t vd, vfloat16m4_t vs2,
                                vfloat16m4_t vs1, size_t vl);
vfloat32m8_t __riscv_vfwmul_tum(vbool4_t vm, vfloat32m8_t vd, vfloat16m4_t vs2,
                                _Float16 rs1, size_t vl);
vfloat64m1_t __riscv_vfwmul_tum(vbool64_t vm, vfloat64m1_t vd,
                                vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                size_t vl);
vfloat64m1_t __riscv_vfwmul_tum(vbool64_t vm, vfloat64m1_t vd,
                                vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat64m2_t __riscv_vfwmul_tum(vbool32_t vm, vfloat64m2_t vd, vfloat32m1_t vs2,
                                vfloat32m1_t vs1, size_t vl);
vfloat64m2_t __riscv_vfwmul_tum(vbool32_t vm, vfloat64m2_t vd, vfloat32m1_t vs2,
                                float rs1, size_t vl);
vfloat64m4_t __riscv_vfwmul_tum(vbool16_t vm, vfloat64m4_t vd, vfloat32m2_t vs2,
                                vfloat32m2_t vs1, size_t vl);
vfloat64m4_t __riscv_vfwmul_tum(vbool16_t vm, vfloat64m4_t vd, vfloat32m2_t vs2,
                                float rs1, size_t vl);
vfloat64m8_t __riscv_vfwmul_tum(vbool8_t vm, vfloat64m8_t vd, vfloat32m4_t vs2,
                                vfloat32m4_t vs1, size_t vl);
vfloat64m8_t __riscv_vfwmul_tum(vbool8_t vm, vfloat64m8_t vd, vfloat32m4_t vs2,
                                float rs1, size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwmul_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                  size_t vl);
vfloat32mf2_t __riscv_vfwmul_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat32m1_t __riscv_vfwmul_tumu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                 size_t vl);
vfloat32m1_t __riscv_vfwmul_tumu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat32m2_t __riscv_vfwmul_tumu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat16m1_t vs2, vfloat16m1_t vs1, size_t vl);
vfloat32m2_t __riscv_vfwmul_tumu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat16m1_t vs2, _Float16 rs1, size_t vl);
vfloat32m4_t __riscv_vfwmul_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat16m2_t vs2,
                                 vfloat16m2_t vs1, size_t vl);
vfloat32m4_t __riscv_vfwmul_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat16m2_t vs2,
                                 _Float16 rs1, size_t vl);
vfloat32m8_t __riscv_vfwmul_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat16m4_t vs2,
                                 vfloat16m4_t vs1, size_t vl);
vfloat32m8_t __riscv_vfwmul_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat16m4_t vs2,
                                 _Float16 rs1, size_t vl);
vfloat64m1_t __riscv_vfwmul_tumu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                 size_t vl);
vfloat64m1_t __riscv_vfwmul_tumu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat64m2_t __riscv_vfwmul_tumu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat32m1_t vs2, vfloat32m1_t vs1, size_t vl);
vfloat64m2_t __riscv_vfwmul_tumu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat32m1_t vs2, float rs1, size_t vl);
vfloat64m4_t __riscv_vfwmul_tumu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat32m2_t vs2, vfloat32m2_t vs1, size_t vl);
vfloat64m4_t __riscv_vfwmul_tumu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat32m2_t vs2, float rs1, size_t vl);
vfloat64m8_t __riscv_vfwmul_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat32m4_t vs2,
                                 vfloat32m4_t vs1, size_t vl);
vfloat64m8_t __riscv_vfwmul_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat32m4_t vs2,
                                 float rs1, size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwmul_mu(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                size_t vl);
vfloat32mf2_t __riscv_vfwmul_mu(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat32m1_t __riscv_vfwmul_mu(vbool32_t vm, vfloat32m1_t vd, vfloat16mf2_t vs2,
                               vfloat16mf2_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwmul_mu(vbool32_t vm, vfloat32m1_t vd, vfloat16mf2_t vs2,
                               _Float16 rs1, size_t vl);
vfloat32m2_t __riscv_vfwmul_mu(vbool16_t vm, vfloat32m2_t vd, vfloat16m1_t vs2,
                               vfloat16m1_t vs1, size_t vl);
vfloat32m2_t __riscv_vfwmul_mu(vbool16_t vm, vfloat32m2_t vd, vfloat16m1_t vs2,
                               _Float16 rs1, size_t vl);
vfloat32m4_t __riscv_vfwmul_mu(vbool8_t vm, vfloat32m4_t vd, vfloat16m2_t vs2,
                               vfloat16m2_t vs1, size_t vl);
vfloat32m4_t __riscv_vfwmul_mu(vbool8_t vm, vfloat32m4_t vd, vfloat16m2_t vs2,
                               _Float16 rs1, size_t vl);
vfloat32m8_t __riscv_vfwmul_mu(vbool4_t vm, vfloat32m8_t vd, vfloat16m4_t vs2,
                               vfloat16m4_t vs1, size_t vl);
vfloat32m8_t __riscv_vfwmul_mu(vbool4_t vm, vfloat32m8_t vd, vfloat16m4_t vs2,
                               _Float16 rs1, size_t vl);
vfloat64m1_t __riscv_vfwmul_mu(vbool64_t vm, vfloat64m1_t vd, vfloat32mf2_t vs2,
                               vfloat32mf2_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwmul_mu(vbool64_t vm, vfloat64m1_t vd, vfloat32mf2_t vs2,
                               float rs1, size_t vl);
vfloat64m2_t __riscv_vfwmul_mu(vbool32_t vm, vfloat64m2_t vd, vfloat32m1_t vs2,
                               vfloat32m1_t vs1, size_t vl);
vfloat64m2_t __riscv_vfwmul_mu(vbool32_t vm, vfloat64m2_t vd, vfloat32m1_t vs2,
                               float rs1, size_t vl);
vfloat64m4_t __riscv_vfwmul_mu(vbool16_t vm, vfloat64m4_t vd, vfloat32m2_t vs2,
                               vfloat32m2_t vs1, size_t vl);
vfloat64m4_t __riscv_vfwmul_mu(vbool16_t vm, vfloat64m4_t vd, vfloat32m2_t vs2,
                               float rs1, size_t vl);
vfloat64m8_t __riscv_vfwmul_mu(vbool8_t vm, vfloat64m8_t vd, vfloat32m4_t vs2,
                               vfloat32m4_t vs1, size_t vl);
vfloat64m8_t __riscv_vfwmul_mu(vbool8_t vm, vfloat64m8_t vd, vfloat32m4_t vs2,
                               float rs1, size_t vl);
vfloat32mf2_t __riscv_vfwmul_tu(vfloat32mf2_t vd, vfloat16mf4_t vs2,
                                vfloat16mf4_t vs1, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmul_tu(vfloat32mf2_t vd, vfloat16mf4_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmul_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                               vfloat16mf2_t vs1, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmul_tu(vfloat32m1_t vd, vfloat16mf2_t vs2, _Float16 rs1,
                               unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmul_tu(vfloat32m2_t vd, vfloat16m1_t vs2,
                               vfloat16m1_t vs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmul_tu(vfloat32m2_t vd, vfloat16m1_t vs2, _Float16 rs1,
                               unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmul_tu(vfloat32m4_t vd, vfloat16m2_t vs2,
                               vfloat16m2_t vs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmul_tu(vfloat32m4_t vd, vfloat16m2_t vs2, _Float16 rs1,
                               unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmul_tu(vfloat32m8_t vd, vfloat16m4_t vs2,
                               vfloat16m4_t vs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmul_tu(vfloat32m8_t vd, vfloat16m4_t vs2, _Float16 rs1,
                               unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmul_tu(vfloat64m1_t vd, vfloat32mf2_t vs2,
                               vfloat32mf2_t vs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmul_tu(vfloat64m1_t vd, vfloat32mf2_t vs2, float rs1,
                               unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmul_tu(vfloat64m2_t vd, vfloat32m1_t vs2,
                               vfloat32m1_t vs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmul_tu(vfloat64m2_t vd, vfloat32m1_t vs2, float rs1,
                               unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmul_tu(vfloat64m4_t vd, vfloat32m2_t vs2,
                               vfloat32m2_t vs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmul_tu(vfloat64m4_t vd, vfloat32m2_t vs2, float rs1,
                               unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmul_tu(vfloat64m8_t vd, vfloat32m4_t vs2,
                               vfloat32m4_t vs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmul_tu(vfloat64m8_t vd, vfloat32m4_t vs2, float rs1,
                               unsigned int frm, size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwmul_tum(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmul_tum(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat16mf4_t vs2, _Float16 rs1,
                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmul_tum(vbool32_t vm, vfloat32m1_t vd,
                                vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmul_tum(vbool32_t vm, vfloat32m1_t vd,
                                vfloat16mf2_t vs2, _Float16 rs1,
                                unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmul_tum(vbool16_t vm, vfloat32m2_t vd, vfloat16m1_t vs2,
                                vfloat16m1_t vs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmul_tum(vbool16_t vm, vfloat32m2_t vd, vfloat16m1_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmul_tum(vbool8_t vm, vfloat32m4_t vd, vfloat16m2_t vs2,
                                vfloat16m2_t vs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmul_tum(vbool8_t vm, vfloat32m4_t vd, vfloat16m2_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmul_tum(vbool4_t vm, vfloat32m8_t vd, vfloat16m4_t vs2,
                                vfloat16m4_t vs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmul_tum(vbool4_t vm, vfloat32m8_t vd, vfloat16m4_t vs2,
                                _Float16 rs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmul_tum(vbool64_t vm, vfloat64m1_t vd,
                                vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmul_tum(vbool64_t vm, vfloat64m1_t vd,
                                vfloat32mf2_t vs2, float rs1, unsigned int frm,
                                size_t vl);
vfloat64m2_t __riscv_vfwmul_tum(vbool32_t vm, vfloat64m2_t vd, vfloat32m1_t vs2,
                                vfloat32m1_t vs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmul_tum(vbool32_t vm, vfloat64m2_t vd, vfloat32m1_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmul_tum(vbool16_t vm, vfloat64m4_t vd, vfloat32m2_t vs2,
                                vfloat32m2_t vs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmul_tum(vbool16_t vm, vfloat64m4_t vd, vfloat32m2_t vs2,
                                float rs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmul_tum(vbool8_t vm, vfloat64m8_t vd, vfloat32m4_t vs2,
                                vfloat32m4_t vs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmul_tum(vbool8_t vm, vfloat64m8_t vd, vfloat32m4_t vs2,
                                float rs1, unsigned int frm, size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwmul_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                  unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmul_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat16mf4_t vs2, _Float16 rs1,
                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmul_tumu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmul_tumu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat16mf2_t vs2, _Float16 rs1,
                                 unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmul_tumu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat16m1_t vs2, vfloat16m1_t vs1,
                                 unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmul_tumu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat16m1_t vs2, _Float16 rs1,
                                 unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmul_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat16m2_t vs2,
                                 vfloat16m2_t vs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmul_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat16m2_t vs2,
                                 _Float16 rs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmul_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat16m4_t vs2,
                                 vfloat16m4_t vs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmul_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat16m4_t vs2,
                                 _Float16 rs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmul_tumu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                 unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmul_tumu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat32mf2_t vs2, float rs1, unsigned int frm,
                                 size_t vl);
vfloat64m2_t __riscv_vfwmul_tumu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat32m1_t vs2, vfloat32m1_t vs1,
                                 unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmul_tumu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat32m1_t vs2, float rs1, unsigned int frm,
                                 size_t vl);
vfloat64m4_t __riscv_vfwmul_tumu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat32m2_t vs2, vfloat32m2_t vs1,
                                 unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmul_tumu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat32m2_t vs2, float rs1, unsigned int frm,
                                 size_t vl);
vfloat64m8_t __riscv_vfwmul_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat32m4_t vs2,
                                 vfloat32m4_t vs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmul_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat32m4_t vs2,
                                 float rs1, unsigned int frm, size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwmul_mu(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmul_mu(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat16mf4_t vs2, _Float16 rs1,
                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmul_mu(vbool32_t vm, vfloat32m1_t vd, vfloat16mf2_t vs2,
                               vfloat16mf2_t vs1, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmul_mu(vbool32_t vm, vfloat32m1_t vd, vfloat16mf2_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmul_mu(vbool16_t vm, vfloat32m2_t vd, vfloat16m1_t vs2,
                               vfloat16m1_t vs1, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmul_mu(vbool16_t vm, vfloat32m2_t vd, vfloat16m1_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmul_mu(vbool8_t vm, vfloat32m4_t vd, vfloat16m2_t vs2,
                               vfloat16m2_t vs1, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmul_mu(vbool8_t vm, vfloat32m4_t vd, vfloat16m2_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmul_mu(vbool4_t vm, vfloat32m8_t vd, vfloat16m4_t vs2,
                               vfloat16m4_t vs1, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmul_mu(vbool4_t vm, vfloat32m8_t vd, vfloat16m4_t vs2,
                               _Float16 rs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmul_mu(vbool64_t vm, vfloat64m1_t vd, vfloat32mf2_t vs2,
                               vfloat32mf2_t vs1, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmul_mu(vbool64_t vm, vfloat64m1_t vd, vfloat32mf2_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmul_mu(vbool32_t vm, vfloat64m2_t vd, vfloat32m1_t vs2,
                               vfloat32m1_t vs1, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmul_mu(vbool32_t vm, vfloat64m2_t vd, vfloat32m1_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmul_mu(vbool16_t vm, vfloat64m4_t vd, vfloat32m2_t vs2,
                               vfloat32m2_t vs1, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmul_mu(vbool16_t vm, vfloat64m4_t vd, vfloat32m2_t vs2,
                               float rs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmul_mu(vbool8_t vm, vfloat64m8_t vd, vfloat32m4_t vs2,
                               vfloat32m4_t vs1, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmul_mu(vbool8_t vm, vfloat64m8_t vd, vfloat32m4_t vs2,
                               float rs1, unsigned int frm, size_t vl);

Vector Single-Width Floating-Point Fused Multiply-Add Intrinsics

vfloat16mf4_t __riscv_vfmacc_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1,
                                vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfmacc_tu(vfloat16mf4_t vd, _Float16 rs1,
                                vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmacc_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1,
                                vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmacc_tu(vfloat16mf2_t vd, _Float16 rs1,
                                vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmacc_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                               vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmacc_tu(vfloat16m1_t vd, _Float16 rs1, vfloat16m1_t vs2,
                               size_t vl);
vfloat16m2_t __riscv_vfmacc_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                               vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmacc_tu(vfloat16m2_t vd, _Float16 rs1, vfloat16m2_t vs2,
                               size_t vl);
vfloat16m4_t __riscv_vfmacc_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                               vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmacc_tu(vfloat16m4_t vd, _Float16 rs1, vfloat16m4_t vs2,
                               size_t vl);
vfloat16m8_t __riscv_vfmacc_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                               vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmacc_tu(vfloat16m8_t vd, _Float16 rs1, vfloat16m8_t vs2,
                               size_t vl);
vfloat32mf2_t __riscv_vfmacc_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1,
                                vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmacc_tu(vfloat32mf2_t vd, float rs1, vfloat32mf2_t vs2,
                                size_t vl);
vfloat32m1_t __riscv_vfmacc_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                               vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmacc_tu(vfloat32m1_t vd, float rs1, vfloat32m1_t vs2,
                               size_t vl);
vfloat32m2_t __riscv_vfmacc_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                               vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmacc_tu(vfloat32m2_t vd, float rs1, vfloat32m2_t vs2,
                               size_t vl);
vfloat32m4_t __riscv_vfmacc_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                               vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmacc_tu(vfloat32m4_t vd, float rs1, vfloat32m4_t vs2,
                               size_t vl);
vfloat32m8_t __riscv_vfmacc_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                               vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmacc_tu(vfloat32m8_t vd, float rs1, vfloat32m8_t vs2,
                               size_t vl);
vfloat64m1_t __riscv_vfmacc_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                               vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmacc_tu(vfloat64m1_t vd, double rs1, vfloat64m1_t vs2,
                               size_t vl);
vfloat64m2_t __riscv_vfmacc_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                               vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmacc_tu(vfloat64m2_t vd, double rs1, vfloat64m2_t vs2,
                               size_t vl);
vfloat64m4_t __riscv_vfmacc_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                               vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmacc_tu(vfloat64m4_t vd, double rs1, vfloat64m4_t vs2,
                               size_t vl);
vfloat64m8_t __riscv_vfmacc_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                               vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmacc_tu(vfloat64m8_t vd, double rs1, vfloat64m8_t vs2,
                               size_t vl);
vfloat16mf4_t __riscv_vfnmacc_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1,
                                 vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmacc_tu(vfloat16mf4_t vd, _Float16 rs1,
                                 vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmacc_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmacc_tu(vfloat16mf2_t vd, _Float16 rs1,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmacc_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmacc_tu(vfloat16m1_t vd, _Float16 rs1, vfloat16m1_t vs2,
                                size_t vl);
vfloat16m2_t __riscv_vfnmacc_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmacc_tu(vfloat16m2_t vd, _Float16 rs1, vfloat16m2_t vs2,
                                size_t vl);
vfloat16m4_t __riscv_vfnmacc_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmacc_tu(vfloat16m4_t vd, _Float16 rs1, vfloat16m4_t vs2,
                                size_t vl);
vfloat16m8_t __riscv_vfnmacc_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                                vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmacc_tu(vfloat16m8_t vd, _Float16 rs1, vfloat16m8_t vs2,
                                size_t vl);
vfloat32mf2_t __riscv_vfnmacc_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1,
                                 vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmacc_tu(vfloat32mf2_t vd, float rs1, vfloat32mf2_t vs2,
                                 size_t vl);
vfloat32m1_t __riscv_vfnmacc_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmacc_tu(vfloat32m1_t vd, float rs1, vfloat32m1_t vs2,
                                size_t vl);
vfloat32m2_t __riscv_vfnmacc_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmacc_tu(vfloat32m2_t vd, float rs1, vfloat32m2_t vs2,
                                size_t vl);
vfloat32m4_t __riscv_vfnmacc_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmacc_tu(vfloat32m4_t vd, float rs1, vfloat32m4_t vs2,
                                size_t vl);
vfloat32m8_t __riscv_vfnmacc_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                                vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmacc_tu(vfloat32m8_t vd, float rs1, vfloat32m8_t vs2,
                                size_t vl);
vfloat64m1_t __riscv_vfnmacc_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                                vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmacc_tu(vfloat64m1_t vd, double rs1, vfloat64m1_t vs2,
                                size_t vl);
vfloat64m2_t __riscv_vfnmacc_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                                vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmacc_tu(vfloat64m2_t vd, double rs1, vfloat64m2_t vs2,
                                size_t vl);
vfloat64m4_t __riscv_vfnmacc_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                                vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmacc_tu(vfloat64m4_t vd, double rs1, vfloat64m4_t vs2,
                                size_t vl);
vfloat64m8_t __riscv_vfnmacc_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                                vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmacc_tu(vfloat64m8_t vd, double rs1, vfloat64m8_t vs2,
                                size_t vl);
vfloat16mf4_t __riscv_vfmsac_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1,
                                vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfmsac_tu(vfloat16mf4_t vd, _Float16 rs1,
                                vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmsac_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1,
                                vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmsac_tu(vfloat16mf2_t vd, _Float16 rs1,
                                vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmsac_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                               vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmsac_tu(vfloat16m1_t vd, _Float16 rs1, vfloat16m1_t vs2,
                               size_t vl);
vfloat16m2_t __riscv_vfmsac_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                               vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmsac_tu(vfloat16m2_t vd, _Float16 rs1, vfloat16m2_t vs2,
                               size_t vl);
vfloat16m4_t __riscv_vfmsac_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                               vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmsac_tu(vfloat16m4_t vd, _Float16 rs1, vfloat16m4_t vs2,
                               size_t vl);
vfloat16m8_t __riscv_vfmsac_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                               vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmsac_tu(vfloat16m8_t vd, _Float16 rs1, vfloat16m8_t vs2,
                               size_t vl);
vfloat32mf2_t __riscv_vfmsac_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1,
                                vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmsac_tu(vfloat32mf2_t vd, float rs1, vfloat32mf2_t vs2,
                                size_t vl);
vfloat32m1_t __riscv_vfmsac_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                               vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmsac_tu(vfloat32m1_t vd, float rs1, vfloat32m1_t vs2,
                               size_t vl);
vfloat32m2_t __riscv_vfmsac_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                               vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmsac_tu(vfloat32m2_t vd, float rs1, vfloat32m2_t vs2,
                               size_t vl);
vfloat32m4_t __riscv_vfmsac_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                               vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmsac_tu(vfloat32m4_t vd, float rs1, vfloat32m4_t vs2,
                               size_t vl);
vfloat32m8_t __riscv_vfmsac_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                               vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmsac_tu(vfloat32m8_t vd, float rs1, vfloat32m8_t vs2,
                               size_t vl);
vfloat64m1_t __riscv_vfmsac_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                               vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmsac_tu(vfloat64m1_t vd, double rs1, vfloat64m1_t vs2,
                               size_t vl);
vfloat64m2_t __riscv_vfmsac_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                               vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmsac_tu(vfloat64m2_t vd, double rs1, vfloat64m2_t vs2,
                               size_t vl);
vfloat64m4_t __riscv_vfmsac_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                               vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmsac_tu(vfloat64m4_t vd, double rs1, vfloat64m4_t vs2,
                               size_t vl);
vfloat64m8_t __riscv_vfmsac_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                               vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmsac_tu(vfloat64m8_t vd, double rs1, vfloat64m8_t vs2,
                               size_t vl);
vfloat16mf4_t __riscv_vfnmsac_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1,
                                 vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmsac_tu(vfloat16mf4_t vd, _Float16 rs1,
                                 vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmsac_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmsac_tu(vfloat16mf2_t vd, _Float16 rs1,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmsac_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmsac_tu(vfloat16m1_t vd, _Float16 rs1, vfloat16m1_t vs2,
                                size_t vl);
vfloat16m2_t __riscv_vfnmsac_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmsac_tu(vfloat16m2_t vd, _Float16 rs1, vfloat16m2_t vs2,
                                size_t vl);
vfloat16m4_t __riscv_vfnmsac_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmsac_tu(vfloat16m4_t vd, _Float16 rs1, vfloat16m4_t vs2,
                                size_t vl);
vfloat16m8_t __riscv_vfnmsac_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                                vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmsac_tu(vfloat16m8_t vd, _Float16 rs1, vfloat16m8_t vs2,
                                size_t vl);
vfloat32mf2_t __riscv_vfnmsac_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1,
                                 vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmsac_tu(vfloat32mf2_t vd, float rs1, vfloat32mf2_t vs2,
                                 size_t vl);
vfloat32m1_t __riscv_vfnmsac_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmsac_tu(vfloat32m1_t vd, float rs1, vfloat32m1_t vs2,
                                size_t vl);
vfloat32m2_t __riscv_vfnmsac_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmsac_tu(vfloat32m2_t vd, float rs1, vfloat32m2_t vs2,
                                size_t vl);
vfloat32m4_t __riscv_vfnmsac_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmsac_tu(vfloat32m4_t vd, float rs1, vfloat32m4_t vs2,
                                size_t vl);
vfloat32m8_t __riscv_vfnmsac_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                                vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmsac_tu(vfloat32m8_t vd, float rs1, vfloat32m8_t vs2,
                                size_t vl);
vfloat64m1_t __riscv_vfnmsac_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                                vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmsac_tu(vfloat64m1_t vd, double rs1, vfloat64m1_t vs2,
                                size_t vl);
vfloat64m2_t __riscv_vfnmsac_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                                vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmsac_tu(vfloat64m2_t vd, double rs1, vfloat64m2_t vs2,
                                size_t vl);
vfloat64m4_t __riscv_vfnmsac_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                                vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmsac_tu(vfloat64m4_t vd, double rs1, vfloat64m4_t vs2,
                                size_t vl);
vfloat64m8_t __riscv_vfnmsac_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                                vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmsac_tu(vfloat64m8_t vd, double rs1, vfloat64m8_t vs2,
                                size_t vl);
vfloat16mf4_t __riscv_vfmadd_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1,
                                vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfmadd_tu(vfloat16mf4_t vd, _Float16 rs1,
                                vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmadd_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1,
                                vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmadd_tu(vfloat16mf2_t vd, _Float16 rs1,
                                vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmadd_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                               vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmadd_tu(vfloat16m1_t vd, _Float16 rs1, vfloat16m1_t vs2,
                               size_t vl);
vfloat16m2_t __riscv_vfmadd_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                               vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmadd_tu(vfloat16m2_t vd, _Float16 rs1, vfloat16m2_t vs2,
                               size_t vl);
vfloat16m4_t __riscv_vfmadd_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                               vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmadd_tu(vfloat16m4_t vd, _Float16 rs1, vfloat16m4_t vs2,
                               size_t vl);
vfloat16m8_t __riscv_vfmadd_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                               vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmadd_tu(vfloat16m8_t vd, _Float16 rs1, vfloat16m8_t vs2,
                               size_t vl);
vfloat32mf2_t __riscv_vfmadd_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1,
                                vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmadd_tu(vfloat32mf2_t vd, float rs1, vfloat32mf2_t vs2,
                                size_t vl);
vfloat32m1_t __riscv_vfmadd_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                               vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmadd_tu(vfloat32m1_t vd, float rs1, vfloat32m1_t vs2,
                               size_t vl);
vfloat32m2_t __riscv_vfmadd_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                               vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmadd_tu(vfloat32m2_t vd, float rs1, vfloat32m2_t vs2,
                               size_t vl);
vfloat32m4_t __riscv_vfmadd_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                               vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmadd_tu(vfloat32m4_t vd, float rs1, vfloat32m4_t vs2,
                               size_t vl);
vfloat32m8_t __riscv_vfmadd_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                               vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmadd_tu(vfloat32m8_t vd, float rs1, vfloat32m8_t vs2,
                               size_t vl);
vfloat64m1_t __riscv_vfmadd_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                               vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmadd_tu(vfloat64m1_t vd, double rs1, vfloat64m1_t vs2,
                               size_t vl);
vfloat64m2_t __riscv_vfmadd_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                               vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmadd_tu(vfloat64m2_t vd, double rs1, vfloat64m2_t vs2,
                               size_t vl);
vfloat64m4_t __riscv_vfmadd_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                               vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmadd_tu(vfloat64m4_t vd, double rs1, vfloat64m4_t vs2,
                               size_t vl);
vfloat64m8_t __riscv_vfmadd_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                               vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmadd_tu(vfloat64m8_t vd, double rs1, vfloat64m8_t vs2,
                               size_t vl);
vfloat16mf4_t __riscv_vfnmadd_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1,
                                 vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmadd_tu(vfloat16mf4_t vd, _Float16 rs1,
                                 vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmadd_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmadd_tu(vfloat16mf2_t vd, _Float16 rs1,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmadd_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmadd_tu(vfloat16m1_t vd, _Float16 rs1, vfloat16m1_t vs2,
                                size_t vl);
vfloat16m2_t __riscv_vfnmadd_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmadd_tu(vfloat16m2_t vd, _Float16 rs1, vfloat16m2_t vs2,
                                size_t vl);
vfloat16m4_t __riscv_vfnmadd_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmadd_tu(vfloat16m4_t vd, _Float16 rs1, vfloat16m4_t vs2,
                                size_t vl);
vfloat16m8_t __riscv_vfnmadd_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                                vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmadd_tu(vfloat16m8_t vd, _Float16 rs1, vfloat16m8_t vs2,
                                size_t vl);
vfloat32mf2_t __riscv_vfnmadd_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1,
                                 vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmadd_tu(vfloat32mf2_t vd, float rs1, vfloat32mf2_t vs2,
                                 size_t vl);
vfloat32m1_t __riscv_vfnmadd_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmadd_tu(vfloat32m1_t vd, float rs1, vfloat32m1_t vs2,
                                size_t vl);
vfloat32m2_t __riscv_vfnmadd_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmadd_tu(vfloat32m2_t vd, float rs1, vfloat32m2_t vs2,
                                size_t vl);
vfloat32m4_t __riscv_vfnmadd_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmadd_tu(vfloat32m4_t vd, float rs1, vfloat32m4_t vs2,
                                size_t vl);
vfloat32m8_t __riscv_vfnmadd_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                                vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmadd_tu(vfloat32m8_t vd, float rs1, vfloat32m8_t vs2,
                                size_t vl);
vfloat64m1_t __riscv_vfnmadd_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                                vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmadd_tu(vfloat64m1_t vd, double rs1, vfloat64m1_t vs2,
                                size_t vl);
vfloat64m2_t __riscv_vfnmadd_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                                vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmadd_tu(vfloat64m2_t vd, double rs1, vfloat64m2_t vs2,
                                size_t vl);
vfloat64m4_t __riscv_vfnmadd_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                                vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmadd_tu(vfloat64m4_t vd, double rs1, vfloat64m4_t vs2,
                                size_t vl);
vfloat64m8_t __riscv_vfnmadd_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                                vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmadd_tu(vfloat64m8_t vd, double rs1, vfloat64m8_t vs2,
                                size_t vl);
vfloat16mf4_t __riscv_vfmsub_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1,
                                vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfmsub_tu(vfloat16mf4_t vd, _Float16 rs1,
                                vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmsub_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1,
                                vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmsub_tu(vfloat16mf2_t vd, _Float16 rs1,
                                vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmsub_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                               vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmsub_tu(vfloat16m1_t vd, _Float16 rs1, vfloat16m1_t vs2,
                               size_t vl);
vfloat16m2_t __riscv_vfmsub_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                               vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmsub_tu(vfloat16m2_t vd, _Float16 rs1, vfloat16m2_t vs2,
                               size_t vl);
vfloat16m4_t __riscv_vfmsub_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                               vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmsub_tu(vfloat16m4_t vd, _Float16 rs1, vfloat16m4_t vs2,
                               size_t vl);
vfloat16m8_t __riscv_vfmsub_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                               vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmsub_tu(vfloat16m8_t vd, _Float16 rs1, vfloat16m8_t vs2,
                               size_t vl);
vfloat32mf2_t __riscv_vfmsub_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1,
                                vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmsub_tu(vfloat32mf2_t vd, float rs1, vfloat32mf2_t vs2,
                                size_t vl);
vfloat32m1_t __riscv_vfmsub_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                               vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmsub_tu(vfloat32m1_t vd, float rs1, vfloat32m1_t vs2,
                               size_t vl);
vfloat32m2_t __riscv_vfmsub_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                               vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmsub_tu(vfloat32m2_t vd, float rs1, vfloat32m2_t vs2,
                               size_t vl);
vfloat32m4_t __riscv_vfmsub_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                               vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmsub_tu(vfloat32m4_t vd, float rs1, vfloat32m4_t vs2,
                               size_t vl);
vfloat32m8_t __riscv_vfmsub_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                               vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmsub_tu(vfloat32m8_t vd, float rs1, vfloat32m8_t vs2,
                               size_t vl);
vfloat64m1_t __riscv_vfmsub_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                               vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmsub_tu(vfloat64m1_t vd, double rs1, vfloat64m1_t vs2,
                               size_t vl);
vfloat64m2_t __riscv_vfmsub_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                               vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmsub_tu(vfloat64m2_t vd, double rs1, vfloat64m2_t vs2,
                               size_t vl);
vfloat64m4_t __riscv_vfmsub_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                               vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmsub_tu(vfloat64m4_t vd, double rs1, vfloat64m4_t vs2,
                               size_t vl);
vfloat64m8_t __riscv_vfmsub_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                               vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmsub_tu(vfloat64m8_t vd, double rs1, vfloat64m8_t vs2,
                               size_t vl);
vfloat16mf4_t __riscv_vfnmsub_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1,
                                 vfloat16mf4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmsub_tu(vfloat16mf4_t vd, _Float16 rs1,
                                 vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmsub_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmsub_tu(vfloat16mf2_t vd, _Float16 rs1,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmsub_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmsub_tu(vfloat16m1_t vd, _Float16 rs1, vfloat16m1_t vs2,
                                size_t vl);
vfloat16m2_t __riscv_vfnmsub_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmsub_tu(vfloat16m2_t vd, _Float16 rs1, vfloat16m2_t vs2,
                                size_t vl);
vfloat16m4_t __riscv_vfnmsub_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmsub_tu(vfloat16m4_t vd, _Float16 rs1, vfloat16m4_t vs2,
                                size_t vl);
vfloat16m8_t __riscv_vfnmsub_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                                vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmsub_tu(vfloat16m8_t vd, _Float16 rs1, vfloat16m8_t vs2,
                                size_t vl);
vfloat32mf2_t __riscv_vfnmsub_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1,
                                 vfloat32mf2_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmsub_tu(vfloat32mf2_t vd, float rs1, vfloat32mf2_t vs2,
                                 size_t vl);
vfloat32m1_t __riscv_vfnmsub_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmsub_tu(vfloat32m1_t vd, float rs1, vfloat32m1_t vs2,
                                size_t vl);
vfloat32m2_t __riscv_vfnmsub_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmsub_tu(vfloat32m2_t vd, float rs1, vfloat32m2_t vs2,
                                size_t vl);
vfloat32m4_t __riscv_vfnmsub_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmsub_tu(vfloat32m4_t vd, float rs1, vfloat32m4_t vs2,
                                size_t vl);
vfloat32m8_t __riscv_vfnmsub_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                                vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmsub_tu(vfloat32m8_t vd, float rs1, vfloat32m8_t vs2,
                                size_t vl);
vfloat64m1_t __riscv_vfnmsub_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                                vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmsub_tu(vfloat64m1_t vd, double rs1, vfloat64m1_t vs2,
                                size_t vl);
vfloat64m2_t __riscv_vfnmsub_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                                vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmsub_tu(vfloat64m2_t vd, double rs1, vfloat64m2_t vs2,
                                size_t vl);
vfloat64m4_t __riscv_vfnmsub_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                                vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmsub_tu(vfloat64m4_t vd, double rs1, vfloat64m4_t vs2,
                                size_t vl);
vfloat64m8_t __riscv_vfnmsub_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                                vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmsub_tu(vfloat64m8_t vd, double rs1, vfloat64m8_t vs2,
                                size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmacc_tum(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                 size_t vl);
vfloat16mf4_t __riscv_vfmacc_tum(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                 vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmacc_tum(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                 size_t vl);
vfloat16mf2_t __riscv_vfmacc_tum(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmacc_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmacc_tum(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmacc_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmacc_tum(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmacc_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmacc_tum(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmacc_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmacc_tum(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmacc_tum(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                 size_t vl);
vfloat32mf2_t __riscv_vfmacc_tum(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                 vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmacc_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmacc_tum(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmacc_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmacc_tum(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmacc_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmacc_tum(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmacc_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmacc_tum(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmacc_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs1,
                                vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmacc_tum(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmacc_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs1,
                                vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmacc_tum(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmacc_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs1,
                                vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmacc_tum(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmacc_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmacc_tum(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmacc_tum(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                  size_t vl);
vfloat16mf4_t __riscv_vfnmacc_tum(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                  vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmacc_tum(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                  size_t vl);
vfloat16mf2_t __riscv_vfnmacc_tum(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                  vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmacc_tum(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs1, vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmacc_tum(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                 vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmacc_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmacc_tum(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmacc_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmacc_tum(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmacc_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                 vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmacc_tum(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                 vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmacc_tum(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                  size_t vl);
vfloat32mf2_t __riscv_vfnmacc_tum(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                  vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmacc_tum(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs1, vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmacc_tum(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                 vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmacc_tum(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs1, vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmacc_tum(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                 vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmacc_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmacc_tum(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmacc_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                 vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmacc_tum(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                 vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmacc_tum(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs1, vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmacc_tum(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                 vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmacc_tum(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs1, vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmacc_tum(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                 vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmacc_tum(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs1, vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmacc_tum(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                 vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmacc_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                 vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmacc_tum(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                 vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfmsac_tum(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                 size_t vl);
vfloat16mf4_t __riscv_vfmsac_tum(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                 vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmsac_tum(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                 size_t vl);
vfloat16mf2_t __riscv_vfmsac_tum(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmsac_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmsac_tum(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmsac_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmsac_tum(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmsac_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmsac_tum(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmsac_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmsac_tum(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmsac_tum(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                 size_t vl);
vfloat32mf2_t __riscv_vfmsac_tum(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                 vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmsac_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmsac_tum(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmsac_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmsac_tum(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmsac_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmsac_tum(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmsac_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmsac_tum(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmsac_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs1,
                                vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmsac_tum(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmsac_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs1,
                                vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmsac_tum(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmsac_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs1,
                                vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmsac_tum(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmsac_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmsac_tum(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmsac_tum(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                  size_t vl);
vfloat16mf4_t __riscv_vfnmsac_tum(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                  vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmsac_tum(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                  size_t vl);
vfloat16mf2_t __riscv_vfnmsac_tum(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                  vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmsac_tum(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs1, vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmsac_tum(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                 vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmsac_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmsac_tum(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmsac_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmsac_tum(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmsac_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                 vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmsac_tum(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                 vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmsac_tum(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                  size_t vl);
vfloat32mf2_t __riscv_vfnmsac_tum(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                  vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmsac_tum(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs1, vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmsac_tum(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                 vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmsac_tum(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs1, vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmsac_tum(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                 vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmsac_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmsac_tum(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmsac_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                 vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmsac_tum(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                 vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmsac_tum(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs1, vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmsac_tum(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                 vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmsac_tum(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs1, vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmsac_tum(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                 vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmsac_tum(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs1, vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmsac_tum(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                 vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmsac_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                 vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmsac_tum(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                 vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfmadd_tum(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                 size_t vl);
vfloat16mf4_t __riscv_vfmadd_tum(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                 vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmadd_tum(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                 size_t vl);
vfloat16mf2_t __riscv_vfmadd_tum(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmadd_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmadd_tum(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmadd_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmadd_tum(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmadd_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmadd_tum(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmadd_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmadd_tum(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmadd_tum(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                 size_t vl);
vfloat32mf2_t __riscv_vfmadd_tum(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                 vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmadd_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmadd_tum(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmadd_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmadd_tum(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmadd_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmadd_tum(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmadd_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmadd_tum(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmadd_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs1,
                                vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmadd_tum(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmadd_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs1,
                                vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmadd_tum(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmadd_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs1,
                                vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmadd_tum(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmadd_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmadd_tum(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmadd_tum(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                  size_t vl);
vfloat16mf4_t __riscv_vfnmadd_tum(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                  vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmadd_tum(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                  size_t vl);
vfloat16mf2_t __riscv_vfnmadd_tum(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                  vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmadd_tum(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs1, vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmadd_tum(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                 vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmadd_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmadd_tum(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmadd_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmadd_tum(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmadd_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                 vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmadd_tum(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                 vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmadd_tum(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                  size_t vl);
vfloat32mf2_t __riscv_vfnmadd_tum(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                  vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmadd_tum(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs1, vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmadd_tum(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                 vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmadd_tum(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs1, vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmadd_tum(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                 vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmadd_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmadd_tum(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmadd_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                 vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmadd_tum(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                 vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmadd_tum(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs1, vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmadd_tum(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                 vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmadd_tum(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs1, vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmadd_tum(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                 vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmadd_tum(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs1, vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmadd_tum(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                 vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmadd_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                 vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmadd_tum(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                 vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfmsub_tum(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                 size_t vl);
vfloat16mf4_t __riscv_vfmsub_tum(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                 vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmsub_tum(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                 size_t vl);
vfloat16mf2_t __riscv_vfmsub_tum(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmsub_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmsub_tum(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmsub_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmsub_tum(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmsub_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmsub_tum(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmsub_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmsub_tum(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmsub_tum(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                 size_t vl);
vfloat32mf2_t __riscv_vfmsub_tum(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                 vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmsub_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmsub_tum(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmsub_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmsub_tum(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmsub_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmsub_tum(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmsub_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmsub_tum(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmsub_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs1,
                                vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmsub_tum(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmsub_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs1,
                                vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmsub_tum(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmsub_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs1,
                                vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmsub_tum(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmsub_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmsub_tum(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmsub_tum(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                  size_t vl);
vfloat16mf4_t __riscv_vfnmsub_tum(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                  vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmsub_tum(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                  size_t vl);
vfloat16mf2_t __riscv_vfnmsub_tum(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                  vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmsub_tum(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs1, vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmsub_tum(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                 vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmsub_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmsub_tum(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmsub_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmsub_tum(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmsub_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                 vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmsub_tum(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                 vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmsub_tum(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                  size_t vl);
vfloat32mf2_t __riscv_vfnmsub_tum(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                  vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmsub_tum(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs1, vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmsub_tum(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                 vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmsub_tum(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs1, vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmsub_tum(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                 vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmsub_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmsub_tum(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmsub_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                 vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmsub_tum(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                 vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmsub_tum(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs1, vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmsub_tum(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                 vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmsub_tum(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs1, vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmsub_tum(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                 vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmsub_tum(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs1, vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmsub_tum(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                 vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmsub_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                 vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmsub_tum(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                 vfloat64m8_t vs2, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmacc_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                  size_t vl);
vfloat16mf4_t __riscv_vfmacc_tumu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                  vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmacc_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                  size_t vl);
vfloat16mf2_t __riscv_vfmacc_tumu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                  vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmacc_tumu(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs1, vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmacc_tumu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                 vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmacc_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmacc_tumu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmacc_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmacc_tumu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmacc_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                 vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmacc_tumu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                 vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmacc_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                  size_t vl);
vfloat32mf2_t __riscv_vfmacc_tumu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                  vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmacc_tumu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs1, vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmacc_tumu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                 vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmacc_tumu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs1, vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmacc_tumu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                 vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmacc_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmacc_tumu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmacc_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                 vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmacc_tumu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                 vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmacc_tumu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs1, vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmacc_tumu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                 vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmacc_tumu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs1, vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmacc_tumu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                 vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmacc_tumu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs1, vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmacc_tumu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                 vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmacc_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                 vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmacc_tumu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                 vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmacc_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                   vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                   size_t vl);
vfloat16mf4_t __riscv_vfnmacc_tumu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                   vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmacc_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                   vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                   size_t vl);
vfloat16mf2_t __riscv_vfnmacc_tumu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                   vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmacc_tumu(vbool16_t vm, vfloat16m1_t vd,
                                  vfloat16m1_t vs1, vfloat16m1_t vs2,
                                  size_t vl);
vfloat16m1_t __riscv_vfnmacc_tumu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                  vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmacc_tumu(vbool8_t vm, vfloat16m2_t vd,
                                  vfloat16m2_t vs1, vfloat16m2_t vs2,
                                  size_t vl);
vfloat16m2_t __riscv_vfnmacc_tumu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                  vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmacc_tumu(vbool4_t vm, vfloat16m4_t vd,
                                  vfloat16m4_t vs1, vfloat16m4_t vs2,
                                  size_t vl);
vfloat16m4_t __riscv_vfnmacc_tumu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                  vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmacc_tumu(vbool2_t vm, vfloat16m8_t vd,
                                  vfloat16m8_t vs1, vfloat16m8_t vs2,
                                  size_t vl);
vfloat16m8_t __riscv_vfnmacc_tumu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                  vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmacc_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                   size_t vl);
vfloat32mf2_t __riscv_vfnmacc_tumu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                   vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmacc_tumu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat32m1_t vs1, vfloat32m1_t vs2,
                                  size_t vl);
vfloat32m1_t __riscv_vfnmacc_tumu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                  vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmacc_tumu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat32m2_t vs1, vfloat32m2_t vs2,
                                  size_t vl);
vfloat32m2_t __riscv_vfnmacc_tumu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                  vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmacc_tumu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat32m4_t vs1, vfloat32m4_t vs2,
                                  size_t vl);
vfloat32m4_t __riscv_vfnmacc_tumu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                  vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmacc_tumu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat32m8_t vs1, vfloat32m8_t vs2,
                                  size_t vl);
vfloat32m8_t __riscv_vfnmacc_tumu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                  vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmacc_tumu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat64m1_t vs1, vfloat64m1_t vs2,
                                  size_t vl);
vfloat64m1_t __riscv_vfnmacc_tumu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                  vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmacc_tumu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat64m2_t vs1, vfloat64m2_t vs2,
                                  size_t vl);
vfloat64m2_t __riscv_vfnmacc_tumu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                  vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmacc_tumu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat64m4_t vs1, vfloat64m4_t vs2,
                                  size_t vl);
vfloat64m4_t __riscv_vfnmacc_tumu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                  vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmacc_tumu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat64m8_t vs1, vfloat64m8_t vs2,
                                  size_t vl);
vfloat64m8_t __riscv_vfnmacc_tumu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                  vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfmsac_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                  size_t vl);
vfloat16mf4_t __riscv_vfmsac_tumu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                  vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmsac_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                  size_t vl);
vfloat16mf2_t __riscv_vfmsac_tumu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                  vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmsac_tumu(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs1, vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmsac_tumu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                 vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmsac_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmsac_tumu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmsac_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmsac_tumu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmsac_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                 vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmsac_tumu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                 vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmsac_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                  size_t vl);
vfloat32mf2_t __riscv_vfmsac_tumu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                  vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmsac_tumu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs1, vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmsac_tumu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                 vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmsac_tumu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs1, vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmsac_tumu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                 vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmsac_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmsac_tumu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmsac_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                 vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmsac_tumu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                 vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmsac_tumu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs1, vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmsac_tumu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                 vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmsac_tumu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs1, vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmsac_tumu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                 vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmsac_tumu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs1, vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmsac_tumu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                 vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmsac_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                 vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmsac_tumu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                 vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmsac_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                   vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                   size_t vl);
vfloat16mf4_t __riscv_vfnmsac_tumu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                   vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmsac_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                   vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                   size_t vl);
vfloat16mf2_t __riscv_vfnmsac_tumu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                   vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmsac_tumu(vbool16_t vm, vfloat16m1_t vd,
                                  vfloat16m1_t vs1, vfloat16m1_t vs2,
                                  size_t vl);
vfloat16m1_t __riscv_vfnmsac_tumu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                  vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmsac_tumu(vbool8_t vm, vfloat16m2_t vd,
                                  vfloat16m2_t vs1, vfloat16m2_t vs2,
                                  size_t vl);
vfloat16m2_t __riscv_vfnmsac_tumu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                  vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmsac_tumu(vbool4_t vm, vfloat16m4_t vd,
                                  vfloat16m4_t vs1, vfloat16m4_t vs2,
                                  size_t vl);
vfloat16m4_t __riscv_vfnmsac_tumu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                  vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmsac_tumu(vbool2_t vm, vfloat16m8_t vd,
                                  vfloat16m8_t vs1, vfloat16m8_t vs2,
                                  size_t vl);
vfloat16m8_t __riscv_vfnmsac_tumu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                  vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmsac_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                   size_t vl);
vfloat32mf2_t __riscv_vfnmsac_tumu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                   vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmsac_tumu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat32m1_t vs1, vfloat32m1_t vs2,
                                  size_t vl);
vfloat32m1_t __riscv_vfnmsac_tumu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                  vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmsac_tumu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat32m2_t vs1, vfloat32m2_t vs2,
                                  size_t vl);
vfloat32m2_t __riscv_vfnmsac_tumu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                  vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmsac_tumu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat32m4_t vs1, vfloat32m4_t vs2,
                                  size_t vl);
vfloat32m4_t __riscv_vfnmsac_tumu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                  vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmsac_tumu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat32m8_t vs1, vfloat32m8_t vs2,
                                  size_t vl);
vfloat32m8_t __riscv_vfnmsac_tumu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                  vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmsac_tumu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat64m1_t vs1, vfloat64m1_t vs2,
                                  size_t vl);
vfloat64m1_t __riscv_vfnmsac_tumu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                  vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmsac_tumu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat64m2_t vs1, vfloat64m2_t vs2,
                                  size_t vl);
vfloat64m2_t __riscv_vfnmsac_tumu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                  vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmsac_tumu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat64m4_t vs1, vfloat64m4_t vs2,
                                  size_t vl);
vfloat64m4_t __riscv_vfnmsac_tumu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                  vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmsac_tumu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat64m8_t vs1, vfloat64m8_t vs2,
                                  size_t vl);
vfloat64m8_t __riscv_vfnmsac_tumu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                  vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfmadd_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                  size_t vl);
vfloat16mf4_t __riscv_vfmadd_tumu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                  vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmadd_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                  size_t vl);
vfloat16mf2_t __riscv_vfmadd_tumu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                  vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmadd_tumu(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs1, vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmadd_tumu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                 vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmadd_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmadd_tumu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmadd_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmadd_tumu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmadd_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                 vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmadd_tumu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                 vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmadd_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                  size_t vl);
vfloat32mf2_t __riscv_vfmadd_tumu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                  vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmadd_tumu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs1, vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmadd_tumu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                 vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmadd_tumu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs1, vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmadd_tumu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                 vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmadd_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmadd_tumu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmadd_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                 vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmadd_tumu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                 vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmadd_tumu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs1, vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmadd_tumu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                 vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmadd_tumu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs1, vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmadd_tumu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                 vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmadd_tumu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs1, vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmadd_tumu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                 vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmadd_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                 vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmadd_tumu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                 vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmadd_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                   vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                   size_t vl);
vfloat16mf4_t __riscv_vfnmadd_tumu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                   vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmadd_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                   vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                   size_t vl);
vfloat16mf2_t __riscv_vfnmadd_tumu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                   vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmadd_tumu(vbool16_t vm, vfloat16m1_t vd,
                                  vfloat16m1_t vs1, vfloat16m1_t vs2,
                                  size_t vl);
vfloat16m1_t __riscv_vfnmadd_tumu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                  vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmadd_tumu(vbool8_t vm, vfloat16m2_t vd,
                                  vfloat16m2_t vs1, vfloat16m2_t vs2,
                                  size_t vl);
vfloat16m2_t __riscv_vfnmadd_tumu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                  vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmadd_tumu(vbool4_t vm, vfloat16m4_t vd,
                                  vfloat16m4_t vs1, vfloat16m4_t vs2,
                                  size_t vl);
vfloat16m4_t __riscv_vfnmadd_tumu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                  vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmadd_tumu(vbool2_t vm, vfloat16m8_t vd,
                                  vfloat16m8_t vs1, vfloat16m8_t vs2,
                                  size_t vl);
vfloat16m8_t __riscv_vfnmadd_tumu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                  vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmadd_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                   size_t vl);
vfloat32mf2_t __riscv_vfnmadd_tumu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                   vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmadd_tumu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat32m1_t vs1, vfloat32m1_t vs2,
                                  size_t vl);
vfloat32m1_t __riscv_vfnmadd_tumu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                  vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmadd_tumu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat32m2_t vs1, vfloat32m2_t vs2,
                                  size_t vl);
vfloat32m2_t __riscv_vfnmadd_tumu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                  vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmadd_tumu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat32m4_t vs1, vfloat32m4_t vs2,
                                  size_t vl);
vfloat32m4_t __riscv_vfnmadd_tumu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                  vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmadd_tumu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat32m8_t vs1, vfloat32m8_t vs2,
                                  size_t vl);
vfloat32m8_t __riscv_vfnmadd_tumu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                  vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmadd_tumu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat64m1_t vs1, vfloat64m1_t vs2,
                                  size_t vl);
vfloat64m1_t __riscv_vfnmadd_tumu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                  vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmadd_tumu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat64m2_t vs1, vfloat64m2_t vs2,
                                  size_t vl);
vfloat64m2_t __riscv_vfnmadd_tumu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                  vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmadd_tumu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat64m4_t vs1, vfloat64m4_t vs2,
                                  size_t vl);
vfloat64m4_t __riscv_vfnmadd_tumu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                  vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmadd_tumu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat64m8_t vs1, vfloat64m8_t vs2,
                                  size_t vl);
vfloat64m8_t __riscv_vfnmadd_tumu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                  vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfmsub_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                  size_t vl);
vfloat16mf4_t __riscv_vfmsub_tumu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                  vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmsub_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                  size_t vl);
vfloat16mf2_t __riscv_vfmsub_tumu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                  vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmsub_tumu(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs1, vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmsub_tumu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                 vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmsub_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmsub_tumu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmsub_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmsub_tumu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmsub_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                 vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmsub_tumu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                 vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmsub_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                  size_t vl);
vfloat32mf2_t __riscv_vfmsub_tumu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                  vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmsub_tumu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs1, vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmsub_tumu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                 vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmsub_tumu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs1, vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmsub_tumu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                 vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmsub_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmsub_tumu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmsub_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                 vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmsub_tumu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                 vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmsub_tumu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs1, vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmsub_tumu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                 vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmsub_tumu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs1, vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmsub_tumu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                 vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmsub_tumu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs1, vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmsub_tumu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                 vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmsub_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                 vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmsub_tumu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                 vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmsub_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                   vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                   size_t vl);
vfloat16mf4_t __riscv_vfnmsub_tumu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                   vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmsub_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                   vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                   size_t vl);
vfloat16mf2_t __riscv_vfnmsub_tumu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                   vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmsub_tumu(vbool16_t vm, vfloat16m1_t vd,
                                  vfloat16m1_t vs1, vfloat16m1_t vs2,
                                  size_t vl);
vfloat16m1_t __riscv_vfnmsub_tumu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                  vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmsub_tumu(vbool8_t vm, vfloat16m2_t vd,
                                  vfloat16m2_t vs1, vfloat16m2_t vs2,
                                  size_t vl);
vfloat16m2_t __riscv_vfnmsub_tumu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                  vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmsub_tumu(vbool4_t vm, vfloat16m4_t vd,
                                  vfloat16m4_t vs1, vfloat16m4_t vs2,
                                  size_t vl);
vfloat16m4_t __riscv_vfnmsub_tumu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                  vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmsub_tumu(vbool2_t vm, vfloat16m8_t vd,
                                  vfloat16m8_t vs1, vfloat16m8_t vs2,
                                  size_t vl);
vfloat16m8_t __riscv_vfnmsub_tumu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                  vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmsub_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                   size_t vl);
vfloat32mf2_t __riscv_vfnmsub_tumu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                   vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmsub_tumu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat32m1_t vs1, vfloat32m1_t vs2,
                                  size_t vl);
vfloat32m1_t __riscv_vfnmsub_tumu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                  vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmsub_tumu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat32m2_t vs1, vfloat32m2_t vs2,
                                  size_t vl);
vfloat32m2_t __riscv_vfnmsub_tumu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                  vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmsub_tumu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat32m4_t vs1, vfloat32m4_t vs2,
                                  size_t vl);
vfloat32m4_t __riscv_vfnmsub_tumu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                  vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmsub_tumu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat32m8_t vs1, vfloat32m8_t vs2,
                                  size_t vl);
vfloat32m8_t __riscv_vfnmsub_tumu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                  vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmsub_tumu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat64m1_t vs1, vfloat64m1_t vs2,
                                  size_t vl);
vfloat64m1_t __riscv_vfnmsub_tumu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                  vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmsub_tumu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat64m2_t vs1, vfloat64m2_t vs2,
                                  size_t vl);
vfloat64m2_t __riscv_vfnmsub_tumu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                  vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmsub_tumu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat64m4_t vs1, vfloat64m4_t vs2,
                                  size_t vl);
vfloat64m4_t __riscv_vfnmsub_tumu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                  vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmsub_tumu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat64m8_t vs1, vfloat64m8_t vs2,
                                  size_t vl);
vfloat64m8_t __riscv_vfnmsub_tumu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                  vfloat64m8_t vs2, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmacc_mu(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                size_t vl);
vfloat16mf4_t __riscv_vfmacc_mu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmacc_mu(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                size_t vl);
vfloat16mf2_t __riscv_vfmacc_mu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmacc_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs1,
                               vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmacc_mu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                               vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmacc_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                               vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmacc_mu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                               vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmacc_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                               vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmacc_mu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                               vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmacc_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                               vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmacc_mu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                               vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmacc_mu(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                size_t vl);
vfloat32mf2_t __riscv_vfmacc_mu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmacc_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs1,
                               vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmacc_mu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                               vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmacc_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs1,
                               vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmacc_mu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                               vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmacc_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                               vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmacc_mu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                               vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmacc_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                               vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmacc_mu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                               vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmacc_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs1,
                               vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmacc_mu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                               vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmacc_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs1,
                               vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmacc_mu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                               vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmacc_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs1,
                               vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmacc_mu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                               vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmacc_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                               vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmacc_mu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                               vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmacc_mu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                 size_t vl);
vfloat16mf4_t __riscv_vfnmacc_mu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                 vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmacc_mu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                 size_t vl);
vfloat16mf2_t __riscv_vfnmacc_mu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmacc_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmacc_mu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmacc_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmacc_mu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmacc_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmacc_mu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmacc_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmacc_mu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmacc_mu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                 size_t vl);
vfloat32mf2_t __riscv_vfnmacc_mu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                 vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmacc_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmacc_mu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmacc_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmacc_mu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmacc_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmacc_mu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmacc_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmacc_mu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmacc_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs1,
                                vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmacc_mu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmacc_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs1,
                                vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmacc_mu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmacc_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs1,
                                vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmacc_mu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmacc_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmacc_mu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfmsac_mu(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                size_t vl);
vfloat16mf4_t __riscv_vfmsac_mu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmsac_mu(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                size_t vl);
vfloat16mf2_t __riscv_vfmsac_mu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmsac_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs1,
                               vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmsac_mu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                               vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmsac_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                               vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmsac_mu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                               vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmsac_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                               vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmsac_mu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                               vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmsac_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                               vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmsac_mu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                               vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmsac_mu(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                size_t vl);
vfloat32mf2_t __riscv_vfmsac_mu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmsac_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs1,
                               vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmsac_mu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                               vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmsac_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs1,
                               vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmsac_mu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                               vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmsac_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                               vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmsac_mu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                               vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmsac_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                               vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmsac_mu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                               vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmsac_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs1,
                               vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmsac_mu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                               vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmsac_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs1,
                               vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmsac_mu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                               vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmsac_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs1,
                               vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmsac_mu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                               vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmsac_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                               vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmsac_mu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                               vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmsac_mu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                 size_t vl);
vfloat16mf4_t __riscv_vfnmsac_mu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                 vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmsac_mu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                 size_t vl);
vfloat16mf2_t __riscv_vfnmsac_mu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmsac_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmsac_mu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmsac_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmsac_mu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmsac_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmsac_mu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmsac_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmsac_mu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmsac_mu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                 size_t vl);
vfloat32mf2_t __riscv_vfnmsac_mu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                 vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmsac_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmsac_mu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmsac_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmsac_mu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmsac_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmsac_mu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmsac_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmsac_mu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmsac_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs1,
                                vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmsac_mu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmsac_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs1,
                                vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmsac_mu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmsac_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs1,
                                vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmsac_mu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmsac_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmsac_mu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfmadd_mu(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                size_t vl);
vfloat16mf4_t __riscv_vfmadd_mu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmadd_mu(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                size_t vl);
vfloat16mf2_t __riscv_vfmadd_mu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmadd_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs1,
                               vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmadd_mu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                               vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmadd_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                               vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmadd_mu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                               vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmadd_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                               vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmadd_mu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                               vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmadd_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                               vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmadd_mu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                               vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmadd_mu(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                size_t vl);
vfloat32mf2_t __riscv_vfmadd_mu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmadd_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs1,
                               vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmadd_mu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                               vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmadd_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs1,
                               vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmadd_mu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                               vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmadd_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                               vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmadd_mu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                               vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmadd_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                               vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmadd_mu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                               vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmadd_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs1,
                               vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmadd_mu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                               vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmadd_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs1,
                               vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmadd_mu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                               vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmadd_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs1,
                               vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmadd_mu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                               vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmadd_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                               vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmadd_mu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                               vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmadd_mu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                 size_t vl);
vfloat16mf4_t __riscv_vfnmadd_mu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                 vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmadd_mu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                 size_t vl);
vfloat16mf2_t __riscv_vfnmadd_mu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmadd_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmadd_mu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmadd_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmadd_mu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmadd_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmadd_mu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmadd_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmadd_mu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmadd_mu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                 size_t vl);
vfloat32mf2_t __riscv_vfnmadd_mu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                 vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmadd_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmadd_mu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmadd_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmadd_mu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmadd_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmadd_mu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmadd_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmadd_mu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmadd_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs1,
                                vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmadd_mu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmadd_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs1,
                                vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmadd_mu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmadd_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs1,
                                vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmadd_mu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmadd_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmadd_mu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfmsub_mu(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                size_t vl);
vfloat16mf4_t __riscv_vfmsub_mu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfmsub_mu(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                size_t vl);
vfloat16mf2_t __riscv_vfmsub_mu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmsub_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs1,
                               vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfmsub_mu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                               vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmsub_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                               vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfmsub_mu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                               vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmsub_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                               vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfmsub_mu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                               vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmsub_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                               vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfmsub_mu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                               vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfmsub_mu(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                size_t vl);
vfloat32mf2_t __riscv_vfmsub_mu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmsub_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs1,
                               vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfmsub_mu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                               vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmsub_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs1,
                               vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfmsub_mu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                               vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmsub_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                               vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfmsub_mu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                               vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmsub_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                               vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfmsub_mu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                               vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmsub_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs1,
                               vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfmsub_mu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                               vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmsub_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs1,
                               vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfmsub_mu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                               vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmsub_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs1,
                               vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfmsub_mu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                               vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmsub_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                               vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfmsub_mu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                               vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfnmsub_mu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                 size_t vl);
vfloat16mf4_t __riscv_vfnmsub_mu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                 vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfnmsub_mu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                 size_t vl);
vfloat16mf2_t __riscv_vfnmsub_mu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmsub_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfnmsub_mu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmsub_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfnmsub_mu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmsub_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfnmsub_mu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmsub_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                vfloat16m8_t vs2, size_t vl);
vfloat16m8_t __riscv_vfnmsub_mu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfnmsub_mu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                 size_t vl);
vfloat32mf2_t __riscv_vfnmsub_mu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                 vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmsub_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfnmsub_mu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmsub_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfnmsub_mu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmsub_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfnmsub_mu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmsub_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                vfloat32m8_t vs2, size_t vl);
vfloat32m8_t __riscv_vfnmsub_mu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmsub_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs1,
                                vfloat64m1_t vs2, size_t vl);
vfloat64m1_t __riscv_vfnmsub_mu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmsub_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs1,
                                vfloat64m2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfnmsub_mu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmsub_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs1,
                                vfloat64m4_t vs2, size_t vl);
vfloat64m4_t __riscv_vfnmsub_mu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmsub_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                vfloat64m8_t vs2, size_t vl);
vfloat64m8_t __riscv_vfnmsub_mu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                vfloat64m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfmacc_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1,
                                vfloat16mf4_t vs2, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmacc_tu(vfloat16mf4_t vd, _Float16 rs1,
                                vfloat16mf4_t vs2, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmacc_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1,
                                vfloat16mf2_t vs2, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmacc_tu(vfloat16mf2_t vd, _Float16 rs1,
                                vfloat16mf2_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmacc_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                               vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmacc_tu(vfloat16m1_t vd, _Float16 rs1, vfloat16m1_t vs2,
                               unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmacc_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                               vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmacc_tu(vfloat16m2_t vd, _Float16 rs1, vfloat16m2_t vs2,
                               unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmacc_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                               vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmacc_tu(vfloat16m4_t vd, _Float16 rs1, vfloat16m4_t vs2,
                               unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmacc_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                               vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmacc_tu(vfloat16m8_t vd, _Float16 rs1, vfloat16m8_t vs2,
                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmacc_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1,
                                vfloat32mf2_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmacc_tu(vfloat32mf2_t vd, float rs1, vfloat32mf2_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmacc_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                               vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmacc_tu(vfloat32m1_t vd, float rs1, vfloat32m1_t vs2,
                               unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmacc_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                               vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmacc_tu(vfloat32m2_t vd, float rs1, vfloat32m2_t vs2,
                               unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmacc_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                               vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmacc_tu(vfloat32m4_t vd, float rs1, vfloat32m4_t vs2,
                               unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmacc_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                               vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmacc_tu(vfloat32m8_t vd, float rs1, vfloat32m8_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmacc_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                               vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmacc_tu(vfloat64m1_t vd, double rs1, vfloat64m1_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmacc_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                               vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmacc_tu(vfloat64m2_t vd, double rs1, vfloat64m2_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmacc_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                               vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmacc_tu(vfloat64m4_t vd, double rs1, vfloat64m4_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmacc_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                               vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmacc_tu(vfloat64m8_t vd, double rs1, vfloat64m8_t vs2,
                               unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmacc_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16mf4_t __riscv_vfnmacc_tu(vfloat16mf4_t vd, _Float16 rs1,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16mf2_t __riscv_vfnmacc_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16mf2_t __riscv_vfnmacc_tu(vfloat16mf2_t vd, _Float16 rs1,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16m1_t __riscv_vfnmacc_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmacc_tu(vfloat16m1_t vd, _Float16 rs1, vfloat16m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmacc_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmacc_tu(vfloat16m2_t vd, _Float16 rs1, vfloat16m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmacc_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmacc_tu(vfloat16m4_t vd, _Float16 rs1, vfloat16m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmacc_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                                vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmacc_tu(vfloat16m8_t vd, _Float16 rs1, vfloat16m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmacc_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1,
                                 vfloat32mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32mf2_t __riscv_vfnmacc_tu(vfloat32mf2_t vd, float rs1, vfloat32mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmacc_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmacc_tu(vfloat32m1_t vd, float rs1, vfloat32m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmacc_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmacc_tu(vfloat32m2_t vd, float rs1, vfloat32m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmacc_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmacc_tu(vfloat32m4_t vd, float rs1, vfloat32m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmacc_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                                vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmacc_tu(vfloat32m8_t vd, float rs1, vfloat32m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmacc_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                                vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmacc_tu(vfloat64m1_t vd, double rs1, vfloat64m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmacc_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                                vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmacc_tu(vfloat64m2_t vd, double rs1, vfloat64m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmacc_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                                vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmacc_tu(vfloat64m4_t vd, double rs1, vfloat64m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmacc_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                                vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmacc_tu(vfloat64m8_t vd, double rs1, vfloat64m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsac_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1,
                                vfloat16mf4_t vs2, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsac_tu(vfloat16mf4_t vd, _Float16 rs1,
                                vfloat16mf4_t vs2, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsac_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1,
                                vfloat16mf2_t vs2, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsac_tu(vfloat16mf2_t vd, _Float16 rs1,
                                vfloat16mf2_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsac_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                               vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsac_tu(vfloat16m1_t vd, _Float16 rs1, vfloat16m1_t vs2,
                               unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsac_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                               vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsac_tu(vfloat16m2_t vd, _Float16 rs1, vfloat16m2_t vs2,
                               unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsac_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                               vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsac_tu(vfloat16m4_t vd, _Float16 rs1, vfloat16m4_t vs2,
                               unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsac_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                               vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsac_tu(vfloat16m8_t vd, _Float16 rs1, vfloat16m8_t vs2,
                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsac_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1,
                                vfloat32mf2_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsac_tu(vfloat32mf2_t vd, float rs1, vfloat32mf2_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsac_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                               vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsac_tu(vfloat32m1_t vd, float rs1, vfloat32m1_t vs2,
                               unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsac_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                               vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsac_tu(vfloat32m2_t vd, float rs1, vfloat32m2_t vs2,
                               unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsac_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                               vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsac_tu(vfloat32m4_t vd, float rs1, vfloat32m4_t vs2,
                               unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsac_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                               vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsac_tu(vfloat32m8_t vd, float rs1, vfloat32m8_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsac_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                               vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsac_tu(vfloat64m1_t vd, double rs1, vfloat64m1_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsac_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                               vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsac_tu(vfloat64m2_t vd, double rs1, vfloat64m2_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsac_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                               vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsac_tu(vfloat64m4_t vd, double rs1, vfloat64m4_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsac_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                               vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsac_tu(vfloat64m8_t vd, double rs1, vfloat64m8_t vs2,
                               unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsac_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16mf4_t __riscv_vfnmsac_tu(vfloat16mf4_t vd, _Float16 rs1,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16mf2_t __riscv_vfnmsac_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16mf2_t __riscv_vfnmsac_tu(vfloat16mf2_t vd, _Float16 rs1,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16m1_t __riscv_vfnmsac_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmsac_tu(vfloat16m1_t vd, _Float16 rs1, vfloat16m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsac_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsac_tu(vfloat16m2_t vd, _Float16 rs1, vfloat16m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsac_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsac_tu(vfloat16m4_t vd, _Float16 rs1, vfloat16m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsac_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                                vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsac_tu(vfloat16m8_t vd, _Float16 rs1, vfloat16m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsac_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1,
                                 vfloat32mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32mf2_t __riscv_vfnmsac_tu(vfloat32mf2_t vd, float rs1, vfloat32mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmsac_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmsac_tu(vfloat32m1_t vd, float rs1, vfloat32m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsac_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsac_tu(vfloat32m2_t vd, float rs1, vfloat32m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsac_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsac_tu(vfloat32m4_t vd, float rs1, vfloat32m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsac_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                                vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsac_tu(vfloat32m8_t vd, float rs1, vfloat32m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsac_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                                vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsac_tu(vfloat64m1_t vd, double rs1, vfloat64m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsac_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                                vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsac_tu(vfloat64m2_t vd, double rs1, vfloat64m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsac_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                                vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsac_tu(vfloat64m4_t vd, double rs1, vfloat64m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsac_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                                vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsac_tu(vfloat64m8_t vd, double rs1, vfloat64m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmadd_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1,
                                vfloat16mf4_t vs2, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmadd_tu(vfloat16mf4_t vd, _Float16 rs1,
                                vfloat16mf4_t vs2, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmadd_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1,
                                vfloat16mf2_t vs2, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmadd_tu(vfloat16mf2_t vd, _Float16 rs1,
                                vfloat16mf2_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmadd_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                               vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmadd_tu(vfloat16m1_t vd, _Float16 rs1, vfloat16m1_t vs2,
                               unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmadd_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                               vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmadd_tu(vfloat16m2_t vd, _Float16 rs1, vfloat16m2_t vs2,
                               unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmadd_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                               vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmadd_tu(vfloat16m4_t vd, _Float16 rs1, vfloat16m4_t vs2,
                               unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmadd_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                               vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmadd_tu(vfloat16m8_t vd, _Float16 rs1, vfloat16m8_t vs2,
                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmadd_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1,
                                vfloat32mf2_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmadd_tu(vfloat32mf2_t vd, float rs1, vfloat32mf2_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmadd_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                               vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmadd_tu(vfloat32m1_t vd, float rs1, vfloat32m1_t vs2,
                               unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmadd_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                               vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmadd_tu(vfloat32m2_t vd, float rs1, vfloat32m2_t vs2,
                               unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmadd_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                               vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmadd_tu(vfloat32m4_t vd, float rs1, vfloat32m4_t vs2,
                               unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmadd_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                               vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmadd_tu(vfloat32m8_t vd, float rs1, vfloat32m8_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmadd_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                               vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmadd_tu(vfloat64m1_t vd, double rs1, vfloat64m1_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmadd_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                               vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmadd_tu(vfloat64m2_t vd, double rs1, vfloat64m2_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmadd_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                               vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmadd_tu(vfloat64m4_t vd, double rs1, vfloat64m4_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmadd_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                               vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmadd_tu(vfloat64m8_t vd, double rs1, vfloat64m8_t vs2,
                               unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmadd_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16mf4_t __riscv_vfnmadd_tu(vfloat16mf4_t vd, _Float16 rs1,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16mf2_t __riscv_vfnmadd_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16mf2_t __riscv_vfnmadd_tu(vfloat16mf2_t vd, _Float16 rs1,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16m1_t __riscv_vfnmadd_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmadd_tu(vfloat16m1_t vd, _Float16 rs1, vfloat16m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmadd_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmadd_tu(vfloat16m2_t vd, _Float16 rs1, vfloat16m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmadd_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmadd_tu(vfloat16m4_t vd, _Float16 rs1, vfloat16m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmadd_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                                vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmadd_tu(vfloat16m8_t vd, _Float16 rs1, vfloat16m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmadd_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1,
                                 vfloat32mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32mf2_t __riscv_vfnmadd_tu(vfloat32mf2_t vd, float rs1, vfloat32mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmadd_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmadd_tu(vfloat32m1_t vd, float rs1, vfloat32m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmadd_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmadd_tu(vfloat32m2_t vd, float rs1, vfloat32m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmadd_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmadd_tu(vfloat32m4_t vd, float rs1, vfloat32m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmadd_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                                vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmadd_tu(vfloat32m8_t vd, float rs1, vfloat32m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmadd_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                                vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmadd_tu(vfloat64m1_t vd, double rs1, vfloat64m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmadd_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                                vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmadd_tu(vfloat64m2_t vd, double rs1, vfloat64m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmadd_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                                vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmadd_tu(vfloat64m4_t vd, double rs1, vfloat64m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmadd_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                                vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmadd_tu(vfloat64m8_t vd, double rs1, vfloat64m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsub_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1,
                                vfloat16mf4_t vs2, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsub_tu(vfloat16mf4_t vd, _Float16 rs1,
                                vfloat16mf4_t vs2, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsub_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1,
                                vfloat16mf2_t vs2, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsub_tu(vfloat16mf2_t vd, _Float16 rs1,
                                vfloat16mf2_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsub_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                               vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsub_tu(vfloat16m1_t vd, _Float16 rs1, vfloat16m1_t vs2,
                               unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsub_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                               vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsub_tu(vfloat16m2_t vd, _Float16 rs1, vfloat16m2_t vs2,
                               unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsub_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                               vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsub_tu(vfloat16m4_t vd, _Float16 rs1, vfloat16m4_t vs2,
                               unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsub_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                               vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsub_tu(vfloat16m8_t vd, _Float16 rs1, vfloat16m8_t vs2,
                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsub_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1,
                                vfloat32mf2_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsub_tu(vfloat32mf2_t vd, float rs1, vfloat32mf2_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsub_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                               vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsub_tu(vfloat32m1_t vd, float rs1, vfloat32m1_t vs2,
                               unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsub_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                               vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsub_tu(vfloat32m2_t vd, float rs1, vfloat32m2_t vs2,
                               unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsub_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                               vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsub_tu(vfloat32m4_t vd, float rs1, vfloat32m4_t vs2,
                               unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsub_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                               vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsub_tu(vfloat32m8_t vd, float rs1, vfloat32m8_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsub_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                               vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsub_tu(vfloat64m1_t vd, double rs1, vfloat64m1_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsub_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                               vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsub_tu(vfloat64m2_t vd, double rs1, vfloat64m2_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsub_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                               vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsub_tu(vfloat64m4_t vd, double rs1, vfloat64m4_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsub_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                               vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsub_tu(vfloat64m8_t vd, double rs1, vfloat64m8_t vs2,
                               unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsub_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16mf4_t __riscv_vfnmsub_tu(vfloat16mf4_t vd, _Float16 rs1,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16mf2_t __riscv_vfnmsub_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16mf2_t __riscv_vfnmsub_tu(vfloat16mf2_t vd, _Float16 rs1,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16m1_t __riscv_vfnmsub_tu(vfloat16m1_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmsub_tu(vfloat16m1_t vd, _Float16 rs1, vfloat16m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsub_tu(vfloat16m2_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsub_tu(vfloat16m2_t vd, _Float16 rs1, vfloat16m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsub_tu(vfloat16m4_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsub_tu(vfloat16m4_t vd, _Float16 rs1, vfloat16m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsub_tu(vfloat16m8_t vd, vfloat16m8_t vs1,
                                vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsub_tu(vfloat16m8_t vd, _Float16 rs1, vfloat16m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsub_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1,
                                 vfloat32mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32mf2_t __riscv_vfnmsub_tu(vfloat32mf2_t vd, float rs1, vfloat32mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmsub_tu(vfloat32m1_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmsub_tu(vfloat32m1_t vd, float rs1, vfloat32m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsub_tu(vfloat32m2_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsub_tu(vfloat32m2_t vd, float rs1, vfloat32m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsub_tu(vfloat32m4_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsub_tu(vfloat32m4_t vd, float rs1, vfloat32m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsub_tu(vfloat32m8_t vd, vfloat32m8_t vs1,
                                vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsub_tu(vfloat32m8_t vd, float rs1, vfloat32m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsub_tu(vfloat64m1_t vd, vfloat64m1_t vs1,
                                vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsub_tu(vfloat64m1_t vd, double rs1, vfloat64m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsub_tu(vfloat64m2_t vd, vfloat64m2_t vs1,
                                vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsub_tu(vfloat64m2_t vd, double rs1, vfloat64m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsub_tu(vfloat64m4_t vd, vfloat64m4_t vs1,
                                vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsub_tu(vfloat64m4_t vd, double rs1, vfloat64m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsub_tu(vfloat64m8_t vd, vfloat64m8_t vs1,
                                vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsub_tu(vfloat64m8_t vd, double rs1, vfloat64m8_t vs2,
                                unsigned int frm, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmacc_tum(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmacc_tum(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16mf2_t __riscv_vfmacc_tum(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmacc_tum(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16m1_t __riscv_vfmacc_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmacc_tum(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmacc_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmacc_tum(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmacc_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmacc_tum(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmacc_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmacc_tum(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmacc_tum(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmacc_tum(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                 vfloat32mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32m1_t __riscv_vfmacc_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmacc_tum(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmacc_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmacc_tum(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmacc_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmacc_tum(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmacc_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmacc_tum(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmacc_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs1,
                                vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmacc_tum(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmacc_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs1,
                                vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmacc_tum(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmacc_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs1,
                                vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmacc_tum(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmacc_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmacc_tum(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmacc_tum(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmacc_tum(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                  vfloat16mf4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16mf2_t __riscv_vfnmacc_tum(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmacc_tum(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                  vfloat16mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m1_t __riscv_vfnmacc_tum(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs1, vfloat16m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmacc_tum(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                 vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmacc_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmacc_tum(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmacc_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmacc_tum(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmacc_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                 vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmacc_tum(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                 vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmacc_tum(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmacc_tum(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                  vfloat32mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfnmacc_tum(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs1, vfloat32m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmacc_tum(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                 vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmacc_tum(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs1, vfloat32m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmacc_tum(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                 vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmacc_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmacc_tum(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmacc_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                 vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmacc_tum(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                 vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmacc_tum(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs1, vfloat64m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmacc_tum(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                 vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmacc_tum(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs1, vfloat64m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmacc_tum(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                 vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmacc_tum(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs1, vfloat64m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmacc_tum(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                 vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmacc_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                 vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmacc_tum(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                 vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsac_tum(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsac_tum(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16mf2_t __riscv_vfmsac_tum(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsac_tum(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16m1_t __riscv_vfmsac_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsac_tum(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsac_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsac_tum(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsac_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsac_tum(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsac_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsac_tum(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsac_tum(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsac_tum(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                 vfloat32mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32m1_t __riscv_vfmsac_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsac_tum(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsac_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsac_tum(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsac_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsac_tum(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsac_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsac_tum(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsac_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs1,
                                vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsac_tum(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsac_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs1,
                                vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsac_tum(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsac_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs1,
                                vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsac_tum(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsac_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsac_tum(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsac_tum(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsac_tum(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                  vfloat16mf4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16mf2_t __riscv_vfnmsac_tum(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmsac_tum(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                  vfloat16mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m1_t __riscv_vfnmsac_tum(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs1, vfloat16m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmsac_tum(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                 vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsac_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsac_tum(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsac_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsac_tum(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsac_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                 vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsac_tum(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                 vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsac_tum(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsac_tum(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                  vfloat32mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfnmsac_tum(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs1, vfloat32m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmsac_tum(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                 vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsac_tum(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs1, vfloat32m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsac_tum(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                 vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsac_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsac_tum(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsac_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                 vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsac_tum(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                 vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsac_tum(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs1, vfloat64m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsac_tum(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                 vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsac_tum(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs1, vfloat64m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsac_tum(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                 vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsac_tum(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs1, vfloat64m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsac_tum(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                 vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsac_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                 vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsac_tum(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                 vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmadd_tum(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmadd_tum(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16mf2_t __riscv_vfmadd_tum(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmadd_tum(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16m1_t __riscv_vfmadd_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmadd_tum(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmadd_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmadd_tum(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmadd_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmadd_tum(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmadd_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmadd_tum(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmadd_tum(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmadd_tum(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                 vfloat32mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32m1_t __riscv_vfmadd_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmadd_tum(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmadd_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmadd_tum(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmadd_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmadd_tum(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmadd_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmadd_tum(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmadd_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs1,
                                vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmadd_tum(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmadd_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs1,
                                vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmadd_tum(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmadd_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs1,
                                vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmadd_tum(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmadd_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmadd_tum(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmadd_tum(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmadd_tum(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                  vfloat16mf4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16mf2_t __riscv_vfnmadd_tum(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmadd_tum(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                  vfloat16mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m1_t __riscv_vfnmadd_tum(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs1, vfloat16m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmadd_tum(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                 vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmadd_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmadd_tum(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmadd_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmadd_tum(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmadd_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                 vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmadd_tum(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                 vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmadd_tum(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmadd_tum(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                  vfloat32mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfnmadd_tum(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs1, vfloat32m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmadd_tum(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                 vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmadd_tum(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs1, vfloat32m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmadd_tum(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                 vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmadd_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmadd_tum(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmadd_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                 vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmadd_tum(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                 vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmadd_tum(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs1, vfloat64m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmadd_tum(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                 vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmadd_tum(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs1, vfloat64m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmadd_tum(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                 vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmadd_tum(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs1, vfloat64m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmadd_tum(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                 vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmadd_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                 vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmadd_tum(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                 vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsub_tum(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsub_tum(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16mf2_t __riscv_vfmsub_tum(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsub_tum(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16m1_t __riscv_vfmsub_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsub_tum(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsub_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsub_tum(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsub_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsub_tum(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsub_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsub_tum(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsub_tum(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsub_tum(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                 vfloat32mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32m1_t __riscv_vfmsub_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsub_tum(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsub_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsub_tum(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsub_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsub_tum(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsub_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsub_tum(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsub_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs1,
                                vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsub_tum(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsub_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs1,
                                vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsub_tum(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsub_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs1,
                                vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsub_tum(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsub_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsub_tum(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsub_tum(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsub_tum(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                  vfloat16mf4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16mf2_t __riscv_vfnmsub_tum(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmsub_tum(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                  vfloat16mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m1_t __riscv_vfnmsub_tum(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs1, vfloat16m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmsub_tum(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                 vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsub_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsub_tum(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsub_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsub_tum(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsub_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                 vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsub_tum(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                 vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsub_tum(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsub_tum(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                  vfloat32mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfnmsub_tum(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs1, vfloat32m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmsub_tum(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                 vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsub_tum(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs1, vfloat32m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsub_tum(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                 vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsub_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsub_tum(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsub_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                 vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsub_tum(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                 vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsub_tum(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs1, vfloat64m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsub_tum(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                 vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsub_tum(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs1, vfloat64m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsub_tum(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                 vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsub_tum(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs1, vfloat64m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsub_tum(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                 vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsub_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                 vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsub_tum(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                 vfloat64m8_t vs2, unsigned int frm, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmacc_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmacc_tumu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                  vfloat16mf4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16mf2_t __riscv_vfmacc_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmacc_tumu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                  vfloat16mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m1_t __riscv_vfmacc_tumu(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs1, vfloat16m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmacc_tumu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                 vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmacc_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmacc_tumu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmacc_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmacc_tumu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmacc_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                 vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmacc_tumu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                 vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmacc_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmacc_tumu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                  vfloat32mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfmacc_tumu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs1, vfloat32m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmacc_tumu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                 vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmacc_tumu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs1, vfloat32m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmacc_tumu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                 vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmacc_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmacc_tumu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmacc_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                 vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmacc_tumu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                 vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmacc_tumu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs1, vfloat64m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmacc_tumu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                 vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmacc_tumu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs1, vfloat64m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmacc_tumu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                 vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmacc_tumu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs1, vfloat64m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmacc_tumu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                 vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmacc_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                 vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmacc_tumu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                 vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmacc_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                   vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                   unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmacc_tumu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                   vfloat16mf4_t vs2, unsigned int frm,
                                   size_t vl);
vfloat16mf2_t __riscv_vfnmacc_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                   vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                   unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmacc_tumu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                   vfloat16mf2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat16m1_t __riscv_vfnmacc_tumu(vbool16_t vm, vfloat16m1_t vd,
                                  vfloat16m1_t vs1, vfloat16m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmacc_tumu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                  vfloat16m1_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m2_t __riscv_vfnmacc_tumu(vbool8_t vm, vfloat16m2_t vd,
                                  vfloat16m2_t vs1, vfloat16m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmacc_tumu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                  vfloat16m2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m4_t __riscv_vfnmacc_tumu(vbool4_t vm, vfloat16m4_t vd,
                                  vfloat16m4_t vs1, vfloat16m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmacc_tumu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                  vfloat16m4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m8_t __riscv_vfnmacc_tumu(vbool2_t vm, vfloat16m8_t vd,
                                  vfloat16m8_t vs1, vfloat16m8_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmacc_tumu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                  vfloat16m8_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32mf2_t __riscv_vfnmacc_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                   unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmacc_tumu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                   vfloat32mf2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat32m1_t __riscv_vfnmacc_tumu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat32m1_t vs1, vfloat32m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmacc_tumu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                  vfloat32m1_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m2_t __riscv_vfnmacc_tumu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat32m2_t vs1, vfloat32m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmacc_tumu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                  vfloat32m2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m4_t __riscv_vfnmacc_tumu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat32m4_t vs1, vfloat32m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmacc_tumu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                  vfloat32m4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m8_t __riscv_vfnmacc_tumu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat32m8_t vs1, vfloat32m8_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmacc_tumu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                  vfloat32m8_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m1_t __riscv_vfnmacc_tumu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat64m1_t vs1, vfloat64m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmacc_tumu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                  vfloat64m1_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m2_t __riscv_vfnmacc_tumu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat64m2_t vs1, vfloat64m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmacc_tumu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                  vfloat64m2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m4_t __riscv_vfnmacc_tumu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat64m4_t vs1, vfloat64m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmacc_tumu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                  vfloat64m4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m8_t __riscv_vfnmacc_tumu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat64m8_t vs1, vfloat64m8_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmacc_tumu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                  vfloat64m8_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16mf4_t __riscv_vfmsac_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsac_tumu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                  vfloat16mf4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16mf2_t __riscv_vfmsac_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsac_tumu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                  vfloat16mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m1_t __riscv_vfmsac_tumu(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs1, vfloat16m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsac_tumu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                 vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsac_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsac_tumu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsac_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsac_tumu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsac_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                 vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsac_tumu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                 vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsac_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsac_tumu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                  vfloat32mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfmsac_tumu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs1, vfloat32m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsac_tumu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                 vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsac_tumu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs1, vfloat32m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsac_tumu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                 vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsac_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsac_tumu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsac_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                 vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsac_tumu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                 vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsac_tumu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs1, vfloat64m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsac_tumu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                 vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsac_tumu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs1, vfloat64m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsac_tumu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                 vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsac_tumu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs1, vfloat64m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsac_tumu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                 vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsac_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                 vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsac_tumu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                 vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsac_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                   vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                   unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsac_tumu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                   vfloat16mf4_t vs2, unsigned int frm,
                                   size_t vl);
vfloat16mf2_t __riscv_vfnmsac_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                   vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                   unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmsac_tumu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                   vfloat16mf2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat16m1_t __riscv_vfnmsac_tumu(vbool16_t vm, vfloat16m1_t vd,
                                  vfloat16m1_t vs1, vfloat16m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmsac_tumu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                  vfloat16m1_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m2_t __riscv_vfnmsac_tumu(vbool8_t vm, vfloat16m2_t vd,
                                  vfloat16m2_t vs1, vfloat16m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsac_tumu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                  vfloat16m2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m4_t __riscv_vfnmsac_tumu(vbool4_t vm, vfloat16m4_t vd,
                                  vfloat16m4_t vs1, vfloat16m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsac_tumu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                  vfloat16m4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m8_t __riscv_vfnmsac_tumu(vbool2_t vm, vfloat16m8_t vd,
                                  vfloat16m8_t vs1, vfloat16m8_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsac_tumu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                  vfloat16m8_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32mf2_t __riscv_vfnmsac_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                   unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsac_tumu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                   vfloat32mf2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat32m1_t __riscv_vfnmsac_tumu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat32m1_t vs1, vfloat32m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmsac_tumu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                  vfloat32m1_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m2_t __riscv_vfnmsac_tumu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat32m2_t vs1, vfloat32m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsac_tumu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                  vfloat32m2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m4_t __riscv_vfnmsac_tumu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat32m4_t vs1, vfloat32m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsac_tumu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                  vfloat32m4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m8_t __riscv_vfnmsac_tumu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat32m8_t vs1, vfloat32m8_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsac_tumu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                  vfloat32m8_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m1_t __riscv_vfnmsac_tumu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat64m1_t vs1, vfloat64m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsac_tumu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                  vfloat64m1_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m2_t __riscv_vfnmsac_tumu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat64m2_t vs1, vfloat64m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsac_tumu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                  vfloat64m2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m4_t __riscv_vfnmsac_tumu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat64m4_t vs1, vfloat64m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsac_tumu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                  vfloat64m4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m8_t __riscv_vfnmsac_tumu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat64m8_t vs1, vfloat64m8_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsac_tumu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                  vfloat64m8_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16mf4_t __riscv_vfmadd_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmadd_tumu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                  vfloat16mf4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16mf2_t __riscv_vfmadd_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmadd_tumu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                  vfloat16mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m1_t __riscv_vfmadd_tumu(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs1, vfloat16m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmadd_tumu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                 vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmadd_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmadd_tumu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmadd_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmadd_tumu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmadd_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                 vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmadd_tumu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                 vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmadd_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmadd_tumu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                  vfloat32mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfmadd_tumu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs1, vfloat32m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmadd_tumu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                 vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmadd_tumu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs1, vfloat32m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmadd_tumu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                 vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmadd_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmadd_tumu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmadd_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                 vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmadd_tumu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                 vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmadd_tumu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs1, vfloat64m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmadd_tumu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                 vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmadd_tumu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs1, vfloat64m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmadd_tumu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                 vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmadd_tumu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs1, vfloat64m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmadd_tumu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                 vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmadd_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                 vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmadd_tumu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                 vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmadd_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                   vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                   unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmadd_tumu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                   vfloat16mf4_t vs2, unsigned int frm,
                                   size_t vl);
vfloat16mf2_t __riscv_vfnmadd_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                   vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                   unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmadd_tumu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                   vfloat16mf2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat16m1_t __riscv_vfnmadd_tumu(vbool16_t vm, vfloat16m1_t vd,
                                  vfloat16m1_t vs1, vfloat16m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmadd_tumu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                  vfloat16m1_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m2_t __riscv_vfnmadd_tumu(vbool8_t vm, vfloat16m2_t vd,
                                  vfloat16m2_t vs1, vfloat16m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmadd_tumu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                  vfloat16m2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m4_t __riscv_vfnmadd_tumu(vbool4_t vm, vfloat16m4_t vd,
                                  vfloat16m4_t vs1, vfloat16m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmadd_tumu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                  vfloat16m4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m8_t __riscv_vfnmadd_tumu(vbool2_t vm, vfloat16m8_t vd,
                                  vfloat16m8_t vs1, vfloat16m8_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmadd_tumu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                  vfloat16m8_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32mf2_t __riscv_vfnmadd_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                   unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmadd_tumu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                   vfloat32mf2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat32m1_t __riscv_vfnmadd_tumu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat32m1_t vs1, vfloat32m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmadd_tumu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                  vfloat32m1_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m2_t __riscv_vfnmadd_tumu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat32m2_t vs1, vfloat32m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmadd_tumu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                  vfloat32m2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m4_t __riscv_vfnmadd_tumu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat32m4_t vs1, vfloat32m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmadd_tumu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                  vfloat32m4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m8_t __riscv_vfnmadd_tumu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat32m8_t vs1, vfloat32m8_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmadd_tumu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                  vfloat32m8_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m1_t __riscv_vfnmadd_tumu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat64m1_t vs1, vfloat64m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmadd_tumu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                  vfloat64m1_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m2_t __riscv_vfnmadd_tumu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat64m2_t vs1, vfloat64m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmadd_tumu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                  vfloat64m2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m4_t __riscv_vfnmadd_tumu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat64m4_t vs1, vfloat64m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmadd_tumu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                  vfloat64m4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m8_t __riscv_vfnmadd_tumu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat64m8_t vs1, vfloat64m8_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmadd_tumu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                  vfloat64m8_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16mf4_t __riscv_vfmsub_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsub_tumu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                  vfloat16mf4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16mf2_t __riscv_vfmsub_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsub_tumu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                  vfloat16mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m1_t __riscv_vfmsub_tumu(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs1, vfloat16m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsub_tumu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                 vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsub_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsub_tumu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsub_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsub_tumu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsub_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                 vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsub_tumu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                 vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsub_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsub_tumu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                  vfloat32mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfmsub_tumu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs1, vfloat32m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsub_tumu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                 vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsub_tumu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs1, vfloat32m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsub_tumu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                 vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsub_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsub_tumu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsub_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                 vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsub_tumu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                 vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsub_tumu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs1, vfloat64m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsub_tumu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                 vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsub_tumu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs1, vfloat64m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsub_tumu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                 vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsub_tumu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs1, vfloat64m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsub_tumu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                 vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsub_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                 vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsub_tumu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                 vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsub_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                   vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                   unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsub_tumu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                   vfloat16mf4_t vs2, unsigned int frm,
                                   size_t vl);
vfloat16mf2_t __riscv_vfnmsub_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                   vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                   unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmsub_tumu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                   vfloat16mf2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat16m1_t __riscv_vfnmsub_tumu(vbool16_t vm, vfloat16m1_t vd,
                                  vfloat16m1_t vs1, vfloat16m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmsub_tumu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                  vfloat16m1_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m2_t __riscv_vfnmsub_tumu(vbool8_t vm, vfloat16m2_t vd,
                                  vfloat16m2_t vs1, vfloat16m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsub_tumu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                  vfloat16m2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m4_t __riscv_vfnmsub_tumu(vbool4_t vm, vfloat16m4_t vd,
                                  vfloat16m4_t vs1, vfloat16m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsub_tumu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                  vfloat16m4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m8_t __riscv_vfnmsub_tumu(vbool2_t vm, vfloat16m8_t vd,
                                  vfloat16m8_t vs1, vfloat16m8_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsub_tumu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                  vfloat16m8_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32mf2_t __riscv_vfnmsub_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                   unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsub_tumu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                   vfloat32mf2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat32m1_t __riscv_vfnmsub_tumu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat32m1_t vs1, vfloat32m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmsub_tumu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                  vfloat32m1_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m2_t __riscv_vfnmsub_tumu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat32m2_t vs1, vfloat32m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsub_tumu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                  vfloat32m2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m4_t __riscv_vfnmsub_tumu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat32m4_t vs1, vfloat32m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsub_tumu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                  vfloat32m4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m8_t __riscv_vfnmsub_tumu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat32m8_t vs1, vfloat32m8_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsub_tumu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                  vfloat32m8_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m1_t __riscv_vfnmsub_tumu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat64m1_t vs1, vfloat64m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsub_tumu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                  vfloat64m1_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m2_t __riscv_vfnmsub_tumu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat64m2_t vs1, vfloat64m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsub_tumu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                  vfloat64m2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m4_t __riscv_vfnmsub_tumu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat64m4_t vs1, vfloat64m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsub_tumu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                  vfloat64m4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m8_t __riscv_vfnmsub_tumu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat64m8_t vs1, vfloat64m8_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsub_tumu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                  vfloat64m8_t vs2, unsigned int frm,
                                  size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmacc_mu(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmacc_mu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                vfloat16mf4_t vs2, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmacc_mu(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmacc_mu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                vfloat16mf2_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmacc_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs1,
                               vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmacc_mu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                               vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmacc_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                               vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmacc_mu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                               vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmacc_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                               vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmacc_mu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                               vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmacc_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                               vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmacc_mu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                               vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmacc_mu(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmacc_mu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                vfloat32mf2_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmacc_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs1,
                               vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmacc_mu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                               vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmacc_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs1,
                               vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmacc_mu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                               vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmacc_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                               vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmacc_mu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                               vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmacc_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                               vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmacc_mu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                               vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmacc_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs1,
                               vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmacc_mu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                               vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmacc_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs1,
                               vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmacc_mu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                               vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmacc_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs1,
                               vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmacc_mu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                               vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmacc_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                               vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmacc_mu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                               vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmacc_mu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmacc_mu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16mf2_t __riscv_vfnmacc_mu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmacc_mu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16m1_t __riscv_vfnmacc_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmacc_mu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmacc_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmacc_mu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmacc_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmacc_mu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmacc_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmacc_mu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmacc_mu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmacc_mu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                 vfloat32mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32m1_t __riscv_vfnmacc_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmacc_mu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmacc_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmacc_mu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmacc_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmacc_mu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmacc_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmacc_mu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmacc_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs1,
                                vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmacc_mu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmacc_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs1,
                                vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmacc_mu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmacc_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs1,
                                vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmacc_mu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmacc_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmacc_mu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsac_mu(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsac_mu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                vfloat16mf4_t vs2, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsac_mu(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsac_mu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                vfloat16mf2_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsac_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs1,
                               vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsac_mu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                               vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsac_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                               vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsac_mu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                               vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsac_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                               vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsac_mu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                               vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsac_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                               vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsac_mu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                               vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsac_mu(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsac_mu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                vfloat32mf2_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsac_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs1,
                               vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsac_mu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                               vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsac_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs1,
                               vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsac_mu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                               vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsac_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                               vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsac_mu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                               vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsac_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                               vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsac_mu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                               vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsac_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs1,
                               vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsac_mu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                               vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsac_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs1,
                               vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsac_mu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                               vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsac_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs1,
                               vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsac_mu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                               vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsac_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                               vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsac_mu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                               vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsac_mu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsac_mu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16mf2_t __riscv_vfnmsac_mu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmsac_mu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16m1_t __riscv_vfnmsac_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmsac_mu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsac_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsac_mu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsac_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsac_mu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsac_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsac_mu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsac_mu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsac_mu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                 vfloat32mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32m1_t __riscv_vfnmsac_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmsac_mu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsac_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsac_mu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsac_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsac_mu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsac_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsac_mu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsac_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs1,
                                vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsac_mu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsac_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs1,
                                vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsac_mu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsac_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs1,
                                vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsac_mu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsac_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsac_mu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmadd_mu(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmadd_mu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                vfloat16mf4_t vs2, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmadd_mu(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmadd_mu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                vfloat16mf2_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmadd_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs1,
                               vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmadd_mu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                               vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmadd_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                               vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmadd_mu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                               vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmadd_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                               vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmadd_mu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                               vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmadd_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                               vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmadd_mu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                               vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmadd_mu(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmadd_mu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                vfloat32mf2_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmadd_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs1,
                               vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmadd_mu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                               vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmadd_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs1,
                               vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmadd_mu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                               vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmadd_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                               vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmadd_mu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                               vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmadd_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                               vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmadd_mu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                               vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmadd_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs1,
                               vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmadd_mu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                               vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmadd_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs1,
                               vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmadd_mu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                               vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmadd_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs1,
                               vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmadd_mu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                               vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmadd_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                               vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmadd_mu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                               vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmadd_mu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmadd_mu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16mf2_t __riscv_vfnmadd_mu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmadd_mu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16m1_t __riscv_vfnmadd_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmadd_mu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmadd_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmadd_mu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmadd_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmadd_mu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmadd_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmadd_mu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmadd_mu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmadd_mu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                 vfloat32mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32m1_t __riscv_vfnmadd_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmadd_mu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmadd_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmadd_mu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmadd_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmadd_mu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmadd_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmadd_mu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmadd_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs1,
                                vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmadd_mu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmadd_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs1,
                                vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmadd_mu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmadd_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs1,
                                vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmadd_mu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmadd_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmadd_mu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsub_mu(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfmsub_mu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                vfloat16mf4_t vs2, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsub_mu(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfmsub_mu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                vfloat16mf2_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsub_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs1,
                               vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfmsub_mu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                               vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsub_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                               vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfmsub_mu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                               vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsub_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                               vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfmsub_mu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                               vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsub_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                               vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfmsub_mu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                               vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsub_mu(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfmsub_mu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                vfloat32mf2_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsub_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs1,
                               vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfmsub_mu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                               vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsub_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs1,
                               vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfmsub_mu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                               vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsub_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                               vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfmsub_mu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                               vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsub_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                               vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfmsub_mu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                               vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsub_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs1,
                               vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfmsub_mu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                               vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsub_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs1,
                               vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfmsub_mu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                               vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsub_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs1,
                               vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfmsub_mu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                               vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsub_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                               vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfmsub_mu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                               vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsub_mu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfnmsub_mu(vbool64_t vm, vfloat16mf4_t vd, _Float16 rs1,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16mf2_t __riscv_vfnmsub_mu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfnmsub_mu(vbool32_t vm, vfloat16mf2_t vd, _Float16 rs1,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16m1_t __riscv_vfnmsub_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfnmsub_mu(vbool16_t vm, vfloat16m1_t vd, _Float16 rs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsub_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfnmsub_mu(vbool8_t vm, vfloat16m2_t vd, _Float16 rs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsub_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfnmsub_mu(vbool4_t vm, vfloat16m4_t vd, _Float16 rs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsub_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs1,
                                vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfnmsub_mu(vbool2_t vm, vfloat16m8_t vd, _Float16 rs1,
                                vfloat16m8_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsub_mu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfnmsub_mu(vbool64_t vm, vfloat32mf2_t vd, float rs1,
                                 vfloat32mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32m1_t __riscv_vfnmsub_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfnmsub_mu(vbool32_t vm, vfloat32m1_t vd, float rs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsub_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfnmsub_mu(vbool16_t vm, vfloat32m2_t vd, float rs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsub_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfnmsub_mu(vbool8_t vm, vfloat32m4_t vd, float rs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsub_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs1,
                                vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfnmsub_mu(vbool4_t vm, vfloat32m8_t vd, float rs1,
                                vfloat32m8_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsub_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs1,
                                vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfnmsub_mu(vbool64_t vm, vfloat64m1_t vd, double rs1,
                                vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsub_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs1,
                                vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfnmsub_mu(vbool32_t vm, vfloat64m2_t vd, double rs1,
                                vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsub_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs1,
                                vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfnmsub_mu(vbool16_t vm, vfloat64m4_t vd, double rs1,
                                vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsub_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs1,
                                vfloat64m8_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfnmsub_mu(vbool8_t vm, vfloat64m8_t vd, double rs1,
                                vfloat64m8_t vs2, unsigned int frm, size_t vl);

Vector Widening Floating-Point Fused Multiply-Add Intrinsics

vfloat32mf2_t __riscv_vfwmacc_tu(vfloat32mf2_t vd, vfloat16mf4_t vs1,
                                 vfloat16mf4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwmacc_tu(vfloat32mf2_t vd, _Float16 vs1,
                                 vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwmacc_tu(vfloat32m1_t vd, vfloat16mf2_t vs1,
                                vfloat16mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwmacc_tu(vfloat32m1_t vd, _Float16 vs1,
                                vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwmacc_tu(vfloat32m2_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwmacc_tu(vfloat32m2_t vd, _Float16 vs1, vfloat16m1_t vs2,
                                size_t vl);
vfloat32m4_t __riscv_vfwmacc_tu(vfloat32m4_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwmacc_tu(vfloat32m4_t vd, _Float16 vs1, vfloat16m2_t vs2,
                                size_t vl);
vfloat32m8_t __riscv_vfwmacc_tu(vfloat32m8_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwmacc_tu(vfloat32m8_t vd, _Float16 vs1, vfloat16m4_t vs2,
                                size_t vl);
vfloat64m1_t __riscv_vfwmacc_tu(vfloat64m1_t vd, vfloat32mf2_t vs1,
                                vfloat32mf2_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwmacc_tu(vfloat64m1_t vd, float vs1, vfloat32mf2_t vs2,
                                size_t vl);
vfloat64m2_t __riscv_vfwmacc_tu(vfloat64m2_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwmacc_tu(vfloat64m2_t vd, float vs1, vfloat32m1_t vs2,
                                size_t vl);
vfloat64m4_t __riscv_vfwmacc_tu(vfloat64m4_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwmacc_tu(vfloat64m4_t vd, float vs1, vfloat32m2_t vs2,
                                size_t vl);
vfloat64m8_t __riscv_vfwmacc_tu(vfloat64m8_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwmacc_tu(vfloat64m8_t vd, float vs1, vfloat32m4_t vs2,
                                size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_tu(vfloat32mf2_t vd, vfloat16mf4_t vs1,
                                  vfloat16mf4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_tu(vfloat32mf2_t vd, _Float16 vs1,
                                  vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwnmacc_tu(vfloat32m1_t vd, vfloat16mf2_t vs1,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwnmacc_tu(vfloat32m1_t vd, _Float16 vs1,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwnmacc_tu(vfloat32m2_t vd, vfloat16m1_t vs1,
                                 vfloat16m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwnmacc_tu(vfloat32m2_t vd, _Float16 vs1,
                                 vfloat16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwnmacc_tu(vfloat32m4_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwnmacc_tu(vfloat32m4_t vd, _Float16 vs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwnmacc_tu(vfloat32m8_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwnmacc_tu(vfloat32m8_t vd, _Float16 vs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwnmacc_tu(vfloat64m1_t vd, vfloat32mf2_t vs1,
                                 vfloat32mf2_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwnmacc_tu(vfloat64m1_t vd, float vs1, vfloat32mf2_t vs2,
                                 size_t vl);
vfloat64m2_t __riscv_vfwnmacc_tu(vfloat64m2_t vd, vfloat32m1_t vs1,
                                 vfloat32m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwnmacc_tu(vfloat64m2_t vd, float vs1, vfloat32m1_t vs2,
                                 size_t vl);
vfloat64m4_t __riscv_vfwnmacc_tu(vfloat64m4_t vd, vfloat32m2_t vs1,
                                 vfloat32m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwnmacc_tu(vfloat64m4_t vd, float vs1, vfloat32m2_t vs2,
                                 size_t vl);
vfloat64m8_t __riscv_vfwnmacc_tu(vfloat64m8_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwnmacc_tu(vfloat64m8_t vd, float vs1, vfloat32m4_t vs2,
                                 size_t vl);
vfloat32mf2_t __riscv_vfwmsac_tu(vfloat32mf2_t vd, vfloat16mf4_t vs1,
                                 vfloat16mf4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwmsac_tu(vfloat32mf2_t vd, _Float16 vs1,
                                 vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwmsac_tu(vfloat32m1_t vd, vfloat16mf2_t vs1,
                                vfloat16mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwmsac_tu(vfloat32m1_t vd, _Float16 vs1,
                                vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwmsac_tu(vfloat32m2_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwmsac_tu(vfloat32m2_t vd, _Float16 vs1, vfloat16m1_t vs2,
                                size_t vl);
vfloat32m4_t __riscv_vfwmsac_tu(vfloat32m4_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwmsac_tu(vfloat32m4_t vd, _Float16 vs1, vfloat16m2_t vs2,
                                size_t vl);
vfloat32m8_t __riscv_vfwmsac_tu(vfloat32m8_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwmsac_tu(vfloat32m8_t vd, _Float16 vs1, vfloat16m4_t vs2,
                                size_t vl);
vfloat64m1_t __riscv_vfwmsac_tu(vfloat64m1_t vd, vfloat32mf2_t vs1,
                                vfloat32mf2_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwmsac_tu(vfloat64m1_t vd, float vs1, vfloat32mf2_t vs2,
                                size_t vl);
vfloat64m2_t __riscv_vfwmsac_tu(vfloat64m2_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwmsac_tu(vfloat64m2_t vd, float vs1, vfloat32m1_t vs2,
                                size_t vl);
vfloat64m4_t __riscv_vfwmsac_tu(vfloat64m4_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwmsac_tu(vfloat64m4_t vd, float vs1, vfloat32m2_t vs2,
                                size_t vl);
vfloat64m8_t __riscv_vfwmsac_tu(vfloat64m8_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwmsac_tu(vfloat64m8_t vd, float vs1, vfloat32m4_t vs2,
                                size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_tu(vfloat32mf2_t vd, vfloat16mf4_t vs1,
                                  vfloat16mf4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_tu(vfloat32mf2_t vd, _Float16 vs1,
                                  vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwnmsac_tu(vfloat32m1_t vd, vfloat16mf2_t vs1,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwnmsac_tu(vfloat32m1_t vd, _Float16 vs1,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwnmsac_tu(vfloat32m2_t vd, vfloat16m1_t vs1,
                                 vfloat16m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwnmsac_tu(vfloat32m2_t vd, _Float16 vs1,
                                 vfloat16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwnmsac_tu(vfloat32m4_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwnmsac_tu(vfloat32m4_t vd, _Float16 vs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwnmsac_tu(vfloat32m8_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwnmsac_tu(vfloat32m8_t vd, _Float16 vs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwnmsac_tu(vfloat64m1_t vd, vfloat32mf2_t vs1,
                                 vfloat32mf2_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwnmsac_tu(vfloat64m1_t vd, float vs1, vfloat32mf2_t vs2,
                                 size_t vl);
vfloat64m2_t __riscv_vfwnmsac_tu(vfloat64m2_t vd, vfloat32m1_t vs1,
                                 vfloat32m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwnmsac_tu(vfloat64m2_t vd, float vs1, vfloat32m1_t vs2,
                                 size_t vl);
vfloat64m4_t __riscv_vfwnmsac_tu(vfloat64m4_t vd, vfloat32m2_t vs1,
                                 vfloat32m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwnmsac_tu(vfloat64m4_t vd, float vs1, vfloat32m2_t vs2,
                                 size_t vl);
vfloat64m8_t __riscv_vfwnmsac_tu(vfloat64m8_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwnmsac_tu(vfloat64m8_t vd, float vs1, vfloat32m4_t vs2,
                                 size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwmacc_tum(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                  size_t vl);
vfloat32mf2_t __riscv_vfwmacc_tum(vbool64_t vm, vfloat32mf2_t vd, _Float16 vs1,
                                  vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwmacc_tum(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                 size_t vl);
vfloat32m1_t __riscv_vfwmacc_tum(vbool32_t vm, vfloat32m1_t vd, _Float16 vs1,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwmacc_tum(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat16m1_t vs1, vfloat16m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwmacc_tum(vbool16_t vm, vfloat32m2_t vd, _Float16 vs1,
                                 vfloat16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwmacc_tum(vbool8_t vm, vfloat32m4_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwmacc_tum(vbool8_t vm, vfloat32m4_t vd, _Float16 vs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwmacc_tum(vbool4_t vm, vfloat32m8_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwmacc_tum(vbool4_t vm, vfloat32m8_t vd, _Float16 vs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwmacc_tum(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                 size_t vl);
vfloat64m1_t __riscv_vfwmacc_tum(vbool64_t vm, vfloat64m1_t vd, float vs1,
                                 vfloat32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwmacc_tum(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat32m1_t vs1, vfloat32m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwmacc_tum(vbool32_t vm, vfloat64m2_t vd, float vs1,
                                 vfloat32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwmacc_tum(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat32m2_t vs1, vfloat32m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwmacc_tum(vbool16_t vm, vfloat64m4_t vd, float vs1,
                                 vfloat32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwmacc_tum(vbool8_t vm, vfloat64m8_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwmacc_tum(vbool8_t vm, vfloat64m8_t vd, float vs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_tum(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                   size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_tum(vbool64_t vm, vfloat32mf2_t vd, _Float16 vs1,
                                   vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwnmacc_tum(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                  size_t vl);
vfloat32m1_t __riscv_vfwnmacc_tum(vbool32_t vm, vfloat32m1_t vd, _Float16 vs1,
                                  vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwnmacc_tum(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat16m1_t vs1, vfloat16m1_t vs2,
                                  size_t vl);
vfloat32m2_t __riscv_vfwnmacc_tum(vbool16_t vm, vfloat32m2_t vd, _Float16 vs1,
                                  vfloat16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwnmacc_tum(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat16m2_t vs1, vfloat16m2_t vs2,
                                  size_t vl);
vfloat32m4_t __riscv_vfwnmacc_tum(vbool8_t vm, vfloat32m4_t vd, _Float16 vs1,
                                  vfloat16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwnmacc_tum(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat16m4_t vs1, vfloat16m4_t vs2,
                                  size_t vl);
vfloat32m8_t __riscv_vfwnmacc_tum(vbool4_t vm, vfloat32m8_t vd, _Float16 vs1,
                                  vfloat16m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwnmacc_tum(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                  size_t vl);
vfloat64m1_t __riscv_vfwnmacc_tum(vbool64_t vm, vfloat64m1_t vd, float vs1,
                                  vfloat32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwnmacc_tum(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat32m1_t vs1, vfloat32m1_t vs2,
                                  size_t vl);
vfloat64m2_t __riscv_vfwnmacc_tum(vbool32_t vm, vfloat64m2_t vd, float vs1,
                                  vfloat32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwnmacc_tum(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat32m2_t vs1, vfloat32m2_t vs2,
                                  size_t vl);
vfloat64m4_t __riscv_vfwnmacc_tum(vbool16_t vm, vfloat64m4_t vd, float vs1,
                                  vfloat32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwnmacc_tum(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat32m4_t vs1, vfloat32m4_t vs2,
                                  size_t vl);
vfloat64m8_t __riscv_vfwnmacc_tum(vbool8_t vm, vfloat64m8_t vd, float vs1,
                                  vfloat32m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwmsac_tum(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                  size_t vl);
vfloat32mf2_t __riscv_vfwmsac_tum(vbool64_t vm, vfloat32mf2_t vd, _Float16 vs1,
                                  vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwmsac_tum(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                 size_t vl);
vfloat32m1_t __riscv_vfwmsac_tum(vbool32_t vm, vfloat32m1_t vd, _Float16 vs1,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwmsac_tum(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat16m1_t vs1, vfloat16m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwmsac_tum(vbool16_t vm, vfloat32m2_t vd, _Float16 vs1,
                                 vfloat16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwmsac_tum(vbool8_t vm, vfloat32m4_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwmsac_tum(vbool8_t vm, vfloat32m4_t vd, _Float16 vs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwmsac_tum(vbool4_t vm, vfloat32m8_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwmsac_tum(vbool4_t vm, vfloat32m8_t vd, _Float16 vs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwmsac_tum(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                 size_t vl);
vfloat64m1_t __riscv_vfwmsac_tum(vbool64_t vm, vfloat64m1_t vd, float vs1,
                                 vfloat32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwmsac_tum(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat32m1_t vs1, vfloat32m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwmsac_tum(vbool32_t vm, vfloat64m2_t vd, float vs1,
                                 vfloat32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwmsac_tum(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat32m2_t vs1, vfloat32m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwmsac_tum(vbool16_t vm, vfloat64m4_t vd, float vs1,
                                 vfloat32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwmsac_tum(vbool8_t vm, vfloat64m8_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwmsac_tum(vbool8_t vm, vfloat64m8_t vd, float vs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_tum(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                   size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_tum(vbool64_t vm, vfloat32mf2_t vd, _Float16 vs1,
                                   vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwnmsac_tum(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                  size_t vl);
vfloat32m1_t __riscv_vfwnmsac_tum(vbool32_t vm, vfloat32m1_t vd, _Float16 vs1,
                                  vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwnmsac_tum(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat16m1_t vs1, vfloat16m1_t vs2,
                                  size_t vl);
vfloat32m2_t __riscv_vfwnmsac_tum(vbool16_t vm, vfloat32m2_t vd, _Float16 vs1,
                                  vfloat16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwnmsac_tum(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat16m2_t vs1, vfloat16m2_t vs2,
                                  size_t vl);
vfloat32m4_t __riscv_vfwnmsac_tum(vbool8_t vm, vfloat32m4_t vd, _Float16 vs1,
                                  vfloat16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwnmsac_tum(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat16m4_t vs1, vfloat16m4_t vs2,
                                  size_t vl);
vfloat32m8_t __riscv_vfwnmsac_tum(vbool4_t vm, vfloat32m8_t vd, _Float16 vs1,
                                  vfloat16m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwnmsac_tum(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                  size_t vl);
vfloat64m1_t __riscv_vfwnmsac_tum(vbool64_t vm, vfloat64m1_t vd, float vs1,
                                  vfloat32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwnmsac_tum(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat32m1_t vs1, vfloat32m1_t vs2,
                                  size_t vl);
vfloat64m2_t __riscv_vfwnmsac_tum(vbool32_t vm, vfloat64m2_t vd, float vs1,
                                  vfloat32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwnmsac_tum(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat32m2_t vs1, vfloat32m2_t vs2,
                                  size_t vl);
vfloat64m4_t __riscv_vfwnmsac_tum(vbool16_t vm, vfloat64m4_t vd, float vs1,
                                  vfloat32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwnmsac_tum(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat32m4_t vs1, vfloat32m4_t vs2,
                                  size_t vl);
vfloat64m8_t __riscv_vfwnmsac_tum(vbool8_t vm, vfloat64m8_t vd, float vs1,
                                  vfloat32m4_t vs2, size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwmacc_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                   size_t vl);
vfloat32mf2_t __riscv_vfwmacc_tumu(vbool64_t vm, vfloat32mf2_t vd, _Float16 vs1,
                                   vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwmacc_tumu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                  size_t vl);
vfloat32m1_t __riscv_vfwmacc_tumu(vbool32_t vm, vfloat32m1_t vd, _Float16 vs1,
                                  vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwmacc_tumu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat16m1_t vs1, vfloat16m1_t vs2,
                                  size_t vl);
vfloat32m2_t __riscv_vfwmacc_tumu(vbool16_t vm, vfloat32m2_t vd, _Float16 vs1,
                                  vfloat16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwmacc_tumu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat16m2_t vs1, vfloat16m2_t vs2,
                                  size_t vl);
vfloat32m4_t __riscv_vfwmacc_tumu(vbool8_t vm, vfloat32m4_t vd, _Float16 vs1,
                                  vfloat16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwmacc_tumu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat16m4_t vs1, vfloat16m4_t vs2,
                                  size_t vl);
vfloat32m8_t __riscv_vfwmacc_tumu(vbool4_t vm, vfloat32m8_t vd, _Float16 vs1,
                                  vfloat16m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwmacc_tumu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                  size_t vl);
vfloat64m1_t __riscv_vfwmacc_tumu(vbool64_t vm, vfloat64m1_t vd, float vs1,
                                  vfloat32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwmacc_tumu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat32m1_t vs1, vfloat32m1_t vs2,
                                  size_t vl);
vfloat64m2_t __riscv_vfwmacc_tumu(vbool32_t vm, vfloat64m2_t vd, float vs1,
                                  vfloat32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwmacc_tumu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat32m2_t vs1, vfloat32m2_t vs2,
                                  size_t vl);
vfloat64m4_t __riscv_vfwmacc_tumu(vbool16_t vm, vfloat64m4_t vd, float vs1,
                                  vfloat32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwmacc_tumu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat32m4_t vs1, vfloat32m4_t vs2,
                                  size_t vl);
vfloat64m8_t __riscv_vfwmacc_tumu(vbool8_t vm, vfloat64m8_t vd, float vs1,
                                  vfloat32m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                    vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                    size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                    _Float16 vs1, vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwnmacc_tumu(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                   size_t vl);
vfloat32m1_t __riscv_vfwnmacc_tumu(vbool32_t vm, vfloat32m1_t vd, _Float16 vs1,
                                   vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwnmacc_tumu(vbool16_t vm, vfloat32m2_t vd,
                                   vfloat16m1_t vs1, vfloat16m1_t vs2,
                                   size_t vl);
vfloat32m2_t __riscv_vfwnmacc_tumu(vbool16_t vm, vfloat32m2_t vd, _Float16 vs1,
                                   vfloat16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwnmacc_tumu(vbool8_t vm, vfloat32m4_t vd,
                                   vfloat16m2_t vs1, vfloat16m2_t vs2,
                                   size_t vl);
vfloat32m4_t __riscv_vfwnmacc_tumu(vbool8_t vm, vfloat32m4_t vd, _Float16 vs1,
                                   vfloat16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwnmacc_tumu(vbool4_t vm, vfloat32m8_t vd,
                                   vfloat16m4_t vs1, vfloat16m4_t vs2,
                                   size_t vl);
vfloat32m8_t __riscv_vfwnmacc_tumu(vbool4_t vm, vfloat32m8_t vd, _Float16 vs1,
                                   vfloat16m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwnmacc_tumu(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                   size_t vl);
vfloat64m1_t __riscv_vfwnmacc_tumu(vbool64_t vm, vfloat64m1_t vd, float vs1,
                                   vfloat32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwnmacc_tumu(vbool32_t vm, vfloat64m2_t vd,
                                   vfloat32m1_t vs1, vfloat32m1_t vs2,
                                   size_t vl);
vfloat64m2_t __riscv_vfwnmacc_tumu(vbool32_t vm, vfloat64m2_t vd, float vs1,
                                   vfloat32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwnmacc_tumu(vbool16_t vm, vfloat64m4_t vd,
                                   vfloat32m2_t vs1, vfloat32m2_t vs2,
                                   size_t vl);
vfloat64m4_t __riscv_vfwnmacc_tumu(vbool16_t vm, vfloat64m4_t vd, float vs1,
                                   vfloat32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwnmacc_tumu(vbool8_t vm, vfloat64m8_t vd,
                                   vfloat32m4_t vs1, vfloat32m4_t vs2,
                                   size_t vl);
vfloat64m8_t __riscv_vfwnmacc_tumu(vbool8_t vm, vfloat64m8_t vd, float vs1,
                                   vfloat32m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwmsac_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                   size_t vl);
vfloat32mf2_t __riscv_vfwmsac_tumu(vbool64_t vm, vfloat32mf2_t vd, _Float16 vs1,
                                   vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwmsac_tumu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                  size_t vl);
vfloat32m1_t __riscv_vfwmsac_tumu(vbool32_t vm, vfloat32m1_t vd, _Float16 vs1,
                                  vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwmsac_tumu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat16m1_t vs1, vfloat16m1_t vs2,
                                  size_t vl);
vfloat32m2_t __riscv_vfwmsac_tumu(vbool16_t vm, vfloat32m2_t vd, _Float16 vs1,
                                  vfloat16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwmsac_tumu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat16m2_t vs1, vfloat16m2_t vs2,
                                  size_t vl);
vfloat32m4_t __riscv_vfwmsac_tumu(vbool8_t vm, vfloat32m4_t vd, _Float16 vs1,
                                  vfloat16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwmsac_tumu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat16m4_t vs1, vfloat16m4_t vs2,
                                  size_t vl);
vfloat32m8_t __riscv_vfwmsac_tumu(vbool4_t vm, vfloat32m8_t vd, _Float16 vs1,
                                  vfloat16m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwmsac_tumu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                  size_t vl);
vfloat64m1_t __riscv_vfwmsac_tumu(vbool64_t vm, vfloat64m1_t vd, float vs1,
                                  vfloat32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwmsac_tumu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat32m1_t vs1, vfloat32m1_t vs2,
                                  size_t vl);
vfloat64m2_t __riscv_vfwmsac_tumu(vbool32_t vm, vfloat64m2_t vd, float vs1,
                                  vfloat32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwmsac_tumu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat32m2_t vs1, vfloat32m2_t vs2,
                                  size_t vl);
vfloat64m4_t __riscv_vfwmsac_tumu(vbool16_t vm, vfloat64m4_t vd, float vs1,
                                  vfloat32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwmsac_tumu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat32m4_t vs1, vfloat32m4_t vs2,
                                  size_t vl);
vfloat64m8_t __riscv_vfwmsac_tumu(vbool8_t vm, vfloat64m8_t vd, float vs1,
                                  vfloat32m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                    vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                    size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                    _Float16 vs1, vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwnmsac_tumu(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                   size_t vl);
vfloat32m1_t __riscv_vfwnmsac_tumu(vbool32_t vm, vfloat32m1_t vd, _Float16 vs1,
                                   vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwnmsac_tumu(vbool16_t vm, vfloat32m2_t vd,
                                   vfloat16m1_t vs1, vfloat16m1_t vs2,
                                   size_t vl);
vfloat32m2_t __riscv_vfwnmsac_tumu(vbool16_t vm, vfloat32m2_t vd, _Float16 vs1,
                                   vfloat16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwnmsac_tumu(vbool8_t vm, vfloat32m4_t vd,
                                   vfloat16m2_t vs1, vfloat16m2_t vs2,
                                   size_t vl);
vfloat32m4_t __riscv_vfwnmsac_tumu(vbool8_t vm, vfloat32m4_t vd, _Float16 vs1,
                                   vfloat16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwnmsac_tumu(vbool4_t vm, vfloat32m8_t vd,
                                   vfloat16m4_t vs1, vfloat16m4_t vs2,
                                   size_t vl);
vfloat32m8_t __riscv_vfwnmsac_tumu(vbool4_t vm, vfloat32m8_t vd, _Float16 vs1,
                                   vfloat16m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwnmsac_tumu(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                   size_t vl);
vfloat64m1_t __riscv_vfwnmsac_tumu(vbool64_t vm, vfloat64m1_t vd, float vs1,
                                   vfloat32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwnmsac_tumu(vbool32_t vm, vfloat64m2_t vd,
                                   vfloat32m1_t vs1, vfloat32m1_t vs2,
                                   size_t vl);
vfloat64m2_t __riscv_vfwnmsac_tumu(vbool32_t vm, vfloat64m2_t vd, float vs1,
                                   vfloat32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwnmsac_tumu(vbool16_t vm, vfloat64m4_t vd,
                                   vfloat32m2_t vs1, vfloat32m2_t vs2,
                                   size_t vl);
vfloat64m4_t __riscv_vfwnmsac_tumu(vbool16_t vm, vfloat64m4_t vd, float vs1,
                                   vfloat32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwnmsac_tumu(vbool8_t vm, vfloat64m8_t vd,
                                   vfloat32m4_t vs1, vfloat32m4_t vs2,
                                   size_t vl);
vfloat64m8_t __riscv_vfwnmsac_tumu(vbool8_t vm, vfloat64m8_t vd, float vs1,
                                   vfloat32m4_t vs2, size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwmacc_mu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                 size_t vl);
vfloat32mf2_t __riscv_vfwmacc_mu(vbool64_t vm, vfloat32mf2_t vd, _Float16 vs1,
                                 vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwmacc_mu(vbool32_t vm, vfloat32m1_t vd,
                                vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                size_t vl);
vfloat32m1_t __riscv_vfwmacc_mu(vbool32_t vm, vfloat32m1_t vd, _Float16 vs1,
                                vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwmacc_mu(vbool16_t vm, vfloat32m2_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwmacc_mu(vbool16_t vm, vfloat32m2_t vd, _Float16 vs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwmacc_mu(vbool8_t vm, vfloat32m4_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwmacc_mu(vbool8_t vm, vfloat32m4_t vd, _Float16 vs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwmacc_mu(vbool4_t vm, vfloat32m8_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwmacc_mu(vbool4_t vm, vfloat32m8_t vd, _Float16 vs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwmacc_mu(vbool64_t vm, vfloat64m1_t vd,
                                vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                size_t vl);
vfloat64m1_t __riscv_vfwmacc_mu(vbool64_t vm, vfloat64m1_t vd, float vs1,
                                vfloat32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwmacc_mu(vbool32_t vm, vfloat64m2_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwmacc_mu(vbool32_t vm, vfloat64m2_t vd, float vs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwmacc_mu(vbool16_t vm, vfloat64m4_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwmacc_mu(vbool16_t vm, vfloat64m4_t vd, float vs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwmacc_mu(vbool8_t vm, vfloat64m8_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwmacc_mu(vbool8_t vm, vfloat64m8_t vd, float vs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_mu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                  size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_mu(vbool64_t vm, vfloat32mf2_t vd, _Float16 vs1,
                                  vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwnmacc_mu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                 size_t vl);
vfloat32m1_t __riscv_vfwnmacc_mu(vbool32_t vm, vfloat32m1_t vd, _Float16 vs1,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwnmacc_mu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat16m1_t vs1, vfloat16m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwnmacc_mu(vbool16_t vm, vfloat32m2_t vd, _Float16 vs1,
                                 vfloat16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwnmacc_mu(vbool8_t vm, vfloat32m4_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwnmacc_mu(vbool8_t vm, vfloat32m4_t vd, _Float16 vs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwnmacc_mu(vbool4_t vm, vfloat32m8_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwnmacc_mu(vbool4_t vm, vfloat32m8_t vd, _Float16 vs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwnmacc_mu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                 size_t vl);
vfloat64m1_t __riscv_vfwnmacc_mu(vbool64_t vm, vfloat64m1_t vd, float vs1,
                                 vfloat32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwnmacc_mu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat32m1_t vs1, vfloat32m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwnmacc_mu(vbool32_t vm, vfloat64m2_t vd, float vs1,
                                 vfloat32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwnmacc_mu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat32m2_t vs1, vfloat32m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwnmacc_mu(vbool16_t vm, vfloat64m4_t vd, float vs1,
                                 vfloat32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwnmacc_mu(vbool8_t vm, vfloat64m8_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwnmacc_mu(vbool8_t vm, vfloat64m8_t vd, float vs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwmsac_mu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                 size_t vl);
vfloat32mf2_t __riscv_vfwmsac_mu(vbool64_t vm, vfloat32mf2_t vd, _Float16 vs1,
                                 vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwmsac_mu(vbool32_t vm, vfloat32m1_t vd,
                                vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                size_t vl);
vfloat32m1_t __riscv_vfwmsac_mu(vbool32_t vm, vfloat32m1_t vd, _Float16 vs1,
                                vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwmsac_mu(vbool16_t vm, vfloat32m2_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwmsac_mu(vbool16_t vm, vfloat32m2_t vd, _Float16 vs1,
                                vfloat16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwmsac_mu(vbool8_t vm, vfloat32m4_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwmsac_mu(vbool8_t vm, vfloat32m4_t vd, _Float16 vs1,
                                vfloat16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwmsac_mu(vbool4_t vm, vfloat32m8_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwmsac_mu(vbool4_t vm, vfloat32m8_t vd, _Float16 vs1,
                                vfloat16m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwmsac_mu(vbool64_t vm, vfloat64m1_t vd,
                                vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                size_t vl);
vfloat64m1_t __riscv_vfwmsac_mu(vbool64_t vm, vfloat64m1_t vd, float vs1,
                                vfloat32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwmsac_mu(vbool32_t vm, vfloat64m2_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwmsac_mu(vbool32_t vm, vfloat64m2_t vd, float vs1,
                                vfloat32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwmsac_mu(vbool16_t vm, vfloat64m4_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwmsac_mu(vbool16_t vm, vfloat64m4_t vd, float vs1,
                                vfloat32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwmsac_mu(vbool8_t vm, vfloat64m8_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwmsac_mu(vbool8_t vm, vfloat64m8_t vd, float vs1,
                                vfloat32m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_mu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                  size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_mu(vbool64_t vm, vfloat32mf2_t vd, _Float16 vs1,
                                  vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwnmsac_mu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                 size_t vl);
vfloat32m1_t __riscv_vfwnmsac_mu(vbool32_t vm, vfloat32m1_t vd, _Float16 vs1,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwnmsac_mu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat16m1_t vs1, vfloat16m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwnmsac_mu(vbool16_t vm, vfloat32m2_t vd, _Float16 vs1,
                                 vfloat16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwnmsac_mu(vbool8_t vm, vfloat32m4_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwnmsac_mu(vbool8_t vm, vfloat32m4_t vd, _Float16 vs1,
                                 vfloat16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwnmsac_mu(vbool4_t vm, vfloat32m8_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwnmsac_mu(vbool4_t vm, vfloat32m8_t vd, _Float16 vs1,
                                 vfloat16m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwnmsac_mu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                 size_t vl);
vfloat64m1_t __riscv_vfwnmsac_mu(vbool64_t vm, vfloat64m1_t vd, float vs1,
                                 vfloat32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwnmsac_mu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat32m1_t vs1, vfloat32m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwnmsac_mu(vbool32_t vm, vfloat64m2_t vd, float vs1,
                                 vfloat32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwnmsac_mu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat32m2_t vs1, vfloat32m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwnmsac_mu(vbool16_t vm, vfloat64m4_t vd, float vs1,
                                 vfloat32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwnmsac_mu(vbool8_t vm, vfloat64m8_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwnmsac_mu(vbool8_t vm, vfloat64m8_t vd, float vs1,
                                 vfloat32m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwmacc_tu(vfloat32mf2_t vd, vfloat16mf4_t vs1,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32mf2_t __riscv_vfwmacc_tu(vfloat32mf2_t vd, _Float16 vs1,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32m1_t __riscv_vfwmacc_tu(vfloat32m1_t vd, vfloat16mf2_t vs1,
                                vfloat16mf2_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmacc_tu(vfloat32m1_t vd, _Float16 vs1,
                                vfloat16mf2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmacc_tu(vfloat32m2_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmacc_tu(vfloat32m2_t vd, _Float16 vs1, vfloat16m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmacc_tu(vfloat32m4_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmacc_tu(vfloat32m4_t vd, _Float16 vs1, vfloat16m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmacc_tu(vfloat32m8_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmacc_tu(vfloat32m8_t vd, _Float16 vs1, vfloat16m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmacc_tu(vfloat64m1_t vd, vfloat32mf2_t vs1,
                                vfloat32mf2_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmacc_tu(vfloat64m1_t vd, float vs1, vfloat32mf2_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmacc_tu(vfloat64m2_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmacc_tu(vfloat64m2_t vd, float vs1, vfloat32m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmacc_tu(vfloat64m4_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmacc_tu(vfloat64m4_t vd, float vs1, vfloat32m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmacc_tu(vfloat64m8_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmacc_tu(vfloat64m8_t vd, float vs1, vfloat32m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_tu(vfloat32mf2_t vd, vfloat16mf4_t vs1,
                                  vfloat16mf4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_tu(vfloat32mf2_t vd, _Float16 vs1,
                                  vfloat16mf4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfwnmacc_tu(vfloat32m1_t vd, vfloat16mf2_t vs1,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32m1_t __riscv_vfwnmacc_tu(vfloat32m1_t vd, _Float16 vs1,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32m2_t __riscv_vfwnmacc_tu(vfloat32m2_t vd, vfloat16m1_t vs1,
                                 vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwnmacc_tu(vfloat32m2_t vd, _Float16 vs1,
                                 vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwnmacc_tu(vfloat32m4_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwnmacc_tu(vfloat32m4_t vd, _Float16 vs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwnmacc_tu(vfloat32m8_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwnmacc_tu(vfloat32m8_t vd, _Float16 vs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwnmacc_tu(vfloat64m1_t vd, vfloat32mf2_t vs1,
                                 vfloat32mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat64m1_t __riscv_vfwnmacc_tu(vfloat64m1_t vd, float vs1, vfloat32mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwnmacc_tu(vfloat64m2_t vd, vfloat32m1_t vs1,
                                 vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwnmacc_tu(vfloat64m2_t vd, float vs1, vfloat32m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwnmacc_tu(vfloat64m4_t vd, vfloat32m2_t vs1,
                                 vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwnmacc_tu(vfloat64m4_t vd, float vs1, vfloat32m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwnmacc_tu(vfloat64m8_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwnmacc_tu(vfloat64m8_t vd, float vs1, vfloat32m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmsac_tu(vfloat32mf2_t vd, vfloat16mf4_t vs1,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32mf2_t __riscv_vfwmsac_tu(vfloat32mf2_t vd, _Float16 vs1,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32m1_t __riscv_vfwmsac_tu(vfloat32m1_t vd, vfloat16mf2_t vs1,
                                vfloat16mf2_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmsac_tu(vfloat32m1_t vd, _Float16 vs1,
                                vfloat16mf2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmsac_tu(vfloat32m2_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmsac_tu(vfloat32m2_t vd, _Float16 vs1, vfloat16m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmsac_tu(vfloat32m4_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmsac_tu(vfloat32m4_t vd, _Float16 vs1, vfloat16m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmsac_tu(vfloat32m8_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmsac_tu(vfloat32m8_t vd, _Float16 vs1, vfloat16m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmsac_tu(vfloat64m1_t vd, vfloat32mf2_t vs1,
                                vfloat32mf2_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmsac_tu(vfloat64m1_t vd, float vs1, vfloat32mf2_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmsac_tu(vfloat64m2_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmsac_tu(vfloat64m2_t vd, float vs1, vfloat32m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmsac_tu(vfloat64m4_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmsac_tu(vfloat64m4_t vd, float vs1, vfloat32m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmsac_tu(vfloat64m8_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmsac_tu(vfloat64m8_t vd, float vs1, vfloat32m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_tu(vfloat32mf2_t vd, vfloat16mf4_t vs1,
                                  vfloat16mf4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_tu(vfloat32mf2_t vd, _Float16 vs1,
                                  vfloat16mf4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfwnmsac_tu(vfloat32m1_t vd, vfloat16mf2_t vs1,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32m1_t __riscv_vfwnmsac_tu(vfloat32m1_t vd, _Float16 vs1,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32m2_t __riscv_vfwnmsac_tu(vfloat32m2_t vd, vfloat16m1_t vs1,
                                 vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwnmsac_tu(vfloat32m2_t vd, _Float16 vs1,
                                 vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwnmsac_tu(vfloat32m4_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwnmsac_tu(vfloat32m4_t vd, _Float16 vs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwnmsac_tu(vfloat32m8_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwnmsac_tu(vfloat32m8_t vd, _Float16 vs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwnmsac_tu(vfloat64m1_t vd, vfloat32mf2_t vs1,
                                 vfloat32mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat64m1_t __riscv_vfwnmsac_tu(vfloat64m1_t vd, float vs1, vfloat32mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwnmsac_tu(vfloat64m2_t vd, vfloat32m1_t vs1,
                                 vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwnmsac_tu(vfloat64m2_t vd, float vs1, vfloat32m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwnmsac_tu(vfloat64m4_t vd, vfloat32m2_t vs1,
                                 vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwnmsac_tu(vfloat64m4_t vd, float vs1, vfloat32m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwnmsac_tu(vfloat64m8_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwnmsac_tu(vfloat64m8_t vd, float vs1, vfloat32m4_t vs2,
                                 unsigned int frm, size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwmacc_tum(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmacc_tum(vbool64_t vm, vfloat32mf2_t vd, _Float16 vs1,
                                  vfloat16mf4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfwmacc_tum(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmacc_tum(vbool32_t vm, vfloat32m1_t vd, _Float16 vs1,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32m2_t __riscv_vfwmacc_tum(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat16m1_t vs1, vfloat16m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmacc_tum(vbool16_t vm, vfloat32m2_t vd, _Float16 vs1,
                                 vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmacc_tum(vbool8_t vm, vfloat32m4_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmacc_tum(vbool8_t vm, vfloat32m4_t vd, _Float16 vs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmacc_tum(vbool4_t vm, vfloat32m8_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmacc_tum(vbool4_t vm, vfloat32m8_t vd, _Float16 vs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmacc_tum(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmacc_tum(vbool64_t vm, vfloat64m1_t vd, float vs1,
                                 vfloat32mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat64m2_t __riscv_vfwmacc_tum(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat32m1_t vs1, vfloat32m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmacc_tum(vbool32_t vm, vfloat64m2_t vd, float vs1,
                                 vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmacc_tum(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat32m2_t vs1, vfloat32m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmacc_tum(vbool16_t vm, vfloat64m4_t vd, float vs1,
                                 vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmacc_tum(vbool8_t vm, vfloat64m8_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmacc_tum(vbool8_t vm, vfloat64m8_t vd, float vs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_tum(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                   unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_tum(vbool64_t vm, vfloat32mf2_t vd, _Float16 vs1,
                                   vfloat16mf4_t vs2, unsigned int frm,
                                   size_t vl);
vfloat32m1_t __riscv_vfwnmacc_tum(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwnmacc_tum(vbool32_t vm, vfloat32m1_t vd, _Float16 vs1,
                                  vfloat16mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m2_t __riscv_vfwnmacc_tum(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat16m1_t vs1, vfloat16m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwnmacc_tum(vbool16_t vm, vfloat32m2_t vd, _Float16 vs1,
                                  vfloat16m1_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m4_t __riscv_vfwnmacc_tum(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat16m2_t vs1, vfloat16m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwnmacc_tum(vbool8_t vm, vfloat32m4_t vd, _Float16 vs1,
                                  vfloat16m2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m8_t __riscv_vfwnmacc_tum(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat16m4_t vs1, vfloat16m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwnmacc_tum(vbool4_t vm, vfloat32m8_t vd, _Float16 vs1,
                                  vfloat16m4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m1_t __riscv_vfwnmacc_tum(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwnmacc_tum(vbool64_t vm, vfloat64m1_t vd, float vs1,
                                  vfloat32mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m2_t __riscv_vfwnmacc_tum(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat32m1_t vs1, vfloat32m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwnmacc_tum(vbool32_t vm, vfloat64m2_t vd, float vs1,
                                  vfloat32m1_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m4_t __riscv_vfwnmacc_tum(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat32m2_t vs1, vfloat32m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwnmacc_tum(vbool16_t vm, vfloat64m4_t vd, float vs1,
                                  vfloat32m2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m8_t __riscv_vfwnmacc_tum(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat32m4_t vs1, vfloat32m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwnmacc_tum(vbool8_t vm, vfloat64m8_t vd, float vs1,
                                  vfloat32m4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32mf2_t __riscv_vfwmsac_tum(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmsac_tum(vbool64_t vm, vfloat32mf2_t vd, _Float16 vs1,
                                  vfloat16mf4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfwmsac_tum(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmsac_tum(vbool32_t vm, vfloat32m1_t vd, _Float16 vs1,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32m2_t __riscv_vfwmsac_tum(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat16m1_t vs1, vfloat16m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmsac_tum(vbool16_t vm, vfloat32m2_t vd, _Float16 vs1,
                                 vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmsac_tum(vbool8_t vm, vfloat32m4_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmsac_tum(vbool8_t vm, vfloat32m4_t vd, _Float16 vs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmsac_tum(vbool4_t vm, vfloat32m8_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmsac_tum(vbool4_t vm, vfloat32m8_t vd, _Float16 vs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmsac_tum(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmsac_tum(vbool64_t vm, vfloat64m1_t vd, float vs1,
                                 vfloat32mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat64m2_t __riscv_vfwmsac_tum(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat32m1_t vs1, vfloat32m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmsac_tum(vbool32_t vm, vfloat64m2_t vd, float vs1,
                                 vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmsac_tum(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat32m2_t vs1, vfloat32m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmsac_tum(vbool16_t vm, vfloat64m4_t vd, float vs1,
                                 vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmsac_tum(vbool8_t vm, vfloat64m8_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmsac_tum(vbool8_t vm, vfloat64m8_t vd, float vs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_tum(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                   unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_tum(vbool64_t vm, vfloat32mf2_t vd, _Float16 vs1,
                                   vfloat16mf4_t vs2, unsigned int frm,
                                   size_t vl);
vfloat32m1_t __riscv_vfwnmsac_tum(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwnmsac_tum(vbool32_t vm, vfloat32m1_t vd, _Float16 vs1,
                                  vfloat16mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m2_t __riscv_vfwnmsac_tum(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat16m1_t vs1, vfloat16m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwnmsac_tum(vbool16_t vm, vfloat32m2_t vd, _Float16 vs1,
                                  vfloat16m1_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m4_t __riscv_vfwnmsac_tum(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat16m2_t vs1, vfloat16m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwnmsac_tum(vbool8_t vm, vfloat32m4_t vd, _Float16 vs1,
                                  vfloat16m2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m8_t __riscv_vfwnmsac_tum(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat16m4_t vs1, vfloat16m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwnmsac_tum(vbool4_t vm, vfloat32m8_t vd, _Float16 vs1,
                                  vfloat16m4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m1_t __riscv_vfwnmsac_tum(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwnmsac_tum(vbool64_t vm, vfloat64m1_t vd, float vs1,
                                  vfloat32mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m2_t __riscv_vfwnmsac_tum(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat32m1_t vs1, vfloat32m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwnmsac_tum(vbool32_t vm, vfloat64m2_t vd, float vs1,
                                  vfloat32m1_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m4_t __riscv_vfwnmsac_tum(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat32m2_t vs1, vfloat32m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwnmsac_tum(vbool16_t vm, vfloat64m4_t vd, float vs1,
                                  vfloat32m2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m8_t __riscv_vfwnmsac_tum(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat32m4_t vs1, vfloat32m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwnmsac_tum(vbool8_t vm, vfloat64m8_t vd, float vs1,
                                  vfloat32m4_t vs2, unsigned int frm,
                                  size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwmacc_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                   unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmacc_tumu(vbool64_t vm, vfloat32mf2_t vd, _Float16 vs1,
                                   vfloat16mf4_t vs2, unsigned int frm,
                                   size_t vl);
vfloat32m1_t __riscv_vfwmacc_tumu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmacc_tumu(vbool32_t vm, vfloat32m1_t vd, _Float16 vs1,
                                  vfloat16mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m2_t __riscv_vfwmacc_tumu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat16m1_t vs1, vfloat16m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmacc_tumu(vbool16_t vm, vfloat32m2_t vd, _Float16 vs1,
                                  vfloat16m1_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m4_t __riscv_vfwmacc_tumu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat16m2_t vs1, vfloat16m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmacc_tumu(vbool8_t vm, vfloat32m4_t vd, _Float16 vs1,
                                  vfloat16m2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m8_t __riscv_vfwmacc_tumu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat16m4_t vs1, vfloat16m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmacc_tumu(vbool4_t vm, vfloat32m8_t vd, _Float16 vs1,
                                  vfloat16m4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m1_t __riscv_vfwmacc_tumu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmacc_tumu(vbool64_t vm, vfloat64m1_t vd, float vs1,
                                  vfloat32mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m2_t __riscv_vfwmacc_tumu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat32m1_t vs1, vfloat32m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmacc_tumu(vbool32_t vm, vfloat64m2_t vd, float vs1,
                                  vfloat32m1_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m4_t __riscv_vfwmacc_tumu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat32m2_t vs1, vfloat32m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmacc_tumu(vbool16_t vm, vfloat64m4_t vd, float vs1,
                                  vfloat32m2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m8_t __riscv_vfwmacc_tumu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat32m4_t vs1, vfloat32m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmacc_tumu(vbool8_t vm, vfloat64m8_t vd, float vs1,
                                  vfloat32m4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                    vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                    unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                    _Float16 vs1, vfloat16mf4_t vs2,
                                    unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwnmacc_tumu(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwnmacc_tumu(vbool32_t vm, vfloat32m1_t vd, _Float16 vs1,
                                   vfloat16mf2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat32m2_t __riscv_vfwnmacc_tumu(vbool16_t vm, vfloat32m2_t vd,
                                   vfloat16m1_t vs1, vfloat16m1_t vs2,
                                   unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwnmacc_tumu(vbool16_t vm, vfloat32m2_t vd, _Float16 vs1,
                                   vfloat16m1_t vs2, unsigned int frm,
                                   size_t vl);
vfloat32m4_t __riscv_vfwnmacc_tumu(vbool8_t vm, vfloat32m4_t vd,
                                   vfloat16m2_t vs1, vfloat16m2_t vs2,
                                   unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwnmacc_tumu(vbool8_t vm, vfloat32m4_t vd, _Float16 vs1,
                                   vfloat16m2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat32m8_t __riscv_vfwnmacc_tumu(vbool4_t vm, vfloat32m8_t vd,
                                   vfloat16m4_t vs1, vfloat16m4_t vs2,
                                   unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwnmacc_tumu(vbool4_t vm, vfloat32m8_t vd, _Float16 vs1,
                                   vfloat16m4_t vs2, unsigned int frm,
                                   size_t vl);
vfloat64m1_t __riscv_vfwnmacc_tumu(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwnmacc_tumu(vbool64_t vm, vfloat64m1_t vd, float vs1,
                                   vfloat32mf2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat64m2_t __riscv_vfwnmacc_tumu(vbool32_t vm, vfloat64m2_t vd,
                                   vfloat32m1_t vs1, vfloat32m1_t vs2,
                                   unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwnmacc_tumu(vbool32_t vm, vfloat64m2_t vd, float vs1,
                                   vfloat32m1_t vs2, unsigned int frm,
                                   size_t vl);
vfloat64m4_t __riscv_vfwnmacc_tumu(vbool16_t vm, vfloat64m4_t vd,
                                   vfloat32m2_t vs1, vfloat32m2_t vs2,
                                   unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwnmacc_tumu(vbool16_t vm, vfloat64m4_t vd, float vs1,
                                   vfloat32m2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat64m8_t __riscv_vfwnmacc_tumu(vbool8_t vm, vfloat64m8_t vd,
                                   vfloat32m4_t vs1, vfloat32m4_t vs2,
                                   unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwnmacc_tumu(vbool8_t vm, vfloat64m8_t vd, float vs1,
                                   vfloat32m4_t vs2, unsigned int frm,
                                   size_t vl);
vfloat32mf2_t __riscv_vfwmsac_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                   unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmsac_tumu(vbool64_t vm, vfloat32mf2_t vd, _Float16 vs1,
                                   vfloat16mf4_t vs2, unsigned int frm,
                                   size_t vl);
vfloat32m1_t __riscv_vfwmsac_tumu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmsac_tumu(vbool32_t vm, vfloat32m1_t vd, _Float16 vs1,
                                  vfloat16mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m2_t __riscv_vfwmsac_tumu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat16m1_t vs1, vfloat16m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmsac_tumu(vbool16_t vm, vfloat32m2_t vd, _Float16 vs1,
                                  vfloat16m1_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m4_t __riscv_vfwmsac_tumu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat16m2_t vs1, vfloat16m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmsac_tumu(vbool8_t vm, vfloat32m4_t vd, _Float16 vs1,
                                  vfloat16m2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m8_t __riscv_vfwmsac_tumu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat16m4_t vs1, vfloat16m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmsac_tumu(vbool4_t vm, vfloat32m8_t vd, _Float16 vs1,
                                  vfloat16m4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m1_t __riscv_vfwmsac_tumu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmsac_tumu(vbool64_t vm, vfloat64m1_t vd, float vs1,
                                  vfloat32mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m2_t __riscv_vfwmsac_tumu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat32m1_t vs1, vfloat32m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmsac_tumu(vbool32_t vm, vfloat64m2_t vd, float vs1,
                                  vfloat32m1_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m4_t __riscv_vfwmsac_tumu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat32m2_t vs1, vfloat32m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmsac_tumu(vbool16_t vm, vfloat64m4_t vd, float vs1,
                                  vfloat32m2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat64m8_t __riscv_vfwmsac_tumu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat32m4_t vs1, vfloat32m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmsac_tumu(vbool8_t vm, vfloat64m8_t vd, float vs1,
                                  vfloat32m4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                    vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                    unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                    _Float16 vs1, vfloat16mf4_t vs2,
                                    unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwnmsac_tumu(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwnmsac_tumu(vbool32_t vm, vfloat32m1_t vd, _Float16 vs1,
                                   vfloat16mf2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat32m2_t __riscv_vfwnmsac_tumu(vbool16_t vm, vfloat32m2_t vd,
                                   vfloat16m1_t vs1, vfloat16m1_t vs2,
                                   unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwnmsac_tumu(vbool16_t vm, vfloat32m2_t vd, _Float16 vs1,
                                   vfloat16m1_t vs2, unsigned int frm,
                                   size_t vl);
vfloat32m4_t __riscv_vfwnmsac_tumu(vbool8_t vm, vfloat32m4_t vd,
                                   vfloat16m2_t vs1, vfloat16m2_t vs2,
                                   unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwnmsac_tumu(vbool8_t vm, vfloat32m4_t vd, _Float16 vs1,
                                   vfloat16m2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat32m8_t __riscv_vfwnmsac_tumu(vbool4_t vm, vfloat32m8_t vd,
                                   vfloat16m4_t vs1, vfloat16m4_t vs2,
                                   unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwnmsac_tumu(vbool4_t vm, vfloat32m8_t vd, _Float16 vs1,
                                   vfloat16m4_t vs2, unsigned int frm,
                                   size_t vl);
vfloat64m1_t __riscv_vfwnmsac_tumu(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwnmsac_tumu(vbool64_t vm, vfloat64m1_t vd, float vs1,
                                   vfloat32mf2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat64m2_t __riscv_vfwnmsac_tumu(vbool32_t vm, vfloat64m2_t vd,
                                   vfloat32m1_t vs1, vfloat32m1_t vs2,
                                   unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwnmsac_tumu(vbool32_t vm, vfloat64m2_t vd, float vs1,
                                   vfloat32m1_t vs2, unsigned int frm,
                                   size_t vl);
vfloat64m4_t __riscv_vfwnmsac_tumu(vbool16_t vm, vfloat64m4_t vd,
                                   vfloat32m2_t vs1, vfloat32m2_t vs2,
                                   unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwnmsac_tumu(vbool16_t vm, vfloat64m4_t vd, float vs1,
                                   vfloat32m2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat64m8_t __riscv_vfwnmsac_tumu(vbool8_t vm, vfloat64m8_t vd,
                                   vfloat32m4_t vs1, vfloat32m4_t vs2,
                                   unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwnmsac_tumu(vbool8_t vm, vfloat64m8_t vd, float vs1,
                                   vfloat32m4_t vs2, unsigned int frm,
                                   size_t vl);
// masked functions
vfloat32mf2_t __riscv_vfwmacc_mu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmacc_mu(vbool64_t vm, vfloat32mf2_t vd, _Float16 vs1,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32m1_t __riscv_vfwmacc_mu(vbool32_t vm, vfloat32m1_t vd,
                                vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmacc_mu(vbool32_t vm, vfloat32m1_t vd, _Float16 vs1,
                                vfloat16mf2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmacc_mu(vbool16_t vm, vfloat32m2_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmacc_mu(vbool16_t vm, vfloat32m2_t vd, _Float16 vs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmacc_mu(vbool8_t vm, vfloat32m4_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmacc_mu(vbool8_t vm, vfloat32m4_t vd, _Float16 vs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmacc_mu(vbool4_t vm, vfloat32m8_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmacc_mu(vbool4_t vm, vfloat32m8_t vd, _Float16 vs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmacc_mu(vbool64_t vm, vfloat64m1_t vd,
                                vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmacc_mu(vbool64_t vm, vfloat64m1_t vd, float vs1,
                                vfloat32mf2_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmacc_mu(vbool32_t vm, vfloat64m2_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmacc_mu(vbool32_t vm, vfloat64m2_t vd, float vs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmacc_mu(vbool16_t vm, vfloat64m4_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmacc_mu(vbool16_t vm, vfloat64m4_t vd, float vs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmacc_mu(vbool8_t vm, vfloat64m8_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmacc_mu(vbool8_t vm, vfloat64m8_t vd, float vs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_mu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmacc_mu(vbool64_t vm, vfloat32mf2_t vd, _Float16 vs1,
                                  vfloat16mf4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfwnmacc_mu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwnmacc_mu(vbool32_t vm, vfloat32m1_t vd, _Float16 vs1,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32m2_t __riscv_vfwnmacc_mu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat16m1_t vs1, vfloat16m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwnmacc_mu(vbool16_t vm, vfloat32m2_t vd, _Float16 vs1,
                                 vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwnmacc_mu(vbool8_t vm, vfloat32m4_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwnmacc_mu(vbool8_t vm, vfloat32m4_t vd, _Float16 vs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwnmacc_mu(vbool4_t vm, vfloat32m8_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwnmacc_mu(vbool4_t vm, vfloat32m8_t vd, _Float16 vs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwnmacc_mu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwnmacc_mu(vbool64_t vm, vfloat64m1_t vd, float vs1,
                                 vfloat32mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat64m2_t __riscv_vfwnmacc_mu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat32m1_t vs1, vfloat32m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwnmacc_mu(vbool32_t vm, vfloat64m2_t vd, float vs1,
                                 vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwnmacc_mu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat32m2_t vs1, vfloat32m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwnmacc_mu(vbool16_t vm, vfloat64m4_t vd, float vs1,
                                 vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwnmacc_mu(vbool8_t vm, vfloat64m8_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwnmacc_mu(vbool8_t vm, vfloat64m8_t vd, float vs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmsac_mu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwmsac_mu(vbool64_t vm, vfloat32mf2_t vd, _Float16 vs1,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32m1_t __riscv_vfwmsac_mu(vbool32_t vm, vfloat32m1_t vd,
                                vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwmsac_mu(vbool32_t vm, vfloat32m1_t vd, _Float16 vs1,
                                vfloat16mf2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmsac_mu(vbool16_t vm, vfloat32m2_t vd, vfloat16m1_t vs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwmsac_mu(vbool16_t vm, vfloat32m2_t vd, _Float16 vs1,
                                vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmsac_mu(vbool8_t vm, vfloat32m4_t vd, vfloat16m2_t vs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwmsac_mu(vbool8_t vm, vfloat32m4_t vd, _Float16 vs1,
                                vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmsac_mu(vbool4_t vm, vfloat32m8_t vd, vfloat16m4_t vs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwmsac_mu(vbool4_t vm, vfloat32m8_t vd, _Float16 vs1,
                                vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmsac_mu(vbool64_t vm, vfloat64m1_t vd,
                                vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwmsac_mu(vbool64_t vm, vfloat64m1_t vd, float vs1,
                                vfloat32mf2_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmsac_mu(vbool32_t vm, vfloat64m2_t vd, vfloat32m1_t vs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwmsac_mu(vbool32_t vm, vfloat64m2_t vd, float vs1,
                                vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmsac_mu(vbool16_t vm, vfloat64m4_t vd, vfloat32m2_t vs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwmsac_mu(vbool16_t vm, vfloat64m4_t vd, float vs1,
                                vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmsac_mu(vbool8_t vm, vfloat64m8_t vd, vfloat32m4_t vs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwmsac_mu(vbool8_t vm, vfloat64m8_t vd, float vs1,
                                vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_mu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat16mf4_t vs1, vfloat16mf4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfwnmsac_mu(vbool64_t vm, vfloat32mf2_t vd, _Float16 vs1,
                                  vfloat16mf4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfwnmsac_mu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat16mf2_t vs1, vfloat16mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwnmsac_mu(vbool32_t vm, vfloat32m1_t vd, _Float16 vs1,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32m2_t __riscv_vfwnmsac_mu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat16m1_t vs1, vfloat16m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfwnmsac_mu(vbool16_t vm, vfloat32m2_t vd, _Float16 vs1,
                                 vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwnmsac_mu(vbool8_t vm, vfloat32m4_t vd, vfloat16m2_t vs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfwnmsac_mu(vbool8_t vm, vfloat32m4_t vd, _Float16 vs1,
                                 vfloat16m2_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwnmsac_mu(vbool4_t vm, vfloat32m8_t vd, vfloat16m4_t vs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfwnmsac_mu(vbool4_t vm, vfloat32m8_t vd, _Float16 vs1,
                                 vfloat16m4_t vs2, unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwnmsac_mu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat32mf2_t vs1, vfloat32mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwnmsac_mu(vbool64_t vm, vfloat64m1_t vd, float vs1,
                                 vfloat32mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat64m2_t __riscv_vfwnmsac_mu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat32m1_t vs1, vfloat32m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfwnmsac_mu(vbool32_t vm, vfloat64m2_t vd, float vs1,
                                 vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwnmsac_mu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat32m2_t vs1, vfloat32m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfwnmsac_mu(vbool16_t vm, vfloat64m4_t vd, float vs1,
                                 vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwnmsac_mu(vbool8_t vm, vfloat64m8_t vd, vfloat32m4_t vs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfwnmsac_mu(vbool8_t vm, vfloat64m8_t vd, float vs1,
                                 vfloat32m4_t vs2, unsigned int frm, size_t vl);

Vector Floating-Point Square-Root Intrinsics

vfloat16mf4_t __riscv_vfsqrt_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfsqrt_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfsqrt_tu(vfloat16m1_t vd, vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfsqrt_tu(vfloat16m2_t vd, vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfsqrt_tu(vfloat16m4_t vd, vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfsqrt_tu(vfloat16m8_t vd, vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfsqrt_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfsqrt_tu(vfloat32m1_t vd, vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfsqrt_tu(vfloat32m2_t vd, vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfsqrt_tu(vfloat32m4_t vd, vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfsqrt_tu(vfloat32m8_t vd, vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfsqrt_tu(vfloat64m1_t vd, vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfsqrt_tu(vfloat64m2_t vd, vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfsqrt_tu(vfloat64m4_t vd, vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfsqrt_tu(vfloat64m8_t vd, vfloat64m8_t vs2, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfsqrt_tum(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfsqrt_tum(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfsqrt_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                size_t vl);
vfloat16m2_t __riscv_vfsqrt_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                size_t vl);
vfloat16m4_t __riscv_vfsqrt_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                size_t vl);
vfloat16m8_t __riscv_vfsqrt_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                size_t vl);
vfloat32mf2_t __riscv_vfsqrt_tum(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfsqrt_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                size_t vl);
vfloat32m2_t __riscv_vfsqrt_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                size_t vl);
vfloat32m4_t __riscv_vfsqrt_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                size_t vl);
vfloat32m8_t __riscv_vfsqrt_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                size_t vl);
vfloat64m1_t __riscv_vfsqrt_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                size_t vl);
vfloat64m2_t __riscv_vfsqrt_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                size_t vl);
vfloat64m4_t __riscv_vfsqrt_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                size_t vl);
vfloat64m8_t __riscv_vfsqrt_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfsqrt_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfsqrt_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfsqrt_tumu(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfsqrt_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                 size_t vl);
vfloat16m4_t __riscv_vfsqrt_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                 size_t vl);
vfloat16m8_t __riscv_vfsqrt_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                 size_t vl);
vfloat32mf2_t __riscv_vfsqrt_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfsqrt_tumu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfsqrt_tumu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfsqrt_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                 size_t vl);
vfloat32m8_t __riscv_vfsqrt_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                 size_t vl);
vfloat64m1_t __riscv_vfsqrt_tumu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfsqrt_tumu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfsqrt_tumu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfsqrt_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                 size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfsqrt_mu(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfsqrt_mu(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfsqrt_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               size_t vl);
vfloat16m2_t __riscv_vfsqrt_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               size_t vl);
vfloat16m4_t __riscv_vfsqrt_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               size_t vl);
vfloat16m8_t __riscv_vfsqrt_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               size_t vl);
vfloat32mf2_t __riscv_vfsqrt_mu(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfsqrt_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               size_t vl);
vfloat32m2_t __riscv_vfsqrt_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               size_t vl);
vfloat32m4_t __riscv_vfsqrt_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               size_t vl);
vfloat32m8_t __riscv_vfsqrt_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               size_t vl);
vfloat64m1_t __riscv_vfsqrt_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               size_t vl);
vfloat64m2_t __riscv_vfsqrt_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               size_t vl);
vfloat64m4_t __riscv_vfsqrt_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               size_t vl);
vfloat64m8_t __riscv_vfsqrt_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               size_t vl);
vfloat16mf4_t __riscv_vfsqrt_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfsqrt_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfsqrt_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                               unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfsqrt_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                               unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfsqrt_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                               unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfsqrt_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfsqrt_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfsqrt_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                               unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfsqrt_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                               unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfsqrt_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                               unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfsqrt_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfsqrt_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfsqrt_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfsqrt_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfsqrt_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                               unsigned int frm, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfsqrt_tum(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16mf2_t __riscv_vfsqrt_tum(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16m1_t __riscv_vfsqrt_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfsqrt_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfsqrt_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfsqrt_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfsqrt_tum(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32m1_t __riscv_vfsqrt_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfsqrt_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfsqrt_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfsqrt_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfsqrt_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfsqrt_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfsqrt_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfsqrt_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                unsigned int frm, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfsqrt_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16mf2_t __riscv_vfsqrt_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m1_t __riscv_vfsqrt_tumu(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfsqrt_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfsqrt_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfsqrt_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfsqrt_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfsqrt_tumu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfsqrt_tumu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfsqrt_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfsqrt_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfsqrt_tumu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfsqrt_tumu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfsqrt_tumu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfsqrt_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                 unsigned int frm, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfsqrt_mu(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfsqrt_mu(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfsqrt_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfsqrt_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfsqrt_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfsqrt_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfsqrt_mu(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfsqrt_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfsqrt_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfsqrt_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfsqrt_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfsqrt_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfsqrt_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfsqrt_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfsqrt_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               unsigned int frm, size_t vl);

Vector Floating-Point Reciprocal Square-Root Estimate Intrinsics

vfloat16mf4_t __riscv_vfrsqrt7_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                  size_t vl);
vfloat16mf2_t __riscv_vfrsqrt7_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                  size_t vl);
vfloat16m1_t __riscv_vfrsqrt7_tu(vfloat16m1_t vd, vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfrsqrt7_tu(vfloat16m2_t vd, vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfrsqrt7_tu(vfloat16m4_t vd, vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfrsqrt7_tu(vfloat16m8_t vd, vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfrsqrt7_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                  size_t vl);
vfloat32m1_t __riscv_vfrsqrt7_tu(vfloat32m1_t vd, vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfrsqrt7_tu(vfloat32m2_t vd, vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfrsqrt7_tu(vfloat32m4_t vd, vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfrsqrt7_tu(vfloat32m8_t vd, vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfrsqrt7_tu(vfloat64m1_t vd, vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfrsqrt7_tu(vfloat64m2_t vd, vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfrsqrt7_tu(vfloat64m4_t vd, vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfrsqrt7_tu(vfloat64m8_t vd, vfloat64m8_t vs2, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfrsqrt7_tum(vbool64_t vm, vfloat16mf4_t vd,
                                   vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfrsqrt7_tum(vbool32_t vm, vfloat16mf2_t vd,
                                   vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfrsqrt7_tum(vbool16_t vm, vfloat16m1_t vd,
                                  vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfrsqrt7_tum(vbool8_t vm, vfloat16m2_t vd,
                                  vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfrsqrt7_tum(vbool4_t vm, vfloat16m4_t vd,
                                  vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfrsqrt7_tum(vbool2_t vm, vfloat16m8_t vd,
                                  vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfrsqrt7_tum(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfrsqrt7_tum(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfrsqrt7_tum(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfrsqrt7_tum(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfrsqrt7_tum(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfrsqrt7_tum(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfrsqrt7_tum(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfrsqrt7_tum(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfrsqrt7_tum(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat64m8_t vs2, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfrsqrt7_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                    vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfrsqrt7_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                    vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfrsqrt7_tumu(vbool16_t vm, vfloat16m1_t vd,
                                   vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfrsqrt7_tumu(vbool8_t vm, vfloat16m2_t vd,
                                   vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfrsqrt7_tumu(vbool4_t vm, vfloat16m4_t vd,
                                   vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfrsqrt7_tumu(vbool2_t vm, vfloat16m8_t vd,
                                   vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfrsqrt7_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                    vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfrsqrt7_tumu(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfrsqrt7_tumu(vbool16_t vm, vfloat32m2_t vd,
                                   vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfrsqrt7_tumu(vbool8_t vm, vfloat32m4_t vd,
                                   vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfrsqrt7_tumu(vbool4_t vm, vfloat32m8_t vd,
                                   vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfrsqrt7_tumu(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfrsqrt7_tumu(vbool32_t vm, vfloat64m2_t vd,
                                   vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfrsqrt7_tumu(vbool16_t vm, vfloat64m4_t vd,
                                   vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfrsqrt7_tumu(vbool8_t vm, vfloat64m8_t vd,
                                   vfloat64m8_t vs2, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfrsqrt7_mu(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfrsqrt7_mu(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfrsqrt7_mu(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfrsqrt7_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                 size_t vl);
vfloat16m4_t __riscv_vfrsqrt7_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                 size_t vl);
vfloat16m8_t __riscv_vfrsqrt7_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                 size_t vl);
vfloat32mf2_t __riscv_vfrsqrt7_mu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfrsqrt7_mu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfrsqrt7_mu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfrsqrt7_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                 size_t vl);
vfloat32m8_t __riscv_vfrsqrt7_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                 size_t vl);
vfloat64m1_t __riscv_vfrsqrt7_mu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfrsqrt7_mu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfrsqrt7_mu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfrsqrt7_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                 size_t vl);

[[policy-variant-overloaded#1410-vector-floating-point-reciprocal-estimate]] ==== Vector Floating-Point Reciprocal Estimate Intrinsics

vfloat16mf4_t __riscv_vfrec7_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfrec7_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfrec7_tu(vfloat16m1_t vd, vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfrec7_tu(vfloat16m2_t vd, vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfrec7_tu(vfloat16m4_t vd, vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfrec7_tu(vfloat16m8_t vd, vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfrec7_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfrec7_tu(vfloat32m1_t vd, vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfrec7_tu(vfloat32m2_t vd, vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfrec7_tu(vfloat32m4_t vd, vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfrec7_tu(vfloat32m8_t vd, vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfrec7_tu(vfloat64m1_t vd, vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfrec7_tu(vfloat64m2_t vd, vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfrec7_tu(vfloat64m4_t vd, vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfrec7_tu(vfloat64m8_t vd, vfloat64m8_t vs2, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfrec7_tum(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfrec7_tum(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfrec7_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                size_t vl);
vfloat16m2_t __riscv_vfrec7_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                size_t vl);
vfloat16m4_t __riscv_vfrec7_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                size_t vl);
vfloat16m8_t __riscv_vfrec7_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                size_t vl);
vfloat32mf2_t __riscv_vfrec7_tum(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfrec7_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                size_t vl);
vfloat32m2_t __riscv_vfrec7_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                size_t vl);
vfloat32m4_t __riscv_vfrec7_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                size_t vl);
vfloat32m8_t __riscv_vfrec7_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                size_t vl);
vfloat64m1_t __riscv_vfrec7_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                size_t vl);
vfloat64m2_t __riscv_vfrec7_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                size_t vl);
vfloat64m4_t __riscv_vfrec7_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                size_t vl);
vfloat64m8_t __riscv_vfrec7_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfrec7_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfrec7_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfrec7_tumu(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfrec7_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                 size_t vl);
vfloat16m4_t __riscv_vfrec7_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                 size_t vl);
vfloat16m8_t __riscv_vfrec7_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                 size_t vl);
vfloat32mf2_t __riscv_vfrec7_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfrec7_tumu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfrec7_tumu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfrec7_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                 size_t vl);
vfloat32m8_t __riscv_vfrec7_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                 size_t vl);
vfloat64m1_t __riscv_vfrec7_tumu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfrec7_tumu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfrec7_tumu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfrec7_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                 size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfrec7_mu(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfrec7_mu(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfrec7_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               size_t vl);
vfloat16m2_t __riscv_vfrec7_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               size_t vl);
vfloat16m4_t __riscv_vfrec7_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               size_t vl);
vfloat16m8_t __riscv_vfrec7_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               size_t vl);
vfloat32mf2_t __riscv_vfrec7_mu(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfrec7_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               size_t vl);
vfloat32m2_t __riscv_vfrec7_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               size_t vl);
vfloat32m4_t __riscv_vfrec7_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               size_t vl);
vfloat32m8_t __riscv_vfrec7_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               size_t vl);
vfloat64m1_t __riscv_vfrec7_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               size_t vl);
vfloat64m2_t __riscv_vfrec7_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               size_t vl);
vfloat64m4_t __riscv_vfrec7_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               size_t vl);
vfloat64m8_t __riscv_vfrec7_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               size_t vl);
vfloat16mf4_t __riscv_vfrec7_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfrec7_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfrec7_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                               unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfrec7_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                               unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfrec7_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                               unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfrec7_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfrec7_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfrec7_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                               unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfrec7_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                               unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfrec7_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                               unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfrec7_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfrec7_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfrec7_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfrec7_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfrec7_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                               unsigned int frm, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfrec7_tum(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16mf2_t __riscv_vfrec7_tum(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat16m1_t __riscv_vfrec7_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfrec7_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfrec7_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfrec7_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfrec7_tum(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, unsigned int frm,
                                 size_t vl);
vfloat32m1_t __riscv_vfrec7_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfrec7_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfrec7_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfrec7_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfrec7_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfrec7_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfrec7_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfrec7_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                unsigned int frm, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfrec7_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16mf2_t __riscv_vfrec7_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m1_t __riscv_vfrec7_tumu(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfrec7_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfrec7_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfrec7_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfrec7_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfrec7_tumu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfrec7_tumu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfrec7_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfrec7_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfrec7_tumu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfrec7_tumu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfrec7_tumu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfrec7_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                 unsigned int frm, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfrec7_mu(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfrec7_mu(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfrec7_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfrec7_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfrec7_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfrec7_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfrec7_mu(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfrec7_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfrec7_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfrec7_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfrec7_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfrec7_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfrec7_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfrec7_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfrec7_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               unsigned int frm, size_t vl);

Vector Floating-Point MIN/MAX Intrinsics

vfloat16mf4_t __riscv_vfmin_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                               vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfmin_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfmin_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                               vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfmin_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfmin_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                              vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfmin_tu(vfloat16m1_t vd, vfloat16m1_t vs2, _Float16 rs1,
                              size_t vl);
vfloat16m2_t __riscv_vfmin_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                              vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfmin_tu(vfloat16m2_t vd, vfloat16m2_t vs2, _Float16 rs1,
                              size_t vl);
vfloat16m4_t __riscv_vfmin_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                              vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfmin_tu(vfloat16m4_t vd, vfloat16m4_t vs2, _Float16 rs1,
                              size_t vl);
vfloat16m8_t __riscv_vfmin_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                              vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfmin_tu(vfloat16m8_t vd, vfloat16m8_t vs2, _Float16 rs1,
                              size_t vl);
vfloat32mf2_t __riscv_vfmin_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                               vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfmin_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2, float rs1,
                               size_t vl);
vfloat32m1_t __riscv_vfmin_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                              vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfmin_tu(vfloat32m1_t vd, vfloat32m1_t vs2, float rs1,
                              size_t vl);
vfloat32m2_t __riscv_vfmin_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                              vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfmin_tu(vfloat32m2_t vd, vfloat32m2_t vs2, float rs1,
                              size_t vl);
vfloat32m4_t __riscv_vfmin_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                              vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfmin_tu(vfloat32m4_t vd, vfloat32m4_t vs2, float rs1,
                              size_t vl);
vfloat32m8_t __riscv_vfmin_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                              vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfmin_tu(vfloat32m8_t vd, vfloat32m8_t vs2, float rs1,
                              size_t vl);
vfloat64m1_t __riscv_vfmin_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                              vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfmin_tu(vfloat64m1_t vd, vfloat64m1_t vs2, double rs1,
                              size_t vl);
vfloat64m2_t __riscv_vfmin_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                              vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfmin_tu(vfloat64m2_t vd, vfloat64m2_t vs2, double rs1,
                              size_t vl);
vfloat64m4_t __riscv_vfmin_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                              vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfmin_tu(vfloat64m4_t vd, vfloat64m4_t vs2, double rs1,
                              size_t vl);
vfloat64m8_t __riscv_vfmin_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                              vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfmin_tu(vfloat64m8_t vd, vfloat64m8_t vs2, double rs1,
                              size_t vl);
vfloat16mf4_t __riscv_vfmax_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                               vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfmax_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfmax_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                               vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfmax_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfmax_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                              vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfmax_tu(vfloat16m1_t vd, vfloat16m1_t vs2, _Float16 rs1,
                              size_t vl);
vfloat16m2_t __riscv_vfmax_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                              vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfmax_tu(vfloat16m2_t vd, vfloat16m2_t vs2, _Float16 rs1,
                              size_t vl);
vfloat16m4_t __riscv_vfmax_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                              vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfmax_tu(vfloat16m4_t vd, vfloat16m4_t vs2, _Float16 rs1,
                              size_t vl);
vfloat16m8_t __riscv_vfmax_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                              vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfmax_tu(vfloat16m8_t vd, vfloat16m8_t vs2, _Float16 rs1,
                              size_t vl);
vfloat32mf2_t __riscv_vfmax_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                               vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfmax_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2, float rs1,
                               size_t vl);
vfloat32m1_t __riscv_vfmax_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                              vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfmax_tu(vfloat32m1_t vd, vfloat32m1_t vs2, float rs1,
                              size_t vl);
vfloat32m2_t __riscv_vfmax_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                              vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfmax_tu(vfloat32m2_t vd, vfloat32m2_t vs2, float rs1,
                              size_t vl);
vfloat32m4_t __riscv_vfmax_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                              vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfmax_tu(vfloat32m4_t vd, vfloat32m4_t vs2, float rs1,
                              size_t vl);
vfloat32m8_t __riscv_vfmax_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                              vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfmax_tu(vfloat32m8_t vd, vfloat32m8_t vs2, float rs1,
                              size_t vl);
vfloat64m1_t __riscv_vfmax_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                              vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfmax_tu(vfloat64m1_t vd, vfloat64m1_t vs2, double rs1,
                              size_t vl);
vfloat64m2_t __riscv_vfmax_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                              vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfmax_tu(vfloat64m2_t vd, vfloat64m2_t vs2, double rs1,
                              size_t vl);
vfloat64m4_t __riscv_vfmax_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                              vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfmax_tu(vfloat64m4_t vd, vfloat64m4_t vs2, double rs1,
                              size_t vl);
vfloat64m8_t __riscv_vfmax_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                              vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfmax_tu(vfloat64m8_t vd, vfloat64m8_t vs2, double rs1,
                              size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmin_tum(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                size_t vl);
vfloat16mf4_t __riscv_vfmin_tum(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfmin_tum(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                size_t vl);
vfloat16mf2_t __riscv_vfmin_tum(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfmin_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfmin_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfmin_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfmin_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfmin_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfmin_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfmin_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfmin_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfmin_tum(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                size_t vl);
vfloat32mf2_t __riscv_vfmin_tum(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfmin_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfmin_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               float rs1, size_t vl);
vfloat32m2_t __riscv_vfmin_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfmin_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               float rs1, size_t vl);
vfloat32m4_t __riscv_vfmin_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfmin_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               float rs1, size_t vl);
vfloat32m8_t __riscv_vfmin_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfmin_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               float rs1, size_t vl);
vfloat64m1_t __riscv_vfmin_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfmin_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               double rs1, size_t vl);
vfloat64m2_t __riscv_vfmin_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfmin_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               double rs1, size_t vl);
vfloat64m4_t __riscv_vfmin_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfmin_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               double rs1, size_t vl);
vfloat64m8_t __riscv_vfmin_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfmin_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               double rs1, size_t vl);
vfloat16mf4_t __riscv_vfmax_tum(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                size_t vl);
vfloat16mf4_t __riscv_vfmax_tum(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfmax_tum(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                size_t vl);
vfloat16mf2_t __riscv_vfmax_tum(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfmax_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfmax_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfmax_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfmax_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfmax_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfmax_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfmax_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfmax_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfmax_tum(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                size_t vl);
vfloat32mf2_t __riscv_vfmax_tum(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfmax_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfmax_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               float rs1, size_t vl);
vfloat32m2_t __riscv_vfmax_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfmax_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               float rs1, size_t vl);
vfloat32m4_t __riscv_vfmax_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfmax_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               float rs1, size_t vl);
vfloat32m8_t __riscv_vfmax_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfmax_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               float rs1, size_t vl);
vfloat64m1_t __riscv_vfmax_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfmax_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               double rs1, size_t vl);
vfloat64m2_t __riscv_vfmax_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfmax_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               double rs1, size_t vl);
vfloat64m4_t __riscv_vfmax_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfmax_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               double rs1, size_t vl);
vfloat64m8_t __riscv_vfmax_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfmax_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               double rs1, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmin_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                 size_t vl);
vfloat16mf4_t __riscv_vfmin_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfmin_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                 size_t vl);
vfloat16mf2_t __riscv_vfmin_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfmin_tumu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfmin_tumu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfmin_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfmin_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfmin_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfmin_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfmin_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfmin_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfmin_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                 size_t vl);
vfloat32mf2_t __riscv_vfmin_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfmin_tumu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfmin_tumu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                float rs1, size_t vl);
vfloat32m2_t __riscv_vfmin_tumu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfmin_tumu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                float rs1, size_t vl);
vfloat32m4_t __riscv_vfmin_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfmin_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                float rs1, size_t vl);
vfloat32m8_t __riscv_vfmin_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfmin_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                float rs1, size_t vl);
vfloat64m1_t __riscv_vfmin_tumu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfmin_tumu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                double rs1, size_t vl);
vfloat64m2_t __riscv_vfmin_tumu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfmin_tumu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                double rs1, size_t vl);
vfloat64m4_t __riscv_vfmin_tumu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfmin_tumu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                double rs1, size_t vl);
vfloat64m8_t __riscv_vfmin_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfmin_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                double rs1, size_t vl);
vfloat16mf4_t __riscv_vfmax_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                 size_t vl);
vfloat16mf4_t __riscv_vfmax_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfmax_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                 size_t vl);
vfloat16mf2_t __riscv_vfmax_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfmax_tumu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfmax_tumu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfmax_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfmax_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfmax_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfmax_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfmax_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfmax_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfmax_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                 size_t vl);
vfloat32mf2_t __riscv_vfmax_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfmax_tumu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfmax_tumu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                float rs1, size_t vl);
vfloat32m2_t __riscv_vfmax_tumu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfmax_tumu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                float rs1, size_t vl);
vfloat32m4_t __riscv_vfmax_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfmax_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                float rs1, size_t vl);
vfloat32m8_t __riscv_vfmax_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfmax_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                float rs1, size_t vl);
vfloat64m1_t __riscv_vfmax_tumu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfmax_tumu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                double rs1, size_t vl);
vfloat64m2_t __riscv_vfmax_tumu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfmax_tumu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                double rs1, size_t vl);
vfloat64m4_t __riscv_vfmax_tumu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfmax_tumu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                double rs1, size_t vl);
vfloat64m8_t __riscv_vfmax_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfmax_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                double rs1, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfmin_mu(vbool64_t vm, vfloat16mf4_t vd,
                               vfloat16mf4_t vs2, vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfmin_mu(vbool64_t vm, vfloat16mf4_t vd,
                               vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfmin_mu(vbool32_t vm, vfloat16mf2_t vd,
                               vfloat16mf2_t vs2, vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfmin_mu(vbool32_t vm, vfloat16mf2_t vd,
                               vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfmin_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                              vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfmin_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                              _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfmin_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                              vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfmin_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                              _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfmin_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                              vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfmin_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                              _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfmin_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                              vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfmin_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                              _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfmin_mu(vbool64_t vm, vfloat32mf2_t vd,
                               vfloat32mf2_t vs2, vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfmin_mu(vbool64_t vm, vfloat32mf2_t vd,
                               vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfmin_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                              vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfmin_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                              float rs1, size_t vl);
vfloat32m2_t __riscv_vfmin_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                              vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfmin_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                              float rs1, size_t vl);
vfloat32m4_t __riscv_vfmin_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                              vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfmin_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                              float rs1, size_t vl);
vfloat32m8_t __riscv_vfmin_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                              vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfmin_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                              float rs1, size_t vl);
vfloat64m1_t __riscv_vfmin_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                              vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfmin_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                              double rs1, size_t vl);
vfloat64m2_t __riscv_vfmin_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                              vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfmin_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                              double rs1, size_t vl);
vfloat64m4_t __riscv_vfmin_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                              vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfmin_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                              double rs1, size_t vl);
vfloat64m8_t __riscv_vfmin_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                              vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfmin_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                              double rs1, size_t vl);
vfloat16mf4_t __riscv_vfmax_mu(vbool64_t vm, vfloat16mf4_t vd,
                               vfloat16mf4_t vs2, vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfmax_mu(vbool64_t vm, vfloat16mf4_t vd,
                               vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfmax_mu(vbool32_t vm, vfloat16mf2_t vd,
                               vfloat16mf2_t vs2, vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfmax_mu(vbool32_t vm, vfloat16mf2_t vd,
                               vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfmax_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                              vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfmax_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                              _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfmax_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                              vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfmax_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                              _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfmax_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                              vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfmax_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                              _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfmax_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                              vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfmax_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                              _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfmax_mu(vbool64_t vm, vfloat32mf2_t vd,
                               vfloat32mf2_t vs2, vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfmax_mu(vbool64_t vm, vfloat32mf2_t vd,
                               vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfmax_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                              vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfmax_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                              float rs1, size_t vl);
vfloat32m2_t __riscv_vfmax_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                              vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfmax_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                              float rs1, size_t vl);
vfloat32m4_t __riscv_vfmax_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                              vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfmax_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                              float rs1, size_t vl);
vfloat32m8_t __riscv_vfmax_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                              vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfmax_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                              float rs1, size_t vl);
vfloat64m1_t __riscv_vfmax_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                              vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfmax_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                              double rs1, size_t vl);
vfloat64m2_t __riscv_vfmax_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                              vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfmax_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                              double rs1, size_t vl);
vfloat64m4_t __riscv_vfmax_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                              vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfmax_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                              double rs1, size_t vl);
vfloat64m8_t __riscv_vfmax_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                              vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfmax_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                              double rs1, size_t vl);

Vector Floating-Point Sign-Injection Intrinsics

vfloat16mf4_t __riscv_vfsgnj_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfsgnj_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnj_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnj_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfsgnj_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                               vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfsgnj_tu(vfloat16m1_t vd, vfloat16m1_t vs2, _Float16 rs1,
                               size_t vl);
vfloat16m2_t __riscv_vfsgnj_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                               vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfsgnj_tu(vfloat16m2_t vd, vfloat16m2_t vs2, _Float16 rs1,
                               size_t vl);
vfloat16m4_t __riscv_vfsgnj_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                               vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfsgnj_tu(vfloat16m4_t vd, vfloat16m4_t vs2, _Float16 rs1,
                               size_t vl);
vfloat16m8_t __riscv_vfsgnj_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                               vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfsgnj_tu(vfloat16m8_t vd, vfloat16m8_t vs2, _Float16 rs1,
                               size_t vl);
vfloat32mf2_t __riscv_vfsgnj_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfsgnj_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2, float rs1,
                                size_t vl);
vfloat32m1_t __riscv_vfsgnj_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                               vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfsgnj_tu(vfloat32m1_t vd, vfloat32m1_t vs2, float rs1,
                               size_t vl);
vfloat32m2_t __riscv_vfsgnj_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                               vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfsgnj_tu(vfloat32m2_t vd, vfloat32m2_t vs2, float rs1,
                               size_t vl);
vfloat32m4_t __riscv_vfsgnj_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                               vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfsgnj_tu(vfloat32m4_t vd, vfloat32m4_t vs2, float rs1,
                               size_t vl);
vfloat32m8_t __riscv_vfsgnj_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                               vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfsgnj_tu(vfloat32m8_t vd, vfloat32m8_t vs2, float rs1,
                               size_t vl);
vfloat64m1_t __riscv_vfsgnj_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                               vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfsgnj_tu(vfloat64m1_t vd, vfloat64m1_t vs2, double rs1,
                               size_t vl);
vfloat64m2_t __riscv_vfsgnj_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                               vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfsgnj_tu(vfloat64m2_t vd, vfloat64m2_t vs2, double rs1,
                               size_t vl);
vfloat64m4_t __riscv_vfsgnj_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                               vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfsgnj_tu(vfloat64m4_t vd, vfloat64m4_t vs2, double rs1,
                               size_t vl);
vfloat64m8_t __riscv_vfsgnj_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                               vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfsgnj_tu(vfloat64m8_t vd, vfloat64m8_t vs2, double rs1,
                               size_t vl);
vfloat16mf4_t __riscv_vfsgnjn_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                 vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfsgnjn_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                 _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnjn_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                 vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnjn_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                 _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfsgnjn_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfsgnjn_tu(vfloat16m1_t vd, vfloat16m1_t vs2, _Float16 rs1,
                                size_t vl);
vfloat16m2_t __riscv_vfsgnjn_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfsgnjn_tu(vfloat16m2_t vd, vfloat16m2_t vs2, _Float16 rs1,
                                size_t vl);
vfloat16m4_t __riscv_vfsgnjn_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfsgnjn_tu(vfloat16m4_t vd, vfloat16m4_t vs2, _Float16 rs1,
                                size_t vl);
vfloat16m8_t __riscv_vfsgnjn_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfsgnjn_tu(vfloat16m8_t vd, vfloat16m8_t vs2, _Float16 rs1,
                                size_t vl);
vfloat32mf2_t __riscv_vfsgnjn_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                 vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfsgnjn_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2, float rs1,
                                 size_t vl);
vfloat32m1_t __riscv_vfsgnjn_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfsgnjn_tu(vfloat32m1_t vd, vfloat32m1_t vs2, float rs1,
                                size_t vl);
vfloat32m2_t __riscv_vfsgnjn_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfsgnjn_tu(vfloat32m2_t vd, vfloat32m2_t vs2, float rs1,
                                size_t vl);
vfloat32m4_t __riscv_vfsgnjn_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfsgnjn_tu(vfloat32m4_t vd, vfloat32m4_t vs2, float rs1,
                                size_t vl);
vfloat32m8_t __riscv_vfsgnjn_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfsgnjn_tu(vfloat32m8_t vd, vfloat32m8_t vs2, float rs1,
                                size_t vl);
vfloat64m1_t __riscv_vfsgnjn_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfsgnjn_tu(vfloat64m1_t vd, vfloat64m1_t vs2, double rs1,
                                size_t vl);
vfloat64m2_t __riscv_vfsgnjn_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfsgnjn_tu(vfloat64m2_t vd, vfloat64m2_t vs2, double rs1,
                                size_t vl);
vfloat64m4_t __riscv_vfsgnjn_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfsgnjn_tu(vfloat64m4_t vd, vfloat64m4_t vs2, double rs1,
                                size_t vl);
vfloat64m8_t __riscv_vfsgnjn_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfsgnjn_tu(vfloat64m8_t vd, vfloat64m8_t vs2, double rs1,
                                size_t vl);
vfloat16mf4_t __riscv_vfsgnjx_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                 vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfsgnjx_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                 _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnjx_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                 vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnjx_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                 _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfsgnjx_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfsgnjx_tu(vfloat16m1_t vd, vfloat16m1_t vs2, _Float16 rs1,
                                size_t vl);
vfloat16m2_t __riscv_vfsgnjx_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfsgnjx_tu(vfloat16m2_t vd, vfloat16m2_t vs2, _Float16 rs1,
                                size_t vl);
vfloat16m4_t __riscv_vfsgnjx_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfsgnjx_tu(vfloat16m4_t vd, vfloat16m4_t vs2, _Float16 rs1,
                                size_t vl);
vfloat16m8_t __riscv_vfsgnjx_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfsgnjx_tu(vfloat16m8_t vd, vfloat16m8_t vs2, _Float16 rs1,
                                size_t vl);
vfloat32mf2_t __riscv_vfsgnjx_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                 vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfsgnjx_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2, float rs1,
                                 size_t vl);
vfloat32m1_t __riscv_vfsgnjx_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfsgnjx_tu(vfloat32m1_t vd, vfloat32m1_t vs2, float rs1,
                                size_t vl);
vfloat32m2_t __riscv_vfsgnjx_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfsgnjx_tu(vfloat32m2_t vd, vfloat32m2_t vs2, float rs1,
                                size_t vl);
vfloat32m4_t __riscv_vfsgnjx_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfsgnjx_tu(vfloat32m4_t vd, vfloat32m4_t vs2, float rs1,
                                size_t vl);
vfloat32m8_t __riscv_vfsgnjx_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfsgnjx_tu(vfloat32m8_t vd, vfloat32m8_t vs2, float rs1,
                                size_t vl);
vfloat64m1_t __riscv_vfsgnjx_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfsgnjx_tu(vfloat64m1_t vd, vfloat64m1_t vs2, double rs1,
                                size_t vl);
vfloat64m2_t __riscv_vfsgnjx_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfsgnjx_tu(vfloat64m2_t vd, vfloat64m2_t vs2, double rs1,
                                size_t vl);
vfloat64m4_t __riscv_vfsgnjx_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfsgnjx_tu(vfloat64m4_t vd, vfloat64m4_t vs2, double rs1,
                                size_t vl);
vfloat64m8_t __riscv_vfsgnjx_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfsgnjx_tu(vfloat64m8_t vd, vfloat64m8_t vs2, double rs1,
                                size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfsgnj_tum(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                 size_t vl);
vfloat16mf4_t __riscv_vfsgnj_tum(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnj_tum(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                 size_t vl);
vfloat16mf2_t __riscv_vfsgnj_tum(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfsgnj_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfsgnj_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfsgnj_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfsgnj_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfsgnj_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfsgnj_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfsgnj_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfsgnj_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfsgnj_tum(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                 size_t vl);
vfloat32mf2_t __riscv_vfsgnj_tum(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfsgnj_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfsgnj_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                float rs1, size_t vl);
vfloat32m2_t __riscv_vfsgnj_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfsgnj_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                float rs1, size_t vl);
vfloat32m4_t __riscv_vfsgnj_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfsgnj_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                float rs1, size_t vl);
vfloat32m8_t __riscv_vfsgnj_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfsgnj_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                float rs1, size_t vl);
vfloat64m1_t __riscv_vfsgnj_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfsgnj_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                double rs1, size_t vl);
vfloat64m2_t __riscv_vfsgnj_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfsgnj_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                double rs1, size_t vl);
vfloat64m4_t __riscv_vfsgnj_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfsgnj_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                double rs1, size_t vl);
vfloat64m8_t __riscv_vfsgnj_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfsgnj_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                double rs1, size_t vl);
vfloat16mf4_t __riscv_vfsgnjn_tum(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                  size_t vl);
vfloat16mf4_t __riscv_vfsgnjn_tum(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnjn_tum(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                  size_t vl);
vfloat16mf2_t __riscv_vfsgnjn_tum(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfsgnjn_tum(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs2, vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfsgnjn_tum(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs2, _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfsgnjn_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                 vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfsgnjn_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                 _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfsgnjn_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                 vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfsgnjn_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                 _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfsgnjn_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                 vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfsgnjn_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                 _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfsgnjn_tum(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                  size_t vl);
vfloat32mf2_t __riscv_vfsgnjn_tum(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfsgnjn_tum(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs2, vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfsgnjn_tum(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs2, float rs1, size_t vl);
vfloat32m2_t __riscv_vfsgnjn_tum(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs2, vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfsgnjn_tum(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs2, float rs1, size_t vl);
vfloat32m4_t __riscv_vfsgnjn_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                 vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfsgnjn_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                 float rs1, size_t vl);
vfloat32m8_t __riscv_vfsgnjn_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                 vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfsgnjn_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                 float rs1, size_t vl);
vfloat64m1_t __riscv_vfsgnjn_tum(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs2, vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfsgnjn_tum(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs2, double rs1, size_t vl);
vfloat64m2_t __riscv_vfsgnjn_tum(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs2, vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfsgnjn_tum(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs2, double rs1, size_t vl);
vfloat64m4_t __riscv_vfsgnjn_tum(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs2, vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfsgnjn_tum(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs2, double rs1, size_t vl);
vfloat64m8_t __riscv_vfsgnjn_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                 vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfsgnjn_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                 double rs1, size_t vl);
vfloat16mf4_t __riscv_vfsgnjx_tum(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                  size_t vl);
vfloat16mf4_t __riscv_vfsgnjx_tum(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnjx_tum(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                  size_t vl);
vfloat16mf2_t __riscv_vfsgnjx_tum(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfsgnjx_tum(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs2, vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfsgnjx_tum(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs2, _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfsgnjx_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                 vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfsgnjx_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                 _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfsgnjx_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                 vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfsgnjx_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                 _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfsgnjx_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                 vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfsgnjx_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                 _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfsgnjx_tum(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                  size_t vl);
vfloat32mf2_t __riscv_vfsgnjx_tum(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfsgnjx_tum(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs2, vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfsgnjx_tum(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs2, float rs1, size_t vl);
vfloat32m2_t __riscv_vfsgnjx_tum(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs2, vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfsgnjx_tum(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs2, float rs1, size_t vl);
vfloat32m4_t __riscv_vfsgnjx_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                 vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfsgnjx_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                 float rs1, size_t vl);
vfloat32m8_t __riscv_vfsgnjx_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                 vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfsgnjx_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                 float rs1, size_t vl);
vfloat64m1_t __riscv_vfsgnjx_tum(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs2, vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfsgnjx_tum(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs2, double rs1, size_t vl);
vfloat64m2_t __riscv_vfsgnjx_tum(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs2, vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfsgnjx_tum(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs2, double rs1, size_t vl);
vfloat64m4_t __riscv_vfsgnjx_tum(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs2, vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfsgnjx_tum(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs2, double rs1, size_t vl);
vfloat64m8_t __riscv_vfsgnjx_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                 vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfsgnjx_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                 double rs1, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfsgnj_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                  size_t vl);
vfloat16mf4_t __riscv_vfsgnj_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnj_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                  size_t vl);
vfloat16mf2_t __riscv_vfsgnj_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfsgnj_tumu(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs2, vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfsgnj_tumu(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat16m1_t vs2, _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfsgnj_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                 vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfsgnj_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                 _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfsgnj_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                 vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfsgnj_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                 _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfsgnj_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                 vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfsgnj_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                 _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfsgnj_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                  size_t vl);
vfloat32mf2_t __riscv_vfsgnj_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfsgnj_tumu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs2, vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfsgnj_tumu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat32m1_t vs2, float rs1, size_t vl);
vfloat32m2_t __riscv_vfsgnj_tumu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs2, vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfsgnj_tumu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat32m2_t vs2, float rs1, size_t vl);
vfloat32m4_t __riscv_vfsgnj_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                 vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfsgnj_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                 float rs1, size_t vl);
vfloat32m8_t __riscv_vfsgnj_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                 vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfsgnj_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                 float rs1, size_t vl);
vfloat64m1_t __riscv_vfsgnj_tumu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs2, vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfsgnj_tumu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat64m1_t vs2, double rs1, size_t vl);
vfloat64m2_t __riscv_vfsgnj_tumu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs2, vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfsgnj_tumu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat64m2_t vs2, double rs1, size_t vl);
vfloat64m4_t __riscv_vfsgnj_tumu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs2, vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfsgnj_tumu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat64m4_t vs2, double rs1, size_t vl);
vfloat64m8_t __riscv_vfsgnj_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                 vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfsgnj_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                 double rs1, size_t vl);
vfloat16mf4_t __riscv_vfsgnjn_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                   vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                   size_t vl);
vfloat16mf4_t __riscv_vfsgnjn_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                   vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnjn_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                   vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                   size_t vl);
vfloat16mf2_t __riscv_vfsgnjn_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                   vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfsgnjn_tumu(vbool16_t vm, vfloat16m1_t vd,
                                  vfloat16m1_t vs2, vfloat16m1_t vs1,
                                  size_t vl);
vfloat16m1_t __riscv_vfsgnjn_tumu(vbool16_t vm, vfloat16m1_t vd,
                                  vfloat16m1_t vs2, _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfsgnjn_tumu(vbool8_t vm, vfloat16m2_t vd,
                                  vfloat16m2_t vs2, vfloat16m2_t vs1,
                                  size_t vl);
vfloat16m2_t __riscv_vfsgnjn_tumu(vbool8_t vm, vfloat16m2_t vd,
                                  vfloat16m2_t vs2, _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfsgnjn_tumu(vbool4_t vm, vfloat16m4_t vd,
                                  vfloat16m4_t vs2, vfloat16m4_t vs1,
                                  size_t vl);
vfloat16m4_t __riscv_vfsgnjn_tumu(vbool4_t vm, vfloat16m4_t vd,
                                  vfloat16m4_t vs2, _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfsgnjn_tumu(vbool2_t vm, vfloat16m8_t vd,
                                  vfloat16m8_t vs2, vfloat16m8_t vs1,
                                  size_t vl);
vfloat16m8_t __riscv_vfsgnjn_tumu(vbool2_t vm, vfloat16m8_t vd,
                                  vfloat16m8_t vs2, _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfsgnjn_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                   size_t vl);
vfloat32mf2_t __riscv_vfsgnjn_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfsgnjn_tumu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat32m1_t vs2, vfloat32m1_t vs1,
                                  size_t vl);
vfloat32m1_t __riscv_vfsgnjn_tumu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat32m1_t vs2, float rs1, size_t vl);
vfloat32m2_t __riscv_vfsgnjn_tumu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat32m2_t vs2, vfloat32m2_t vs1,
                                  size_t vl);
vfloat32m2_t __riscv_vfsgnjn_tumu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat32m2_t vs2, float rs1, size_t vl);
vfloat32m4_t __riscv_vfsgnjn_tumu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat32m4_t vs2, vfloat32m4_t vs1,
                                  size_t vl);
vfloat32m4_t __riscv_vfsgnjn_tumu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat32m4_t vs2, float rs1, size_t vl);
vfloat32m8_t __riscv_vfsgnjn_tumu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat32m8_t vs2, vfloat32m8_t vs1,
                                  size_t vl);
vfloat32m8_t __riscv_vfsgnjn_tumu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat32m8_t vs2, float rs1, size_t vl);
vfloat64m1_t __riscv_vfsgnjn_tumu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat64m1_t vs2, vfloat64m1_t vs1,
                                  size_t vl);
vfloat64m1_t __riscv_vfsgnjn_tumu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat64m1_t vs2, double rs1, size_t vl);
vfloat64m2_t __riscv_vfsgnjn_tumu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat64m2_t vs2, vfloat64m2_t vs1,
                                  size_t vl);
vfloat64m2_t __riscv_vfsgnjn_tumu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat64m2_t vs2, double rs1, size_t vl);
vfloat64m4_t __riscv_vfsgnjn_tumu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat64m4_t vs2, vfloat64m4_t vs1,
                                  size_t vl);
vfloat64m4_t __riscv_vfsgnjn_tumu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat64m4_t vs2, double rs1, size_t vl);
vfloat64m8_t __riscv_vfsgnjn_tumu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat64m8_t vs2, vfloat64m8_t vs1,
                                  size_t vl);
vfloat64m8_t __riscv_vfsgnjn_tumu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat64m8_t vs2, double rs1, size_t vl);
vfloat16mf4_t __riscv_vfsgnjx_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                   vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                   size_t vl);
vfloat16mf4_t __riscv_vfsgnjx_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                   vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnjx_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                   vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                   size_t vl);
vfloat16mf2_t __riscv_vfsgnjx_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                   vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfsgnjx_tumu(vbool16_t vm, vfloat16m1_t vd,
                                  vfloat16m1_t vs2, vfloat16m1_t vs1,
                                  size_t vl);
vfloat16m1_t __riscv_vfsgnjx_tumu(vbool16_t vm, vfloat16m1_t vd,
                                  vfloat16m1_t vs2, _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfsgnjx_tumu(vbool8_t vm, vfloat16m2_t vd,
                                  vfloat16m2_t vs2, vfloat16m2_t vs1,
                                  size_t vl);
vfloat16m2_t __riscv_vfsgnjx_tumu(vbool8_t vm, vfloat16m2_t vd,
                                  vfloat16m2_t vs2, _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfsgnjx_tumu(vbool4_t vm, vfloat16m4_t vd,
                                  vfloat16m4_t vs2, vfloat16m4_t vs1,
                                  size_t vl);
vfloat16m4_t __riscv_vfsgnjx_tumu(vbool4_t vm, vfloat16m4_t vd,
                                  vfloat16m4_t vs2, _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfsgnjx_tumu(vbool2_t vm, vfloat16m8_t vd,
                                  vfloat16m8_t vs2, vfloat16m8_t vs1,
                                  size_t vl);
vfloat16m8_t __riscv_vfsgnjx_tumu(vbool2_t vm, vfloat16m8_t vd,
                                  vfloat16m8_t vs2, _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfsgnjx_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                   size_t vl);
vfloat32mf2_t __riscv_vfsgnjx_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfsgnjx_tumu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat32m1_t vs2, vfloat32m1_t vs1,
                                  size_t vl);
vfloat32m1_t __riscv_vfsgnjx_tumu(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat32m1_t vs2, float rs1, size_t vl);
vfloat32m2_t __riscv_vfsgnjx_tumu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat32m2_t vs2, vfloat32m2_t vs1,
                                  size_t vl);
vfloat32m2_t __riscv_vfsgnjx_tumu(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat32m2_t vs2, float rs1, size_t vl);
vfloat32m4_t __riscv_vfsgnjx_tumu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat32m4_t vs2, vfloat32m4_t vs1,
                                  size_t vl);
vfloat32m4_t __riscv_vfsgnjx_tumu(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat32m4_t vs2, float rs1, size_t vl);
vfloat32m8_t __riscv_vfsgnjx_tumu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat32m8_t vs2, vfloat32m8_t vs1,
                                  size_t vl);
vfloat32m8_t __riscv_vfsgnjx_tumu(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat32m8_t vs2, float rs1, size_t vl);
vfloat64m1_t __riscv_vfsgnjx_tumu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat64m1_t vs2, vfloat64m1_t vs1,
                                  size_t vl);
vfloat64m1_t __riscv_vfsgnjx_tumu(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat64m1_t vs2, double rs1, size_t vl);
vfloat64m2_t __riscv_vfsgnjx_tumu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat64m2_t vs2, vfloat64m2_t vs1,
                                  size_t vl);
vfloat64m2_t __riscv_vfsgnjx_tumu(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat64m2_t vs2, double rs1, size_t vl);
vfloat64m4_t __riscv_vfsgnjx_tumu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat64m4_t vs2, vfloat64m4_t vs1,
                                  size_t vl);
vfloat64m4_t __riscv_vfsgnjx_tumu(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat64m4_t vs2, double rs1, size_t vl);
vfloat64m8_t __riscv_vfsgnjx_tumu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat64m8_t vs2, vfloat64m8_t vs1,
                                  size_t vl);
vfloat64m8_t __riscv_vfsgnjx_tumu(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat64m8_t vs2, double rs1, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfsgnj_mu(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                size_t vl);
vfloat16mf4_t __riscv_vfsgnj_mu(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnj_mu(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                size_t vl);
vfloat16mf2_t __riscv_vfsgnj_mu(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfsgnj_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfsgnj_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfsgnj_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfsgnj_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfsgnj_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfsgnj_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfsgnj_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfsgnj_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfsgnj_mu(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                size_t vl);
vfloat32mf2_t __riscv_vfsgnj_mu(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfsgnj_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfsgnj_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               float rs1, size_t vl);
vfloat32m2_t __riscv_vfsgnj_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfsgnj_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               float rs1, size_t vl);
vfloat32m4_t __riscv_vfsgnj_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfsgnj_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               float rs1, size_t vl);
vfloat32m8_t __riscv_vfsgnj_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfsgnj_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               float rs1, size_t vl);
vfloat64m1_t __riscv_vfsgnj_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfsgnj_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               double rs1, size_t vl);
vfloat64m2_t __riscv_vfsgnj_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfsgnj_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               double rs1, size_t vl);
vfloat64m4_t __riscv_vfsgnj_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfsgnj_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               double rs1, size_t vl);
vfloat64m8_t __riscv_vfsgnj_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfsgnj_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               double rs1, size_t vl);
vfloat16mf4_t __riscv_vfsgnjn_mu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                 size_t vl);
vfloat16mf4_t __riscv_vfsgnjn_mu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnjn_mu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                 size_t vl);
vfloat16mf2_t __riscv_vfsgnjn_mu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfsgnjn_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfsgnjn_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfsgnjn_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfsgnjn_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfsgnjn_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfsgnjn_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfsgnjn_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfsgnjn_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfsgnjn_mu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                 size_t vl);
vfloat32mf2_t __riscv_vfsgnjn_mu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfsgnjn_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfsgnjn_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                float rs1, size_t vl);
vfloat32m2_t __riscv_vfsgnjn_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfsgnjn_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                float rs1, size_t vl);
vfloat32m4_t __riscv_vfsgnjn_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfsgnjn_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                float rs1, size_t vl);
vfloat32m8_t __riscv_vfsgnjn_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfsgnjn_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                float rs1, size_t vl);
vfloat64m1_t __riscv_vfsgnjn_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfsgnjn_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                double rs1, size_t vl);
vfloat64m2_t __riscv_vfsgnjn_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfsgnjn_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                double rs1, size_t vl);
vfloat64m4_t __riscv_vfsgnjn_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfsgnjn_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                double rs1, size_t vl);
vfloat64m8_t __riscv_vfsgnjn_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfsgnjn_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                double rs1, size_t vl);
vfloat16mf4_t __riscv_vfsgnjx_mu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, vfloat16mf4_t vs1,
                                 size_t vl);
vfloat16mf4_t __riscv_vfsgnjx_mu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfsgnjx_mu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, vfloat16mf2_t vs1,
                                 size_t vl);
vfloat16mf2_t __riscv_vfsgnjx_mu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfsgnjx_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfsgnjx_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfsgnjx_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfsgnjx_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfsgnjx_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfsgnjx_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfsgnjx_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfsgnjx_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfsgnjx_mu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, vfloat32mf2_t vs1,
                                 size_t vl);
vfloat32mf2_t __riscv_vfsgnjx_mu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfsgnjx_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfsgnjx_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                float rs1, size_t vl);
vfloat32m2_t __riscv_vfsgnjx_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfsgnjx_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                float rs1, size_t vl);
vfloat32m4_t __riscv_vfsgnjx_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfsgnjx_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                float rs1, size_t vl);
vfloat32m8_t __riscv_vfsgnjx_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfsgnjx_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                float rs1, size_t vl);
vfloat64m1_t __riscv_vfsgnjx_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfsgnjx_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                double rs1, size_t vl);
vfloat64m2_t __riscv_vfsgnjx_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfsgnjx_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                double rs1, size_t vl);
vfloat64m4_t __riscv_vfsgnjx_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfsgnjx_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                double rs1, size_t vl);
vfloat64m8_t __riscv_vfsgnjx_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfsgnjx_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                double rs1, size_t vl);

Vector Floating-Point Absolute Value Intrinsics

vfloat16mf4_t __riscv_vfabs_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfabs_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfabs_tu(vfloat16m1_t vd, vfloat16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfabs_tu(vfloat16m2_t vd, vfloat16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfabs_tu(vfloat16m4_t vd, vfloat16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfabs_tu(vfloat16m8_t vd, vfloat16m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfabs_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfabs_tu(vfloat32m1_t vd, vfloat32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfabs_tu(vfloat32m2_t vd, vfloat32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfabs_tu(vfloat32m4_t vd, vfloat32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfabs_tu(vfloat32m8_t vd, vfloat32m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfabs_tu(vfloat64m1_t vd, vfloat64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfabs_tu(vfloat64m2_t vd, vfloat64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfabs_tu(vfloat64m4_t vd, vfloat64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfabs_tu(vfloat64m8_t vd, vfloat64m8_t vs2, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfabs_tum(vbool64_t vm, vfloat16mf4_t vd,
                                vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfabs_tum(vbool32_t vm, vfloat16mf2_t vd,
                                vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfabs_tum(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                               size_t vl);
vfloat16m2_t __riscv_vfabs_tum(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                               size_t vl);
vfloat16m4_t __riscv_vfabs_tum(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                               size_t vl);
vfloat16m8_t __riscv_vfabs_tum(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                               size_t vl);
vfloat32mf2_t __riscv_vfabs_tum(vbool64_t vm, vfloat32mf2_t vd,
                                vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfabs_tum(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                               size_t vl);
vfloat32m2_t __riscv_vfabs_tum(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                               size_t vl);
vfloat32m4_t __riscv_vfabs_tum(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                               size_t vl);
vfloat32m8_t __riscv_vfabs_tum(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                               size_t vl);
vfloat64m1_t __riscv_vfabs_tum(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                               size_t vl);
vfloat64m2_t __riscv_vfabs_tum(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                               size_t vl);
vfloat64m4_t __riscv_vfabs_tum(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                               size_t vl);
vfloat64m8_t __riscv_vfabs_tum(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                               size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfabs_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                 vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfabs_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfabs_tumu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                                size_t vl);
vfloat16m2_t __riscv_vfabs_tumu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                                size_t vl);
vfloat16m4_t __riscv_vfabs_tumu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                                size_t vl);
vfloat16m8_t __riscv_vfabs_tumu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                                size_t vl);
vfloat32mf2_t __riscv_vfabs_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                 vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfabs_tumu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                                size_t vl);
vfloat32m2_t __riscv_vfabs_tumu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                                size_t vl);
vfloat32m4_t __riscv_vfabs_tumu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                                size_t vl);
vfloat32m8_t __riscv_vfabs_tumu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                                size_t vl);
vfloat64m1_t __riscv_vfabs_tumu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                                size_t vl);
vfloat64m2_t __riscv_vfabs_tumu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                                size_t vl);
vfloat64m4_t __riscv_vfabs_tumu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                                size_t vl);
vfloat64m8_t __riscv_vfabs_tumu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                                size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfabs_mu(vbool64_t vm, vfloat16mf4_t vd,
                               vfloat16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfabs_mu(vbool32_t vm, vfloat16mf2_t vd,
                               vfloat16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfabs_mu(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                              size_t vl);
vfloat16m2_t __riscv_vfabs_mu(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                              size_t vl);
vfloat16m4_t __riscv_vfabs_mu(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                              size_t vl);
vfloat16m8_t __riscv_vfabs_mu(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                              size_t vl);
vfloat32mf2_t __riscv_vfabs_mu(vbool64_t vm, vfloat32mf2_t vd,
                               vfloat32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfabs_mu(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                              size_t vl);
vfloat32m2_t __riscv_vfabs_mu(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                              size_t vl);
vfloat32m4_t __riscv_vfabs_mu(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                              size_t vl);
vfloat32m8_t __riscv_vfabs_mu(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                              size_t vl);
vfloat64m1_t __riscv_vfabs_mu(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                              size_t vl);
vfloat64m2_t __riscv_vfabs_mu(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                              size_t vl);
vfloat64m4_t __riscv_vfabs_mu(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                              size_t vl);
vfloat64m8_t __riscv_vfabs_mu(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                              size_t vl);

Vector Floating-Point Compare Intrinsics

// masked functions
vbool64_t __riscv_vmfeq_mu(vbool64_t vm, vbool64_t vd, vfloat16mf4_t vs2,
                           vfloat16mf4_t vs1, size_t vl);
vbool64_t __riscv_vmfeq_mu(vbool64_t vm, vbool64_t vd, vfloat16mf4_t vs2,
                           _Float16 rs1, size_t vl);
vbool32_t __riscv_vmfeq_mu(vbool32_t vm, vbool32_t vd, vfloat16mf2_t vs2,
                           vfloat16mf2_t vs1, size_t vl);
vbool32_t __riscv_vmfeq_mu(vbool32_t vm, vbool32_t vd, vfloat16mf2_t vs2,
                           _Float16 rs1, size_t vl);
vbool16_t __riscv_vmfeq_mu(vbool16_t vm, vbool16_t vd, vfloat16m1_t vs2,
                           vfloat16m1_t vs1, size_t vl);
vbool16_t __riscv_vmfeq_mu(vbool16_t vm, vbool16_t vd, vfloat16m1_t vs2,
                           _Float16 rs1, size_t vl);
vbool8_t __riscv_vmfeq_mu(vbool8_t vm, vbool8_t vd, vfloat16m2_t vs2,
                          vfloat16m2_t vs1, size_t vl);
vbool8_t __riscv_vmfeq_mu(vbool8_t vm, vbool8_t vd, vfloat16m2_t vs2,
                          _Float16 rs1, size_t vl);
vbool4_t __riscv_vmfeq_mu(vbool4_t vm, vbool4_t vd, vfloat16m4_t vs2,
                          vfloat16m4_t vs1, size_t vl);
vbool4_t __riscv_vmfeq_mu(vbool4_t vm, vbool4_t vd, vfloat16m4_t vs2,
                          _Float16 rs1, size_t vl);
vbool2_t __riscv_vmfeq_mu(vbool2_t vm, vbool2_t vd, vfloat16m8_t vs2,
                          vfloat16m8_t vs1, size_t vl);
vbool2_t __riscv_vmfeq_mu(vbool2_t vm, vbool2_t vd, vfloat16m8_t vs2,
                          _Float16 rs1, size_t vl);
vbool64_t __riscv_vmfeq_mu(vbool64_t vm, vbool64_t vd, vfloat32mf2_t vs2,
                           vfloat32mf2_t vs1, size_t vl);
vbool64_t __riscv_vmfeq_mu(vbool64_t vm, vbool64_t vd, vfloat32mf2_t vs2,
                           float rs1, size_t vl);
vbool32_t __riscv_vmfeq_mu(vbool32_t vm, vbool32_t vd, vfloat32m1_t vs2,
                           vfloat32m1_t vs1, size_t vl);
vbool32_t __riscv_vmfeq_mu(vbool32_t vm, vbool32_t vd, vfloat32m1_t vs2,
                           float rs1, size_t vl);
vbool16_t __riscv_vmfeq_mu(vbool16_t vm, vbool16_t vd, vfloat32m2_t vs2,
                           vfloat32m2_t vs1, size_t vl);
vbool16_t __riscv_vmfeq_mu(vbool16_t vm, vbool16_t vd, vfloat32m2_t vs2,
                           float rs1, size_t vl);
vbool8_t __riscv_vmfeq_mu(vbool8_t vm, vbool8_t vd, vfloat32m4_t vs2,
                          vfloat32m4_t vs1, size_t vl);
vbool8_t __riscv_vmfeq_mu(vbool8_t vm, vbool8_t vd, vfloat32m4_t vs2, float rs1,
                          size_t vl);
vbool4_t __riscv_vmfeq_mu(vbool4_t vm, vbool4_t vd, vfloat32m8_t vs2,
                          vfloat32m8_t vs1, size_t vl);
vbool4_t __riscv_vmfeq_mu(vbool4_t vm, vbool4_t vd, vfloat32m8_t vs2, float rs1,
                          size_t vl);
vbool64_t __riscv_vmfeq_mu(vbool64_t vm, vbool64_t vd, vfloat64m1_t vs2,
                           vfloat64m1_t vs1, size_t vl);
vbool64_t __riscv_vmfeq_mu(vbool64_t vm, vbool64_t vd, vfloat64m1_t vs2,
                           double rs1, size_t vl);
vbool32_t __riscv_vmfeq_mu(vbool32_t vm, vbool32_t vd, vfloat64m2_t vs2,
                           vfloat64m2_t vs1, size_t vl);
vbool32_t __riscv_vmfeq_mu(vbool32_t vm, vbool32_t vd, vfloat64m2_t vs2,
                           double rs1, size_t vl);
vbool16_t __riscv_vmfeq_mu(vbool16_t vm, vbool16_t vd, vfloat64m4_t vs2,
                           vfloat64m4_t vs1, size_t vl);
vbool16_t __riscv_vmfeq_mu(vbool16_t vm, vbool16_t vd, vfloat64m4_t vs2,
                           double rs1, size_t vl);
vbool8_t __riscv_vmfeq_mu(vbool8_t vm, vbool8_t vd, vfloat64m8_t vs2,
                          vfloat64m8_t vs1, size_t vl);
vbool8_t __riscv_vmfeq_mu(vbool8_t vm, vbool8_t vd, vfloat64m8_t vs2,
                          double rs1, size_t vl);
vbool64_t __riscv_vmfne_mu(vbool64_t vm, vbool64_t vd, vfloat16mf4_t vs2,
                           vfloat16mf4_t vs1, size_t vl);
vbool64_t __riscv_vmfne_mu(vbool64_t vm, vbool64_t vd, vfloat16mf4_t vs2,
                           _Float16 rs1, size_t vl);
vbool32_t __riscv_vmfne_mu(vbool32_t vm, vbool32_t vd, vfloat16mf2_t vs2,
                           vfloat16mf2_t vs1, size_t vl);
vbool32_t __riscv_vmfne_mu(vbool32_t vm, vbool32_t vd, vfloat16mf2_t vs2,
                           _Float16 rs1, size_t vl);
vbool16_t __riscv_vmfne_mu(vbool16_t vm, vbool16_t vd, vfloat16m1_t vs2,
                           vfloat16m1_t vs1, size_t vl);
vbool16_t __riscv_vmfne_mu(vbool16_t vm, vbool16_t vd, vfloat16m1_t vs2,
                           _Float16 rs1, size_t vl);
vbool8_t __riscv_vmfne_mu(vbool8_t vm, vbool8_t vd, vfloat16m2_t vs2,
                          vfloat16m2_t vs1, size_t vl);
vbool8_t __riscv_vmfne_mu(vbool8_t vm, vbool8_t vd, vfloat16m2_t vs2,
                          _Float16 rs1, size_t vl);
vbool4_t __riscv_vmfne_mu(vbool4_t vm, vbool4_t vd, vfloat16m4_t vs2,
                          vfloat16m4_t vs1, size_t vl);
vbool4_t __riscv_vmfne_mu(vbool4_t vm, vbool4_t vd, vfloat16m4_t vs2,
                          _Float16 rs1, size_t vl);
vbool2_t __riscv_vmfne_mu(vbool2_t vm, vbool2_t vd, vfloat16m8_t vs2,
                          vfloat16m8_t vs1, size_t vl);
vbool2_t __riscv_vmfne_mu(vbool2_t vm, vbool2_t vd, vfloat16m8_t vs2,
                          _Float16 rs1, size_t vl);
vbool64_t __riscv_vmfne_mu(vbool64_t vm, vbool64_t vd, vfloat32mf2_t vs2,
                           vfloat32mf2_t vs1, size_t vl);
vbool64_t __riscv_vmfne_mu(vbool64_t vm, vbool64_t vd, vfloat32mf2_t vs2,
                           float rs1, size_t vl);
vbool32_t __riscv_vmfne_mu(vbool32_t vm, vbool32_t vd, vfloat32m1_t vs2,
                           vfloat32m1_t vs1, size_t vl);
vbool32_t __riscv_vmfne_mu(vbool32_t vm, vbool32_t vd, vfloat32m1_t vs2,
                           float rs1, size_t vl);
vbool16_t __riscv_vmfne_mu(vbool16_t vm, vbool16_t vd, vfloat32m2_t vs2,
                           vfloat32m2_t vs1, size_t vl);
vbool16_t __riscv_vmfne_mu(vbool16_t vm, vbool16_t vd, vfloat32m2_t vs2,
                           float rs1, size_t vl);
vbool8_t __riscv_vmfne_mu(vbool8_t vm, vbool8_t vd, vfloat32m4_t vs2,
                          vfloat32m4_t vs1, size_t vl);
vbool8_t __riscv_vmfne_mu(vbool8_t vm, vbool8_t vd, vfloat32m4_t vs2, float rs1,
                          size_t vl);
vbool4_t __riscv_vmfne_mu(vbool4_t vm, vbool4_t vd, vfloat32m8_t vs2,
                          vfloat32m8_t vs1, size_t vl);
vbool4_t __riscv_vmfne_mu(vbool4_t vm, vbool4_t vd, vfloat32m8_t vs2, float rs1,
                          size_t vl);
vbool64_t __riscv_vmfne_mu(vbool64_t vm, vbool64_t vd, vfloat64m1_t vs2,
                           vfloat64m1_t vs1, size_t vl);
vbool64_t __riscv_vmfne_mu(vbool64_t vm, vbool64_t vd, vfloat64m1_t vs2,
                           double rs1, size_t vl);
vbool32_t __riscv_vmfne_mu(vbool32_t vm, vbool32_t vd, vfloat64m2_t vs2,
                           vfloat64m2_t vs1, size_t vl);
vbool32_t __riscv_vmfne_mu(vbool32_t vm, vbool32_t vd, vfloat64m2_t vs2,
                           double rs1, size_t vl);
vbool16_t __riscv_vmfne_mu(vbool16_t vm, vbool16_t vd, vfloat64m4_t vs2,
                           vfloat64m4_t vs1, size_t vl);
vbool16_t __riscv_vmfne_mu(vbool16_t vm, vbool16_t vd, vfloat64m4_t vs2,
                           double rs1, size_t vl);
vbool8_t __riscv_vmfne_mu(vbool8_t vm, vbool8_t vd, vfloat64m8_t vs2,
                          vfloat64m8_t vs1, size_t vl);
vbool8_t __riscv_vmfne_mu(vbool8_t vm, vbool8_t vd, vfloat64m8_t vs2,
                          double rs1, size_t vl);
vbool64_t __riscv_vmflt_mu(vbool64_t vm, vbool64_t vd, vfloat16mf4_t vs2,
                           vfloat16mf4_t vs1, size_t vl);
vbool64_t __riscv_vmflt_mu(vbool64_t vm, vbool64_t vd, vfloat16mf4_t vs2,
                           _Float16 rs1, size_t vl);
vbool32_t __riscv_vmflt_mu(vbool32_t vm, vbool32_t vd, vfloat16mf2_t vs2,
                           vfloat16mf2_t vs1, size_t vl);
vbool32_t __riscv_vmflt_mu(vbool32_t vm, vbool32_t vd, vfloat16mf2_t vs2,
                           _Float16 rs1, size_t vl);
vbool16_t __riscv_vmflt_mu(vbool16_t vm, vbool16_t vd, vfloat16m1_t vs2,
                           vfloat16m1_t vs1, size_t vl);
vbool16_t __riscv_vmflt_mu(vbool16_t vm, vbool16_t vd, vfloat16m1_t vs2,
                           _Float16 rs1, size_t vl);
vbool8_t __riscv_vmflt_mu(vbool8_t vm, vbool8_t vd, vfloat16m2_t vs2,
                          vfloat16m2_t vs1, size_t vl);
vbool8_t __riscv_vmflt_mu(vbool8_t vm, vbool8_t vd, vfloat16m2_t vs2,
                          _Float16 rs1, size_t vl);
vbool4_t __riscv_vmflt_mu(vbool4_t vm, vbool4_t vd, vfloat16m4_t vs2,
                          vfloat16m4_t vs1, size_t vl);
vbool4_t __riscv_vmflt_mu(vbool4_t vm, vbool4_t vd, vfloat16m4_t vs2,
                          _Float16 rs1, size_t vl);
vbool2_t __riscv_vmflt_mu(vbool2_t vm, vbool2_t vd, vfloat16m8_t vs2,
                          vfloat16m8_t vs1, size_t vl);
vbool2_t __riscv_vmflt_mu(vbool2_t vm, vbool2_t vd, vfloat16m8_t vs2,
                          _Float16 rs1, size_t vl);
vbool64_t __riscv_vmflt_mu(vbool64_t vm, vbool64_t vd, vfloat32mf2_t vs2,
                           vfloat32mf2_t vs1, size_t vl);
vbool64_t __riscv_vmflt_mu(vbool64_t vm, vbool64_t vd, vfloat32mf2_t vs2,
                           float rs1, size_t vl);
vbool32_t __riscv_vmflt_mu(vbool32_t vm, vbool32_t vd, vfloat32m1_t vs2,
                           vfloat32m1_t vs1, size_t vl);
vbool32_t __riscv_vmflt_mu(vbool32_t vm, vbool32_t vd, vfloat32m1_t vs2,
                           float rs1, size_t vl);
vbool16_t __riscv_vmflt_mu(vbool16_t vm, vbool16_t vd, vfloat32m2_t vs2,
                           vfloat32m2_t vs1, size_t vl);
vbool16_t __riscv_vmflt_mu(vbool16_t vm, vbool16_t vd, vfloat32m2_t vs2,
                           float rs1, size_t vl);
vbool8_t __riscv_vmflt_mu(vbool8_t vm, vbool8_t vd, vfloat32m4_t vs2,
                          vfloat32m4_t vs1, size_t vl);
vbool8_t __riscv_vmflt_mu(vbool8_t vm, vbool8_t vd, vfloat32m4_t vs2, float rs1,
                          size_t vl);
vbool4_t __riscv_vmflt_mu(vbool4_t vm, vbool4_t vd, vfloat32m8_t vs2,
                          vfloat32m8_t vs1, size_t vl);
vbool4_t __riscv_vmflt_mu(vbool4_t vm, vbool4_t vd, vfloat32m8_t vs2, float rs1,
                          size_t vl);
vbool64_t __riscv_vmflt_mu(vbool64_t vm, vbool64_t vd, vfloat64m1_t vs2,
                           vfloat64m1_t vs1, size_t vl);
vbool64_t __riscv_vmflt_mu(vbool64_t vm, vbool64_t vd, vfloat64m1_t vs2,
                           double rs1, size_t vl);
vbool32_t __riscv_vmflt_mu(vbool32_t vm, vbool32_t vd, vfloat64m2_t vs2,
                           vfloat64m2_t vs1, size_t vl);
vbool32_t __riscv_vmflt_mu(vbool32_t vm, vbool32_t vd, vfloat64m2_t vs2,
                           double rs1, size_t vl);
vbool16_t __riscv_vmflt_mu(vbool16_t vm, vbool16_t vd, vfloat64m4_t vs2,
                           vfloat64m4_t vs1, size_t vl);
vbool16_t __riscv_vmflt_mu(vbool16_t vm, vbool16_t vd, vfloat64m4_t vs2,
                           double rs1, size_t vl);
vbool8_t __riscv_vmflt_mu(vbool8_t vm, vbool8_t vd, vfloat64m8_t vs2,
                          vfloat64m8_t vs1, size_t vl);
vbool8_t __riscv_vmflt_mu(vbool8_t vm, vbool8_t vd, vfloat64m8_t vs2,
                          double rs1, size_t vl);
vbool64_t __riscv_vmfle_mu(vbool64_t vm, vbool64_t vd, vfloat16mf4_t vs2,
                           vfloat16mf4_t vs1, size_t vl);
vbool64_t __riscv_vmfle_mu(vbool64_t vm, vbool64_t vd, vfloat16mf4_t vs2,
                           _Float16 rs1, size_t vl);
vbool32_t __riscv_vmfle_mu(vbool32_t vm, vbool32_t vd, vfloat16mf2_t vs2,
                           vfloat16mf2_t vs1, size_t vl);
vbool32_t __riscv_vmfle_mu(vbool32_t vm, vbool32_t vd, vfloat16mf2_t vs2,
                           _Float16 rs1, size_t vl);
vbool16_t __riscv_vmfle_mu(vbool16_t vm, vbool16_t vd, vfloat16m1_t vs2,
                           vfloat16m1_t vs1, size_t vl);
vbool16_t __riscv_vmfle_mu(vbool16_t vm, vbool16_t vd, vfloat16m1_t vs2,
                           _Float16 rs1, size_t vl);
vbool8_t __riscv_vmfle_mu(vbool8_t vm, vbool8_t vd, vfloat16m2_t vs2,
                          vfloat16m2_t vs1, size_t vl);
vbool8_t __riscv_vmfle_mu(vbool8_t vm, vbool8_t vd, vfloat16m2_t vs2,
                          _Float16 rs1, size_t vl);
vbool4_t __riscv_vmfle_mu(vbool4_t vm, vbool4_t vd, vfloat16m4_t vs2,
                          vfloat16m4_t vs1, size_t vl);
vbool4_t __riscv_vmfle_mu(vbool4_t vm, vbool4_t vd, vfloat16m4_t vs2,
                          _Float16 rs1, size_t vl);
vbool2_t __riscv_vmfle_mu(vbool2_t vm, vbool2_t vd, vfloat16m8_t vs2,
                          vfloat16m8_t vs1, size_t vl);
vbool2_t __riscv_vmfle_mu(vbool2_t vm, vbool2_t vd, vfloat16m8_t vs2,
                          _Float16 rs1, size_t vl);
vbool64_t __riscv_vmfle_mu(vbool64_t vm, vbool64_t vd, vfloat32mf2_t vs2,
                           vfloat32mf2_t vs1, size_t vl);
vbool64_t __riscv_vmfle_mu(vbool64_t vm, vbool64_t vd, vfloat32mf2_t vs2,
                           float rs1, size_t vl);
vbool32_t __riscv_vmfle_mu(vbool32_t vm, vbool32_t vd, vfloat32m1_t vs2,
                           vfloat32m1_t vs1, size_t vl);
vbool32_t __riscv_vmfle_mu(vbool32_t vm, vbool32_t vd, vfloat32m1_t vs2,
                           float rs1, size_t vl);
vbool16_t __riscv_vmfle_mu(vbool16_t vm, vbool16_t vd, vfloat32m2_t vs2,
                           vfloat32m2_t vs1, size_t vl);
vbool16_t __riscv_vmfle_mu(vbool16_t vm, vbool16_t vd, vfloat32m2_t vs2,
                           float rs1, size_t vl);
vbool8_t __riscv_vmfle_mu(vbool8_t vm, vbool8_t vd, vfloat32m4_t vs2,
                          vfloat32m4_t vs1, size_t vl);
vbool8_t __riscv_vmfle_mu(vbool8_t vm, vbool8_t vd, vfloat32m4_t vs2, float rs1,
                          size_t vl);
vbool4_t __riscv_vmfle_mu(vbool4_t vm, vbool4_t vd, vfloat32m8_t vs2,
                          vfloat32m8_t vs1, size_t vl);
vbool4_t __riscv_vmfle_mu(vbool4_t vm, vbool4_t vd, vfloat32m8_t vs2, float rs1,
                          size_t vl);
vbool64_t __riscv_vmfle_mu(vbool64_t vm, vbool64_t vd, vfloat64m1_t vs2,
                           vfloat64m1_t vs1, size_t vl);
vbool64_t __riscv_vmfle_mu(vbool64_t vm, vbool64_t vd, vfloat64m1_t vs2,
                           double rs1, size_t vl);
vbool32_t __riscv_vmfle_mu(vbool32_t vm, vbool32_t vd, vfloat64m2_t vs2,
                           vfloat64m2_t vs1, size_t vl);
vbool32_t __riscv_vmfle_mu(vbool32_t vm, vbool32_t vd, vfloat64m2_t vs2,
                           double rs1, size_t vl);
vbool16_t __riscv_vmfle_mu(vbool16_t vm, vbool16_t vd, vfloat64m4_t vs2,
                           vfloat64m4_t vs1, size_t vl);
vbool16_t __riscv_vmfle_mu(vbool16_t vm, vbool16_t vd, vfloat64m4_t vs2,
                           double rs1, size_t vl);
vbool8_t __riscv_vmfle_mu(vbool8_t vm, vbool8_t vd, vfloat64m8_t vs2,
                          vfloat64m8_t vs1, size_t vl);
vbool8_t __riscv_vmfle_mu(vbool8_t vm, vbool8_t vd, vfloat64m8_t vs2,
                          double rs1, size_t vl);
vbool64_t __riscv_vmfgt_mu(vbool64_t vm, vbool64_t vd, vfloat16mf4_t vs2,
                           vfloat16mf4_t vs1, size_t vl);
vbool64_t __riscv_vmfgt_mu(vbool64_t vm, vbool64_t vd, vfloat16mf4_t vs2,
                           _Float16 rs1, size_t vl);
vbool32_t __riscv_vmfgt_mu(vbool32_t vm, vbool32_t vd, vfloat16mf2_t vs2,
                           vfloat16mf2_t vs1, size_t vl);
vbool32_t __riscv_vmfgt_mu(vbool32_t vm, vbool32_t vd, vfloat16mf2_t vs2,
                           _Float16 rs1, size_t vl);
vbool16_t __riscv_vmfgt_mu(vbool16_t vm, vbool16_t vd, vfloat16m1_t vs2,
                           vfloat16m1_t vs1, size_t vl);
vbool16_t __riscv_vmfgt_mu(vbool16_t vm, vbool16_t vd, vfloat16m1_t vs2,
                           _Float16 rs1, size_t vl);
vbool8_t __riscv_vmfgt_mu(vbool8_t vm, vbool8_t vd, vfloat16m2_t vs2,
                          vfloat16m2_t vs1, size_t vl);
vbool8_t __riscv_vmfgt_mu(vbool8_t vm, vbool8_t vd, vfloat16m2_t vs2,
                          _Float16 rs1, size_t vl);
vbool4_t __riscv_vmfgt_mu(vbool4_t vm, vbool4_t vd, vfloat16m4_t vs2,
                          vfloat16m4_t vs1, size_t vl);
vbool4_t __riscv_vmfgt_mu(vbool4_t vm, vbool4_t vd, vfloat16m4_t vs2,
                          _Float16 rs1, size_t vl);
vbool2_t __riscv_vmfgt_mu(vbool2_t vm, vbool2_t vd, vfloat16m8_t vs2,
                          vfloat16m8_t vs1, size_t vl);
vbool2_t __riscv_vmfgt_mu(vbool2_t vm, vbool2_t vd, vfloat16m8_t vs2,
                          _Float16 rs1, size_t vl);
vbool64_t __riscv_vmfgt_mu(vbool64_t vm, vbool64_t vd, vfloat32mf2_t vs2,
                           vfloat32mf2_t vs1, size_t vl);
vbool64_t __riscv_vmfgt_mu(vbool64_t vm, vbool64_t vd, vfloat32mf2_t vs2,
                           float rs1, size_t vl);
vbool32_t __riscv_vmfgt_mu(vbool32_t vm, vbool32_t vd, vfloat32m1_t vs2,
                           vfloat32m1_t vs1, size_t vl);
vbool32_t __riscv_vmfgt_mu(vbool32_t vm, vbool32_t vd, vfloat32m1_t vs2,
                           float rs1, size_t vl);
vbool16_t __riscv_vmfgt_mu(vbool16_t vm, vbool16_t vd, vfloat32m2_t vs2,
                           vfloat32m2_t vs1, size_t vl);
vbool16_t __riscv_vmfgt_mu(vbool16_t vm, vbool16_t vd, vfloat32m2_t vs2,
                           float rs1, size_t vl);
vbool8_t __riscv_vmfgt_mu(vbool8_t vm, vbool8_t vd, vfloat32m4_t vs2,
                          vfloat32m4_t vs1, size_t vl);
vbool8_t __riscv_vmfgt_mu(vbool8_t vm, vbool8_t vd, vfloat32m4_t vs2, float rs1,
                          size_t vl);
vbool4_t __riscv_vmfgt_mu(vbool4_t vm, vbool4_t vd, vfloat32m8_t vs2,
                          vfloat32m8_t vs1, size_t vl);
vbool4_t __riscv_vmfgt_mu(vbool4_t vm, vbool4_t vd, vfloat32m8_t vs2, float rs1,
                          size_t vl);
vbool64_t __riscv_vmfgt_mu(vbool64_t vm, vbool64_t vd, vfloat64m1_t vs2,
                           vfloat64m1_t vs1, size_t vl);
vbool64_t __riscv_vmfgt_mu(vbool64_t vm, vbool64_t vd, vfloat64m1_t vs2,
                           double rs1, size_t vl);
vbool32_t __riscv_vmfgt_mu(vbool32_t vm, vbool32_t vd, vfloat64m2_t vs2,
                           vfloat64m2_t vs1, size_t vl);
vbool32_t __riscv_vmfgt_mu(vbool32_t vm, vbool32_t vd, vfloat64m2_t vs2,
                           double rs1, size_t vl);
vbool16_t __riscv_vmfgt_mu(vbool16_t vm, vbool16_t vd, vfloat64m4_t vs2,
                           vfloat64m4_t vs1, size_t vl);
vbool16_t __riscv_vmfgt_mu(vbool16_t vm, vbool16_t vd, vfloat64m4_t vs2,
                           double rs1, size_t vl);
vbool8_t __riscv_vmfgt_mu(vbool8_t vm, vbool8_t vd, vfloat64m8_t vs2,
                          vfloat64m8_t vs1, size_t vl);
vbool8_t __riscv_vmfgt_mu(vbool8_t vm, vbool8_t vd, vfloat64m8_t vs2,
                          double rs1, size_t vl);
vbool64_t __riscv_vmfge_mu(vbool64_t vm, vbool64_t vd, vfloat16mf4_t vs2,
                           vfloat16mf4_t vs1, size_t vl);
vbool64_t __riscv_vmfge_mu(vbool64_t vm, vbool64_t vd, vfloat16mf4_t vs2,
                           _Float16 rs1, size_t vl);
vbool32_t __riscv_vmfge_mu(vbool32_t vm, vbool32_t vd, vfloat16mf2_t vs2,
                           vfloat16mf2_t vs1, size_t vl);
vbool32_t __riscv_vmfge_mu(vbool32_t vm, vbool32_t vd, vfloat16mf2_t vs2,
                           _Float16 rs1, size_t vl);
vbool16_t __riscv_vmfge_mu(vbool16_t vm, vbool16_t vd, vfloat16m1_t vs2,
                           vfloat16m1_t vs1, size_t vl);
vbool16_t __riscv_vmfge_mu(vbool16_t vm, vbool16_t vd, vfloat16m1_t vs2,
                           _Float16 rs1, size_t vl);
vbool8_t __riscv_vmfge_mu(vbool8_t vm, vbool8_t vd, vfloat16m2_t vs2,
                          vfloat16m2_t vs1, size_t vl);
vbool8_t __riscv_vmfge_mu(vbool8_t vm, vbool8_t vd, vfloat16m2_t vs2,
                          _Float16 rs1, size_t vl);
vbool4_t __riscv_vmfge_mu(vbool4_t vm, vbool4_t vd, vfloat16m4_t vs2,
                          vfloat16m4_t vs1, size_t vl);
vbool4_t __riscv_vmfge_mu(vbool4_t vm, vbool4_t vd, vfloat16m4_t vs2,
                          _Float16 rs1, size_t vl);
vbool2_t __riscv_vmfge_mu(vbool2_t vm, vbool2_t vd, vfloat16m8_t vs2,
                          vfloat16m8_t vs1, size_t vl);
vbool2_t __riscv_vmfge_mu(vbool2_t vm, vbool2_t vd, vfloat16m8_t vs2,
                          _Float16 rs1, size_t vl);
vbool64_t __riscv_vmfge_mu(vbool64_t vm, vbool64_t vd, vfloat32mf2_t vs2,
                           vfloat32mf2_t vs1, size_t vl);
vbool64_t __riscv_vmfge_mu(vbool64_t vm, vbool64_t vd, vfloat32mf2_t vs2,
                           float rs1, size_t vl);
vbool32_t __riscv_vmfge_mu(vbool32_t vm, vbool32_t vd, vfloat32m1_t vs2,
                           vfloat32m1_t vs1, size_t vl);
vbool32_t __riscv_vmfge_mu(vbool32_t vm, vbool32_t vd, vfloat32m1_t vs2,
                           float rs1, size_t vl);
vbool16_t __riscv_vmfge_mu(vbool16_t vm, vbool16_t vd, vfloat32m2_t vs2,
                           vfloat32m2_t vs1, size_t vl);
vbool16_t __riscv_vmfge_mu(vbool16_t vm, vbool16_t vd, vfloat32m2_t vs2,
                           float rs1, size_t vl);
vbool8_t __riscv_vmfge_mu(vbool8_t vm, vbool8_t vd, vfloat32m4_t vs2,
                          vfloat32m4_t vs1, size_t vl);
vbool8_t __riscv_vmfge_mu(vbool8_t vm, vbool8_t vd, vfloat32m4_t vs2, float rs1,
                          size_t vl);
vbool4_t __riscv_vmfge_mu(vbool4_t vm, vbool4_t vd, vfloat32m8_t vs2,
                          vfloat32m8_t vs1, size_t vl);
vbool4_t __riscv_vmfge_mu(vbool4_t vm, vbool4_t vd, vfloat32m8_t vs2, float rs1,
                          size_t vl);
vbool64_t __riscv_vmfge_mu(vbool64_t vm, vbool64_t vd, vfloat64m1_t vs2,
                           vfloat64m1_t vs1, size_t vl);
vbool64_t __riscv_vmfge_mu(vbool64_t vm, vbool64_t vd, vfloat64m1_t vs2,
                           double rs1, size_t vl);
vbool32_t __riscv_vmfge_mu(vbool32_t vm, vbool32_t vd, vfloat64m2_t vs2,
                           vfloat64m2_t vs1, size_t vl);
vbool32_t __riscv_vmfge_mu(vbool32_t vm, vbool32_t vd, vfloat64m2_t vs2,
                           double rs1, size_t vl);
vbool16_t __riscv_vmfge_mu(vbool16_t vm, vbool16_t vd, vfloat64m4_t vs2,
                           vfloat64m4_t vs1, size_t vl);
vbool16_t __riscv_vmfge_mu(vbool16_t vm, vbool16_t vd, vfloat64m4_t vs2,
                           double rs1, size_t vl);
vbool8_t __riscv_vmfge_mu(vbool8_t vm, vbool8_t vd, vfloat64m8_t vs2,
                          vfloat64m8_t vs1, size_t vl);
vbool8_t __riscv_vmfge_mu(vbool8_t vm, vbool8_t vd, vfloat64m8_t vs2,
                          double rs1, size_t vl);

Vector Floating-Point Classify Intrinsics

vuint16mf4_t __riscv_vfclass_tu(vuint16mf4_t vd, vfloat16mf4_t vs2, size_t vl);
vuint16mf2_t __riscv_vfclass_tu(vuint16mf2_t vd, vfloat16mf2_t vs2, size_t vl);
vuint16m1_t __riscv_vfclass_tu(vuint16m1_t vd, vfloat16m1_t vs2, size_t vl);
vuint16m2_t __riscv_vfclass_tu(vuint16m2_t vd, vfloat16m2_t vs2, size_t vl);
vuint16m4_t __riscv_vfclass_tu(vuint16m4_t vd, vfloat16m4_t vs2, size_t vl);
vuint16m8_t __riscv_vfclass_tu(vuint16m8_t vd, vfloat16m8_t vs2, size_t vl);
vuint32mf2_t __riscv_vfclass_tu(vuint32mf2_t vd, vfloat32mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vfclass_tu(vuint32m1_t vd, vfloat32m1_t vs2, size_t vl);
vuint32m2_t __riscv_vfclass_tu(vuint32m2_t vd, vfloat32m2_t vs2, size_t vl);
vuint32m4_t __riscv_vfclass_tu(vuint32m4_t vd, vfloat32m4_t vs2, size_t vl);
vuint32m8_t __riscv_vfclass_tu(vuint32m8_t vd, vfloat32m8_t vs2, size_t vl);
vuint64m1_t __riscv_vfclass_tu(vuint64m1_t vd, vfloat64m1_t vs2, size_t vl);
vuint64m2_t __riscv_vfclass_tu(vuint64m2_t vd, vfloat64m2_t vs2, size_t vl);
vuint64m4_t __riscv_vfclass_tu(vuint64m4_t vd, vfloat64m4_t vs2, size_t vl);
vuint64m8_t __riscv_vfclass_tu(vuint64m8_t vd, vfloat64m8_t vs2, size_t vl);
// masked functions
vuint16mf4_t __riscv_vfclass_tum(vbool64_t vm, vuint16mf4_t vd,
                                 vfloat16mf4_t vs2, size_t vl);
vuint16mf2_t __riscv_vfclass_tum(vbool32_t vm, vuint16mf2_t vd,
                                 vfloat16mf2_t vs2, size_t vl);
vuint16m1_t __riscv_vfclass_tum(vbool16_t vm, vuint16m1_t vd, vfloat16m1_t vs2,
                                size_t vl);
vuint16m2_t __riscv_vfclass_tum(vbool8_t vm, vuint16m2_t vd, vfloat16m2_t vs2,
                                size_t vl);
vuint16m4_t __riscv_vfclass_tum(vbool4_t vm, vuint16m4_t vd, vfloat16m4_t vs2,
                                size_t vl);
vuint16m8_t __riscv_vfclass_tum(vbool2_t vm, vuint16m8_t vd, vfloat16m8_t vs2,
                                size_t vl);
vuint32mf2_t __riscv_vfclass_tum(vbool64_t vm, vuint32mf2_t vd,
                                 vfloat32mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vfclass_tum(vbool32_t vm, vuint32m1_t vd, vfloat32m1_t vs2,
                                size_t vl);
vuint32m2_t __riscv_vfclass_tum(vbool16_t vm, vuint32m2_t vd, vfloat32m2_t vs2,
                                size_t vl);
vuint32m4_t __riscv_vfclass_tum(vbool8_t vm, vuint32m4_t vd, vfloat32m4_t vs2,
                                size_t vl);
vuint32m8_t __riscv_vfclass_tum(vbool4_t vm, vuint32m8_t vd, vfloat32m8_t vs2,
                                size_t vl);
vuint64m1_t __riscv_vfclass_tum(vbool64_t vm, vuint64m1_t vd, vfloat64m1_t vs2,
                                size_t vl);
vuint64m2_t __riscv_vfclass_tum(vbool32_t vm, vuint64m2_t vd, vfloat64m2_t vs2,
                                size_t vl);
vuint64m4_t __riscv_vfclass_tum(vbool16_t vm, vuint64m4_t vd, vfloat64m4_t vs2,
                                size_t vl);
vuint64m8_t __riscv_vfclass_tum(vbool8_t vm, vuint64m8_t vd, vfloat64m8_t vs2,
                                size_t vl);
// masked functions
vuint16mf4_t __riscv_vfclass_tumu(vbool64_t vm, vuint16mf4_t vd,
                                  vfloat16mf4_t vs2, size_t vl);
vuint16mf2_t __riscv_vfclass_tumu(vbool32_t vm, vuint16mf2_t vd,
                                  vfloat16mf2_t vs2, size_t vl);
vuint16m1_t __riscv_vfclass_tumu(vbool16_t vm, vuint16m1_t vd, vfloat16m1_t vs2,
                                 size_t vl);
vuint16m2_t __riscv_vfclass_tumu(vbool8_t vm, vuint16m2_t vd, vfloat16m2_t vs2,
                                 size_t vl);
vuint16m4_t __riscv_vfclass_tumu(vbool4_t vm, vuint16m4_t vd, vfloat16m4_t vs2,
                                 size_t vl);
vuint16m8_t __riscv_vfclass_tumu(vbool2_t vm, vuint16m8_t vd, vfloat16m8_t vs2,
                                 size_t vl);
vuint32mf2_t __riscv_vfclass_tumu(vbool64_t vm, vuint32mf2_t vd,
                                  vfloat32mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vfclass_tumu(vbool32_t vm, vuint32m1_t vd, vfloat32m1_t vs2,
                                 size_t vl);
vuint32m2_t __riscv_vfclass_tumu(vbool16_t vm, vuint32m2_t vd, vfloat32m2_t vs2,
                                 size_t vl);
vuint32m4_t __riscv_vfclass_tumu(vbool8_t vm, vuint32m4_t vd, vfloat32m4_t vs2,
                                 size_t vl);
vuint32m8_t __riscv_vfclass_tumu(vbool4_t vm, vuint32m8_t vd, vfloat32m8_t vs2,
                                 size_t vl);
vuint64m1_t __riscv_vfclass_tumu(vbool64_t vm, vuint64m1_t vd, vfloat64m1_t vs2,
                                 size_t vl);
vuint64m2_t __riscv_vfclass_tumu(vbool32_t vm, vuint64m2_t vd, vfloat64m2_t vs2,
                                 size_t vl);
vuint64m4_t __riscv_vfclass_tumu(vbool16_t vm, vuint64m4_t vd, vfloat64m4_t vs2,
                                 size_t vl);
vuint64m8_t __riscv_vfclass_tumu(vbool8_t vm, vuint64m8_t vd, vfloat64m8_t vs2,
                                 size_t vl);
// masked functions
vuint16mf4_t __riscv_vfclass_mu(vbool64_t vm, vuint16mf4_t vd,
                                vfloat16mf4_t vs2, size_t vl);
vuint16mf2_t __riscv_vfclass_mu(vbool32_t vm, vuint16mf2_t vd,
                                vfloat16mf2_t vs2, size_t vl);
vuint16m1_t __riscv_vfclass_mu(vbool16_t vm, vuint16m1_t vd, vfloat16m1_t vs2,
                               size_t vl);
vuint16m2_t __riscv_vfclass_mu(vbool8_t vm, vuint16m2_t vd, vfloat16m2_t vs2,
                               size_t vl);
vuint16m4_t __riscv_vfclass_mu(vbool4_t vm, vuint16m4_t vd, vfloat16m4_t vs2,
                               size_t vl);
vuint16m8_t __riscv_vfclass_mu(vbool2_t vm, vuint16m8_t vd, vfloat16m8_t vs2,
                               size_t vl);
vuint32mf2_t __riscv_vfclass_mu(vbool64_t vm, vuint32mf2_t vd,
                                vfloat32mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vfclass_mu(vbool32_t vm, vuint32m1_t vd, vfloat32m1_t vs2,
                               size_t vl);
vuint32m2_t __riscv_vfclass_mu(vbool16_t vm, vuint32m2_t vd, vfloat32m2_t vs2,
                               size_t vl);
vuint32m4_t __riscv_vfclass_mu(vbool8_t vm, vuint32m4_t vd, vfloat32m4_t vs2,
                               size_t vl);
vuint32m8_t __riscv_vfclass_mu(vbool4_t vm, vuint32m8_t vd, vfloat32m8_t vs2,
                               size_t vl);
vuint64m1_t __riscv_vfclass_mu(vbool64_t vm, vuint64m1_t vd, vfloat64m1_t vs2,
                               size_t vl);
vuint64m2_t __riscv_vfclass_mu(vbool32_t vm, vuint64m2_t vd, vfloat64m2_t vs2,
                               size_t vl);
vuint64m4_t __riscv_vfclass_mu(vbool16_t vm, vuint64m4_t vd, vfloat64m4_t vs2,
                               size_t vl);
vuint64m8_t __riscv_vfclass_mu(vbool8_t vm, vuint64m8_t vd, vfloat64m8_t vs2,
                               size_t vl);

Vector Floating-Point Merge Intrinsics

vfloat16mf4_t __riscv_vmerge_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                vfloat16mf4_t vs1, vbool64_t v0, size_t vl);
vfloat16mf4_t __riscv_vfmerge_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                 _Float16 rs1, vbool64_t v0, size_t vl);
vfloat16mf2_t __riscv_vmerge_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                vfloat16mf2_t vs1, vbool32_t v0, size_t vl);
vfloat16mf2_t __riscv_vfmerge_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                 _Float16 rs1, vbool32_t v0, size_t vl);
vfloat16m1_t __riscv_vmerge_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                               vfloat16m1_t vs1, vbool16_t v0, size_t vl);
vfloat16m1_t __riscv_vfmerge_tu(vfloat16m1_t vd, vfloat16m1_t vs2, _Float16 rs1,
                                vbool16_t v0, size_t vl);
vfloat16m2_t __riscv_vmerge_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                               vfloat16m2_t vs1, vbool8_t v0, size_t vl);
vfloat16m2_t __riscv_vfmerge_tu(vfloat16m2_t vd, vfloat16m2_t vs2, _Float16 rs1,
                                vbool8_t v0, size_t vl);
vfloat16m4_t __riscv_vmerge_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                               vfloat16m4_t vs1, vbool4_t v0, size_t vl);
vfloat16m4_t __riscv_vfmerge_tu(vfloat16m4_t vd, vfloat16m4_t vs2, _Float16 rs1,
                                vbool4_t v0, size_t vl);
vfloat16m8_t __riscv_vmerge_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                               vfloat16m8_t vs1, vbool2_t v0, size_t vl);
vfloat16m8_t __riscv_vfmerge_tu(vfloat16m8_t vd, vfloat16m8_t vs2, _Float16 rs1,
                                vbool2_t v0, size_t vl);
vfloat32mf2_t __riscv_vmerge_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                vfloat32mf2_t vs1, vbool64_t v0, size_t vl);
vfloat32mf2_t __riscv_vfmerge_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2, float rs1,
                                 vbool64_t v0, size_t vl);
vfloat32m1_t __riscv_vmerge_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                               vfloat32m1_t vs1, vbool32_t v0, size_t vl);
vfloat32m1_t __riscv_vfmerge_tu(vfloat32m1_t vd, vfloat32m1_t vs2, float rs1,
                                vbool32_t v0, size_t vl);
vfloat32m2_t __riscv_vmerge_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                               vfloat32m2_t vs1, vbool16_t v0, size_t vl);
vfloat32m2_t __riscv_vfmerge_tu(vfloat32m2_t vd, vfloat32m2_t vs2, float rs1,
                                vbool16_t v0, size_t vl);
vfloat32m4_t __riscv_vmerge_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                               vfloat32m4_t vs1, vbool8_t v0, size_t vl);
vfloat32m4_t __riscv_vfmerge_tu(vfloat32m4_t vd, vfloat32m4_t vs2, float rs1,
                                vbool8_t v0, size_t vl);
vfloat32m8_t __riscv_vmerge_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                               vfloat32m8_t vs1, vbool4_t v0, size_t vl);
vfloat32m8_t __riscv_vfmerge_tu(vfloat32m8_t vd, vfloat32m8_t vs2, float rs1,
                                vbool4_t v0, size_t vl);
vfloat64m1_t __riscv_vmerge_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                               vfloat64m1_t vs1, vbool64_t v0, size_t vl);
vfloat64m1_t __riscv_vfmerge_tu(vfloat64m1_t vd, vfloat64m1_t vs2, double rs1,
                                vbool64_t v0, size_t vl);
vfloat64m2_t __riscv_vmerge_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                               vfloat64m2_t vs1, vbool32_t v0, size_t vl);
vfloat64m2_t __riscv_vfmerge_tu(vfloat64m2_t vd, vfloat64m2_t vs2, double rs1,
                                vbool32_t v0, size_t vl);
vfloat64m4_t __riscv_vmerge_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                               vfloat64m4_t vs1, vbool16_t v0, size_t vl);
vfloat64m4_t __riscv_vfmerge_tu(vfloat64m4_t vd, vfloat64m4_t vs2, double rs1,
                                vbool16_t v0, size_t vl);
vfloat64m8_t __riscv_vmerge_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                               vfloat64m8_t vs1, vbool8_t v0, size_t vl);
vfloat64m8_t __riscv_vfmerge_tu(vfloat64m8_t vd, vfloat64m8_t vs2, double rs1,
                                vbool8_t v0, size_t vl);

Vector Floating-Point Move Intrinsics

vfloat16mf4_t __riscv_vmv_v_tu(vfloat16mf4_t vd, vfloat16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vfmv_v_tu(vfloat16mf4_t vd, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vmv_v_tu(vfloat16mf2_t vd, vfloat16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vfmv_v_tu(vfloat16mf2_t vd, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vmv_v_tu(vfloat16m1_t vd, vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfmv_v_tu(vfloat16m1_t vd, _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vmv_v_tu(vfloat16m2_t vd, vfloat16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vfmv_v_tu(vfloat16m2_t vd, _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vmv_v_tu(vfloat16m4_t vd, vfloat16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vfmv_v_tu(vfloat16m4_t vd, _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vmv_v_tu(vfloat16m8_t vd, vfloat16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vfmv_v_tu(vfloat16m8_t vd, _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vmv_v_tu(vfloat32mf2_t vd, vfloat32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vfmv_v_tu(vfloat32mf2_t vd, float rs1, size_t vl);
vfloat32m1_t __riscv_vmv_v_tu(vfloat32m1_t vd, vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfmv_v_tu(vfloat32m1_t vd, float rs1, size_t vl);
vfloat32m2_t __riscv_vmv_v_tu(vfloat32m2_t vd, vfloat32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vfmv_v_tu(vfloat32m2_t vd, float rs1, size_t vl);
vfloat32m4_t __riscv_vmv_v_tu(vfloat32m4_t vd, vfloat32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vfmv_v_tu(vfloat32m4_t vd, float rs1, size_t vl);
vfloat32m8_t __riscv_vmv_v_tu(vfloat32m8_t vd, vfloat32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vfmv_v_tu(vfloat32m8_t vd, float rs1, size_t vl);
vfloat64m1_t __riscv_vmv_v_tu(vfloat64m1_t vd, vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfmv_v_tu(vfloat64m1_t vd, double rs1, size_t vl);
vfloat64m2_t __riscv_vmv_v_tu(vfloat64m2_t vd, vfloat64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vfmv_v_tu(vfloat64m2_t vd, double rs1, size_t vl);
vfloat64m4_t __riscv_vmv_v_tu(vfloat64m4_t vd, vfloat64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vfmv_v_tu(vfloat64m4_t vd, double rs1, size_t vl);
vfloat64m8_t __riscv_vmv_v_tu(vfloat64m8_t vd, vfloat64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vfmv_v_tu(vfloat64m8_t vd, double rs1, size_t vl);

Single-Width Floating-Point/Integer Type-Convert Intrinsics

vint16mf4_t __riscv_vfcvt_x_tu(vint16mf4_t vd, vfloat16mf4_t vs2, size_t vl);
vint16mf4_t __riscv_vfcvt_rtz_x_tu(vint16mf4_t vd, vfloat16mf4_t vs2,
                                   size_t vl);
vint16mf2_t __riscv_vfcvt_x_tu(vint16mf2_t vd, vfloat16mf2_t vs2, size_t vl);
vint16mf2_t __riscv_vfcvt_rtz_x_tu(vint16mf2_t vd, vfloat16mf2_t vs2,
                                   size_t vl);
vint16m1_t __riscv_vfcvt_x_tu(vint16m1_t vd, vfloat16m1_t vs2, size_t vl);
vint16m1_t __riscv_vfcvt_rtz_x_tu(vint16m1_t vd, vfloat16m1_t vs2, size_t vl);
vint16m2_t __riscv_vfcvt_x_tu(vint16m2_t vd, vfloat16m2_t vs2, size_t vl);
vint16m2_t __riscv_vfcvt_rtz_x_tu(vint16m2_t vd, vfloat16m2_t vs2, size_t vl);
vint16m4_t __riscv_vfcvt_x_tu(vint16m4_t vd, vfloat16m4_t vs2, size_t vl);
vint16m4_t __riscv_vfcvt_rtz_x_tu(vint16m4_t vd, vfloat16m4_t vs2, size_t vl);
vint16m8_t __riscv_vfcvt_x_tu(vint16m8_t vd, vfloat16m8_t vs2, size_t vl);
vint16m8_t __riscv_vfcvt_rtz_x_tu(vint16m8_t vd, vfloat16m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vfcvt_xu_tu(vuint16mf4_t vd, vfloat16mf4_t vs2, size_t vl);
vuint16mf4_t __riscv_vfcvt_rtz_xu_tu(vuint16mf4_t vd, vfloat16mf4_t vs2,
                                     size_t vl);
vuint16mf2_t __riscv_vfcvt_xu_tu(vuint16mf2_t vd, vfloat16mf2_t vs2, size_t vl);
vuint16mf2_t __riscv_vfcvt_rtz_xu_tu(vuint16mf2_t vd, vfloat16mf2_t vs2,
                                     size_t vl);
vuint16m1_t __riscv_vfcvt_xu_tu(vuint16m1_t vd, vfloat16m1_t vs2, size_t vl);
vuint16m1_t __riscv_vfcvt_rtz_xu_tu(vuint16m1_t vd, vfloat16m1_t vs2,
                                    size_t vl);
vuint16m2_t __riscv_vfcvt_xu_tu(vuint16m2_t vd, vfloat16m2_t vs2, size_t vl);
vuint16m2_t __riscv_vfcvt_rtz_xu_tu(vuint16m2_t vd, vfloat16m2_t vs2,
                                    size_t vl);
vuint16m4_t __riscv_vfcvt_xu_tu(vuint16m4_t vd, vfloat16m4_t vs2, size_t vl);
vuint16m4_t __riscv_vfcvt_rtz_xu_tu(vuint16m4_t vd, vfloat16m4_t vs2,
                                    size_t vl);
vuint16m8_t __riscv_vfcvt_xu_tu(vuint16m8_t vd, vfloat16m8_t vs2, size_t vl);
vuint16m8_t __riscv_vfcvt_rtz_xu_tu(vuint16m8_t vd, vfloat16m8_t vs2,
                                    size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_tu(vfloat16mf4_t vd, vint16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_tu(vfloat16mf2_t vd, vint16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_tu(vfloat16m1_t vd, vint16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfcvt_f_tu(vfloat16m2_t vd, vint16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfcvt_f_tu(vfloat16m4_t vd, vint16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfcvt_f_tu(vfloat16m8_t vd, vint16m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_tu(vfloat16mf4_t vd, vuint16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_tu(vfloat16mf2_t vd, vuint16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_tu(vfloat16m1_t vd, vuint16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfcvt_f_tu(vfloat16m2_t vd, vuint16m2_t vs2, size_t vl);
vfloat16m4_t __riscv_vfcvt_f_tu(vfloat16m4_t vd, vuint16m4_t vs2, size_t vl);
vfloat16m8_t __riscv_vfcvt_f_tu(vfloat16m8_t vd, vuint16m8_t vs2, size_t vl);
vint32mf2_t __riscv_vfcvt_x_tu(vint32mf2_t vd, vfloat32mf2_t vs2, size_t vl);
vint32mf2_t __riscv_vfcvt_rtz_x_tu(vint32mf2_t vd, vfloat32mf2_t vs2,
                                   size_t vl);
vint32m1_t __riscv_vfcvt_x_tu(vint32m1_t vd, vfloat32m1_t vs2, size_t vl);
vint32m1_t __riscv_vfcvt_rtz_x_tu(vint32m1_t vd, vfloat32m1_t vs2, size_t vl);
vint32m2_t __riscv_vfcvt_x_tu(vint32m2_t vd, vfloat32m2_t vs2, size_t vl);
vint32m2_t __riscv_vfcvt_rtz_x_tu(vint32m2_t vd, vfloat32m2_t vs2, size_t vl);
vint32m4_t __riscv_vfcvt_x_tu(vint32m4_t vd, vfloat32m4_t vs2, size_t vl);
vint32m4_t __riscv_vfcvt_rtz_x_tu(vint32m4_t vd, vfloat32m4_t vs2, size_t vl);
vint32m8_t __riscv_vfcvt_x_tu(vint32m8_t vd, vfloat32m8_t vs2, size_t vl);
vint32m8_t __riscv_vfcvt_rtz_x_tu(vint32m8_t vd, vfloat32m8_t vs2, size_t vl);
vuint32mf2_t __riscv_vfcvt_xu_tu(vuint32mf2_t vd, vfloat32mf2_t vs2, size_t vl);
vuint32mf2_t __riscv_vfcvt_rtz_xu_tu(vuint32mf2_t vd, vfloat32mf2_t vs2,
                                     size_t vl);
vuint32m1_t __riscv_vfcvt_xu_tu(vuint32m1_t vd, vfloat32m1_t vs2, size_t vl);
vuint32m1_t __riscv_vfcvt_rtz_xu_tu(vuint32m1_t vd, vfloat32m1_t vs2,
                                    size_t vl);
vuint32m2_t __riscv_vfcvt_xu_tu(vuint32m2_t vd, vfloat32m2_t vs2, size_t vl);
vuint32m2_t __riscv_vfcvt_rtz_xu_tu(vuint32m2_t vd, vfloat32m2_t vs2,
                                    size_t vl);
vuint32m4_t __riscv_vfcvt_xu_tu(vuint32m4_t vd, vfloat32m4_t vs2, size_t vl);
vuint32m4_t __riscv_vfcvt_rtz_xu_tu(vuint32m4_t vd, vfloat32m4_t vs2,
                                    size_t vl);
vuint32m8_t __riscv_vfcvt_xu_tu(vuint32m8_t vd, vfloat32m8_t vs2, size_t vl);
vuint32m8_t __riscv_vfcvt_rtz_xu_tu(vuint32m8_t vd, vfloat32m8_t vs2,
                                    size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_tu(vfloat32mf2_t vd, vint32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_tu(vfloat32m1_t vd, vint32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfcvt_f_tu(vfloat32m2_t vd, vint32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfcvt_f_tu(vfloat32m4_t vd, vint32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfcvt_f_tu(vfloat32m8_t vd, vint32m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_tu(vfloat32mf2_t vd, vuint32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_tu(vfloat32m1_t vd, vuint32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfcvt_f_tu(vfloat32m2_t vd, vuint32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfcvt_f_tu(vfloat32m4_t vd, vuint32m4_t vs2, size_t vl);
vfloat32m8_t __riscv_vfcvt_f_tu(vfloat32m8_t vd, vuint32m8_t vs2, size_t vl);
vint64m1_t __riscv_vfcvt_x_tu(vint64m1_t vd, vfloat64m1_t vs2, size_t vl);
vint64m1_t __riscv_vfcvt_rtz_x_tu(vint64m1_t vd, vfloat64m1_t vs2, size_t vl);
vint64m2_t __riscv_vfcvt_x_tu(vint64m2_t vd, vfloat64m2_t vs2, size_t vl);
vint64m2_t __riscv_vfcvt_rtz_x_tu(vint64m2_t vd, vfloat64m2_t vs2, size_t vl);
vint64m4_t __riscv_vfcvt_x_tu(vint64m4_t vd, vfloat64m4_t vs2, size_t vl);
vint64m4_t __riscv_vfcvt_rtz_x_tu(vint64m4_t vd, vfloat64m4_t vs2, size_t vl);
vint64m8_t __riscv_vfcvt_x_tu(vint64m8_t vd, vfloat64m8_t vs2, size_t vl);
vint64m8_t __riscv_vfcvt_rtz_x_tu(vint64m8_t vd, vfloat64m8_t vs2, size_t vl);
vuint64m1_t __riscv_vfcvt_xu_tu(vuint64m1_t vd, vfloat64m1_t vs2, size_t vl);
vuint64m1_t __riscv_vfcvt_rtz_xu_tu(vuint64m1_t vd, vfloat64m1_t vs2,
                                    size_t vl);
vuint64m2_t __riscv_vfcvt_xu_tu(vuint64m2_t vd, vfloat64m2_t vs2, size_t vl);
vuint64m2_t __riscv_vfcvt_rtz_xu_tu(vuint64m2_t vd, vfloat64m2_t vs2,
                                    size_t vl);
vuint64m4_t __riscv_vfcvt_xu_tu(vuint64m4_t vd, vfloat64m4_t vs2, size_t vl);
vuint64m4_t __riscv_vfcvt_rtz_xu_tu(vuint64m4_t vd, vfloat64m4_t vs2,
                                    size_t vl);
vuint64m8_t __riscv_vfcvt_xu_tu(vuint64m8_t vd, vfloat64m8_t vs2, size_t vl);
vuint64m8_t __riscv_vfcvt_rtz_xu_tu(vuint64m8_t vd, vfloat64m8_t vs2,
                                    size_t vl);
vfloat64m1_t __riscv_vfcvt_f_tu(vfloat64m1_t vd, vint64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfcvt_f_tu(vfloat64m2_t vd, vint64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfcvt_f_tu(vfloat64m4_t vd, vint64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfcvt_f_tu(vfloat64m8_t vd, vint64m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfcvt_f_tu(vfloat64m1_t vd, vuint64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfcvt_f_tu(vfloat64m2_t vd, vuint64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfcvt_f_tu(vfloat64m4_t vd, vuint64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfcvt_f_tu(vfloat64m8_t vd, vuint64m8_t vs2, size_t vl);
// masked functions
vint16mf4_t __riscv_vfcvt_x_tum(vbool64_t vm, vint16mf4_t vd, vfloat16mf4_t vs2,
                                size_t vl);
vint16mf4_t __riscv_vfcvt_rtz_x_tum(vbool64_t vm, vint16mf4_t vd,
                                    vfloat16mf4_t vs2, size_t vl);
vint16mf2_t __riscv_vfcvt_x_tum(vbool32_t vm, vint16mf2_t vd, vfloat16mf2_t vs2,
                                size_t vl);
vint16mf2_t __riscv_vfcvt_rtz_x_tum(vbool32_t vm, vint16mf2_t vd,
                                    vfloat16mf2_t vs2, size_t vl);
vint16m1_t __riscv_vfcvt_x_tum(vbool16_t vm, vint16m1_t vd, vfloat16m1_t vs2,
                               size_t vl);
vint16m1_t __riscv_vfcvt_rtz_x_tum(vbool16_t vm, vint16m1_t vd,
                                   vfloat16m1_t vs2, size_t vl);
vint16m2_t __riscv_vfcvt_x_tum(vbool8_t vm, vint16m2_t vd, vfloat16m2_t vs2,
                               size_t vl);
vint16m2_t __riscv_vfcvt_rtz_x_tum(vbool8_t vm, vint16m2_t vd, vfloat16m2_t vs2,
                                   size_t vl);
vint16m4_t __riscv_vfcvt_x_tum(vbool4_t vm, vint16m4_t vd, vfloat16m4_t vs2,
                               size_t vl);
vint16m4_t __riscv_vfcvt_rtz_x_tum(vbool4_t vm, vint16m4_t vd, vfloat16m4_t vs2,
                                   size_t vl);
vint16m8_t __riscv_vfcvt_x_tum(vbool2_t vm, vint16m8_t vd, vfloat16m8_t vs2,
                               size_t vl);
vint16m8_t __riscv_vfcvt_rtz_x_tum(vbool2_t vm, vint16m8_t vd, vfloat16m8_t vs2,
                                   size_t vl);
vuint16mf4_t __riscv_vfcvt_xu_tum(vbool64_t vm, vuint16mf4_t vd,
                                  vfloat16mf4_t vs2, size_t vl);
vuint16mf4_t __riscv_vfcvt_rtz_xu_tum(vbool64_t vm, vuint16mf4_t vd,
                                      vfloat16mf4_t vs2, size_t vl);
vuint16mf2_t __riscv_vfcvt_xu_tum(vbool32_t vm, vuint16mf2_t vd,
                                  vfloat16mf2_t vs2, size_t vl);
vuint16mf2_t __riscv_vfcvt_rtz_xu_tum(vbool32_t vm, vuint16mf2_t vd,
                                      vfloat16mf2_t vs2, size_t vl);
vuint16m1_t __riscv_vfcvt_xu_tum(vbool16_t vm, vuint16m1_t vd, vfloat16m1_t vs2,
                                 size_t vl);
vuint16m1_t __riscv_vfcvt_rtz_xu_tum(vbool16_t vm, vuint16m1_t vd,
                                     vfloat16m1_t vs2, size_t vl);
vuint16m2_t __riscv_vfcvt_xu_tum(vbool8_t vm, vuint16m2_t vd, vfloat16m2_t vs2,
                                 size_t vl);
vuint16m2_t __riscv_vfcvt_rtz_xu_tum(vbool8_t vm, vuint16m2_t vd,
                                     vfloat16m2_t vs2, size_t vl);
vuint16m4_t __riscv_vfcvt_xu_tum(vbool4_t vm, vuint16m4_t vd, vfloat16m4_t vs2,
                                 size_t vl);
vuint16m4_t __riscv_vfcvt_rtz_xu_tum(vbool4_t vm, vuint16m4_t vd,
                                     vfloat16m4_t vs2, size_t vl);
vuint16m8_t __riscv_vfcvt_xu_tum(vbool2_t vm, vuint16m8_t vd, vfloat16m8_t vs2,
                                 size_t vl);
vuint16m8_t __riscv_vfcvt_rtz_xu_tum(vbool2_t vm, vuint16m8_t vd,
                                     vfloat16m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_tum(vbool64_t vm, vfloat16mf4_t vd,
                                  vint16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_tum(vbool32_t vm, vfloat16mf2_t vd,
                                  vint16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_tum(vbool16_t vm, vfloat16m1_t vd, vint16m1_t vs2,
                                 size_t vl);
vfloat16m2_t __riscv_vfcvt_f_tum(vbool8_t vm, vfloat16m2_t vd, vint16m2_t vs2,
                                 size_t vl);
vfloat16m4_t __riscv_vfcvt_f_tum(vbool4_t vm, vfloat16m4_t vd, vint16m4_t vs2,
                                 size_t vl);
vfloat16m8_t __riscv_vfcvt_f_tum(vbool2_t vm, vfloat16m8_t vd, vint16m8_t vs2,
                                 size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_tum(vbool64_t vm, vfloat16mf4_t vd,
                                  vuint16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_tum(vbool32_t vm, vfloat16mf2_t vd,
                                  vuint16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_tum(vbool16_t vm, vfloat16m1_t vd, vuint16m1_t vs2,
                                 size_t vl);
vfloat16m2_t __riscv_vfcvt_f_tum(vbool8_t vm, vfloat16m2_t vd, vuint16m2_t vs2,
                                 size_t vl);
vfloat16m4_t __riscv_vfcvt_f_tum(vbool4_t vm, vfloat16m4_t vd, vuint16m4_t vs2,
                                 size_t vl);
vfloat16m8_t __riscv_vfcvt_f_tum(vbool2_t vm, vfloat16m8_t vd, vuint16m8_t vs2,
                                 size_t vl);
vint32mf2_t __riscv_vfcvt_x_tum(vbool64_t vm, vint32mf2_t vd, vfloat32mf2_t vs2,
                                size_t vl);
vint32mf2_t __riscv_vfcvt_rtz_x_tum(vbool64_t vm, vint32mf2_t vd,
                                    vfloat32mf2_t vs2, size_t vl);
vint32m1_t __riscv_vfcvt_x_tum(vbool32_t vm, vint32m1_t vd, vfloat32m1_t vs2,
                               size_t vl);
vint32m1_t __riscv_vfcvt_rtz_x_tum(vbool32_t vm, vint32m1_t vd,
                                   vfloat32m1_t vs2, size_t vl);
vint32m2_t __riscv_vfcvt_x_tum(vbool16_t vm, vint32m2_t vd, vfloat32m2_t vs2,
                               size_t vl);
vint32m2_t __riscv_vfcvt_rtz_x_tum(vbool16_t vm, vint32m2_t vd,
                                   vfloat32m2_t vs2, size_t vl);
vint32m4_t __riscv_vfcvt_x_tum(vbool8_t vm, vint32m4_t vd, vfloat32m4_t vs2,
                               size_t vl);
vint32m4_t __riscv_vfcvt_rtz_x_tum(vbool8_t vm, vint32m4_t vd, vfloat32m4_t vs2,
                                   size_t vl);
vint32m8_t __riscv_vfcvt_x_tum(vbool4_t vm, vint32m8_t vd, vfloat32m8_t vs2,
                               size_t vl);
vint32m8_t __riscv_vfcvt_rtz_x_tum(vbool4_t vm, vint32m8_t vd, vfloat32m8_t vs2,
                                   size_t vl);
vuint32mf2_t __riscv_vfcvt_xu_tum(vbool64_t vm, vuint32mf2_t vd,
                                  vfloat32mf2_t vs2, size_t vl);
vuint32mf2_t __riscv_vfcvt_rtz_xu_tum(vbool64_t vm, vuint32mf2_t vd,
                                      vfloat32mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vfcvt_xu_tum(vbool32_t vm, vuint32m1_t vd, vfloat32m1_t vs2,
                                 size_t vl);
vuint32m1_t __riscv_vfcvt_rtz_xu_tum(vbool32_t vm, vuint32m1_t vd,
                                     vfloat32m1_t vs2, size_t vl);
vuint32m2_t __riscv_vfcvt_xu_tum(vbool16_t vm, vuint32m2_t vd, vfloat32m2_t vs2,
                                 size_t vl);
vuint32m2_t __riscv_vfcvt_rtz_xu_tum(vbool16_t vm, vuint32m2_t vd,
                                     vfloat32m2_t vs2, size_t vl);
vuint32m4_t __riscv_vfcvt_xu_tum(vbool8_t vm, vuint32m4_t vd, vfloat32m4_t vs2,
                                 size_t vl);
vuint32m4_t __riscv_vfcvt_rtz_xu_tum(vbool8_t vm, vuint32m4_t vd,
                                     vfloat32m4_t vs2, size_t vl);
vuint32m8_t __riscv_vfcvt_xu_tum(vbool4_t vm, vuint32m8_t vd, vfloat32m8_t vs2,
                                 size_t vl);
vuint32m8_t __riscv_vfcvt_rtz_xu_tum(vbool4_t vm, vuint32m8_t vd,
                                     vfloat32m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_tum(vbool64_t vm, vfloat32mf2_t vd,
                                  vint32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_tum(vbool32_t vm, vfloat32m1_t vd, vint32m1_t vs2,
                                 size_t vl);
vfloat32m2_t __riscv_vfcvt_f_tum(vbool16_t vm, vfloat32m2_t vd, vint32m2_t vs2,
                                 size_t vl);
vfloat32m4_t __riscv_vfcvt_f_tum(vbool8_t vm, vfloat32m4_t vd, vint32m4_t vs2,
                                 size_t vl);
vfloat32m8_t __riscv_vfcvt_f_tum(vbool4_t vm, vfloat32m8_t vd, vint32m8_t vs2,
                                 size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_tum(vbool64_t vm, vfloat32mf2_t vd,
                                  vuint32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_tum(vbool32_t vm, vfloat32m1_t vd, vuint32m1_t vs2,
                                 size_t vl);
vfloat32m2_t __riscv_vfcvt_f_tum(vbool16_t vm, vfloat32m2_t vd, vuint32m2_t vs2,
                                 size_t vl);
vfloat32m4_t __riscv_vfcvt_f_tum(vbool8_t vm, vfloat32m4_t vd, vuint32m4_t vs2,
                                 size_t vl);
vfloat32m8_t __riscv_vfcvt_f_tum(vbool4_t vm, vfloat32m8_t vd, vuint32m8_t vs2,
                                 size_t vl);
vint64m1_t __riscv_vfcvt_x_tum(vbool64_t vm, vint64m1_t vd, vfloat64m1_t vs2,
                               size_t vl);
vint64m1_t __riscv_vfcvt_rtz_x_tum(vbool64_t vm, vint64m1_t vd,
                                   vfloat64m1_t vs2, size_t vl);
vint64m2_t __riscv_vfcvt_x_tum(vbool32_t vm, vint64m2_t vd, vfloat64m2_t vs2,
                               size_t vl);
vint64m2_t __riscv_vfcvt_rtz_x_tum(vbool32_t vm, vint64m2_t vd,
                                   vfloat64m2_t vs2, size_t vl);
vint64m4_t __riscv_vfcvt_x_tum(vbool16_t vm, vint64m4_t vd, vfloat64m4_t vs2,
                               size_t vl);
vint64m4_t __riscv_vfcvt_rtz_x_tum(vbool16_t vm, vint64m4_t vd,
                                   vfloat64m4_t vs2, size_t vl);
vint64m8_t __riscv_vfcvt_x_tum(vbool8_t vm, vint64m8_t vd, vfloat64m8_t vs2,
                               size_t vl);
vint64m8_t __riscv_vfcvt_rtz_x_tum(vbool8_t vm, vint64m8_t vd, vfloat64m8_t vs2,
                                   size_t vl);
vuint64m1_t __riscv_vfcvt_xu_tum(vbool64_t vm, vuint64m1_t vd, vfloat64m1_t vs2,
                                 size_t vl);
vuint64m1_t __riscv_vfcvt_rtz_xu_tum(vbool64_t vm, vuint64m1_t vd,
                                     vfloat64m1_t vs2, size_t vl);
vuint64m2_t __riscv_vfcvt_xu_tum(vbool32_t vm, vuint64m2_t vd, vfloat64m2_t vs2,
                                 size_t vl);
vuint64m2_t __riscv_vfcvt_rtz_xu_tum(vbool32_t vm, vuint64m2_t vd,
                                     vfloat64m2_t vs2, size_t vl);
vuint64m4_t __riscv_vfcvt_xu_tum(vbool16_t vm, vuint64m4_t vd, vfloat64m4_t vs2,
                                 size_t vl);
vuint64m4_t __riscv_vfcvt_rtz_xu_tum(vbool16_t vm, vuint64m4_t vd,
                                     vfloat64m4_t vs2, size_t vl);
vuint64m8_t __riscv_vfcvt_xu_tum(vbool8_t vm, vuint64m8_t vd, vfloat64m8_t vs2,
                                 size_t vl);
vuint64m8_t __riscv_vfcvt_rtz_xu_tum(vbool8_t vm, vuint64m8_t vd,
                                     vfloat64m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfcvt_f_tum(vbool64_t vm, vfloat64m1_t vd, vint64m1_t vs2,
                                 size_t vl);
vfloat64m2_t __riscv_vfcvt_f_tum(vbool32_t vm, vfloat64m2_t vd, vint64m2_t vs2,
                                 size_t vl);
vfloat64m4_t __riscv_vfcvt_f_tum(vbool16_t vm, vfloat64m4_t vd, vint64m4_t vs2,
                                 size_t vl);
vfloat64m8_t __riscv_vfcvt_f_tum(vbool8_t vm, vfloat64m8_t vd, vint64m8_t vs2,
                                 size_t vl);
vfloat64m1_t __riscv_vfcvt_f_tum(vbool64_t vm, vfloat64m1_t vd, vuint64m1_t vs2,
                                 size_t vl);
vfloat64m2_t __riscv_vfcvt_f_tum(vbool32_t vm, vfloat64m2_t vd, vuint64m2_t vs2,
                                 size_t vl);
vfloat64m4_t __riscv_vfcvt_f_tum(vbool16_t vm, vfloat64m4_t vd, vuint64m4_t vs2,
                                 size_t vl);
vfloat64m8_t __riscv_vfcvt_f_tum(vbool8_t vm, vfloat64m8_t vd, vuint64m8_t vs2,
                                 size_t vl);
// masked functions
vint16mf4_t __riscv_vfcvt_x_tumu(vbool64_t vm, vint16mf4_t vd,
                                 vfloat16mf4_t vs2, size_t vl);
vint16mf4_t __riscv_vfcvt_rtz_x_tumu(vbool64_t vm, vint16mf4_t vd,
                                     vfloat16mf4_t vs2, size_t vl);
vint16mf2_t __riscv_vfcvt_x_tumu(vbool32_t vm, vint16mf2_t vd,
                                 vfloat16mf2_t vs2, size_t vl);
vint16mf2_t __riscv_vfcvt_rtz_x_tumu(vbool32_t vm, vint16mf2_t vd,
                                     vfloat16mf2_t vs2, size_t vl);
vint16m1_t __riscv_vfcvt_x_tumu(vbool16_t vm, vint16m1_t vd, vfloat16m1_t vs2,
                                size_t vl);
vint16m1_t __riscv_vfcvt_rtz_x_tumu(vbool16_t vm, vint16m1_t vd,
                                    vfloat16m1_t vs2, size_t vl);
vint16m2_t __riscv_vfcvt_x_tumu(vbool8_t vm, vint16m2_t vd, vfloat16m2_t vs2,
                                size_t vl);
vint16m2_t __riscv_vfcvt_rtz_x_tumu(vbool8_t vm, vint16m2_t vd,
                                    vfloat16m2_t vs2, size_t vl);
vint16m4_t __riscv_vfcvt_x_tumu(vbool4_t vm, vint16m4_t vd, vfloat16m4_t vs2,
                                size_t vl);
vint16m4_t __riscv_vfcvt_rtz_x_tumu(vbool4_t vm, vint16m4_t vd,
                                    vfloat16m4_t vs2, size_t vl);
vint16m8_t __riscv_vfcvt_x_tumu(vbool2_t vm, vint16m8_t vd, vfloat16m8_t vs2,
                                size_t vl);
vint16m8_t __riscv_vfcvt_rtz_x_tumu(vbool2_t vm, vint16m8_t vd,
                                    vfloat16m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vfcvt_xu_tumu(vbool64_t vm, vuint16mf4_t vd,
                                   vfloat16mf4_t vs2, size_t vl);
vuint16mf4_t __riscv_vfcvt_rtz_xu_tumu(vbool64_t vm, vuint16mf4_t vd,
                                       vfloat16mf4_t vs2, size_t vl);
vuint16mf2_t __riscv_vfcvt_xu_tumu(vbool32_t vm, vuint16mf2_t vd,
                                   vfloat16mf2_t vs2, size_t vl);
vuint16mf2_t __riscv_vfcvt_rtz_xu_tumu(vbool32_t vm, vuint16mf2_t vd,
                                       vfloat16mf2_t vs2, size_t vl);
vuint16m1_t __riscv_vfcvt_xu_tumu(vbool16_t vm, vuint16m1_t vd,
                                  vfloat16m1_t vs2, size_t vl);
vuint16m1_t __riscv_vfcvt_rtz_xu_tumu(vbool16_t vm, vuint16m1_t vd,
                                      vfloat16m1_t vs2, size_t vl);
vuint16m2_t __riscv_vfcvt_xu_tumu(vbool8_t vm, vuint16m2_t vd, vfloat16m2_t vs2,
                                  size_t vl);
vuint16m2_t __riscv_vfcvt_rtz_xu_tumu(vbool8_t vm, vuint16m2_t vd,
                                      vfloat16m2_t vs2, size_t vl);
vuint16m4_t __riscv_vfcvt_xu_tumu(vbool4_t vm, vuint16m4_t vd, vfloat16m4_t vs2,
                                  size_t vl);
vuint16m4_t __riscv_vfcvt_rtz_xu_tumu(vbool4_t vm, vuint16m4_t vd,
                                      vfloat16m4_t vs2, size_t vl);
vuint16m8_t __riscv_vfcvt_xu_tumu(vbool2_t vm, vuint16m8_t vd, vfloat16m8_t vs2,
                                  size_t vl);
vuint16m8_t __riscv_vfcvt_rtz_xu_tumu(vbool2_t vm, vuint16m8_t vd,
                                      vfloat16m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                   vint16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                   vint16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_tumu(vbool16_t vm, vfloat16m1_t vd, vint16m1_t vs2,
                                  size_t vl);
vfloat16m2_t __riscv_vfcvt_f_tumu(vbool8_t vm, vfloat16m2_t vd, vint16m2_t vs2,
                                  size_t vl);
vfloat16m4_t __riscv_vfcvt_f_tumu(vbool4_t vm, vfloat16m4_t vd, vint16m4_t vs2,
                                  size_t vl);
vfloat16m8_t __riscv_vfcvt_f_tumu(vbool2_t vm, vfloat16m8_t vd, vint16m8_t vs2,
                                  size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                   vuint16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                   vuint16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_tumu(vbool16_t vm, vfloat16m1_t vd,
                                  vuint16m1_t vs2, size_t vl);
vfloat16m2_t __riscv_vfcvt_f_tumu(vbool8_t vm, vfloat16m2_t vd, vuint16m2_t vs2,
                                  size_t vl);
vfloat16m4_t __riscv_vfcvt_f_tumu(vbool4_t vm, vfloat16m4_t vd, vuint16m4_t vs2,
                                  size_t vl);
vfloat16m8_t __riscv_vfcvt_f_tumu(vbool2_t vm, vfloat16m8_t vd, vuint16m8_t vs2,
                                  size_t vl);
vint32mf2_t __riscv_vfcvt_x_tumu(vbool64_t vm, vint32mf2_t vd,
                                 vfloat32mf2_t vs2, size_t vl);
vint32mf2_t __riscv_vfcvt_rtz_x_tumu(vbool64_t vm, vint32mf2_t vd,
                                     vfloat32mf2_t vs2, size_t vl);
vint32m1_t __riscv_vfcvt_x_tumu(vbool32_t vm, vint32m1_t vd, vfloat32m1_t vs2,
                                size_t vl);
vint32m1_t __riscv_vfcvt_rtz_x_tumu(vbool32_t vm, vint32m1_t vd,
                                    vfloat32m1_t vs2, size_t vl);
vint32m2_t __riscv_vfcvt_x_tumu(vbool16_t vm, vint32m2_t vd, vfloat32m2_t vs2,
                                size_t vl);
vint32m2_t __riscv_vfcvt_rtz_x_tumu(vbool16_t vm, vint32m2_t vd,
                                    vfloat32m2_t vs2, size_t vl);
vint32m4_t __riscv_vfcvt_x_tumu(vbool8_t vm, vint32m4_t vd, vfloat32m4_t vs2,
                                size_t vl);
vint32m4_t __riscv_vfcvt_rtz_x_tumu(vbool8_t vm, vint32m4_t vd,
                                    vfloat32m4_t vs2, size_t vl);
vint32m8_t __riscv_vfcvt_x_tumu(vbool4_t vm, vint32m8_t vd, vfloat32m8_t vs2,
                                size_t vl);
vint32m8_t __riscv_vfcvt_rtz_x_tumu(vbool4_t vm, vint32m8_t vd,
                                    vfloat32m8_t vs2, size_t vl);
vuint32mf2_t __riscv_vfcvt_xu_tumu(vbool64_t vm, vuint32mf2_t vd,
                                   vfloat32mf2_t vs2, size_t vl);
vuint32mf2_t __riscv_vfcvt_rtz_xu_tumu(vbool64_t vm, vuint32mf2_t vd,
                                       vfloat32mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vfcvt_xu_tumu(vbool32_t vm, vuint32m1_t vd,
                                  vfloat32m1_t vs2, size_t vl);
vuint32m1_t __riscv_vfcvt_rtz_xu_tumu(vbool32_t vm, vuint32m1_t vd,
                                      vfloat32m1_t vs2, size_t vl);
vuint32m2_t __riscv_vfcvt_xu_tumu(vbool16_t vm, vuint32m2_t vd,
                                  vfloat32m2_t vs2, size_t vl);
vuint32m2_t __riscv_vfcvt_rtz_xu_tumu(vbool16_t vm, vuint32m2_t vd,
                                      vfloat32m2_t vs2, size_t vl);
vuint32m4_t __riscv_vfcvt_xu_tumu(vbool8_t vm, vuint32m4_t vd, vfloat32m4_t vs2,
                                  size_t vl);
vuint32m4_t __riscv_vfcvt_rtz_xu_tumu(vbool8_t vm, vuint32m4_t vd,
                                      vfloat32m4_t vs2, size_t vl);
vuint32m8_t __riscv_vfcvt_xu_tumu(vbool4_t vm, vuint32m8_t vd, vfloat32m8_t vs2,
                                  size_t vl);
vuint32m8_t __riscv_vfcvt_rtz_xu_tumu(vbool4_t vm, vuint32m8_t vd,
                                      vfloat32m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                   vint32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_tumu(vbool32_t vm, vfloat32m1_t vd, vint32m1_t vs2,
                                  size_t vl);
vfloat32m2_t __riscv_vfcvt_f_tumu(vbool16_t vm, vfloat32m2_t vd, vint32m2_t vs2,
                                  size_t vl);
vfloat32m4_t __riscv_vfcvt_f_tumu(vbool8_t vm, vfloat32m4_t vd, vint32m4_t vs2,
                                  size_t vl);
vfloat32m8_t __riscv_vfcvt_f_tumu(vbool4_t vm, vfloat32m8_t vd, vint32m8_t vs2,
                                  size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                   vuint32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_tumu(vbool32_t vm, vfloat32m1_t vd,
                                  vuint32m1_t vs2, size_t vl);
vfloat32m2_t __riscv_vfcvt_f_tumu(vbool16_t vm, vfloat32m2_t vd,
                                  vuint32m2_t vs2, size_t vl);
vfloat32m4_t __riscv_vfcvt_f_tumu(vbool8_t vm, vfloat32m4_t vd, vuint32m4_t vs2,
                                  size_t vl);
vfloat32m8_t __riscv_vfcvt_f_tumu(vbool4_t vm, vfloat32m8_t vd, vuint32m8_t vs2,
                                  size_t vl);
vint64m1_t __riscv_vfcvt_x_tumu(vbool64_t vm, vint64m1_t vd, vfloat64m1_t vs2,
                                size_t vl);
vint64m1_t __riscv_vfcvt_rtz_x_tumu(vbool64_t vm, vint64m1_t vd,
                                    vfloat64m1_t vs2, size_t vl);
vint64m2_t __riscv_vfcvt_x_tumu(vbool32_t vm, vint64m2_t vd, vfloat64m2_t vs2,
                                size_t vl);
vint64m2_t __riscv_vfcvt_rtz_x_tumu(vbool32_t vm, vint64m2_t vd,
                                    vfloat64m2_t vs2, size_t vl);
vint64m4_t __riscv_vfcvt_x_tumu(vbool16_t vm, vint64m4_t vd, vfloat64m4_t vs2,
                                size_t vl);
vint64m4_t __riscv_vfcvt_rtz_x_tumu(vbool16_t vm, vint64m4_t vd,
                                    vfloat64m4_t vs2, size_t vl);
vint64m8_t __riscv_vfcvt_x_tumu(vbool8_t vm, vint64m8_t vd, vfloat64m8_t vs2,
                                size_t vl);
vint64m8_t __riscv_vfcvt_rtz_x_tumu(vbool8_t vm, vint64m8_t vd,
                                    vfloat64m8_t vs2, size_t vl);
vuint64m1_t __riscv_vfcvt_xu_tumu(vbool64_t vm, vuint64m1_t vd,
                                  vfloat64m1_t vs2, size_t vl);
vuint64m1_t __riscv_vfcvt_rtz_xu_tumu(vbool64_t vm, vuint64m1_t vd,
                                      vfloat64m1_t vs2, size_t vl);
vuint64m2_t __riscv_vfcvt_xu_tumu(vbool32_t vm, vuint64m2_t vd,
                                  vfloat64m2_t vs2, size_t vl);
vuint64m2_t __riscv_vfcvt_rtz_xu_tumu(vbool32_t vm, vuint64m2_t vd,
                                      vfloat64m2_t vs2, size_t vl);
vuint64m4_t __riscv_vfcvt_xu_tumu(vbool16_t vm, vuint64m4_t vd,
                                  vfloat64m4_t vs2, size_t vl);
vuint64m4_t __riscv_vfcvt_rtz_xu_tumu(vbool16_t vm, vuint64m4_t vd,
                                      vfloat64m4_t vs2, size_t vl);
vuint64m8_t __riscv_vfcvt_xu_tumu(vbool8_t vm, vuint64m8_t vd, vfloat64m8_t vs2,
                                  size_t vl);
vuint64m8_t __riscv_vfcvt_rtz_xu_tumu(vbool8_t vm, vuint64m8_t vd,
                                      vfloat64m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfcvt_f_tumu(vbool64_t vm, vfloat64m1_t vd, vint64m1_t vs2,
                                  size_t vl);
vfloat64m2_t __riscv_vfcvt_f_tumu(vbool32_t vm, vfloat64m2_t vd, vint64m2_t vs2,
                                  size_t vl);
vfloat64m4_t __riscv_vfcvt_f_tumu(vbool16_t vm, vfloat64m4_t vd, vint64m4_t vs2,
                                  size_t vl);
vfloat64m8_t __riscv_vfcvt_f_tumu(vbool8_t vm, vfloat64m8_t vd, vint64m8_t vs2,
                                  size_t vl);
vfloat64m1_t __riscv_vfcvt_f_tumu(vbool64_t vm, vfloat64m1_t vd,
                                  vuint64m1_t vs2, size_t vl);
vfloat64m2_t __riscv_vfcvt_f_tumu(vbool32_t vm, vfloat64m2_t vd,
                                  vuint64m2_t vs2, size_t vl);
vfloat64m4_t __riscv_vfcvt_f_tumu(vbool16_t vm, vfloat64m4_t vd,
                                  vuint64m4_t vs2, size_t vl);
vfloat64m8_t __riscv_vfcvt_f_tumu(vbool8_t vm, vfloat64m8_t vd, vuint64m8_t vs2,
                                  size_t vl);
// masked functions
vint16mf4_t __riscv_vfcvt_x_mu(vbool64_t vm, vint16mf4_t vd, vfloat16mf4_t vs2,
                               size_t vl);
vint16mf4_t __riscv_vfcvt_rtz_x_mu(vbool64_t vm, vint16mf4_t vd,
                                   vfloat16mf4_t vs2, size_t vl);
vint16mf2_t __riscv_vfcvt_x_mu(vbool32_t vm, vint16mf2_t vd, vfloat16mf2_t vs2,
                               size_t vl);
vint16mf2_t __riscv_vfcvt_rtz_x_mu(vbool32_t vm, vint16mf2_t vd,
                                   vfloat16mf2_t vs2, size_t vl);
vint16m1_t __riscv_vfcvt_x_mu(vbool16_t vm, vint16m1_t vd, vfloat16m1_t vs2,
                              size_t vl);
vint16m1_t __riscv_vfcvt_rtz_x_mu(vbool16_t vm, vint16m1_t vd, vfloat16m1_t vs2,
                                  size_t vl);
vint16m2_t __riscv_vfcvt_x_mu(vbool8_t vm, vint16m2_t vd, vfloat16m2_t vs2,
                              size_t vl);
vint16m2_t __riscv_vfcvt_rtz_x_mu(vbool8_t vm, vint16m2_t vd, vfloat16m2_t vs2,
                                  size_t vl);
vint16m4_t __riscv_vfcvt_x_mu(vbool4_t vm, vint16m4_t vd, vfloat16m4_t vs2,
                              size_t vl);
vint16m4_t __riscv_vfcvt_rtz_x_mu(vbool4_t vm, vint16m4_t vd, vfloat16m4_t vs2,
                                  size_t vl);
vint16m8_t __riscv_vfcvt_x_mu(vbool2_t vm, vint16m8_t vd, vfloat16m8_t vs2,
                              size_t vl);
vint16m8_t __riscv_vfcvt_rtz_x_mu(vbool2_t vm, vint16m8_t vd, vfloat16m8_t vs2,
                                  size_t vl);
vuint16mf4_t __riscv_vfcvt_xu_mu(vbool64_t vm, vuint16mf4_t vd,
                                 vfloat16mf4_t vs2, size_t vl);
vuint16mf4_t __riscv_vfcvt_rtz_xu_mu(vbool64_t vm, vuint16mf4_t vd,
                                     vfloat16mf4_t vs2, size_t vl);
vuint16mf2_t __riscv_vfcvt_xu_mu(vbool32_t vm, vuint16mf2_t vd,
                                 vfloat16mf2_t vs2, size_t vl);
vuint16mf2_t __riscv_vfcvt_rtz_xu_mu(vbool32_t vm, vuint16mf2_t vd,
                                     vfloat16mf2_t vs2, size_t vl);
vuint16m1_t __riscv_vfcvt_xu_mu(vbool16_t vm, vuint16m1_t vd, vfloat16m1_t vs2,
                                size_t vl);
vuint16m1_t __riscv_vfcvt_rtz_xu_mu(vbool16_t vm, vuint16m1_t vd,
                                    vfloat16m1_t vs2, size_t vl);
vuint16m2_t __riscv_vfcvt_xu_mu(vbool8_t vm, vuint16m2_t vd, vfloat16m2_t vs2,
                                size_t vl);
vuint16m2_t __riscv_vfcvt_rtz_xu_mu(vbool8_t vm, vuint16m2_t vd,
                                    vfloat16m2_t vs2, size_t vl);
vuint16m4_t __riscv_vfcvt_xu_mu(vbool4_t vm, vuint16m4_t vd, vfloat16m4_t vs2,
                                size_t vl);
vuint16m4_t __riscv_vfcvt_rtz_xu_mu(vbool4_t vm, vuint16m4_t vd,
                                    vfloat16m4_t vs2, size_t vl);
vuint16m8_t __riscv_vfcvt_xu_mu(vbool2_t vm, vuint16m8_t vd, vfloat16m8_t vs2,
                                size_t vl);
vuint16m8_t __riscv_vfcvt_rtz_xu_mu(vbool2_t vm, vuint16m8_t vd,
                                    vfloat16m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_mu(vbool64_t vm, vfloat16mf4_t vd,
                                 vint16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_mu(vbool32_t vm, vfloat16mf2_t vd,
                                 vint16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_mu(vbool16_t vm, vfloat16m1_t vd, vint16m1_t vs2,
                                size_t vl);
vfloat16m2_t __riscv_vfcvt_f_mu(vbool8_t vm, vfloat16m2_t vd, vint16m2_t vs2,
                                size_t vl);
vfloat16m4_t __riscv_vfcvt_f_mu(vbool4_t vm, vfloat16m4_t vd, vint16m4_t vs2,
                                size_t vl);
vfloat16m8_t __riscv_vfcvt_f_mu(vbool2_t vm, vfloat16m8_t vd, vint16m8_t vs2,
                                size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_mu(vbool64_t vm, vfloat16mf4_t vd,
                                 vuint16mf4_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_mu(vbool32_t vm, vfloat16mf2_t vd,
                                 vuint16mf2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_mu(vbool16_t vm, vfloat16m1_t vd, vuint16m1_t vs2,
                                size_t vl);
vfloat16m2_t __riscv_vfcvt_f_mu(vbool8_t vm, vfloat16m2_t vd, vuint16m2_t vs2,
                                size_t vl);
vfloat16m4_t __riscv_vfcvt_f_mu(vbool4_t vm, vfloat16m4_t vd, vuint16m4_t vs2,
                                size_t vl);
vfloat16m8_t __riscv_vfcvt_f_mu(vbool2_t vm, vfloat16m8_t vd, vuint16m8_t vs2,
                                size_t vl);
vint32mf2_t __riscv_vfcvt_x_mu(vbool64_t vm, vint32mf2_t vd, vfloat32mf2_t vs2,
                               size_t vl);
vint32mf2_t __riscv_vfcvt_rtz_x_mu(vbool64_t vm, vint32mf2_t vd,
                                   vfloat32mf2_t vs2, size_t vl);
vint32m1_t __riscv_vfcvt_x_mu(vbool32_t vm, vint32m1_t vd, vfloat32m1_t vs2,
                              size_t vl);
vint32m1_t __riscv_vfcvt_rtz_x_mu(vbool32_t vm, vint32m1_t vd, vfloat32m1_t vs2,
                                  size_t vl);
vint32m2_t __riscv_vfcvt_x_mu(vbool16_t vm, vint32m2_t vd, vfloat32m2_t vs2,
                              size_t vl);
vint32m2_t __riscv_vfcvt_rtz_x_mu(vbool16_t vm, vint32m2_t vd, vfloat32m2_t vs2,
                                  size_t vl);
vint32m4_t __riscv_vfcvt_x_mu(vbool8_t vm, vint32m4_t vd, vfloat32m4_t vs2,
                              size_t vl);
vint32m4_t __riscv_vfcvt_rtz_x_mu(vbool8_t vm, vint32m4_t vd, vfloat32m4_t vs2,
                                  size_t vl);
vint32m8_t __riscv_vfcvt_x_mu(vbool4_t vm, vint32m8_t vd, vfloat32m8_t vs2,
                              size_t vl);
vint32m8_t __riscv_vfcvt_rtz_x_mu(vbool4_t vm, vint32m8_t vd, vfloat32m8_t vs2,
                                  size_t vl);
vuint32mf2_t __riscv_vfcvt_xu_mu(vbool64_t vm, vuint32mf2_t vd,
                                 vfloat32mf2_t vs2, size_t vl);
vuint32mf2_t __riscv_vfcvt_rtz_xu_mu(vbool64_t vm, vuint32mf2_t vd,
                                     vfloat32mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vfcvt_xu_mu(vbool32_t vm, vuint32m1_t vd, vfloat32m1_t vs2,
                                size_t vl);
vuint32m1_t __riscv_vfcvt_rtz_xu_mu(vbool32_t vm, vuint32m1_t vd,
                                    vfloat32m1_t vs2, size_t vl);
vuint32m2_t __riscv_vfcvt_xu_mu(vbool16_t vm, vuint32m2_t vd, vfloat32m2_t vs2,
                                size_t vl);
vuint32m2_t __riscv_vfcvt_rtz_xu_mu(vbool16_t vm, vuint32m2_t vd,
                                    vfloat32m2_t vs2, size_t vl);
vuint32m4_t __riscv_vfcvt_xu_mu(vbool8_t vm, vuint32m4_t vd, vfloat32m4_t vs2,
                                size_t vl);
vuint32m4_t __riscv_vfcvt_rtz_xu_mu(vbool8_t vm, vuint32m4_t vd,
                                    vfloat32m4_t vs2, size_t vl);
vuint32m8_t __riscv_vfcvt_xu_mu(vbool4_t vm, vuint32m8_t vd, vfloat32m8_t vs2,
                                size_t vl);
vuint32m8_t __riscv_vfcvt_rtz_xu_mu(vbool4_t vm, vuint32m8_t vd,
                                    vfloat32m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_mu(vbool64_t vm, vfloat32mf2_t vd,
                                 vint32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_mu(vbool32_t vm, vfloat32m1_t vd, vint32m1_t vs2,
                                size_t vl);
vfloat32m2_t __riscv_vfcvt_f_mu(vbool16_t vm, vfloat32m2_t vd, vint32m2_t vs2,
                                size_t vl);
vfloat32m4_t __riscv_vfcvt_f_mu(vbool8_t vm, vfloat32m4_t vd, vint32m4_t vs2,
                                size_t vl);
vfloat32m8_t __riscv_vfcvt_f_mu(vbool4_t vm, vfloat32m8_t vd, vint32m8_t vs2,
                                size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_mu(vbool64_t vm, vfloat32mf2_t vd,
                                 vuint32mf2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_mu(vbool32_t vm, vfloat32m1_t vd, vuint32m1_t vs2,
                                size_t vl);
vfloat32m2_t __riscv_vfcvt_f_mu(vbool16_t vm, vfloat32m2_t vd, vuint32m2_t vs2,
                                size_t vl);
vfloat32m4_t __riscv_vfcvt_f_mu(vbool8_t vm, vfloat32m4_t vd, vuint32m4_t vs2,
                                size_t vl);
vfloat32m8_t __riscv_vfcvt_f_mu(vbool4_t vm, vfloat32m8_t vd, vuint32m8_t vs2,
                                size_t vl);
vint64m1_t __riscv_vfcvt_x_mu(vbool64_t vm, vint64m1_t vd, vfloat64m1_t vs2,
                              size_t vl);
vint64m1_t __riscv_vfcvt_rtz_x_mu(vbool64_t vm, vint64m1_t vd, vfloat64m1_t vs2,
                                  size_t vl);
vint64m2_t __riscv_vfcvt_x_mu(vbool32_t vm, vint64m2_t vd, vfloat64m2_t vs2,
                              size_t vl);
vint64m2_t __riscv_vfcvt_rtz_x_mu(vbool32_t vm, vint64m2_t vd, vfloat64m2_t vs2,
                                  size_t vl);
vint64m4_t __riscv_vfcvt_x_mu(vbool16_t vm, vint64m4_t vd, vfloat64m4_t vs2,
                              size_t vl);
vint64m4_t __riscv_vfcvt_rtz_x_mu(vbool16_t vm, vint64m4_t vd, vfloat64m4_t vs2,
                                  size_t vl);
vint64m8_t __riscv_vfcvt_x_mu(vbool8_t vm, vint64m8_t vd, vfloat64m8_t vs2,
                              size_t vl);
vint64m8_t __riscv_vfcvt_rtz_x_mu(vbool8_t vm, vint64m8_t vd, vfloat64m8_t vs2,
                                  size_t vl);
vuint64m1_t __riscv_vfcvt_xu_mu(vbool64_t vm, vuint64m1_t vd, vfloat64m1_t vs2,
                                size_t vl);
vuint64m1_t __riscv_vfcvt_rtz_xu_mu(vbool64_t vm, vuint64m1_t vd,
                                    vfloat64m1_t vs2, size_t vl);
vuint64m2_t __riscv_vfcvt_xu_mu(vbool32_t vm, vuint64m2_t vd, vfloat64m2_t vs2,
                                size_t vl);
vuint64m2_t __riscv_vfcvt_rtz_xu_mu(vbool32_t vm, vuint64m2_t vd,
                                    vfloat64m2_t vs2, size_t vl);
vuint64m4_t __riscv_vfcvt_xu_mu(vbool16_t vm, vuint64m4_t vd, vfloat64m4_t vs2,
                                size_t vl);
vuint64m4_t __riscv_vfcvt_rtz_xu_mu(vbool16_t vm, vuint64m4_t vd,
                                    vfloat64m4_t vs2, size_t vl);
vuint64m8_t __riscv_vfcvt_xu_mu(vbool8_t vm, vuint64m8_t vd, vfloat64m8_t vs2,
                                size_t vl);
vuint64m8_t __riscv_vfcvt_rtz_xu_mu(vbool8_t vm, vuint64m8_t vd,
                                    vfloat64m8_t vs2, size_t vl);
vfloat64m1_t __riscv_vfcvt_f_mu(vbool64_t vm, vfloat64m1_t vd, vint64m1_t vs2,
                                size_t vl);
vfloat64m2_t __riscv_vfcvt_f_mu(vbool32_t vm, vfloat64m2_t vd, vint64m2_t vs2,
                                size_t vl);
vfloat64m4_t __riscv_vfcvt_f_mu(vbool16_t vm, vfloat64m4_t vd, vint64m4_t vs2,
                                size_t vl);
vfloat64m8_t __riscv_vfcvt_f_mu(vbool8_t vm, vfloat64m8_t vd, vint64m8_t vs2,
                                size_t vl);
vfloat64m1_t __riscv_vfcvt_f_mu(vbool64_t vm, vfloat64m1_t vd, vuint64m1_t vs2,
                                size_t vl);
vfloat64m2_t __riscv_vfcvt_f_mu(vbool32_t vm, vfloat64m2_t vd, vuint64m2_t vs2,
                                size_t vl);
vfloat64m4_t __riscv_vfcvt_f_mu(vbool16_t vm, vfloat64m4_t vd, vuint64m4_t vs2,
                                size_t vl);
vfloat64m8_t __riscv_vfcvt_f_mu(vbool8_t vm, vfloat64m8_t vd, vuint64m8_t vs2,
                                size_t vl);
vint16mf4_t __riscv_vfcvt_x_tu(vint16mf4_t vd, vfloat16mf4_t vs2,
                               unsigned int frm, size_t vl);
vint16mf2_t __riscv_vfcvt_x_tu(vint16mf2_t vd, vfloat16mf2_t vs2,
                               unsigned int frm, size_t vl);
vint16m1_t __riscv_vfcvt_x_tu(vint16m1_t vd, vfloat16m1_t vs2, unsigned int frm,
                              size_t vl);
vint16m2_t __riscv_vfcvt_x_tu(vint16m2_t vd, vfloat16m2_t vs2, unsigned int frm,
                              size_t vl);
vint16m4_t __riscv_vfcvt_x_tu(vint16m4_t vd, vfloat16m4_t vs2, unsigned int frm,
                              size_t vl);
vint16m8_t __riscv_vfcvt_x_tu(vint16m8_t vd, vfloat16m8_t vs2, unsigned int frm,
                              size_t vl);
vuint16mf4_t __riscv_vfcvt_xu_tu(vuint16mf4_t vd, vfloat16mf4_t vs2,
                                 unsigned int frm, size_t vl);
vuint16mf2_t __riscv_vfcvt_xu_tu(vuint16mf2_t vd, vfloat16mf2_t vs2,
                                 unsigned int frm, size_t vl);
vuint16m1_t __riscv_vfcvt_xu_tu(vuint16m1_t vd, vfloat16m1_t vs2,
                                unsigned int frm, size_t vl);
vuint16m2_t __riscv_vfcvt_xu_tu(vuint16m2_t vd, vfloat16m2_t vs2,
                                unsigned int frm, size_t vl);
vuint16m4_t __riscv_vfcvt_xu_tu(vuint16m4_t vd, vfloat16m4_t vs2,
                                unsigned int frm, size_t vl);
vuint16m8_t __riscv_vfcvt_xu_tu(vuint16m8_t vd, vfloat16m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_tu(vfloat16mf4_t vd, vint16mf4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_tu(vfloat16mf2_t vd, vint16mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_tu(vfloat16m1_t vd, vint16m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfcvt_f_tu(vfloat16m2_t vd, vint16m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfcvt_f_tu(vfloat16m4_t vd, vint16m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfcvt_f_tu(vfloat16m8_t vd, vint16m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_tu(vfloat16mf4_t vd, vuint16mf4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_tu(vfloat16mf2_t vd, vuint16mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_tu(vfloat16m1_t vd, vuint16m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfcvt_f_tu(vfloat16m2_t vd, vuint16m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfcvt_f_tu(vfloat16m4_t vd, vuint16m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfcvt_f_tu(vfloat16m8_t vd, vuint16m8_t vs2,
                                unsigned int frm, size_t vl);
vint32mf2_t __riscv_vfcvt_x_tu(vint32mf2_t vd, vfloat32mf2_t vs2,
                               unsigned int frm, size_t vl);
vint32m1_t __riscv_vfcvt_x_tu(vint32m1_t vd, vfloat32m1_t vs2, unsigned int frm,
                              size_t vl);
vint32m2_t __riscv_vfcvt_x_tu(vint32m2_t vd, vfloat32m2_t vs2, unsigned int frm,
                              size_t vl);
vint32m4_t __riscv_vfcvt_x_tu(vint32m4_t vd, vfloat32m4_t vs2, unsigned int frm,
                              size_t vl);
vint32m8_t __riscv_vfcvt_x_tu(vint32m8_t vd, vfloat32m8_t vs2, unsigned int frm,
                              size_t vl);
vuint32mf2_t __riscv_vfcvt_xu_tu(vuint32mf2_t vd, vfloat32mf2_t vs2,
                                 unsigned int frm, size_t vl);
vuint32m1_t __riscv_vfcvt_xu_tu(vuint32m1_t vd, vfloat32m1_t vs2,
                                unsigned int frm, size_t vl);
vuint32m2_t __riscv_vfcvt_xu_tu(vuint32m2_t vd, vfloat32m2_t vs2,
                                unsigned int frm, size_t vl);
vuint32m4_t __riscv_vfcvt_xu_tu(vuint32m4_t vd, vfloat32m4_t vs2,
                                unsigned int frm, size_t vl);
vuint32m8_t __riscv_vfcvt_xu_tu(vuint32m8_t vd, vfloat32m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_tu(vfloat32mf2_t vd, vint32mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_tu(vfloat32m1_t vd, vint32m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfcvt_f_tu(vfloat32m2_t vd, vint32m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfcvt_f_tu(vfloat32m4_t vd, vint32m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfcvt_f_tu(vfloat32m8_t vd, vint32m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_tu(vfloat32mf2_t vd, vuint32mf2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_tu(vfloat32m1_t vd, vuint32m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfcvt_f_tu(vfloat32m2_t vd, vuint32m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfcvt_f_tu(vfloat32m4_t vd, vuint32m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfcvt_f_tu(vfloat32m8_t vd, vuint32m8_t vs2,
                                unsigned int frm, size_t vl);
vint64m1_t __riscv_vfcvt_x_tu(vint64m1_t vd, vfloat64m1_t vs2, unsigned int frm,
                              size_t vl);
vint64m2_t __riscv_vfcvt_x_tu(vint64m2_t vd, vfloat64m2_t vs2, unsigned int frm,
                              size_t vl);
vint64m4_t __riscv_vfcvt_x_tu(vint64m4_t vd, vfloat64m4_t vs2, unsigned int frm,
                              size_t vl);
vint64m8_t __riscv_vfcvt_x_tu(vint64m8_t vd, vfloat64m8_t vs2, unsigned int frm,
                              size_t vl);
vuint64m1_t __riscv_vfcvt_xu_tu(vuint64m1_t vd, vfloat64m1_t vs2,
                                unsigned int frm, size_t vl);
vuint64m2_t __riscv_vfcvt_xu_tu(vuint64m2_t vd, vfloat64m2_t vs2,
                                unsigned int frm, size_t vl);
vuint64m4_t __riscv_vfcvt_xu_tu(vuint64m4_t vd, vfloat64m4_t vs2,
                                unsigned int frm, size_t vl);
vuint64m8_t __riscv_vfcvt_xu_tu(vuint64m8_t vd, vfloat64m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfcvt_f_tu(vfloat64m1_t vd, vint64m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfcvt_f_tu(vfloat64m2_t vd, vint64m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfcvt_f_tu(vfloat64m4_t vd, vint64m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfcvt_f_tu(vfloat64m8_t vd, vint64m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfcvt_f_tu(vfloat64m1_t vd, vuint64m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfcvt_f_tu(vfloat64m2_t vd, vuint64m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfcvt_f_tu(vfloat64m4_t vd, vuint64m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfcvt_f_tu(vfloat64m8_t vd, vuint64m8_t vs2,
                                unsigned int frm, size_t vl);
// masked functions
vint16mf4_t __riscv_vfcvt_x_tum(vbool64_t vm, vint16mf4_t vd, vfloat16mf4_t vs2,
                                unsigned int frm, size_t vl);
vint16mf2_t __riscv_vfcvt_x_tum(vbool32_t vm, vint16mf2_t vd, vfloat16mf2_t vs2,
                                unsigned int frm, size_t vl);
vint16m1_t __riscv_vfcvt_x_tum(vbool16_t vm, vint16m1_t vd, vfloat16m1_t vs2,
                               unsigned int frm, size_t vl);
vint16m2_t __riscv_vfcvt_x_tum(vbool8_t vm, vint16m2_t vd, vfloat16m2_t vs2,
                               unsigned int frm, size_t vl);
vint16m4_t __riscv_vfcvt_x_tum(vbool4_t vm, vint16m4_t vd, vfloat16m4_t vs2,
                               unsigned int frm, size_t vl);
vint16m8_t __riscv_vfcvt_x_tum(vbool2_t vm, vint16m8_t vd, vfloat16m8_t vs2,
                               unsigned int frm, size_t vl);
vuint16mf4_t __riscv_vfcvt_xu_tum(vbool64_t vm, vuint16mf4_t vd,
                                  vfloat16mf4_t vs2, unsigned int frm,
                                  size_t vl);
vuint16mf2_t __riscv_vfcvt_xu_tum(vbool32_t vm, vuint16mf2_t vd,
                                  vfloat16mf2_t vs2, unsigned int frm,
                                  size_t vl);
vuint16m1_t __riscv_vfcvt_xu_tum(vbool16_t vm, vuint16m1_t vd, vfloat16m1_t vs2,
                                 unsigned int frm, size_t vl);
vuint16m2_t __riscv_vfcvt_xu_tum(vbool8_t vm, vuint16m2_t vd, vfloat16m2_t vs2,
                                 unsigned int frm, size_t vl);
vuint16m4_t __riscv_vfcvt_xu_tum(vbool4_t vm, vuint16m4_t vd, vfloat16m4_t vs2,
                                 unsigned int frm, size_t vl);
vuint16m8_t __riscv_vfcvt_xu_tum(vbool2_t vm, vuint16m8_t vd, vfloat16m8_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_tum(vbool64_t vm, vfloat16mf4_t vd,
                                  vint16mf4_t vs2, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_tum(vbool32_t vm, vfloat16mf2_t vd,
                                  vint16mf2_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_tum(vbool16_t vm, vfloat16m1_t vd, vint16m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfcvt_f_tum(vbool8_t vm, vfloat16m2_t vd, vint16m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfcvt_f_tum(vbool4_t vm, vfloat16m4_t vd, vint16m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfcvt_f_tum(vbool2_t vm, vfloat16m8_t vd, vint16m8_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_tum(vbool64_t vm, vfloat16mf4_t vd,
                                  vuint16mf4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_tum(vbool32_t vm, vfloat16mf2_t vd,
                                  vuint16mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m1_t __riscv_vfcvt_f_tum(vbool16_t vm, vfloat16m1_t vd, vuint16m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfcvt_f_tum(vbool8_t vm, vfloat16m2_t vd, vuint16m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfcvt_f_tum(vbool4_t vm, vfloat16m4_t vd, vuint16m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfcvt_f_tum(vbool2_t vm, vfloat16m8_t vd, vuint16m8_t vs2,
                                 unsigned int frm, size_t vl);
vint32mf2_t __riscv_vfcvt_x_tum(vbool64_t vm, vint32mf2_t vd, vfloat32mf2_t vs2,
                                unsigned int frm, size_t vl);
vint32m1_t __riscv_vfcvt_x_tum(vbool32_t vm, vint32m1_t vd, vfloat32m1_t vs2,
                               unsigned int frm, size_t vl);
vint32m2_t __riscv_vfcvt_x_tum(vbool16_t vm, vint32m2_t vd, vfloat32m2_t vs2,
                               unsigned int frm, size_t vl);
vint32m4_t __riscv_vfcvt_x_tum(vbool8_t vm, vint32m4_t vd, vfloat32m4_t vs2,
                               unsigned int frm, size_t vl);
vint32m8_t __riscv_vfcvt_x_tum(vbool4_t vm, vint32m8_t vd, vfloat32m8_t vs2,
                               unsigned int frm, size_t vl);
vuint32mf2_t __riscv_vfcvt_xu_tum(vbool64_t vm, vuint32mf2_t vd,
                                  vfloat32mf2_t vs2, unsigned int frm,
                                  size_t vl);
vuint32m1_t __riscv_vfcvt_xu_tum(vbool32_t vm, vuint32m1_t vd, vfloat32m1_t vs2,
                                 unsigned int frm, size_t vl);
vuint32m2_t __riscv_vfcvt_xu_tum(vbool16_t vm, vuint32m2_t vd, vfloat32m2_t vs2,
                                 unsigned int frm, size_t vl);
vuint32m4_t __riscv_vfcvt_xu_tum(vbool8_t vm, vuint32m4_t vd, vfloat32m4_t vs2,
                                 unsigned int frm, size_t vl);
vuint32m8_t __riscv_vfcvt_xu_tum(vbool4_t vm, vuint32m8_t vd, vfloat32m8_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_tum(vbool64_t vm, vfloat32mf2_t vd,
                                  vint32mf2_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_tum(vbool32_t vm, vfloat32m1_t vd, vint32m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfcvt_f_tum(vbool16_t vm, vfloat32m2_t vd, vint32m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfcvt_f_tum(vbool8_t vm, vfloat32m4_t vd, vint32m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfcvt_f_tum(vbool4_t vm, vfloat32m8_t vd, vint32m8_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_tum(vbool64_t vm, vfloat32mf2_t vd,
                                  vuint32mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfcvt_f_tum(vbool32_t vm, vfloat32m1_t vd, vuint32m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfcvt_f_tum(vbool16_t vm, vfloat32m2_t vd, vuint32m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfcvt_f_tum(vbool8_t vm, vfloat32m4_t vd, vuint32m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfcvt_f_tum(vbool4_t vm, vfloat32m8_t vd, vuint32m8_t vs2,
                                 unsigned int frm, size_t vl);
vint64m1_t __riscv_vfcvt_x_tum(vbool64_t vm, vint64m1_t vd, vfloat64m1_t vs2,
                               unsigned int frm, size_t vl);
vint64m2_t __riscv_vfcvt_x_tum(vbool32_t vm, vint64m2_t vd, vfloat64m2_t vs2,
                               unsigned int frm, size_t vl);
vint64m4_t __riscv_vfcvt_x_tum(vbool16_t vm, vint64m4_t vd, vfloat64m4_t vs2,
                               unsigned int frm, size_t vl);
vint64m8_t __riscv_vfcvt_x_tum(vbool8_t vm, vint64m8_t vd, vfloat64m8_t vs2,
                               unsigned int frm, size_t vl);
vuint64m1_t __riscv_vfcvt_xu_tum(vbool64_t vm, vuint64m1_t vd, vfloat64m1_t vs2,
                                 unsigned int frm, size_t vl);
vuint64m2_t __riscv_vfcvt_xu_tum(vbool32_t vm, vuint64m2_t vd, vfloat64m2_t vs2,
                                 unsigned int frm, size_t vl);
vuint64m4_t __riscv_vfcvt_xu_tum(vbool16_t vm, vuint64m4_t vd, vfloat64m4_t vs2,
                                 unsigned int frm, size_t vl);
vuint64m8_t __riscv_vfcvt_xu_tum(vbool8_t vm, vuint64m8_t vd, vfloat64m8_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfcvt_f_tum(vbool64_t vm, vfloat64m1_t vd, vint64m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfcvt_f_tum(vbool32_t vm, vfloat64m2_t vd, vint64m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfcvt_f_tum(vbool16_t vm, vfloat64m4_t vd, vint64m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfcvt_f_tum(vbool8_t vm, vfloat64m8_t vd, vint64m8_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfcvt_f_tum(vbool64_t vm, vfloat64m1_t vd, vuint64m1_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfcvt_f_tum(vbool32_t vm, vfloat64m2_t vd, vuint64m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfcvt_f_tum(vbool16_t vm, vfloat64m4_t vd, vuint64m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfcvt_f_tum(vbool8_t vm, vfloat64m8_t vd, vuint64m8_t vs2,
                                 unsigned int frm, size_t vl);
// masked functions
vint16mf4_t __riscv_vfcvt_x_tumu(vbool64_t vm, vint16mf4_t vd,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vint16mf2_t __riscv_vfcvt_x_tumu(vbool32_t vm, vint16mf2_t vd,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vint16m1_t __riscv_vfcvt_x_tumu(vbool16_t vm, vint16m1_t vd, vfloat16m1_t vs2,
                                unsigned int frm, size_t vl);
vint16m2_t __riscv_vfcvt_x_tumu(vbool8_t vm, vint16m2_t vd, vfloat16m2_t vs2,
                                unsigned int frm, size_t vl);
vint16m4_t __riscv_vfcvt_x_tumu(vbool4_t vm, vint16m4_t vd, vfloat16m4_t vs2,
                                unsigned int frm, size_t vl);
vint16m8_t __riscv_vfcvt_x_tumu(vbool2_t vm, vint16m8_t vd, vfloat16m8_t vs2,
                                unsigned int frm, size_t vl);
vuint16mf4_t __riscv_vfcvt_xu_tumu(vbool64_t vm, vuint16mf4_t vd,
                                   vfloat16mf4_t vs2, unsigned int frm,
                                   size_t vl);
vuint16mf2_t __riscv_vfcvt_xu_tumu(vbool32_t vm, vuint16mf2_t vd,
                                   vfloat16mf2_t vs2, unsigned int frm,
                                   size_t vl);
vuint16m1_t __riscv_vfcvt_xu_tumu(vbool16_t vm, vuint16m1_t vd,
                                  vfloat16m1_t vs2, unsigned int frm,
                                  size_t vl);
vuint16m2_t __riscv_vfcvt_xu_tumu(vbool8_t vm, vuint16m2_t vd, vfloat16m2_t vs2,
                                  unsigned int frm, size_t vl);
vuint16m4_t __riscv_vfcvt_xu_tumu(vbool4_t vm, vuint16m4_t vd, vfloat16m4_t vs2,
                                  unsigned int frm, size_t vl);
vuint16m8_t __riscv_vfcvt_xu_tumu(vbool2_t vm, vuint16m8_t vd, vfloat16m8_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                   vint16mf4_t vs2, unsigned int frm,
                                   size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                   vint16mf2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat16m1_t __riscv_vfcvt_f_tumu(vbool16_t vm, vfloat16m1_t vd, vint16m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfcvt_f_tumu(vbool8_t vm, vfloat16m2_t vd, vint16m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfcvt_f_tumu(vbool4_t vm, vfloat16m4_t vd, vint16m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfcvt_f_tumu(vbool2_t vm, vfloat16m8_t vd, vint16m8_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                   vuint16mf4_t vs2, unsigned int frm,
                                   size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                   vuint16mf2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat16m1_t __riscv_vfcvt_f_tumu(vbool16_t vm, vfloat16m1_t vd,
                                  vuint16m1_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfcvt_f_tumu(vbool8_t vm, vfloat16m2_t vd, vuint16m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfcvt_f_tumu(vbool4_t vm, vfloat16m4_t vd, vuint16m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfcvt_f_tumu(vbool2_t vm, vfloat16m8_t vd, vuint16m8_t vs2,
                                  unsigned int frm, size_t vl);
vint32mf2_t __riscv_vfcvt_x_tumu(vbool64_t vm, vint32mf2_t vd,
                                 vfloat32mf2_t vs2, unsigned int frm,
                                 size_t vl);
vint32m1_t __riscv_vfcvt_x_tumu(vbool32_t vm, vint32m1_t vd, vfloat32m1_t vs2,
                                unsigned int frm, size_t vl);
vint32m2_t __riscv_vfcvt_x_tumu(vbool16_t vm, vint32m2_t vd, vfloat32m2_t vs2,
                                unsigned int frm, size_t vl);
vint32m4_t __riscv_vfcvt_x_tumu(vbool8_t vm, vint32m4_t vd, vfloat32m4_t vs2,
                                unsigned int frm, size_t vl);
vint32m8_t __riscv_vfcvt_x_tumu(vbool4_t vm, vint32m8_t vd, vfloat32m8_t vs2,
                                unsigned int frm, size_t vl);
vuint32mf2_t __riscv_vfcvt_xu_tumu(vbool64_t vm, vuint32mf2_t vd,
                                   vfloat32mf2_t vs2, unsigned int frm,
                                   size_t vl);
vuint32m1_t __riscv_vfcvt_xu_tumu(vbool32_t vm, vuint32m1_t vd,
                                  vfloat32m1_t vs2, unsigned int frm,
                                  size_t vl);
vuint32m2_t __riscv_vfcvt_xu_tumu(vbool16_t vm, vuint32m2_t vd,
                                  vfloat32m2_t vs2, unsigned int frm,
                                  size_t vl);
vuint32m4_t __riscv_vfcvt_xu_tumu(vbool8_t vm, vuint32m4_t vd, vfloat32m4_t vs2,
                                  unsigned int frm, size_t vl);
vuint32m8_t __riscv_vfcvt_xu_tumu(vbool4_t vm, vuint32m8_t vd, vfloat32m8_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                   vint32mf2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat32m1_t __riscv_vfcvt_f_tumu(vbool32_t vm, vfloat32m1_t vd, vint32m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfcvt_f_tumu(vbool16_t vm, vfloat32m2_t vd, vint32m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfcvt_f_tumu(vbool8_t vm, vfloat32m4_t vd, vint32m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfcvt_f_tumu(vbool4_t vm, vfloat32m8_t vd, vint32m8_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                   vuint32mf2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat32m1_t __riscv_vfcvt_f_tumu(vbool32_t vm, vfloat32m1_t vd,
                                  vuint32m1_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfcvt_f_tumu(vbool16_t vm, vfloat32m2_t vd,
                                  vuint32m2_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfcvt_f_tumu(vbool8_t vm, vfloat32m4_t vd, vuint32m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfcvt_f_tumu(vbool4_t vm, vfloat32m8_t vd, vuint32m8_t vs2,
                                  unsigned int frm, size_t vl);
vint64m1_t __riscv_vfcvt_x_tumu(vbool64_t vm, vint64m1_t vd, vfloat64m1_t vs2,
                                unsigned int frm, size_t vl);
vint64m2_t __riscv_vfcvt_x_tumu(vbool32_t vm, vint64m2_t vd, vfloat64m2_t vs2,
                                unsigned int frm, size_t vl);
vint64m4_t __riscv_vfcvt_x_tumu(vbool16_t vm, vint64m4_t vd, vfloat64m4_t vs2,
                                unsigned int frm, size_t vl);
vint64m8_t __riscv_vfcvt_x_tumu(vbool8_t vm, vint64m8_t vd, vfloat64m8_t vs2,
                                unsigned int frm, size_t vl);
vuint64m1_t __riscv_vfcvt_xu_tumu(vbool64_t vm, vuint64m1_t vd,
                                  vfloat64m1_t vs2, unsigned int frm,
                                  size_t vl);
vuint64m2_t __riscv_vfcvt_xu_tumu(vbool32_t vm, vuint64m2_t vd,
                                  vfloat64m2_t vs2, unsigned int frm,
                                  size_t vl);
vuint64m4_t __riscv_vfcvt_xu_tumu(vbool16_t vm, vuint64m4_t vd,
                                  vfloat64m4_t vs2, unsigned int frm,
                                  size_t vl);
vuint64m8_t __riscv_vfcvt_xu_tumu(vbool8_t vm, vuint64m8_t vd, vfloat64m8_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfcvt_f_tumu(vbool64_t vm, vfloat64m1_t vd, vint64m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfcvt_f_tumu(vbool32_t vm, vfloat64m2_t vd, vint64m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfcvt_f_tumu(vbool16_t vm, vfloat64m4_t vd, vint64m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfcvt_f_tumu(vbool8_t vm, vfloat64m8_t vd, vint64m8_t vs2,
                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfcvt_f_tumu(vbool64_t vm, vfloat64m1_t vd,
                                  vuint64m1_t vs2, unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfcvt_f_tumu(vbool32_t vm, vfloat64m2_t vd,
                                  vuint64m2_t vs2, unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfcvt_f_tumu(vbool16_t vm, vfloat64m4_t vd,
                                  vuint64m4_t vs2, unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfcvt_f_tumu(vbool8_t vm, vfloat64m8_t vd, vuint64m8_t vs2,
                                  unsigned int frm, size_t vl);
// masked functions
vint16mf4_t __riscv_vfcvt_x_mu(vbool64_t vm, vint16mf4_t vd, vfloat16mf4_t vs2,
                               unsigned int frm, size_t vl);
vint16mf2_t __riscv_vfcvt_x_mu(vbool32_t vm, vint16mf2_t vd, vfloat16mf2_t vs2,
                               unsigned int frm, size_t vl);
vint16m1_t __riscv_vfcvt_x_mu(vbool16_t vm, vint16m1_t vd, vfloat16m1_t vs2,
                              unsigned int frm, size_t vl);
vint16m2_t __riscv_vfcvt_x_mu(vbool8_t vm, vint16m2_t vd, vfloat16m2_t vs2,
                              unsigned int frm, size_t vl);
vint16m4_t __riscv_vfcvt_x_mu(vbool4_t vm, vint16m4_t vd, vfloat16m4_t vs2,
                              unsigned int frm, size_t vl);
vint16m8_t __riscv_vfcvt_x_mu(vbool2_t vm, vint16m8_t vd, vfloat16m8_t vs2,
                              unsigned int frm, size_t vl);
vuint16mf4_t __riscv_vfcvt_xu_mu(vbool64_t vm, vuint16mf4_t vd,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vuint16mf2_t __riscv_vfcvt_xu_mu(vbool32_t vm, vuint16mf2_t vd,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vuint16m1_t __riscv_vfcvt_xu_mu(vbool16_t vm, vuint16m1_t vd, vfloat16m1_t vs2,
                                unsigned int frm, size_t vl);
vuint16m2_t __riscv_vfcvt_xu_mu(vbool8_t vm, vuint16m2_t vd, vfloat16m2_t vs2,
                                unsigned int frm, size_t vl);
vuint16m4_t __riscv_vfcvt_xu_mu(vbool4_t vm, vuint16m4_t vd, vfloat16m4_t vs2,
                                unsigned int frm, size_t vl);
vuint16m8_t __riscv_vfcvt_xu_mu(vbool2_t vm, vuint16m8_t vd, vfloat16m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_mu(vbool64_t vm, vfloat16mf4_t vd,
                                 vint16mf4_t vs2, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_mu(vbool32_t vm, vfloat16mf2_t vd,
                                 vint16mf2_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_mu(vbool16_t vm, vfloat16m1_t vd, vint16m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfcvt_f_mu(vbool8_t vm, vfloat16m2_t vd, vint16m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfcvt_f_mu(vbool4_t vm, vfloat16m4_t vd, vint16m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfcvt_f_mu(vbool2_t vm, vfloat16m8_t vd, vint16m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfcvt_f_mu(vbool64_t vm, vfloat16mf4_t vd,
                                 vuint16mf4_t vs2, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfcvt_f_mu(vbool32_t vm, vfloat16mf2_t vd,
                                 vuint16mf2_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfcvt_f_mu(vbool16_t vm, vfloat16m1_t vd, vuint16m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfcvt_f_mu(vbool8_t vm, vfloat16m2_t vd, vuint16m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfcvt_f_mu(vbool4_t vm, vfloat16m4_t vd, vuint16m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat16m8_t __riscv_vfcvt_f_mu(vbool2_t vm, vfloat16m8_t vd, vuint16m8_t vs2,
                                unsigned int frm, size_t vl);
vint32mf2_t __riscv_vfcvt_x_mu(vbool64_t vm, vint32mf2_t vd, vfloat32mf2_t vs2,
                               unsigned int frm, size_t vl);
vint32m1_t __riscv_vfcvt_x_mu(vbool32_t vm, vint32m1_t vd, vfloat32m1_t vs2,
                              unsigned int frm, size_t vl);
vint32m2_t __riscv_vfcvt_x_mu(vbool16_t vm, vint32m2_t vd, vfloat32m2_t vs2,
                              unsigned int frm, size_t vl);
vint32m4_t __riscv_vfcvt_x_mu(vbool8_t vm, vint32m4_t vd, vfloat32m4_t vs2,
                              unsigned int frm, size_t vl);
vint32m8_t __riscv_vfcvt_x_mu(vbool4_t vm, vint32m8_t vd, vfloat32m8_t vs2,
                              unsigned int frm, size_t vl);
vuint32mf2_t __riscv_vfcvt_xu_mu(vbool64_t vm, vuint32mf2_t vd,
                                 vfloat32mf2_t vs2, unsigned int frm,
                                 size_t vl);
vuint32m1_t __riscv_vfcvt_xu_mu(vbool32_t vm, vuint32m1_t vd, vfloat32m1_t vs2,
                                unsigned int frm, size_t vl);
vuint32m2_t __riscv_vfcvt_xu_mu(vbool16_t vm, vuint32m2_t vd, vfloat32m2_t vs2,
                                unsigned int frm, size_t vl);
vuint32m4_t __riscv_vfcvt_xu_mu(vbool8_t vm, vuint32m4_t vd, vfloat32m4_t vs2,
                                unsigned int frm, size_t vl);
vuint32m8_t __riscv_vfcvt_xu_mu(vbool4_t vm, vuint32m8_t vd, vfloat32m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_mu(vbool64_t vm, vfloat32mf2_t vd,
                                 vint32mf2_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_mu(vbool32_t vm, vfloat32m1_t vd, vint32m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfcvt_f_mu(vbool16_t vm, vfloat32m2_t vd, vint32m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfcvt_f_mu(vbool8_t vm, vfloat32m4_t vd, vint32m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfcvt_f_mu(vbool4_t vm, vfloat32m8_t vd, vint32m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfcvt_f_mu(vbool64_t vm, vfloat32mf2_t vd,
                                 vuint32mf2_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfcvt_f_mu(vbool32_t vm, vfloat32m1_t vd, vuint32m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfcvt_f_mu(vbool16_t vm, vfloat32m2_t vd, vuint32m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfcvt_f_mu(vbool8_t vm, vfloat32m4_t vd, vuint32m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat32m8_t __riscv_vfcvt_f_mu(vbool4_t vm, vfloat32m8_t vd, vuint32m8_t vs2,
                                unsigned int frm, size_t vl);
vint64m1_t __riscv_vfcvt_x_mu(vbool64_t vm, vint64m1_t vd, vfloat64m1_t vs2,
                              unsigned int frm, size_t vl);
vint64m2_t __riscv_vfcvt_x_mu(vbool32_t vm, vint64m2_t vd, vfloat64m2_t vs2,
                              unsigned int frm, size_t vl);
vint64m4_t __riscv_vfcvt_x_mu(vbool16_t vm, vint64m4_t vd, vfloat64m4_t vs2,
                              unsigned int frm, size_t vl);
vint64m8_t __riscv_vfcvt_x_mu(vbool8_t vm, vint64m8_t vd, vfloat64m8_t vs2,
                              unsigned int frm, size_t vl);
vuint64m1_t __riscv_vfcvt_xu_mu(vbool64_t vm, vuint64m1_t vd, vfloat64m1_t vs2,
                                unsigned int frm, size_t vl);
vuint64m2_t __riscv_vfcvt_xu_mu(vbool32_t vm, vuint64m2_t vd, vfloat64m2_t vs2,
                                unsigned int frm, size_t vl);
vuint64m4_t __riscv_vfcvt_xu_mu(vbool16_t vm, vuint64m4_t vd, vfloat64m4_t vs2,
                                unsigned int frm, size_t vl);
vuint64m8_t __riscv_vfcvt_xu_mu(vbool8_t vm, vuint64m8_t vd, vfloat64m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfcvt_f_mu(vbool64_t vm, vfloat64m1_t vd, vint64m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfcvt_f_mu(vbool32_t vm, vfloat64m2_t vd, vint64m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfcvt_f_mu(vbool16_t vm, vfloat64m4_t vd, vint64m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfcvt_f_mu(vbool8_t vm, vfloat64m8_t vd, vint64m8_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfcvt_f_mu(vbool64_t vm, vfloat64m1_t vd, vuint64m1_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m2_t __riscv_vfcvt_f_mu(vbool32_t vm, vfloat64m2_t vd, vuint64m2_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m4_t __riscv_vfcvt_f_mu(vbool16_t vm, vfloat64m4_t vd, vuint64m4_t vs2,
                                unsigned int frm, size_t vl);
vfloat64m8_t __riscv_vfcvt_f_mu(vbool8_t vm, vfloat64m8_t vd, vuint64m8_t vs2,
                                unsigned int frm, size_t vl);

Widening Floating-Point/Integer Type-Convert Intrinsics

vfloat16mf4_t __riscv_vfwcvt_f_tu(vfloat16mf4_t vd, vint8mf8_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfwcvt_f_tu(vfloat16mf2_t vd, vint8mf4_t vs2, size_t vl);
vfloat16m1_t __riscv_vfwcvt_f_tu(vfloat16m1_t vd, vint8mf2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfwcvt_f_tu(vfloat16m2_t vd, vint8m1_t vs2, size_t vl);
vfloat16m4_t __riscv_vfwcvt_f_tu(vfloat16m4_t vd, vint8m2_t vs2, size_t vl);
vfloat16m8_t __riscv_vfwcvt_f_tu(vfloat16m8_t vd, vint8m4_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfwcvt_f_tu(vfloat16mf4_t vd, vuint8mf8_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfwcvt_f_tu(vfloat16mf2_t vd, vuint8mf4_t vs2, size_t vl);
vfloat16m1_t __riscv_vfwcvt_f_tu(vfloat16m1_t vd, vuint8mf2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfwcvt_f_tu(vfloat16m2_t vd, vuint8m1_t vs2, size_t vl);
vfloat16m4_t __riscv_vfwcvt_f_tu(vfloat16m4_t vd, vuint8m2_t vs2, size_t vl);
vfloat16m8_t __riscv_vfwcvt_f_tu(vfloat16m8_t vd, vuint8m4_t vs2, size_t vl);
vint32mf2_t __riscv_vfwcvt_x_tu(vint32mf2_t vd, vfloat16mf4_t vs2, size_t vl);
vint32mf2_t __riscv_vfwcvt_rtz_x_tu(vint32mf2_t vd, vfloat16mf4_t vs2,
                                    size_t vl);
vint32m1_t __riscv_vfwcvt_x_tu(vint32m1_t vd, vfloat16mf2_t vs2, size_t vl);
vint32m1_t __riscv_vfwcvt_rtz_x_tu(vint32m1_t vd, vfloat16mf2_t vs2, size_t vl);
vint32m2_t __riscv_vfwcvt_x_tu(vint32m2_t vd, vfloat16m1_t vs2, size_t vl);
vint32m2_t __riscv_vfwcvt_rtz_x_tu(vint32m2_t vd, vfloat16m1_t vs2, size_t vl);
vint32m4_t __riscv_vfwcvt_x_tu(vint32m4_t vd, vfloat16m2_t vs2, size_t vl);
vint32m4_t __riscv_vfwcvt_rtz_x_tu(vint32m4_t vd, vfloat16m2_t vs2, size_t vl);
vint32m8_t __riscv_vfwcvt_x_tu(vint32m8_t vd, vfloat16m4_t vs2, size_t vl);
vint32m8_t __riscv_vfwcvt_rtz_x_tu(vint32m8_t vd, vfloat16m4_t vs2, size_t vl);
vuint32mf2_t __riscv_vfwcvt_xu_tu(vuint32mf2_t vd, vfloat16mf4_t vs2,
                                  size_t vl);
vuint32mf2_t __riscv_vfwcvt_rtz_xu_tu(vuint32mf2_t vd, vfloat16mf4_t vs2,
                                      size_t vl);
vuint32m1_t __riscv_vfwcvt_xu_tu(vuint32m1_t vd, vfloat16mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vfwcvt_rtz_xu_tu(vuint32m1_t vd, vfloat16mf2_t vs2,
                                     size_t vl);
vuint32m2_t __riscv_vfwcvt_xu_tu(vuint32m2_t vd, vfloat16m1_t vs2, size_t vl);
vuint32m2_t __riscv_vfwcvt_rtz_xu_tu(vuint32m2_t vd, vfloat16m1_t vs2,
                                     size_t vl);
vuint32m4_t __riscv_vfwcvt_xu_tu(vuint32m4_t vd, vfloat16m2_t vs2, size_t vl);
vuint32m4_t __riscv_vfwcvt_rtz_xu_tu(vuint32m4_t vd, vfloat16m2_t vs2,
                                     size_t vl);
vuint32m8_t __riscv_vfwcvt_xu_tu(vuint32m8_t vd, vfloat16m4_t vs2, size_t vl);
vuint32m8_t __riscv_vfwcvt_rtz_xu_tu(vuint32m8_t vd, vfloat16m4_t vs2,
                                     size_t vl);
vfloat32mf2_t __riscv_vfwcvt_f_tu(vfloat32mf2_t vd, vint16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwcvt_f_tu(vfloat32m1_t vd, vint16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwcvt_f_tu(vfloat32m2_t vd, vint16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwcvt_f_tu(vfloat32m4_t vd, vint16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwcvt_f_tu(vfloat32m8_t vd, vint16m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwcvt_f_tu(vfloat32mf2_t vd, vuint16mf4_t vs2,
                                  size_t vl);
vfloat32m1_t __riscv_vfwcvt_f_tu(vfloat32m1_t vd, vuint16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwcvt_f_tu(vfloat32m2_t vd, vuint16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwcvt_f_tu(vfloat32m4_t vd, vuint16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwcvt_f_tu(vfloat32m8_t vd, vuint16m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwcvt_f_tu(vfloat32mf2_t vd, vfloat16mf4_t vs2,
                                  size_t vl);
vfloat32m1_t __riscv_vfwcvt_f_tu(vfloat32m1_t vd, vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwcvt_f_tu(vfloat32m2_t vd, vfloat16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwcvt_f_tu(vfloat32m4_t vd, vfloat16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwcvt_f_tu(vfloat32m8_t vd, vfloat16m4_t vs2, size_t vl);
vint64m1_t __riscv_vfwcvt_x_tu(vint64m1_t vd, vfloat32mf2_t vs2, size_t vl);
vint64m1_t __riscv_vfwcvt_rtz_x_tu(vint64m1_t vd, vfloat32mf2_t vs2, size_t vl);
vint64m2_t __riscv_vfwcvt_x_tu(vint64m2_t vd, vfloat32m1_t vs2, size_t vl);
vint64m2_t __riscv_vfwcvt_rtz_x_tu(vint64m2_t vd, vfloat32m1_t vs2, size_t vl);
vint64m4_t __riscv_vfwcvt_x_tu(vint64m4_t vd, vfloat32m2_t vs2, size_t vl);
vint64m4_t __riscv_vfwcvt_rtz_x_tu(vint64m4_t vd, vfloat32m2_t vs2, size_t vl);
vint64m8_t __riscv_vfwcvt_x_tu(vint64m8_t vd, vfloat32m4_t vs2, size_t vl);
vint64m8_t __riscv_vfwcvt_rtz_x_tu(vint64m8_t vd, vfloat32m4_t vs2, size_t vl);
vuint64m1_t __riscv_vfwcvt_xu_tu(vuint64m1_t vd, vfloat32mf2_t vs2, size_t vl);
vuint64m1_t __riscv_vfwcvt_rtz_xu_tu(vuint64m1_t vd, vfloat32mf2_t vs2,
                                     size_t vl);
vuint64m2_t __riscv_vfwcvt_xu_tu(vuint64m2_t vd, vfloat32m1_t vs2, size_t vl);
vuint64m2_t __riscv_vfwcvt_rtz_xu_tu(vuint64m2_t vd, vfloat32m1_t vs2,
                                     size_t vl);
vuint64m4_t __riscv_vfwcvt_xu_tu(vuint64m4_t vd, vfloat32m2_t vs2, size_t vl);
vuint64m4_t __riscv_vfwcvt_rtz_xu_tu(vuint64m4_t vd, vfloat32m2_t vs2,
                                     size_t vl);
vuint64m8_t __riscv_vfwcvt_xu_tu(vuint64m8_t vd, vfloat32m4_t vs2, size_t vl);
vuint64m8_t __riscv_vfwcvt_rtz_xu_tu(vuint64m8_t vd, vfloat32m4_t vs2,
                                     size_t vl);
vfloat64m1_t __riscv_vfwcvt_f_tu(vfloat64m1_t vd, vint32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwcvt_f_tu(vfloat64m2_t vd, vint32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwcvt_f_tu(vfloat64m4_t vd, vint32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwcvt_f_tu(vfloat64m8_t vd, vint32m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwcvt_f_tu(vfloat64m1_t vd, vuint32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwcvt_f_tu(vfloat64m2_t vd, vuint32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwcvt_f_tu(vfloat64m4_t vd, vuint32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwcvt_f_tu(vfloat64m8_t vd, vuint32m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwcvt_f_tu(vfloat64m1_t vd, vfloat32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwcvt_f_tu(vfloat64m2_t vd, vfloat32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwcvt_f_tu(vfloat64m4_t vd, vfloat32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwcvt_f_tu(vfloat64m8_t vd, vfloat32m4_t vs2, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfwcvt_f_tum(vbool64_t vm, vfloat16mf4_t vd,
                                   vint8mf8_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfwcvt_f_tum(vbool32_t vm, vfloat16mf2_t vd,
                                   vint8mf4_t vs2, size_t vl);
vfloat16m1_t __riscv_vfwcvt_f_tum(vbool16_t vm, vfloat16m1_t vd, vint8mf2_t vs2,
                                  size_t vl);
vfloat16m2_t __riscv_vfwcvt_f_tum(vbool8_t vm, vfloat16m2_t vd, vint8m1_t vs2,
                                  size_t vl);
vfloat16m4_t __riscv_vfwcvt_f_tum(vbool4_t vm, vfloat16m4_t vd, vint8m2_t vs2,
                                  size_t vl);
vfloat16m8_t __riscv_vfwcvt_f_tum(vbool2_t vm, vfloat16m8_t vd, vint8m4_t vs2,
                                  size_t vl);
vfloat16mf4_t __riscv_vfwcvt_f_tum(vbool64_t vm, vfloat16mf4_t vd,
                                   vuint8mf8_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfwcvt_f_tum(vbool32_t vm, vfloat16mf2_t vd,
                                   vuint8mf4_t vs2, size_t vl);
vfloat16m1_t __riscv_vfwcvt_f_tum(vbool16_t vm, vfloat16m1_t vd,
                                  vuint8mf2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfwcvt_f_tum(vbool8_t vm, vfloat16m2_t vd, vuint8m1_t vs2,
                                  size_t vl);
vfloat16m4_t __riscv_vfwcvt_f_tum(vbool4_t vm, vfloat16m4_t vd, vuint8m2_t vs2,
                                  size_t vl);
vfloat16m8_t __riscv_vfwcvt_f_tum(vbool2_t vm, vfloat16m8_t vd, vuint8m4_t vs2,
                                  size_t vl);
vint32mf2_t __riscv_vfwcvt_x_tum(vbool64_t vm, vint32mf2_t vd,
                                 vfloat16mf4_t vs2, size_t vl);
vint32mf2_t __riscv_vfwcvt_rtz_x_tum(vbool64_t vm, vint32mf2_t vd,
                                     vfloat16mf4_t vs2, size_t vl);
vint32m1_t __riscv_vfwcvt_x_tum(vbool32_t vm, vint32m1_t vd, vfloat16mf2_t vs2,
                                size_t vl);
vint32m1_t __riscv_vfwcvt_rtz_x_tum(vbool32_t vm, vint32m1_t vd,
                                    vfloat16mf2_t vs2, size_t vl);
vint32m2_t __riscv_vfwcvt_x_tum(vbool16_t vm, vint32m2_t vd, vfloat16m1_t vs2,
                                size_t vl);
vint32m2_t __riscv_vfwcvt_rtz_x_tum(vbool16_t vm, vint32m2_t vd,
                                    vfloat16m1_t vs2, size_t vl);
vint32m4_t __riscv_vfwcvt_x_tum(vbool8_t vm, vint32m4_t vd, vfloat16m2_t vs2,
                                size_t vl);
vint32m4_t __riscv_vfwcvt_rtz_x_tum(vbool8_t vm, vint32m4_t vd,
                                    vfloat16m2_t vs2, size_t vl);
vint32m8_t __riscv_vfwcvt_x_tum(vbool4_t vm, vint32m8_t vd, vfloat16m4_t vs2,
                                size_t vl);
vint32m8_t __riscv_vfwcvt_rtz_x_tum(vbool4_t vm, vint32m8_t vd,
                                    vfloat16m4_t vs2, size_t vl);
vuint32mf2_t __riscv_vfwcvt_xu_tum(vbool64_t vm, vuint32mf2_t vd,
                                   vfloat16mf4_t vs2, size_t vl);
vuint32mf2_t __riscv_vfwcvt_rtz_xu_tum(vbool64_t vm, vuint32mf2_t vd,
                                       vfloat16mf4_t vs2, size_t vl);
vuint32m1_t __riscv_vfwcvt_xu_tum(vbool32_t vm, vuint32m1_t vd,
                                  vfloat16mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vfwcvt_rtz_xu_tum(vbool32_t vm, vuint32m1_t vd,
                                      vfloat16mf2_t vs2, size_t vl);
vuint32m2_t __riscv_vfwcvt_xu_tum(vbool16_t vm, vuint32m2_t vd,
                                  vfloat16m1_t vs2, size_t vl);
vuint32m2_t __riscv_vfwcvt_rtz_xu_tum(vbool16_t vm, vuint32m2_t vd,
                                      vfloat16m1_t vs2, size_t vl);
vuint32m4_t __riscv_vfwcvt_xu_tum(vbool8_t vm, vuint32m4_t vd, vfloat16m2_t vs2,
                                  size_t vl);
vuint32m4_t __riscv_vfwcvt_rtz_xu_tum(vbool8_t vm, vuint32m4_t vd,
                                      vfloat16m2_t vs2, size_t vl);
vuint32m8_t __riscv_vfwcvt_xu_tum(vbool4_t vm, vuint32m8_t vd, vfloat16m4_t vs2,
                                  size_t vl);
vuint32m8_t __riscv_vfwcvt_rtz_xu_tum(vbool4_t vm, vuint32m8_t vd,
                                      vfloat16m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwcvt_f_tum(vbool64_t vm, vfloat32mf2_t vd,
                                   vint16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwcvt_f_tum(vbool32_t vm, vfloat32m1_t vd,
                                  vint16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwcvt_f_tum(vbool16_t vm, vfloat32m2_t vd, vint16m1_t vs2,
                                  size_t vl);
vfloat32m4_t __riscv_vfwcvt_f_tum(vbool8_t vm, vfloat32m4_t vd, vint16m2_t vs2,
                                  size_t vl);
vfloat32m8_t __riscv_vfwcvt_f_tum(vbool4_t vm, vfloat32m8_t vd, vint16m4_t vs2,
                                  size_t vl);
vfloat32mf2_t __riscv_vfwcvt_f_tum(vbool64_t vm, vfloat32mf2_t vd,
                                   vuint16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwcvt_f_tum(vbool32_t vm, vfloat32m1_t vd,
                                  vuint16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwcvt_f_tum(vbool16_t vm, vfloat32m2_t vd,
                                  vuint16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwcvt_f_tum(vbool8_t vm, vfloat32m4_t vd, vuint16m2_t vs2,
                                  size_t vl);
vfloat32m8_t __riscv_vfwcvt_f_tum(vbool4_t vm, vfloat32m8_t vd, vuint16m4_t vs2,
                                  size_t vl);
vfloat32mf2_t __riscv_vfwcvt_f_tum(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwcvt_f_tum(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwcvt_f_tum(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwcvt_f_tum(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwcvt_f_tum(vbool4_t vm, vfloat32m8_t vd,
                                  vfloat16m4_t vs2, size_t vl);
vint64m1_t __riscv_vfwcvt_x_tum(vbool64_t vm, vint64m1_t vd, vfloat32mf2_t vs2,
                                size_t vl);
vint64m1_t __riscv_vfwcvt_rtz_x_tum(vbool64_t vm, vint64m1_t vd,
                                    vfloat32mf2_t vs2, size_t vl);
vint64m2_t __riscv_vfwcvt_x_tum(vbool32_t vm, vint64m2_t vd, vfloat32m1_t vs2,
                                size_t vl);
vint64m2_t __riscv_vfwcvt_rtz_x_tum(vbool32_t vm, vint64m2_t vd,
                                    vfloat32m1_t vs2, size_t vl);
vint64m4_t __riscv_vfwcvt_x_tum(vbool16_t vm, vint64m4_t vd, vfloat32m2_t vs2,
                                size_t vl);
vint64m4_t __riscv_vfwcvt_rtz_x_tum(vbool16_t vm, vint64m4_t vd,
                                    vfloat32m2_t vs2, size_t vl);
vint64m8_t __riscv_vfwcvt_x_tum(vbool8_t vm, vint64m8_t vd, vfloat32m4_t vs2,
                                size_t vl);
vint64m8_t __riscv_vfwcvt_rtz_x_tum(vbool8_t vm, vint64m8_t vd,
                                    vfloat32m4_t vs2, size_t vl);
vuint64m1_t __riscv_vfwcvt_xu_tum(vbool64_t vm, vuint64m1_t vd,
                                  vfloat32mf2_t vs2, size_t vl);
vuint64m1_t __riscv_vfwcvt_rtz_xu_tum(vbool64_t vm, vuint64m1_t vd,
                                      vfloat32mf2_t vs2, size_t vl);
vuint64m2_t __riscv_vfwcvt_xu_tum(vbool32_t vm, vuint64m2_t vd,
                                  vfloat32m1_t vs2, size_t vl);
vuint64m2_t __riscv_vfwcvt_rtz_xu_tum(vbool32_t vm, vuint64m2_t vd,
                                      vfloat32m1_t vs2, size_t vl);
vuint64m4_t __riscv_vfwcvt_xu_tum(vbool16_t vm, vuint64m4_t vd,
                                  vfloat32m2_t vs2, size_t vl);
vuint64m4_t __riscv_vfwcvt_rtz_xu_tum(vbool16_t vm, vuint64m4_t vd,
                                      vfloat32m2_t vs2, size_t vl);
vuint64m8_t __riscv_vfwcvt_xu_tum(vbool8_t vm, vuint64m8_t vd, vfloat32m4_t vs2,
                                  size_t vl);
vuint64m8_t __riscv_vfwcvt_rtz_xu_tum(vbool8_t vm, vuint64m8_t vd,
                                      vfloat32m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwcvt_f_tum(vbool64_t vm, vfloat64m1_t vd,
                                  vint32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwcvt_f_tum(vbool32_t vm, vfloat64m2_t vd, vint32m1_t vs2,
                                  size_t vl);
vfloat64m4_t __riscv_vfwcvt_f_tum(vbool16_t vm, vfloat64m4_t vd, vint32m2_t vs2,
                                  size_t vl);
vfloat64m8_t __riscv_vfwcvt_f_tum(vbool8_t vm, vfloat64m8_t vd, vint32m4_t vs2,
                                  size_t vl);
vfloat64m1_t __riscv_vfwcvt_f_tum(vbool64_t vm, vfloat64m1_t vd,
                                  vuint32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwcvt_f_tum(vbool32_t vm, vfloat64m2_t vd,
                                  vuint32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwcvt_f_tum(vbool16_t vm, vfloat64m4_t vd,
                                  vuint32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwcvt_f_tum(vbool8_t vm, vfloat64m8_t vd, vuint32m4_t vs2,
                                  size_t vl);
vfloat64m1_t __riscv_vfwcvt_f_tum(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwcvt_f_tum(vbool32_t vm, vfloat64m2_t vd,
                                  vfloat32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwcvt_f_tum(vbool16_t vm, vfloat64m4_t vd,
                                  vfloat32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwcvt_f_tum(vbool8_t vm, vfloat64m8_t vd,
                                  vfloat32m4_t vs2, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfwcvt_f_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                    vint8mf8_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfwcvt_f_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                    vint8mf4_t vs2, size_t vl);
vfloat16m1_t __riscv_vfwcvt_f_tumu(vbool16_t vm, vfloat16m1_t vd,
                                   vint8mf2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfwcvt_f_tumu(vbool8_t vm, vfloat16m2_t vd, vint8m1_t vs2,
                                   size_t vl);
vfloat16m4_t __riscv_vfwcvt_f_tumu(vbool4_t vm, vfloat16m4_t vd, vint8m2_t vs2,
                                   size_t vl);
vfloat16m8_t __riscv_vfwcvt_f_tumu(vbool2_t vm, vfloat16m8_t vd, vint8m4_t vs2,
                                   size_t vl);
vfloat16mf4_t __riscv_vfwcvt_f_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                    vuint8mf8_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfwcvt_f_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                    vuint8mf4_t vs2, size_t vl);
vfloat16m1_t __riscv_vfwcvt_f_tumu(vbool16_t vm, vfloat16m1_t vd,
                                   vuint8mf2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfwcvt_f_tumu(vbool8_t vm, vfloat16m2_t vd, vuint8m1_t vs2,
                                   size_t vl);
vfloat16m4_t __riscv_vfwcvt_f_tumu(vbool4_t vm, vfloat16m4_t vd, vuint8m2_t vs2,
                                   size_t vl);
vfloat16m8_t __riscv_vfwcvt_f_tumu(vbool2_t vm, vfloat16m8_t vd, vuint8m4_t vs2,
                                   size_t vl);
vint32mf2_t __riscv_vfwcvt_x_tumu(vbool64_t vm, vint32mf2_t vd,
                                  vfloat16mf4_t vs2, size_t vl);
vint32mf2_t __riscv_vfwcvt_rtz_x_tumu(vbool64_t vm, vint32mf2_t vd,
                                      vfloat16mf4_t vs2, size_t vl);
vint32m1_t __riscv_vfwcvt_x_tumu(vbool32_t vm, vint32m1_t vd, vfloat16mf2_t vs2,
                                 size_t vl);
vint32m1_t __riscv_vfwcvt_rtz_x_tumu(vbool32_t vm, vint32m1_t vd,
                                     vfloat16mf2_t vs2, size_t vl);
vint32m2_t __riscv_vfwcvt_x_tumu(vbool16_t vm, vint32m2_t vd, vfloat16m1_t vs2,
                                 size_t vl);
vint32m2_t __riscv_vfwcvt_rtz_x_tumu(vbool16_t vm, vint32m2_t vd,
                                     vfloat16m1_t vs2, size_t vl);
vint32m4_t __riscv_vfwcvt_x_tumu(vbool8_t vm, vint32m4_t vd, vfloat16m2_t vs2,
                                 size_t vl);
vint32m4_t __riscv_vfwcvt_rtz_x_tumu(vbool8_t vm, vint32m4_t vd,
                                     vfloat16m2_t vs2, size_t vl);
vint32m8_t __riscv_vfwcvt_x_tumu(vbool4_t vm, vint32m8_t vd, vfloat16m4_t vs2,
                                 size_t vl);
vint32m8_t __riscv_vfwcvt_rtz_x_tumu(vbool4_t vm, vint32m8_t vd,
                                     vfloat16m4_t vs2, size_t vl);
vuint32mf2_t __riscv_vfwcvt_xu_tumu(vbool64_t vm, vuint32mf2_t vd,
                                    vfloat16mf4_t vs2, size_t vl);
vuint32mf2_t __riscv_vfwcvt_rtz_xu_tumu(vbool64_t vm, vuint32mf2_t vd,
                                        vfloat16mf4_t vs2, size_t vl);
vuint32m1_t __riscv_vfwcvt_xu_tumu(vbool32_t vm, vuint32m1_t vd,
                                   vfloat16mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vfwcvt_rtz_xu_tumu(vbool32_t vm, vuint32m1_t vd,
                                       vfloat16mf2_t vs2, size_t vl);
vuint32m2_t __riscv_vfwcvt_xu_tumu(vbool16_t vm, vuint32m2_t vd,
                                   vfloat16m1_t vs2, size_t vl);
vuint32m2_t __riscv_vfwcvt_rtz_xu_tumu(vbool16_t vm, vuint32m2_t vd,
                                       vfloat16m1_t vs2, size_t vl);
vuint32m4_t __riscv_vfwcvt_xu_tumu(vbool8_t vm, vuint32m4_t vd,
                                   vfloat16m2_t vs2, size_t vl);
vuint32m4_t __riscv_vfwcvt_rtz_xu_tumu(vbool8_t vm, vuint32m4_t vd,
                                       vfloat16m2_t vs2, size_t vl);
vuint32m8_t __riscv_vfwcvt_xu_tumu(vbool4_t vm, vuint32m8_t vd,
                                   vfloat16m4_t vs2, size_t vl);
vuint32m8_t __riscv_vfwcvt_rtz_xu_tumu(vbool4_t vm, vuint32m8_t vd,
                                       vfloat16m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwcvt_f_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                    vint16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwcvt_f_tumu(vbool32_t vm, vfloat32m1_t vd,
                                   vint16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwcvt_f_tumu(vbool16_t vm, vfloat32m2_t vd,
                                   vint16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwcvt_f_tumu(vbool8_t vm, vfloat32m4_t vd, vint16m2_t vs2,
                                   size_t vl);
vfloat32m8_t __riscv_vfwcvt_f_tumu(vbool4_t vm, vfloat32m8_t vd, vint16m4_t vs2,
                                   size_t vl);
vfloat32mf2_t __riscv_vfwcvt_f_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                    vuint16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwcvt_f_tumu(vbool32_t vm, vfloat32m1_t vd,
                                   vuint16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwcvt_f_tumu(vbool16_t vm, vfloat32m2_t vd,
                                   vuint16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwcvt_f_tumu(vbool8_t vm, vfloat32m4_t vd,
                                   vuint16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwcvt_f_tumu(vbool4_t vm, vfloat32m8_t vd,
                                   vuint16m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwcvt_f_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                    vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwcvt_f_tumu(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwcvt_f_tumu(vbool16_t vm, vfloat32m2_t vd,
                                   vfloat16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwcvt_f_tumu(vbool8_t vm, vfloat32m4_t vd,
                                   vfloat16m2_t vs2, size_t vl);
vfloat32m8_t __riscv_vfwcvt_f_tumu(vbool4_t vm, vfloat32m8_t vd,
                                   vfloat16m4_t vs2, size_t vl);
vint64m1_t __riscv_vfwcvt_x_tumu(vbool64_t vm, vint64m1_t vd, vfloat32mf2_t vs2,
                                 size_t vl);
vint64m1_t __riscv_vfwcvt_rtz_x_tumu(vbool64_t vm, vint64m1_t vd,
                                     vfloat32mf2_t vs2, size_t vl);
vint64m2_t __riscv_vfwcvt_x_tumu(vbool32_t vm, vint64m2_t vd, vfloat32m1_t vs2,
                                 size_t vl);
vint64m2_t __riscv_vfwcvt_rtz_x_tumu(vbool32_t vm, vint64m2_t vd,
                                     vfloat32m1_t vs2, size_t vl);
vint64m4_t __riscv_vfwcvt_x_tumu(vbool16_t vm, vint64m4_t vd, vfloat32m2_t vs2,
                                 size_t vl);
vint64m4_t __riscv_vfwcvt_rtz_x_tumu(vbool16_t vm, vint64m4_t vd,
                                     vfloat32m2_t vs2, size_t vl);
vint64m8_t __riscv_vfwcvt_x_tumu(vbool8_t vm, vint64m8_t vd, vfloat32m4_t vs2,
                                 size_t vl);
vint64m8_t __riscv_vfwcvt_rtz_x_tumu(vbool8_t vm, vint64m8_t vd,
                                     vfloat32m4_t vs2, size_t vl);
vuint64m1_t __riscv_vfwcvt_xu_tumu(vbool64_t vm, vuint64m1_t vd,
                                   vfloat32mf2_t vs2, size_t vl);
vuint64m1_t __riscv_vfwcvt_rtz_xu_tumu(vbool64_t vm, vuint64m1_t vd,
                                       vfloat32mf2_t vs2, size_t vl);
vuint64m2_t __riscv_vfwcvt_xu_tumu(vbool32_t vm, vuint64m2_t vd,
                                   vfloat32m1_t vs2, size_t vl);
vuint64m2_t __riscv_vfwcvt_rtz_xu_tumu(vbool32_t vm, vuint64m2_t vd,
                                       vfloat32m1_t vs2, size_t vl);
vuint64m4_t __riscv_vfwcvt_xu_tumu(vbool16_t vm, vuint64m4_t vd,
                                   vfloat32m2_t vs2, size_t vl);
vuint64m4_t __riscv_vfwcvt_rtz_xu_tumu(vbool16_t vm, vuint64m4_t vd,
                                       vfloat32m2_t vs2, size_t vl);
vuint64m8_t __riscv_vfwcvt_xu_tumu(vbool8_t vm, vuint64m8_t vd,
                                   vfloat32m4_t vs2, size_t vl);
vuint64m8_t __riscv_vfwcvt_rtz_xu_tumu(vbool8_t vm, vuint64m8_t vd,
                                       vfloat32m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwcvt_f_tumu(vbool64_t vm, vfloat64m1_t vd,
                                   vint32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwcvt_f_tumu(vbool32_t vm, vfloat64m2_t vd,
                                   vint32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwcvt_f_tumu(vbool16_t vm, vfloat64m4_t vd,
                                   vint32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwcvt_f_tumu(vbool8_t vm, vfloat64m8_t vd, vint32m4_t vs2,
                                   size_t vl);
vfloat64m1_t __riscv_vfwcvt_f_tumu(vbool64_t vm, vfloat64m1_t vd,
                                   vuint32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwcvt_f_tumu(vbool32_t vm, vfloat64m2_t vd,
                                   vuint32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwcvt_f_tumu(vbool16_t vm, vfloat64m4_t vd,
                                   vuint32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwcvt_f_tumu(vbool8_t vm, vfloat64m8_t vd,
                                   vuint32m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwcvt_f_tumu(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwcvt_f_tumu(vbool32_t vm, vfloat64m2_t vd,
                                   vfloat32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwcvt_f_tumu(vbool16_t vm, vfloat64m4_t vd,
                                   vfloat32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwcvt_f_tumu(vbool8_t vm, vfloat64m8_t vd,
                                   vfloat32m4_t vs2, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfwcvt_f_mu(vbool64_t vm, vfloat16mf4_t vd,
                                  vint8mf8_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfwcvt_f_mu(vbool32_t vm, vfloat16mf2_t vd,
                                  vint8mf4_t vs2, size_t vl);
vfloat16m1_t __riscv_vfwcvt_f_mu(vbool16_t vm, vfloat16m1_t vd, vint8mf2_t vs2,
                                 size_t vl);
vfloat16m2_t __riscv_vfwcvt_f_mu(vbool8_t vm, vfloat16m2_t vd, vint8m1_t vs2,
                                 size_t vl);
vfloat16m4_t __riscv_vfwcvt_f_mu(vbool4_t vm, vfloat16m4_t vd, vint8m2_t vs2,
                                 size_t vl);
vfloat16m8_t __riscv_vfwcvt_f_mu(vbool2_t vm, vfloat16m8_t vd, vint8m4_t vs2,
                                 size_t vl);
vfloat16mf4_t __riscv_vfwcvt_f_mu(vbool64_t vm, vfloat16mf4_t vd,
                                  vuint8mf8_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfwcvt_f_mu(vbool32_t vm, vfloat16mf2_t vd,
                                  vuint8mf4_t vs2, size_t vl);
vfloat16m1_t __riscv_vfwcvt_f_mu(vbool16_t vm, vfloat16m1_t vd, vuint8mf2_t vs2,
                                 size_t vl);
vfloat16m2_t __riscv_vfwcvt_f_mu(vbool8_t vm, vfloat16m2_t vd, vuint8m1_t vs2,
                                 size_t vl);
vfloat16m4_t __riscv_vfwcvt_f_mu(vbool4_t vm, vfloat16m4_t vd, vuint8m2_t vs2,
                                 size_t vl);
vfloat16m8_t __riscv_vfwcvt_f_mu(vbool2_t vm, vfloat16m8_t vd, vuint8m4_t vs2,
                                 size_t vl);
vint32mf2_t __riscv_vfwcvt_x_mu(vbool64_t vm, vint32mf2_t vd, vfloat16mf4_t vs2,
                                size_t vl);
vint32mf2_t __riscv_vfwcvt_rtz_x_mu(vbool64_t vm, vint32mf2_t vd,
                                    vfloat16mf4_t vs2, size_t vl);
vint32m1_t __riscv_vfwcvt_x_mu(vbool32_t vm, vint32m1_t vd, vfloat16mf2_t vs2,
                               size_t vl);
vint32m1_t __riscv_vfwcvt_rtz_x_mu(vbool32_t vm, vint32m1_t vd,
                                   vfloat16mf2_t vs2, size_t vl);
vint32m2_t __riscv_vfwcvt_x_mu(vbool16_t vm, vint32m2_t vd, vfloat16m1_t vs2,
                               size_t vl);
vint32m2_t __riscv_vfwcvt_rtz_x_mu(vbool16_t vm, vint32m2_t vd,
                                   vfloat16m1_t vs2, size_t vl);
vint32m4_t __riscv_vfwcvt_x_mu(vbool8_t vm, vint32m4_t vd, vfloat16m2_t vs2,
                               size_t vl);
vint32m4_t __riscv_vfwcvt_rtz_x_mu(vbool8_t vm, vint32m4_t vd, vfloat16m2_t vs2,
                                   size_t vl);
vint32m8_t __riscv_vfwcvt_x_mu(vbool4_t vm, vint32m8_t vd, vfloat16m4_t vs2,
                               size_t vl);
vint32m8_t __riscv_vfwcvt_rtz_x_mu(vbool4_t vm, vint32m8_t vd, vfloat16m4_t vs2,
                                   size_t vl);
vuint32mf2_t __riscv_vfwcvt_xu_mu(vbool64_t vm, vuint32mf2_t vd,
                                  vfloat16mf4_t vs2, size_t vl);
vuint32mf2_t __riscv_vfwcvt_rtz_xu_mu(vbool64_t vm, vuint32mf2_t vd,
                                      vfloat16mf4_t vs2, size_t vl);
vuint32m1_t __riscv_vfwcvt_xu_mu(vbool32_t vm, vuint32m1_t vd,
                                 vfloat16mf2_t vs2, size_t vl);
vuint32m1_t __riscv_vfwcvt_rtz_xu_mu(vbool32_t vm, vuint32m1_t vd,
                                     vfloat16mf2_t vs2, size_t vl);
vuint32m2_t __riscv_vfwcvt_xu_mu(vbool16_t vm, vuint32m2_t vd, vfloat16m1_t vs2,
                                 size_t vl);
vuint32m2_t __riscv_vfwcvt_rtz_xu_mu(vbool16_t vm, vuint32m2_t vd,
                                     vfloat16m1_t vs2, size_t vl);
vuint32m4_t __riscv_vfwcvt_xu_mu(vbool8_t vm, vuint32m4_t vd, vfloat16m2_t vs2,
                                 size_t vl);
vuint32m4_t __riscv_vfwcvt_rtz_xu_mu(vbool8_t vm, vuint32m4_t vd,
                                     vfloat16m2_t vs2, size_t vl);
vuint32m8_t __riscv_vfwcvt_xu_mu(vbool4_t vm, vuint32m8_t vd, vfloat16m4_t vs2,
                                 size_t vl);
vuint32m8_t __riscv_vfwcvt_rtz_xu_mu(vbool4_t vm, vuint32m8_t vd,
                                     vfloat16m4_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfwcvt_f_mu(vbool64_t vm, vfloat32mf2_t vd,
                                  vint16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwcvt_f_mu(vbool32_t vm, vfloat32m1_t vd, vint16mf2_t vs2,
                                 size_t vl);
vfloat32m2_t __riscv_vfwcvt_f_mu(vbool16_t vm, vfloat32m2_t vd, vint16m1_t vs2,
                                 size_t vl);
vfloat32m4_t __riscv_vfwcvt_f_mu(vbool8_t vm, vfloat32m4_t vd, vint16m2_t vs2,
                                 size_t vl);
vfloat32m8_t __riscv_vfwcvt_f_mu(vbool4_t vm, vfloat32m8_t vd, vint16m4_t vs2,
                                 size_t vl);
vfloat32mf2_t __riscv_vfwcvt_f_mu(vbool64_t vm, vfloat32mf2_t vd,
                                  vuint16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwcvt_f_mu(vbool32_t vm, vfloat32m1_t vd,
                                 vuint16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwcvt_f_mu(vbool16_t vm, vfloat32m2_t vd, vuint16m1_t vs2,
                                 size_t vl);
vfloat32m4_t __riscv_vfwcvt_f_mu(vbool8_t vm, vfloat32m4_t vd, vuint16m2_t vs2,
                                 size_t vl);
vfloat32m8_t __riscv_vfwcvt_f_mu(vbool4_t vm, vfloat32m8_t vd, vuint16m4_t vs2,
                                 size_t vl);
vfloat32mf2_t __riscv_vfwcvt_f_mu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat16mf4_t vs2, size_t vl);
vfloat32m1_t __riscv_vfwcvt_f_mu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat16mf2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfwcvt_f_mu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat16m1_t vs2, size_t vl);
vfloat32m4_t __riscv_vfwcvt_f_mu(vbool8_t vm, vfloat32m4_t vd, vfloat16m2_t vs2,
                                 size_t vl);
vfloat32m8_t __riscv_vfwcvt_f_mu(vbool4_t vm, vfloat32m8_t vd, vfloat16m4_t vs2,
                                 size_t vl);
vint64m1_t __riscv_vfwcvt_x_mu(vbool64_t vm, vint64m1_t vd, vfloat32mf2_t vs2,
                               size_t vl);
vint64m1_t __riscv_vfwcvt_rtz_x_mu(vbool64_t vm, vint64m1_t vd,
                                   vfloat32mf2_t vs2, size_t vl);
vint64m2_t __riscv_vfwcvt_x_mu(vbool32_t vm, vint64m2_t vd, vfloat32m1_t vs2,
                               size_t vl);
vint64m2_t __riscv_vfwcvt_rtz_x_mu(vbool32_t vm, vint64m2_t vd,
                                   vfloat32m1_t vs2, size_t vl);
vint64m4_t __riscv_vfwcvt_x_mu(vbool16_t vm, vint64m4_t vd, vfloat32m2_t vs2,
                               size_t vl);
vint64m4_t __riscv_vfwcvt_rtz_x_mu(vbool16_t vm, vint64m4_t vd,
                                   vfloat32m2_t vs2, size_t vl);
vint64m8_t __riscv_vfwcvt_x_mu(vbool8_t vm, vint64m8_t vd, vfloat32m4_t vs2,
                               size_t vl);
vint64m8_t __riscv_vfwcvt_rtz_x_mu(vbool8_t vm, vint64m8_t vd, vfloat32m4_t vs2,
                                   size_t vl);
vuint64m1_t __riscv_vfwcvt_xu_mu(vbool64_t vm, vuint64m1_t vd,
                                 vfloat32mf2_t vs2, size_t vl);
vuint64m1_t __riscv_vfwcvt_rtz_xu_mu(vbool64_t vm, vuint64m1_t vd,
                                     vfloat32mf2_t vs2, size_t vl);
vuint64m2_t __riscv_vfwcvt_xu_mu(vbool32_t vm, vuint64m2_t vd, vfloat32m1_t vs2,
                                 size_t vl);
vuint64m2_t __riscv_vfwcvt_rtz_xu_mu(vbool32_t vm, vuint64m2_t vd,
                                     vfloat32m1_t vs2, size_t vl);
vuint64m4_t __riscv_vfwcvt_xu_mu(vbool16_t vm, vuint64m4_t vd, vfloat32m2_t vs2,
                                 size_t vl);
vuint64m4_t __riscv_vfwcvt_rtz_xu_mu(vbool16_t vm, vuint64m4_t vd,
                                     vfloat32m2_t vs2, size_t vl);
vuint64m8_t __riscv_vfwcvt_xu_mu(vbool8_t vm, vuint64m8_t vd, vfloat32m4_t vs2,
                                 size_t vl);
vuint64m8_t __riscv_vfwcvt_rtz_xu_mu(vbool8_t vm, vuint64m8_t vd,
                                     vfloat32m4_t vs2, size_t vl);
vfloat64m1_t __riscv_vfwcvt_f_mu(vbool64_t vm, vfloat64m1_t vd, vint32mf2_t vs2,
                                 size_t vl);
vfloat64m2_t __riscv_vfwcvt_f_mu(vbool32_t vm, vfloat64m2_t vd, vint32m1_t vs2,
                                 size_t vl);
vfloat64m4_t __riscv_vfwcvt_f_mu(vbool16_t vm, vfloat64m4_t vd, vint32m2_t vs2,
                                 size_t vl);
vfloat64m8_t __riscv_vfwcvt_f_mu(vbool8_t vm, vfloat64m8_t vd, vint32m4_t vs2,
                                 size_t vl);
vfloat64m1_t __riscv_vfwcvt_f_mu(vbool64_t vm, vfloat64m1_t vd,
                                 vuint32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwcvt_f_mu(vbool32_t vm, vfloat64m2_t vd, vuint32m1_t vs2,
                                 size_t vl);
vfloat64m4_t __riscv_vfwcvt_f_mu(vbool16_t vm, vfloat64m4_t vd, vuint32m2_t vs2,
                                 size_t vl);
vfloat64m8_t __riscv_vfwcvt_f_mu(vbool8_t vm, vfloat64m8_t vd, vuint32m4_t vs2,
                                 size_t vl);
vfloat64m1_t __riscv_vfwcvt_f_mu(vbool64_t vm, vfloat64m1_t vd,
                                 vfloat32mf2_t vs2, size_t vl);
vfloat64m2_t __riscv_vfwcvt_f_mu(vbool32_t vm, vfloat64m2_t vd,
                                 vfloat32m1_t vs2, size_t vl);
vfloat64m4_t __riscv_vfwcvt_f_mu(vbool16_t vm, vfloat64m4_t vd,
                                 vfloat32m2_t vs2, size_t vl);
vfloat64m8_t __riscv_vfwcvt_f_mu(vbool8_t vm, vfloat64m8_t vd, vfloat32m4_t vs2,
                                 size_t vl);
vint32mf2_t __riscv_vfwcvt_x_tu(vint32mf2_t vd, vfloat16mf4_t vs2,
                                unsigned int frm, size_t vl);
vint32m1_t __riscv_vfwcvt_x_tu(vint32m1_t vd, vfloat16mf2_t vs2,
                               unsigned int frm, size_t vl);
vint32m2_t __riscv_vfwcvt_x_tu(vint32m2_t vd, vfloat16m1_t vs2,
                               unsigned int frm, size_t vl);
vint32m4_t __riscv_vfwcvt_x_tu(vint32m4_t vd, vfloat16m2_t vs2,
                               unsigned int frm, size_t vl);
vint32m8_t __riscv_vfwcvt_x_tu(vint32m8_t vd, vfloat16m4_t vs2,
                               unsigned int frm, size_t vl);
vuint32mf2_t __riscv_vfwcvt_xu_tu(vuint32mf2_t vd, vfloat16mf4_t vs2,
                                  unsigned int frm, size_t vl);
vuint32m1_t __riscv_vfwcvt_xu_tu(vuint32m1_t vd, vfloat16mf2_t vs2,
                                 unsigned int frm, size_t vl);
vuint32m2_t __riscv_vfwcvt_xu_tu(vuint32m2_t vd, vfloat16m1_t vs2,
                                 unsigned int frm, size_t vl);
vuint32m4_t __riscv_vfwcvt_xu_tu(vuint32m4_t vd, vfloat16m2_t vs2,
                                 unsigned int frm, size_t vl);
vuint32m8_t __riscv_vfwcvt_xu_tu(vuint32m8_t vd, vfloat16m4_t vs2,
                                 unsigned int frm, size_t vl);
vint64m1_t __riscv_vfwcvt_x_tu(vint64m1_t vd, vfloat32mf2_t vs2,
                               unsigned int frm, size_t vl);
vint64m2_t __riscv_vfwcvt_x_tu(vint64m2_t vd, vfloat32m1_t vs2,
                               unsigned int frm, size_t vl);
vint64m4_t __riscv_vfwcvt_x_tu(vint64m4_t vd, vfloat32m2_t vs2,
                               unsigned int frm, size_t vl);
vint64m8_t __riscv_vfwcvt_x_tu(vint64m8_t vd, vfloat32m4_t vs2,
                               unsigned int frm, size_t vl);
vuint64m1_t __riscv_vfwcvt_xu_tu(vuint64m1_t vd, vfloat32mf2_t vs2,
                                 unsigned int frm, size_t vl);
vuint64m2_t __riscv_vfwcvt_xu_tu(vuint64m2_t vd, vfloat32m1_t vs2,
                                 unsigned int frm, size_t vl);
vuint64m4_t __riscv_vfwcvt_xu_tu(vuint64m4_t vd, vfloat32m2_t vs2,
                                 unsigned int frm, size_t vl);
vuint64m8_t __riscv_vfwcvt_xu_tu(vuint64m8_t vd, vfloat32m4_t vs2,
                                 unsigned int frm, size_t vl);
// masked functions
vint32mf2_t __riscv_vfwcvt_x_tum(vbool64_t vm, vint32mf2_t vd,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vint32m1_t __riscv_vfwcvt_x_tum(vbool32_t vm, vint32m1_t vd, vfloat16mf2_t vs2,
                                unsigned int frm, size_t vl);
vint32m2_t __riscv_vfwcvt_x_tum(vbool16_t vm, vint32m2_t vd, vfloat16m1_t vs2,
                                unsigned int frm, size_t vl);
vint32m4_t __riscv_vfwcvt_x_tum(vbool8_t vm, vint32m4_t vd, vfloat16m2_t vs2,
                                unsigned int frm, size_t vl);
vint32m8_t __riscv_vfwcvt_x_tum(vbool4_t vm, vint32m8_t vd, vfloat16m4_t vs2,
                                unsigned int frm, size_t vl);
vuint32mf2_t __riscv_vfwcvt_xu_tum(vbool64_t vm, vuint32mf2_t vd,
                                   vfloat16mf4_t vs2, unsigned int frm,
                                   size_t vl);
vuint32m1_t __riscv_vfwcvt_xu_tum(vbool32_t vm, vuint32m1_t vd,
                                  vfloat16mf2_t vs2, unsigned int frm,
                                  size_t vl);
vuint32m2_t __riscv_vfwcvt_xu_tum(vbool16_t vm, vuint32m2_t vd,
                                  vfloat16m1_t vs2, unsigned int frm,
                                  size_t vl);
vuint32m4_t __riscv_vfwcvt_xu_tum(vbool8_t vm, vuint32m4_t vd, vfloat16m2_t vs2,
                                  unsigned int frm, size_t vl);
vuint32m8_t __riscv_vfwcvt_xu_tum(vbool4_t vm, vuint32m8_t vd, vfloat16m4_t vs2,
                                  unsigned int frm, size_t vl);
vint64m1_t __riscv_vfwcvt_x_tum(vbool64_t vm, vint64m1_t vd, vfloat32mf2_t vs2,
                                unsigned int frm, size_t vl);
vint64m2_t __riscv_vfwcvt_x_tum(vbool32_t vm, vint64m2_t vd, vfloat32m1_t vs2,
                                unsigned int frm, size_t vl);
vint64m4_t __riscv_vfwcvt_x_tum(vbool16_t vm, vint64m4_t vd, vfloat32m2_t vs2,
                                unsigned int frm, size_t vl);
vint64m8_t __riscv_vfwcvt_x_tum(vbool8_t vm, vint64m8_t vd, vfloat32m4_t vs2,
                                unsigned int frm, size_t vl);
vuint64m1_t __riscv_vfwcvt_xu_tum(vbool64_t vm, vuint64m1_t vd,
                                  vfloat32mf2_t vs2, unsigned int frm,
                                  size_t vl);
vuint64m2_t __riscv_vfwcvt_xu_tum(vbool32_t vm, vuint64m2_t vd,
                                  vfloat32m1_t vs2, unsigned int frm,
                                  size_t vl);
vuint64m4_t __riscv_vfwcvt_xu_tum(vbool16_t vm, vuint64m4_t vd,
                                  vfloat32m2_t vs2, unsigned int frm,
                                  size_t vl);
vuint64m8_t __riscv_vfwcvt_xu_tum(vbool8_t vm, vuint64m8_t vd, vfloat32m4_t vs2,
                                  unsigned int frm, size_t vl);
// masked functions
vint32mf2_t __riscv_vfwcvt_x_tumu(vbool64_t vm, vint32mf2_t vd,
                                  vfloat16mf4_t vs2, unsigned int frm,
                                  size_t vl);
vint32m1_t __riscv_vfwcvt_x_tumu(vbool32_t vm, vint32m1_t vd, vfloat16mf2_t vs2,
                                 unsigned int frm, size_t vl);
vint32m2_t __riscv_vfwcvt_x_tumu(vbool16_t vm, vint32m2_t vd, vfloat16m1_t vs2,
                                 unsigned int frm, size_t vl);
vint32m4_t __riscv_vfwcvt_x_tumu(vbool8_t vm, vint32m4_t vd, vfloat16m2_t vs2,
                                 unsigned int frm, size_t vl);
vint32m8_t __riscv_vfwcvt_x_tumu(vbool4_t vm, vint32m8_t vd, vfloat16m4_t vs2,
                                 unsigned int frm, size_t vl);
vuint32mf2_t __riscv_vfwcvt_xu_tumu(vbool64_t vm, vuint32mf2_t vd,
                                    vfloat16mf4_t vs2, unsigned int frm,
                                    size_t vl);
vuint32m1_t __riscv_vfwcvt_xu_tumu(vbool32_t vm, vuint32m1_t vd,
                                   vfloat16mf2_t vs2, unsigned int frm,
                                   size_t vl);
vuint32m2_t __riscv_vfwcvt_xu_tumu(vbool16_t vm, vuint32m2_t vd,
                                   vfloat16m1_t vs2, unsigned int frm,
                                   size_t vl);
vuint32m4_t __riscv_vfwcvt_xu_tumu(vbool8_t vm, vuint32m4_t vd,
                                   vfloat16m2_t vs2, unsigned int frm,
                                   size_t vl);
vuint32m8_t __riscv_vfwcvt_xu_tumu(vbool4_t vm, vuint32m8_t vd,
                                   vfloat16m4_t vs2, unsigned int frm,
                                   size_t vl);
vint64m1_t __riscv_vfwcvt_x_tumu(vbool64_t vm, vint64m1_t vd, vfloat32mf2_t vs2,
                                 unsigned int frm, size_t vl);
vint64m2_t __riscv_vfwcvt_x_tumu(vbool32_t vm, vint64m2_t vd, vfloat32m1_t vs2,
                                 unsigned int frm, size_t vl);
vint64m4_t __riscv_vfwcvt_x_tumu(vbool16_t vm, vint64m4_t vd, vfloat32m2_t vs2,
                                 unsigned int frm, size_t vl);
vint64m8_t __riscv_vfwcvt_x_tumu(vbool8_t vm, vint64m8_t vd, vfloat32m4_t vs2,
                                 unsigned int frm, size_t vl);
vuint64m1_t __riscv_vfwcvt_xu_tumu(vbool64_t vm, vuint64m1_t vd,
                                   vfloat32mf2_t vs2, unsigned int frm,
                                   size_t vl);
vuint64m2_t __riscv_vfwcvt_xu_tumu(vbool32_t vm, vuint64m2_t vd,
                                   vfloat32m1_t vs2, unsigned int frm,
                                   size_t vl);
vuint64m4_t __riscv_vfwcvt_xu_tumu(vbool16_t vm, vuint64m4_t vd,
                                   vfloat32m2_t vs2, unsigned int frm,
                                   size_t vl);
vuint64m8_t __riscv_vfwcvt_xu_tumu(vbool8_t vm, vuint64m8_t vd,
                                   vfloat32m4_t vs2, unsigned int frm,
                                   size_t vl);
// masked functions
vint32mf2_t __riscv_vfwcvt_x_mu(vbool64_t vm, vint32mf2_t vd, vfloat16mf4_t vs2,
                                unsigned int frm, size_t vl);
vint32m1_t __riscv_vfwcvt_x_mu(vbool32_t vm, vint32m1_t vd, vfloat16mf2_t vs2,
                               unsigned int frm, size_t vl);
vint32m2_t __riscv_vfwcvt_x_mu(vbool16_t vm, vint32m2_t vd, vfloat16m1_t vs2,
                               unsigned int frm, size_t vl);
vint32m4_t __riscv_vfwcvt_x_mu(vbool8_t vm, vint32m4_t vd, vfloat16m2_t vs2,
                               unsigned int frm, size_t vl);
vint32m8_t __riscv_vfwcvt_x_mu(vbool4_t vm, vint32m8_t vd, vfloat16m4_t vs2,
                               unsigned int frm, size_t vl);
vuint32mf2_t __riscv_vfwcvt_xu_mu(vbool64_t vm, vuint32mf2_t vd,
                                  vfloat16mf4_t vs2, unsigned int frm,
                                  size_t vl);
vuint32m1_t __riscv_vfwcvt_xu_mu(vbool32_t vm, vuint32m1_t vd,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vuint32m2_t __riscv_vfwcvt_xu_mu(vbool16_t vm, vuint32m2_t vd, vfloat16m1_t vs2,
                                 unsigned int frm, size_t vl);
vuint32m4_t __riscv_vfwcvt_xu_mu(vbool8_t vm, vuint32m4_t vd, vfloat16m2_t vs2,
                                 unsigned int frm, size_t vl);
vuint32m8_t __riscv_vfwcvt_xu_mu(vbool4_t vm, vuint32m8_t vd, vfloat16m4_t vs2,
                                 unsigned int frm, size_t vl);
vint64m1_t __riscv_vfwcvt_x_mu(vbool64_t vm, vint64m1_t vd, vfloat32mf2_t vs2,
                               unsigned int frm, size_t vl);
vint64m2_t __riscv_vfwcvt_x_mu(vbool32_t vm, vint64m2_t vd, vfloat32m1_t vs2,
                               unsigned int frm, size_t vl);
vint64m4_t __riscv_vfwcvt_x_mu(vbool16_t vm, vint64m4_t vd, vfloat32m2_t vs2,
                               unsigned int frm, size_t vl);
vint64m8_t __riscv_vfwcvt_x_mu(vbool8_t vm, vint64m8_t vd, vfloat32m4_t vs2,
                               unsigned int frm, size_t vl);
vuint64m1_t __riscv_vfwcvt_xu_mu(vbool64_t vm, vuint64m1_t vd,
                                 vfloat32mf2_t vs2, unsigned int frm,
                                 size_t vl);
vuint64m2_t __riscv_vfwcvt_xu_mu(vbool32_t vm, vuint64m2_t vd, vfloat32m1_t vs2,
                                 unsigned int frm, size_t vl);
vuint64m4_t __riscv_vfwcvt_xu_mu(vbool16_t vm, vuint64m4_t vd, vfloat32m2_t vs2,
                                 unsigned int frm, size_t vl);
vuint64m8_t __riscv_vfwcvt_xu_mu(vbool8_t vm, vuint64m8_t vd, vfloat32m4_t vs2,
                                 unsigned int frm, size_t vl);

Narrowing Floating-Point/Integer Type-Convert Intrinsics

vint8mf8_t __riscv_vfncvt_x_tu(vint8mf8_t vd, vfloat16mf4_t vs2, size_t vl);
vint8mf8_t __riscv_vfncvt_rtz_x_tu(vint8mf8_t vd, vfloat16mf4_t vs2, size_t vl);
vint8mf4_t __riscv_vfncvt_x_tu(vint8mf4_t vd, vfloat16mf2_t vs2, size_t vl);
vint8mf4_t __riscv_vfncvt_rtz_x_tu(vint8mf4_t vd, vfloat16mf2_t vs2, size_t vl);
vint8mf2_t __riscv_vfncvt_x_tu(vint8mf2_t vd, vfloat16m1_t vs2, size_t vl);
vint8mf2_t __riscv_vfncvt_rtz_x_tu(vint8mf2_t vd, vfloat16m1_t vs2, size_t vl);
vint8m1_t __riscv_vfncvt_x_tu(vint8m1_t vd, vfloat16m2_t vs2, size_t vl);
vint8m1_t __riscv_vfncvt_rtz_x_tu(vint8m1_t vd, vfloat16m2_t vs2, size_t vl);
vint8m2_t __riscv_vfncvt_x_tu(vint8m2_t vd, vfloat16m4_t vs2, size_t vl);
vint8m2_t __riscv_vfncvt_rtz_x_tu(vint8m2_t vd, vfloat16m4_t vs2, size_t vl);
vint8m4_t __riscv_vfncvt_x_tu(vint8m4_t vd, vfloat16m8_t vs2, size_t vl);
vint8m4_t __riscv_vfncvt_rtz_x_tu(vint8m4_t vd, vfloat16m8_t vs2, size_t vl);
vuint8mf8_t __riscv_vfncvt_xu_tu(vuint8mf8_t vd, vfloat16mf4_t vs2, size_t vl);
vuint8mf8_t __riscv_vfncvt_rtz_xu_tu(vuint8mf8_t vd, vfloat16mf4_t vs2,
                                     size_t vl);
vuint8mf4_t __riscv_vfncvt_xu_tu(vuint8mf4_t vd, vfloat16mf2_t vs2, size_t vl);
vuint8mf4_t __riscv_vfncvt_rtz_xu_tu(vuint8mf4_t vd, vfloat16mf2_t vs2,
                                     size_t vl);
vuint8mf2_t __riscv_vfncvt_xu_tu(vuint8mf2_t vd, vfloat16m1_t vs2, size_t vl);
vuint8mf2_t __riscv_vfncvt_rtz_xu_tu(vuint8mf2_t vd, vfloat16m1_t vs2,
                                     size_t vl);
vuint8m1_t __riscv_vfncvt_xu_tu(vuint8m1_t vd, vfloat16m2_t vs2, size_t vl);
vuint8m1_t __riscv_vfncvt_rtz_xu_tu(vuint8m1_t vd, vfloat16m2_t vs2, size_t vl);
vuint8m2_t __riscv_vfncvt_xu_tu(vuint8m2_t vd, vfloat16m4_t vs2, size_t vl);
vuint8m2_t __riscv_vfncvt_rtz_xu_tu(vuint8m2_t vd, vfloat16m4_t vs2, size_t vl);
vuint8m4_t __riscv_vfncvt_xu_tu(vuint8m4_t vd, vfloat16m8_t vs2, size_t vl);
vuint8m4_t __riscv_vfncvt_rtz_xu_tu(vuint8m4_t vd, vfloat16m8_t vs2, size_t vl);
vint16mf4_t __riscv_vfncvt_x_tu(vint16mf4_t vd, vfloat32mf2_t vs2, size_t vl);
vint16mf4_t __riscv_vfncvt_rtz_x_tu(vint16mf4_t vd, vfloat32mf2_t vs2,
                                    size_t vl);
vint16mf2_t __riscv_vfncvt_x_tu(vint16mf2_t vd, vfloat32m1_t vs2, size_t vl);
vint16mf2_t __riscv_vfncvt_rtz_x_tu(vint16mf2_t vd, vfloat32m1_t vs2,
                                    size_t vl);
vint16m1_t __riscv_vfncvt_x_tu(vint16m1_t vd, vfloat32m2_t vs2, size_t vl);
vint16m1_t __riscv_vfncvt_rtz_x_tu(vint16m1_t vd, vfloat32m2_t vs2, size_t vl);
vint16m2_t __riscv_vfncvt_x_tu(vint16m2_t vd, vfloat32m4_t vs2, size_t vl);
vint16m2_t __riscv_vfncvt_rtz_x_tu(vint16m2_t vd, vfloat32m4_t vs2, size_t vl);
vint16m4_t __riscv_vfncvt_x_tu(vint16m4_t vd, vfloat32m8_t vs2, size_t vl);
vint16m4_t __riscv_vfncvt_rtz_x_tu(vint16m4_t vd, vfloat32m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vfncvt_xu_tu(vuint16mf4_t vd, vfloat32mf2_t vs2,
                                  size_t vl);
vuint16mf4_t __riscv_vfncvt_rtz_xu_tu(vuint16mf4_t vd, vfloat32mf2_t vs2,
                                      size_t vl);
vuint16mf2_t __riscv_vfncvt_xu_tu(vuint16mf2_t vd, vfloat32m1_t vs2, size_t vl);
vuint16mf2_t __riscv_vfncvt_rtz_xu_tu(vuint16mf2_t vd, vfloat32m1_t vs2,
                                      size_t vl);
vuint16m1_t __riscv_vfncvt_xu_tu(vuint16m1_t vd, vfloat32m2_t vs2, size_t vl);
vuint16m1_t __riscv_vfncvt_rtz_xu_tu(vuint16m1_t vd, vfloat32m2_t vs2,
                                     size_t vl);
vuint16m2_t __riscv_vfncvt_xu_tu(vuint16m2_t vd, vfloat32m4_t vs2, size_t vl);
vuint16m2_t __riscv_vfncvt_rtz_xu_tu(vuint16m2_t vd, vfloat32m4_t vs2,
                                     size_t vl);
vuint16m4_t __riscv_vfncvt_xu_tu(vuint16m4_t vd, vfloat32m8_t vs2, size_t vl);
vuint16m4_t __riscv_vfncvt_rtz_xu_tu(vuint16m4_t vd, vfloat32m8_t vs2,
                                     size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_tu(vfloat16mf4_t vd, vint32mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_tu(vfloat16mf2_t vd, vint32m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_tu(vfloat16m1_t vd, vint32m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_tu(vfloat16m2_t vd, vint32m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_tu(vfloat16m4_t vd, vint32m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_tu(vfloat16mf4_t vd, vuint32mf2_t vs2,
                                  size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_tu(vfloat16mf2_t vd, vuint32m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_tu(vfloat16m1_t vd, vuint32m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_tu(vfloat16m2_t vd, vuint32m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_tu(vfloat16m4_t vd, vuint32m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_tu(vfloat16mf4_t vd, vfloat32mf2_t vs2,
                                  size_t vl);
vfloat16mf4_t __riscv_vfncvt_rod_f_tu(vfloat16mf4_t vd, vfloat32mf2_t vs2,
                                      size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_tu(vfloat16mf2_t vd, vfloat32m1_t vs2,
                                  size_t vl);
vfloat16mf2_t __riscv_vfncvt_rod_f_tu(vfloat16mf2_t vd, vfloat32m1_t vs2,
                                      size_t vl);
vfloat16m1_t __riscv_vfncvt_f_tu(vfloat16m1_t vd, vfloat32m2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_rod_f_tu(vfloat16m1_t vd, vfloat32m2_t vs2,
                                     size_t vl);
vfloat16m2_t __riscv_vfncvt_f_tu(vfloat16m2_t vd, vfloat32m4_t vs2, size_t vl);
vfloat16m2_t __riscv_vfncvt_rod_f_tu(vfloat16m2_t vd, vfloat32m4_t vs2,
                                     size_t vl);
vfloat16m4_t __riscv_vfncvt_f_tu(vfloat16m4_t vd, vfloat32m8_t vs2, size_t vl);
vfloat16m4_t __riscv_vfncvt_rod_f_tu(vfloat16m4_t vd, vfloat32m8_t vs2,
                                     size_t vl);
vint32mf2_t __riscv_vfncvt_x_tu(vint32mf2_t vd, vfloat64m1_t vs2, size_t vl);
vint32mf2_t __riscv_vfncvt_rtz_x_tu(vint32mf2_t vd, vfloat64m1_t vs2,
                                    size_t vl);
vint32m1_t __riscv_vfncvt_x_tu(vint32m1_t vd, vfloat64m2_t vs2, size_t vl);
vint32m1_t __riscv_vfncvt_rtz_x_tu(vint32m1_t vd, vfloat64m2_t vs2, size_t vl);
vint32m2_t __riscv_vfncvt_x_tu(vint32m2_t vd, vfloat64m4_t vs2, size_t vl);
vint32m2_t __riscv_vfncvt_rtz_x_tu(vint32m2_t vd, vfloat64m4_t vs2, size_t vl);
vint32m4_t __riscv_vfncvt_x_tu(vint32m4_t vd, vfloat64m8_t vs2, size_t vl);
vint32m4_t __riscv_vfncvt_rtz_x_tu(vint32m4_t vd, vfloat64m8_t vs2, size_t vl);
vuint32mf2_t __riscv_vfncvt_xu_tu(vuint32mf2_t vd, vfloat64m1_t vs2, size_t vl);
vuint32mf2_t __riscv_vfncvt_rtz_xu_tu(vuint32mf2_t vd, vfloat64m1_t vs2,
                                      size_t vl);
vuint32m1_t __riscv_vfncvt_xu_tu(vuint32m1_t vd, vfloat64m2_t vs2, size_t vl);
vuint32m1_t __riscv_vfncvt_rtz_xu_tu(vuint32m1_t vd, vfloat64m2_t vs2,
                                     size_t vl);
vuint32m2_t __riscv_vfncvt_xu_tu(vuint32m2_t vd, vfloat64m4_t vs2, size_t vl);
vuint32m2_t __riscv_vfncvt_rtz_xu_tu(vuint32m2_t vd, vfloat64m4_t vs2,
                                     size_t vl);
vuint32m4_t __riscv_vfncvt_xu_tu(vuint32m4_t vd, vfloat64m8_t vs2, size_t vl);
vuint32m4_t __riscv_vfncvt_rtz_xu_tu(vuint32m4_t vd, vfloat64m8_t vs2,
                                     size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_tu(vfloat32mf2_t vd, vint64m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_tu(vfloat32m1_t vd, vint64m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_tu(vfloat32m2_t vd, vint64m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_tu(vfloat32m4_t vd, vint64m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_tu(vfloat32mf2_t vd, vuint64m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_tu(vfloat32m1_t vd, vuint64m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_tu(vfloat32m2_t vd, vuint64m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_tu(vfloat32m4_t vd, vuint64m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_tu(vfloat32mf2_t vd, vfloat64m1_t vs2,
                                  size_t vl);
vfloat32mf2_t __riscv_vfncvt_rod_f_tu(vfloat32mf2_t vd, vfloat64m1_t vs2,
                                      size_t vl);
vfloat32m1_t __riscv_vfncvt_f_tu(vfloat32m1_t vd, vfloat64m2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_rod_f_tu(vfloat32m1_t vd, vfloat64m2_t vs2,
                                     size_t vl);
vfloat32m2_t __riscv_vfncvt_f_tu(vfloat32m2_t vd, vfloat64m4_t vs2, size_t vl);
vfloat32m2_t __riscv_vfncvt_rod_f_tu(vfloat32m2_t vd, vfloat64m4_t vs2,
                                     size_t vl);
vfloat32m4_t __riscv_vfncvt_f_tu(vfloat32m4_t vd, vfloat64m8_t vs2, size_t vl);
vfloat32m4_t __riscv_vfncvt_rod_f_tu(vfloat32m4_t vd, vfloat64m8_t vs2,
                                     size_t vl);
// masked functions
vint8mf8_t __riscv_vfncvt_x_tum(vbool64_t vm, vint8mf8_t vd, vfloat16mf4_t vs2,
                                size_t vl);
vint8mf8_t __riscv_vfncvt_rtz_x_tum(vbool64_t vm, vint8mf8_t vd,
                                    vfloat16mf4_t vs2, size_t vl);
vint8mf4_t __riscv_vfncvt_x_tum(vbool32_t vm, vint8mf4_t vd, vfloat16mf2_t vs2,
                                size_t vl);
vint8mf4_t __riscv_vfncvt_rtz_x_tum(vbool32_t vm, vint8mf4_t vd,
                                    vfloat16mf2_t vs2, size_t vl);
vint8mf2_t __riscv_vfncvt_x_tum(vbool16_t vm, vint8mf2_t vd, vfloat16m1_t vs2,
                                size_t vl);
vint8mf2_t __riscv_vfncvt_rtz_x_tum(vbool16_t vm, vint8mf2_t vd,
                                    vfloat16m1_t vs2, size_t vl);
vint8m1_t __riscv_vfncvt_x_tum(vbool8_t vm, vint8m1_t vd, vfloat16m2_t vs2,
                               size_t vl);
vint8m1_t __riscv_vfncvt_rtz_x_tum(vbool8_t vm, vint8m1_t vd, vfloat16m2_t vs2,
                                   size_t vl);
vint8m2_t __riscv_vfncvt_x_tum(vbool4_t vm, vint8m2_t vd, vfloat16m4_t vs2,
                               size_t vl);
vint8m2_t __riscv_vfncvt_rtz_x_tum(vbool4_t vm, vint8m2_t vd, vfloat16m4_t vs2,
                                   size_t vl);
vint8m4_t __riscv_vfncvt_x_tum(vbool2_t vm, vint8m4_t vd, vfloat16m8_t vs2,
                               size_t vl);
vint8m4_t __riscv_vfncvt_rtz_x_tum(vbool2_t vm, vint8m4_t vd, vfloat16m8_t vs2,
                                   size_t vl);
vuint8mf8_t __riscv_vfncvt_xu_tum(vbool64_t vm, vuint8mf8_t vd,
                                  vfloat16mf4_t vs2, size_t vl);
vuint8mf8_t __riscv_vfncvt_rtz_xu_tum(vbool64_t vm, vuint8mf8_t vd,
                                      vfloat16mf4_t vs2, size_t vl);
vuint8mf4_t __riscv_vfncvt_xu_tum(vbool32_t vm, vuint8mf4_t vd,
                                  vfloat16mf2_t vs2, size_t vl);
vuint8mf4_t __riscv_vfncvt_rtz_xu_tum(vbool32_t vm, vuint8mf4_t vd,
                                      vfloat16mf2_t vs2, size_t vl);
vuint8mf2_t __riscv_vfncvt_xu_tum(vbool16_t vm, vuint8mf2_t vd,
                                  vfloat16m1_t vs2, size_t vl);
vuint8mf2_t __riscv_vfncvt_rtz_xu_tum(vbool16_t vm, vuint8mf2_t vd,
                                      vfloat16m1_t vs2, size_t vl);
vuint8m1_t __riscv_vfncvt_xu_tum(vbool8_t vm, vuint8m1_t vd, vfloat16m2_t vs2,
                                 size_t vl);
vuint8m1_t __riscv_vfncvt_rtz_xu_tum(vbool8_t vm, vuint8m1_t vd,
                                     vfloat16m2_t vs2, size_t vl);
vuint8m2_t __riscv_vfncvt_xu_tum(vbool4_t vm, vuint8m2_t vd, vfloat16m4_t vs2,
                                 size_t vl);
vuint8m2_t __riscv_vfncvt_rtz_xu_tum(vbool4_t vm, vuint8m2_t vd,
                                     vfloat16m4_t vs2, size_t vl);
vuint8m4_t __riscv_vfncvt_xu_tum(vbool2_t vm, vuint8m4_t vd, vfloat16m8_t vs2,
                                 size_t vl);
vuint8m4_t __riscv_vfncvt_rtz_xu_tum(vbool2_t vm, vuint8m4_t vd,
                                     vfloat16m8_t vs2, size_t vl);
vint16mf4_t __riscv_vfncvt_x_tum(vbool64_t vm, vint16mf4_t vd,
                                 vfloat32mf2_t vs2, size_t vl);
vint16mf4_t __riscv_vfncvt_rtz_x_tum(vbool64_t vm, vint16mf4_t vd,
                                     vfloat32mf2_t vs2, size_t vl);
vint16mf2_t __riscv_vfncvt_x_tum(vbool32_t vm, vint16mf2_t vd, vfloat32m1_t vs2,
                                 size_t vl);
vint16mf2_t __riscv_vfncvt_rtz_x_tum(vbool32_t vm, vint16mf2_t vd,
                                     vfloat32m1_t vs2, size_t vl);
vint16m1_t __riscv_vfncvt_x_tum(vbool16_t vm, vint16m1_t vd, vfloat32m2_t vs2,
                                size_t vl);
vint16m1_t __riscv_vfncvt_rtz_x_tum(vbool16_t vm, vint16m1_t vd,
                                    vfloat32m2_t vs2, size_t vl);
vint16m2_t __riscv_vfncvt_x_tum(vbool8_t vm, vint16m2_t vd, vfloat32m4_t vs2,
                                size_t vl);
vint16m2_t __riscv_vfncvt_rtz_x_tum(vbool8_t vm, vint16m2_t vd,
                                    vfloat32m4_t vs2, size_t vl);
vint16m4_t __riscv_vfncvt_x_tum(vbool4_t vm, vint16m4_t vd, vfloat32m8_t vs2,
                                size_t vl);
vint16m4_t __riscv_vfncvt_rtz_x_tum(vbool4_t vm, vint16m4_t vd,
                                    vfloat32m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vfncvt_xu_tum(vbool64_t vm, vuint16mf4_t vd,
                                   vfloat32mf2_t vs2, size_t vl);
vuint16mf4_t __riscv_vfncvt_rtz_xu_tum(vbool64_t vm, vuint16mf4_t vd,
                                       vfloat32mf2_t vs2, size_t vl);
vuint16mf2_t __riscv_vfncvt_xu_tum(vbool32_t vm, vuint16mf2_t vd,
                                   vfloat32m1_t vs2, size_t vl);
vuint16mf2_t __riscv_vfncvt_rtz_xu_tum(vbool32_t vm, vuint16mf2_t vd,
                                       vfloat32m1_t vs2, size_t vl);
vuint16m1_t __riscv_vfncvt_xu_tum(vbool16_t vm, vuint16m1_t vd,
                                  vfloat32m2_t vs2, size_t vl);
vuint16m1_t __riscv_vfncvt_rtz_xu_tum(vbool16_t vm, vuint16m1_t vd,
                                      vfloat32m2_t vs2, size_t vl);
vuint16m2_t __riscv_vfncvt_xu_tum(vbool8_t vm, vuint16m2_t vd, vfloat32m4_t vs2,
                                  size_t vl);
vuint16m2_t __riscv_vfncvt_rtz_xu_tum(vbool8_t vm, vuint16m2_t vd,
                                      vfloat32m4_t vs2, size_t vl);
vuint16m4_t __riscv_vfncvt_xu_tum(vbool4_t vm, vuint16m4_t vd, vfloat32m8_t vs2,
                                  size_t vl);
vuint16m4_t __riscv_vfncvt_rtz_xu_tum(vbool4_t vm, vuint16m4_t vd,
                                      vfloat32m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_tum(vbool64_t vm, vfloat16mf4_t vd,
                                   vint32mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_tum(vbool32_t vm, vfloat16mf2_t vd,
                                   vint32m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_tum(vbool16_t vm, vfloat16m1_t vd, vint32m2_t vs2,
                                  size_t vl);
vfloat16m2_t __riscv_vfncvt_f_tum(vbool8_t vm, vfloat16m2_t vd, vint32m4_t vs2,
                                  size_t vl);
vfloat16m4_t __riscv_vfncvt_f_tum(vbool4_t vm, vfloat16m4_t vd, vint32m8_t vs2,
                                  size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_tum(vbool64_t vm, vfloat16mf4_t vd,
                                   vuint32mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_tum(vbool32_t vm, vfloat16mf2_t vd,
                                   vuint32m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_tum(vbool16_t vm, vfloat16m1_t vd,
                                  vuint32m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_tum(vbool8_t vm, vfloat16m2_t vd, vuint32m4_t vs2,
                                  size_t vl);
vfloat16m4_t __riscv_vfncvt_f_tum(vbool4_t vm, vfloat16m4_t vd, vuint32m8_t vs2,
                                  size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_tum(vbool64_t vm, vfloat16mf4_t vd,
                                   vfloat32mf2_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfncvt_rod_f_tum(vbool64_t vm, vfloat16mf4_t vd,
                                       vfloat32mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_tum(vbool32_t vm, vfloat16mf2_t vd,
                                   vfloat32m1_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_rod_f_tum(vbool32_t vm, vfloat16mf2_t vd,
                                       vfloat32m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_tum(vbool16_t vm, vfloat16m1_t vd,
                                  vfloat32m2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_rod_f_tum(vbool16_t vm, vfloat16m1_t vd,
                                      vfloat32m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_tum(vbool8_t vm, vfloat16m2_t vd,
                                  vfloat32m4_t vs2, size_t vl);
vfloat16m2_t __riscv_vfncvt_rod_f_tum(vbool8_t vm, vfloat16m2_t vd,
                                      vfloat32m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_tum(vbool4_t vm, vfloat16m4_t vd,
                                  vfloat32m8_t vs2, size_t vl);
vfloat16m4_t __riscv_vfncvt_rod_f_tum(vbool4_t vm, vfloat16m4_t vd,
                                      vfloat32m8_t vs2, size_t vl);
vint32mf2_t __riscv_vfncvt_x_tum(vbool64_t vm, vint32mf2_t vd, vfloat64m1_t vs2,
                                 size_t vl);
vint32mf2_t __riscv_vfncvt_rtz_x_tum(vbool64_t vm, vint32mf2_t vd,
                                     vfloat64m1_t vs2, size_t vl);
vint32m1_t __riscv_vfncvt_x_tum(vbool32_t vm, vint32m1_t vd, vfloat64m2_t vs2,
                                size_t vl);
vint32m1_t __riscv_vfncvt_rtz_x_tum(vbool32_t vm, vint32m1_t vd,
                                    vfloat64m2_t vs2, size_t vl);
vint32m2_t __riscv_vfncvt_x_tum(vbool16_t vm, vint32m2_t vd, vfloat64m4_t vs2,
                                size_t vl);
vint32m2_t __riscv_vfncvt_rtz_x_tum(vbool16_t vm, vint32m2_t vd,
                                    vfloat64m4_t vs2, size_t vl);
vint32m4_t __riscv_vfncvt_x_tum(vbool8_t vm, vint32m4_t vd, vfloat64m8_t vs2,
                                size_t vl);
vint32m4_t __riscv_vfncvt_rtz_x_tum(vbool8_t vm, vint32m4_t vd,
                                    vfloat64m8_t vs2, size_t vl);
vuint32mf2_t __riscv_vfncvt_xu_tum(vbool64_t vm, vuint32mf2_t vd,
                                   vfloat64m1_t vs2, size_t vl);
vuint32mf2_t __riscv_vfncvt_rtz_xu_tum(vbool64_t vm, vuint32mf2_t vd,
                                       vfloat64m1_t vs2, size_t vl);
vuint32m1_t __riscv_vfncvt_xu_tum(vbool32_t vm, vuint32m1_t vd,
                                  vfloat64m2_t vs2, size_t vl);
vuint32m1_t __riscv_vfncvt_rtz_xu_tum(vbool32_t vm, vuint32m1_t vd,
                                      vfloat64m2_t vs2, size_t vl);
vuint32m2_t __riscv_vfncvt_xu_tum(vbool16_t vm, vuint32m2_t vd,
                                  vfloat64m4_t vs2, size_t vl);
vuint32m2_t __riscv_vfncvt_rtz_xu_tum(vbool16_t vm, vuint32m2_t vd,
                                      vfloat64m4_t vs2, size_t vl);
vuint32m4_t __riscv_vfncvt_xu_tum(vbool8_t vm, vuint32m4_t vd, vfloat64m8_t vs2,
                                  size_t vl);
vuint32m4_t __riscv_vfncvt_rtz_xu_tum(vbool8_t vm, vuint32m4_t vd,
                                      vfloat64m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_tum(vbool64_t vm, vfloat32mf2_t vd,
                                   vint64m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_tum(vbool32_t vm, vfloat32m1_t vd, vint64m2_t vs2,
                                  size_t vl);
vfloat32m2_t __riscv_vfncvt_f_tum(vbool16_t vm, vfloat32m2_t vd, vint64m4_t vs2,
                                  size_t vl);
vfloat32m4_t __riscv_vfncvt_f_tum(vbool8_t vm, vfloat32m4_t vd, vint64m8_t vs2,
                                  size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_tum(vbool64_t vm, vfloat32mf2_t vd,
                                   vuint64m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_tum(vbool32_t vm, vfloat32m1_t vd,
                                  vuint64m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_tum(vbool16_t vm, vfloat32m2_t vd,
                                  vuint64m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_tum(vbool8_t vm, vfloat32m4_t vd, vuint64m8_t vs2,
                                  size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_tum(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat64m1_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfncvt_rod_f_tum(vbool64_t vm, vfloat32mf2_t vd,
                                       vfloat64m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_tum(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat64m2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_rod_f_tum(vbool32_t vm, vfloat32m1_t vd,
                                      vfloat64m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_tum(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat64m4_t vs2, size_t vl);
vfloat32m2_t __riscv_vfncvt_rod_f_tum(vbool16_t vm, vfloat32m2_t vd,
                                      vfloat64m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_tum(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat64m8_t vs2, size_t vl);
vfloat32m4_t __riscv_vfncvt_rod_f_tum(vbool8_t vm, vfloat32m4_t vd,
                                      vfloat64m8_t vs2, size_t vl);
// masked functions
vint8mf8_t __riscv_vfncvt_x_tumu(vbool64_t vm, vint8mf8_t vd, vfloat16mf4_t vs2,
                                 size_t vl);
vint8mf8_t __riscv_vfncvt_rtz_x_tumu(vbool64_t vm, vint8mf8_t vd,
                                     vfloat16mf4_t vs2, size_t vl);
vint8mf4_t __riscv_vfncvt_x_tumu(vbool32_t vm, vint8mf4_t vd, vfloat16mf2_t vs2,
                                 size_t vl);
vint8mf4_t __riscv_vfncvt_rtz_x_tumu(vbool32_t vm, vint8mf4_t vd,
                                     vfloat16mf2_t vs2, size_t vl);
vint8mf2_t __riscv_vfncvt_x_tumu(vbool16_t vm, vint8mf2_t vd, vfloat16m1_t vs2,
                                 size_t vl);
vint8mf2_t __riscv_vfncvt_rtz_x_tumu(vbool16_t vm, vint8mf2_t vd,
                                     vfloat16m1_t vs2, size_t vl);
vint8m1_t __riscv_vfncvt_x_tumu(vbool8_t vm, vint8m1_t vd, vfloat16m2_t vs2,
                                size_t vl);
vint8m1_t __riscv_vfncvt_rtz_x_tumu(vbool8_t vm, vint8m1_t vd, vfloat16m2_t vs2,
                                    size_t vl);
vint8m2_t __riscv_vfncvt_x_tumu(vbool4_t vm, vint8m2_t vd, vfloat16m4_t vs2,
                                size_t vl);
vint8m2_t __riscv_vfncvt_rtz_x_tumu(vbool4_t vm, vint8m2_t vd, vfloat16m4_t vs2,
                                    size_t vl);
vint8m4_t __riscv_vfncvt_x_tumu(vbool2_t vm, vint8m4_t vd, vfloat16m8_t vs2,
                                size_t vl);
vint8m4_t __riscv_vfncvt_rtz_x_tumu(vbool2_t vm, vint8m4_t vd, vfloat16m8_t vs2,
                                    size_t vl);
vuint8mf8_t __riscv_vfncvt_xu_tumu(vbool64_t vm, vuint8mf8_t vd,
                                   vfloat16mf4_t vs2, size_t vl);
vuint8mf8_t __riscv_vfncvt_rtz_xu_tumu(vbool64_t vm, vuint8mf8_t vd,
                                       vfloat16mf4_t vs2, size_t vl);
vuint8mf4_t __riscv_vfncvt_xu_tumu(vbool32_t vm, vuint8mf4_t vd,
                                   vfloat16mf2_t vs2, size_t vl);
vuint8mf4_t __riscv_vfncvt_rtz_xu_tumu(vbool32_t vm, vuint8mf4_t vd,
                                       vfloat16mf2_t vs2, size_t vl);
vuint8mf2_t __riscv_vfncvt_xu_tumu(vbool16_t vm, vuint8mf2_t vd,
                                   vfloat16m1_t vs2, size_t vl);
vuint8mf2_t __riscv_vfncvt_rtz_xu_tumu(vbool16_t vm, vuint8mf2_t vd,
                                       vfloat16m1_t vs2, size_t vl);
vuint8m1_t __riscv_vfncvt_xu_tumu(vbool8_t vm, vuint8m1_t vd, vfloat16m2_t vs2,
                                  size_t vl);
vuint8m1_t __riscv_vfncvt_rtz_xu_tumu(vbool8_t vm, vuint8m1_t vd,
                                      vfloat16m2_t vs2, size_t vl);
vuint8m2_t __riscv_vfncvt_xu_tumu(vbool4_t vm, vuint8m2_t vd, vfloat16m4_t vs2,
                                  size_t vl);
vuint8m2_t __riscv_vfncvt_rtz_xu_tumu(vbool4_t vm, vuint8m2_t vd,
                                      vfloat16m4_t vs2, size_t vl);
vuint8m4_t __riscv_vfncvt_xu_tumu(vbool2_t vm, vuint8m4_t vd, vfloat16m8_t vs2,
                                  size_t vl);
vuint8m4_t __riscv_vfncvt_rtz_xu_tumu(vbool2_t vm, vuint8m4_t vd,
                                      vfloat16m8_t vs2, size_t vl);
vint16mf4_t __riscv_vfncvt_x_tumu(vbool64_t vm, vint16mf4_t vd,
                                  vfloat32mf2_t vs2, size_t vl);
vint16mf4_t __riscv_vfncvt_rtz_x_tumu(vbool64_t vm, vint16mf4_t vd,
                                      vfloat32mf2_t vs2, size_t vl);
vint16mf2_t __riscv_vfncvt_x_tumu(vbool32_t vm, vint16mf2_t vd,
                                  vfloat32m1_t vs2, size_t vl);
vint16mf2_t __riscv_vfncvt_rtz_x_tumu(vbool32_t vm, vint16mf2_t vd,
                                      vfloat32m1_t vs2, size_t vl);
vint16m1_t __riscv_vfncvt_x_tumu(vbool16_t vm, vint16m1_t vd, vfloat32m2_t vs2,
                                 size_t vl);
vint16m1_t __riscv_vfncvt_rtz_x_tumu(vbool16_t vm, vint16m1_t vd,
                                     vfloat32m2_t vs2, size_t vl);
vint16m2_t __riscv_vfncvt_x_tumu(vbool8_t vm, vint16m2_t vd, vfloat32m4_t vs2,
                                 size_t vl);
vint16m2_t __riscv_vfncvt_rtz_x_tumu(vbool8_t vm, vint16m2_t vd,
                                     vfloat32m4_t vs2, size_t vl);
vint16m4_t __riscv_vfncvt_x_tumu(vbool4_t vm, vint16m4_t vd, vfloat32m8_t vs2,
                                 size_t vl);
vint16m4_t __riscv_vfncvt_rtz_x_tumu(vbool4_t vm, vint16m4_t vd,
                                     vfloat32m8_t vs2, size_t vl);
vuint16mf4_t __riscv_vfncvt_xu_tumu(vbool64_t vm, vuint16mf4_t vd,
                                    vfloat32mf2_t vs2, size_t vl);
vuint16mf4_t __riscv_vfncvt_rtz_xu_tumu(vbool64_t vm, vuint16mf4_t vd,
                                        vfloat32mf2_t vs2, size_t vl);
vuint16mf2_t __riscv_vfncvt_xu_tumu(vbool32_t vm, vuint16mf2_t vd,
                                    vfloat32m1_t vs2, size_t vl);
vuint16mf2_t __riscv_vfncvt_rtz_xu_tumu(vbool32_t vm, vuint16mf2_t vd,
                                        vfloat32m1_t vs2, size_t vl);
vuint16m1_t __riscv_vfncvt_xu_tumu(vbool16_t vm, vuint16m1_t vd,
                                   vfloat32m2_t vs2, size_t vl);
vuint16m1_t __riscv_vfncvt_rtz_xu_tumu(vbool16_t vm, vuint16m1_t vd,
                                       vfloat32m2_t vs2, size_t vl);
vuint16m2_t __riscv_vfncvt_xu_tumu(vbool8_t vm, vuint16m2_t vd,
                                   vfloat32m4_t vs2, size_t vl);
vuint16m2_t __riscv_vfncvt_rtz_xu_tumu(vbool8_t vm, vuint16m2_t vd,
                                       vfloat32m4_t vs2, size_t vl);
vuint16m4_t __riscv_vfncvt_xu_tumu(vbool4_t vm, vuint16m4_t vd,
                                   vfloat32m8_t vs2, size_t vl);
vuint16m4_t __riscv_vfncvt_rtz_xu_tumu(vbool4_t vm, vuint16m4_t vd,
                                       vfloat32m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                    vint32mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                    vint32m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_tumu(vbool16_t vm, vfloat16m1_t vd,
                                   vint32m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_tumu(vbool8_t vm, vfloat16m2_t vd, vint32m4_t vs2,
                                   size_t vl);
vfloat16m4_t __riscv_vfncvt_f_tumu(vbool4_t vm, vfloat16m4_t vd, vint32m8_t vs2,
                                   size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                    vuint32mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                    vuint32m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_tumu(vbool16_t vm, vfloat16m1_t vd,
                                   vuint32m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_tumu(vbool8_t vm, vfloat16m2_t vd,
                                   vuint32m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_tumu(vbool4_t vm, vfloat16m4_t vd,
                                   vuint32m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                    vfloat32mf2_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfncvt_rod_f_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                        vfloat32mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                    vfloat32m1_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_rod_f_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                        vfloat32m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_tumu(vbool16_t vm, vfloat16m1_t vd,
                                   vfloat32m2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_rod_f_tumu(vbool16_t vm, vfloat16m1_t vd,
                                       vfloat32m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_tumu(vbool8_t vm, vfloat16m2_t vd,
                                   vfloat32m4_t vs2, size_t vl);
vfloat16m2_t __riscv_vfncvt_rod_f_tumu(vbool8_t vm, vfloat16m2_t vd,
                                       vfloat32m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_tumu(vbool4_t vm, vfloat16m4_t vd,
                                   vfloat32m8_t vs2, size_t vl);
vfloat16m4_t __riscv_vfncvt_rod_f_tumu(vbool4_t vm, vfloat16m4_t vd,
                                       vfloat32m8_t vs2, size_t vl);
vint32mf2_t __riscv_vfncvt_x_tumu(vbool64_t vm, vint32mf2_t vd,
                                  vfloat64m1_t vs2, size_t vl);
vint32mf2_t __riscv_vfncvt_rtz_x_tumu(vbool64_t vm, vint32mf2_t vd,
                                      vfloat64m1_t vs2, size_t vl);
vint32m1_t __riscv_vfncvt_x_tumu(vbool32_t vm, vint32m1_t vd, vfloat64m2_t vs2,
                                 size_t vl);
vint32m1_t __riscv_vfncvt_rtz_x_tumu(vbool32_t vm, vint32m1_t vd,
                                     vfloat64m2_t vs2, size_t vl);
vint32m2_t __riscv_vfncvt_x_tumu(vbool16_t vm, vint32m2_t vd, vfloat64m4_t vs2,
                                 size_t vl);
vint32m2_t __riscv_vfncvt_rtz_x_tumu(vbool16_t vm, vint32m2_t vd,
                                     vfloat64m4_t vs2, size_t vl);
vint32m4_t __riscv_vfncvt_x_tumu(vbool8_t vm, vint32m4_t vd, vfloat64m8_t vs2,
                                 size_t vl);
vint32m4_t __riscv_vfncvt_rtz_x_tumu(vbool8_t vm, vint32m4_t vd,
                                     vfloat64m8_t vs2, size_t vl);
vuint32mf2_t __riscv_vfncvt_xu_tumu(vbool64_t vm, vuint32mf2_t vd,
                                    vfloat64m1_t vs2, size_t vl);
vuint32mf2_t __riscv_vfncvt_rtz_xu_tumu(vbool64_t vm, vuint32mf2_t vd,
                                        vfloat64m1_t vs2, size_t vl);
vuint32m1_t __riscv_vfncvt_xu_tumu(vbool32_t vm, vuint32m1_t vd,
                                   vfloat64m2_t vs2, size_t vl);
vuint32m1_t __riscv_vfncvt_rtz_xu_tumu(vbool32_t vm, vuint32m1_t vd,
                                       vfloat64m2_t vs2, size_t vl);
vuint32m2_t __riscv_vfncvt_xu_tumu(vbool16_t vm, vuint32m2_t vd,
                                   vfloat64m4_t vs2, size_t vl);
vuint32m2_t __riscv_vfncvt_rtz_xu_tumu(vbool16_t vm, vuint32m2_t vd,
                                       vfloat64m4_t vs2, size_t vl);
vuint32m4_t __riscv_vfncvt_xu_tumu(vbool8_t vm, vuint32m4_t vd,
                                   vfloat64m8_t vs2, size_t vl);
vuint32m4_t __riscv_vfncvt_rtz_xu_tumu(vbool8_t vm, vuint32m4_t vd,
                                       vfloat64m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                    vint64m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_tumu(vbool32_t vm, vfloat32m1_t vd,
                                   vint64m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_tumu(vbool16_t vm, vfloat32m2_t vd,
                                   vint64m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_tumu(vbool8_t vm, vfloat32m4_t vd, vint64m8_t vs2,
                                   size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                    vuint64m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_tumu(vbool32_t vm, vfloat32m1_t vd,
                                   vuint64m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_tumu(vbool16_t vm, vfloat32m2_t vd,
                                   vuint64m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_tumu(vbool8_t vm, vfloat32m4_t vd,
                                   vuint64m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                    vfloat64m1_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfncvt_rod_f_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                        vfloat64m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_tumu(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat64m2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_rod_f_tumu(vbool32_t vm, vfloat32m1_t vd,
                                       vfloat64m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_tumu(vbool16_t vm, vfloat32m2_t vd,
                                   vfloat64m4_t vs2, size_t vl);
vfloat32m2_t __riscv_vfncvt_rod_f_tumu(vbool16_t vm, vfloat32m2_t vd,
                                       vfloat64m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_tumu(vbool8_t vm, vfloat32m4_t vd,
                                   vfloat64m8_t vs2, size_t vl);
vfloat32m4_t __riscv_vfncvt_rod_f_tumu(vbool8_t vm, vfloat32m4_t vd,
                                       vfloat64m8_t vs2, size_t vl);
// masked functions
vint8mf8_t __riscv_vfncvt_x_mu(vbool64_t vm, vint8mf8_t vd, vfloat16mf4_t vs2,
                               size_t vl);
vint8mf8_t __riscv_vfncvt_rtz_x_mu(vbool64_t vm, vint8mf8_t vd,
                                   vfloat16mf4_t vs2, size_t vl);
vint8mf4_t __riscv_vfncvt_x_mu(vbool32_t vm, vint8mf4_t vd, vfloat16mf2_t vs2,
                               size_t vl);
vint8mf4_t __riscv_vfncvt_rtz_x_mu(vbool32_t vm, vint8mf4_t vd,
                                   vfloat16mf2_t vs2, size_t vl);
vint8mf2_t __riscv_vfncvt_x_mu(vbool16_t vm, vint8mf2_t vd, vfloat16m1_t vs2,
                               size_t vl);
vint8mf2_t __riscv_vfncvt_rtz_x_mu(vbool16_t vm, vint8mf2_t vd,
                                   vfloat16m1_t vs2, size_t vl);
vint8m1_t __riscv_vfncvt_x_mu(vbool8_t vm, vint8m1_t vd, vfloat16m2_t vs2,
                              size_t vl);
vint8m1_t __riscv_vfncvt_rtz_x_mu(vbool8_t vm, vint8m1_t vd, vfloat16m2_t vs2,
                                  size_t vl);
vint8m2_t __riscv_vfncvt_x_mu(vbool4_t vm, vint8m2_t vd, vfloat16m4_t vs2,
                              size_t vl);
vint8m2_t __riscv_vfncvt_rtz_x_mu(vbool4_t vm, vint8m2_t vd, vfloat16m4_t vs2,
                                  size_t vl);
vint8m4_t __riscv_vfncvt_x_mu(vbool2_t vm, vint8m4_t vd, vfloat16m8_t vs2,
                              size_t vl);
vint8m4_t __riscv_vfncvt_rtz_x_mu(vbool2_t vm, vint8m4_t vd, vfloat16m8_t vs2,
                                  size_t vl);
vuint8mf8_t __riscv_vfncvt_xu_mu(vbool64_t vm, vuint8mf8_t vd,
                                 vfloat16mf4_t vs2, size_t vl);
vuint8mf8_t __riscv_vfncvt_rtz_xu_mu(vbool64_t vm, vuint8mf8_t vd,
                                     vfloat16mf4_t vs2, size_t vl);
vuint8mf4_t __riscv_vfncvt_xu_mu(vbool32_t vm, vuint8mf4_t vd,
                                 vfloat16mf2_t vs2, size_t vl);
vuint8mf4_t __riscv_vfncvt_rtz_xu_mu(vbool32_t vm, vuint8mf4_t vd,
                                     vfloat16mf2_t vs2, size_t vl);
vuint8mf2_t __riscv_vfncvt_xu_mu(vbool16_t vm, vuint8mf2_t vd, vfloat16m1_t vs2,
                                 size_t vl);
vuint8mf2_t __riscv_vfncvt_rtz_xu_mu(vbool16_t vm, vuint8mf2_t vd,
                                     vfloat16m1_t vs2, size_t vl);
vuint8m1_t __riscv_vfncvt_xu_mu(vbool8_t vm, vuint8m1_t vd, vfloat16m2_t vs2,
                                size_t vl);
vuint8m1_t __riscv_vfncvt_rtz_xu_mu(vbool8_t vm, vuint8m1_t vd,
                                    vfloat16m2_t vs2, size_t vl);
vuint8m2_t __riscv_vfncvt_xu_mu(vbool4_t vm, vuint8m2_t vd, vfloat16m4_t vs2,
                                size_t vl);
vuint8m2_t __riscv_vfncvt_rtz_xu_mu(vbool4_t vm, vuint8m2_t vd,
                                    vfloat16m4_t vs2, size_t vl);
vuint8m4_t __riscv_vfncvt_xu_mu(vbool2_t vm, vuint8m4_t vd, vfloat16m8_t vs2,
                                size_t vl);
vuint8m4_t __riscv_vfncvt_rtz_xu_mu(vbool2_t vm, vuint8m4_t vd,
                                    vfloat16m8_t vs2, size_t vl);
vint16mf4_t __riscv_vfncvt_x_mu(vbool64_t vm, vint16mf4_t vd, vfloat32mf2_t vs2,
                                size_t vl);
vint16mf4_t __riscv_vfncvt_rtz_x_mu(vbool64_t vm, vint16mf4_t vd,
                                    vfloat32mf2_t vs2, size_t vl);
vint16mf2_t __riscv_vfncvt_x_mu(vbool32_t vm, vint16mf2_t vd, vfloat32m1_t vs2,
                                size_t vl);
vint16mf2_t __riscv_vfncvt_rtz_x_mu(vbool32_t vm, vint16mf2_t vd,
                                    vfloat32m1_t vs2, size_t vl);
vint16m1_t __riscv_vfncvt_x_mu(vbool16_t vm, vint16m1_t vd, vfloat32m2_t vs2,
                               size_t vl);
vint16m1_t __riscv_vfncvt_rtz_x_mu(vbool16_t vm, vint16m1_t vd,
                                   vfloat32m2_t vs2, size_t vl);
vint16m2_t __riscv_vfncvt_x_mu(vbool8_t vm, vint16m2_t vd, vfloat32m4_t vs2,
                               size_t vl);
vint16m2_t __riscv_vfncvt_rtz_x_mu(vbool8_t vm, vint16m2_t vd, vfloat32m4_t vs2,
                                   size_t vl);
vint16m4_t __riscv_vfncvt_x_mu(vbool4_t vm, vint16m4_t vd, vfloat32m8_t vs2,
                               size_t vl);
vint16m4_t __riscv_vfncvt_rtz_x_mu(vbool4_t vm, vint16m4_t vd, vfloat32m8_t vs2,
                                   size_t vl);
vuint16mf4_t __riscv_vfncvt_xu_mu(vbool64_t vm, vuint16mf4_t vd,
                                  vfloat32mf2_t vs2, size_t vl);
vuint16mf4_t __riscv_vfncvt_rtz_xu_mu(vbool64_t vm, vuint16mf4_t vd,
                                      vfloat32mf2_t vs2, size_t vl);
vuint16mf2_t __riscv_vfncvt_xu_mu(vbool32_t vm, vuint16mf2_t vd,
                                  vfloat32m1_t vs2, size_t vl);
vuint16mf2_t __riscv_vfncvt_rtz_xu_mu(vbool32_t vm, vuint16mf2_t vd,
                                      vfloat32m1_t vs2, size_t vl);
vuint16m1_t __riscv_vfncvt_xu_mu(vbool16_t vm, vuint16m1_t vd, vfloat32m2_t vs2,
                                 size_t vl);
vuint16m1_t __riscv_vfncvt_rtz_xu_mu(vbool16_t vm, vuint16m1_t vd,
                                     vfloat32m2_t vs2, size_t vl);
vuint16m2_t __riscv_vfncvt_xu_mu(vbool8_t vm, vuint16m2_t vd, vfloat32m4_t vs2,
                                 size_t vl);
vuint16m2_t __riscv_vfncvt_rtz_xu_mu(vbool8_t vm, vuint16m2_t vd,
                                     vfloat32m4_t vs2, size_t vl);
vuint16m4_t __riscv_vfncvt_xu_mu(vbool4_t vm, vuint16m4_t vd, vfloat32m8_t vs2,
                                 size_t vl);
vuint16m4_t __riscv_vfncvt_rtz_xu_mu(vbool4_t vm, vuint16m4_t vd,
                                     vfloat32m8_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_mu(vbool64_t vm, vfloat16mf4_t vd,
                                  vint32mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_mu(vbool32_t vm, vfloat16mf2_t vd,
                                  vint32m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_mu(vbool16_t vm, vfloat16m1_t vd, vint32m2_t vs2,
                                 size_t vl);
vfloat16m2_t __riscv_vfncvt_f_mu(vbool8_t vm, vfloat16m2_t vd, vint32m4_t vs2,
                                 size_t vl);
vfloat16m4_t __riscv_vfncvt_f_mu(vbool4_t vm, vfloat16m4_t vd, vint32m8_t vs2,
                                 size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_mu(vbool64_t vm, vfloat16mf4_t vd,
                                  vuint32mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_mu(vbool32_t vm, vfloat16mf2_t vd,
                                  vuint32m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_mu(vbool16_t vm, vfloat16m1_t vd, vuint32m2_t vs2,
                                 size_t vl);
vfloat16m2_t __riscv_vfncvt_f_mu(vbool8_t vm, vfloat16m2_t vd, vuint32m4_t vs2,
                                 size_t vl);
vfloat16m4_t __riscv_vfncvt_f_mu(vbool4_t vm, vfloat16m4_t vd, vuint32m8_t vs2,
                                 size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_mu(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat32mf2_t vs2, size_t vl);
vfloat16mf4_t __riscv_vfncvt_rod_f_mu(vbool64_t vm, vfloat16mf4_t vd,
                                      vfloat32mf2_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_mu(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat32m1_t vs2, size_t vl);
vfloat16mf2_t __riscv_vfncvt_rod_f_mu(vbool32_t vm, vfloat16mf2_t vd,
                                      vfloat32m1_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_mu(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat32m2_t vs2, size_t vl);
vfloat16m1_t __riscv_vfncvt_rod_f_mu(vbool16_t vm, vfloat16m1_t vd,
                                     vfloat32m2_t vs2, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_mu(vbool8_t vm, vfloat16m2_t vd, vfloat32m4_t vs2,
                                 size_t vl);
vfloat16m2_t __riscv_vfncvt_rod_f_mu(vbool8_t vm, vfloat16m2_t vd,
                                     vfloat32m4_t vs2, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_mu(vbool4_t vm, vfloat16m4_t vd, vfloat32m8_t vs2,
                                 size_t vl);
vfloat16m4_t __riscv_vfncvt_rod_f_mu(vbool4_t vm, vfloat16m4_t vd,
                                     vfloat32m8_t vs2, size_t vl);
vint32mf2_t __riscv_vfncvt_x_mu(vbool64_t vm, vint32mf2_t vd, vfloat64m1_t vs2,
                                size_t vl);
vint32mf2_t __riscv_vfncvt_rtz_x_mu(vbool64_t vm, vint32mf2_t vd,
                                    vfloat64m1_t vs2, size_t vl);
vint32m1_t __riscv_vfncvt_x_mu(vbool32_t vm, vint32m1_t vd, vfloat64m2_t vs2,
                               size_t vl);
vint32m1_t __riscv_vfncvt_rtz_x_mu(vbool32_t vm, vint32m1_t vd,
                                   vfloat64m2_t vs2, size_t vl);
vint32m2_t __riscv_vfncvt_x_mu(vbool16_t vm, vint32m2_t vd, vfloat64m4_t vs2,
                               size_t vl);
vint32m2_t __riscv_vfncvt_rtz_x_mu(vbool16_t vm, vint32m2_t vd,
                                   vfloat64m4_t vs2, size_t vl);
vint32m4_t __riscv_vfncvt_x_mu(vbool8_t vm, vint32m4_t vd, vfloat64m8_t vs2,
                               size_t vl);
vint32m4_t __riscv_vfncvt_rtz_x_mu(vbool8_t vm, vint32m4_t vd, vfloat64m8_t vs2,
                                   size_t vl);
vuint32mf2_t __riscv_vfncvt_xu_mu(vbool64_t vm, vuint32mf2_t vd,
                                  vfloat64m1_t vs2, size_t vl);
vuint32mf2_t __riscv_vfncvt_rtz_xu_mu(vbool64_t vm, vuint32mf2_t vd,
                                      vfloat64m1_t vs2, size_t vl);
vuint32m1_t __riscv_vfncvt_xu_mu(vbool32_t vm, vuint32m1_t vd, vfloat64m2_t vs2,
                                 size_t vl);
vuint32m1_t __riscv_vfncvt_rtz_xu_mu(vbool32_t vm, vuint32m1_t vd,
                                     vfloat64m2_t vs2, size_t vl);
vuint32m2_t __riscv_vfncvt_xu_mu(vbool16_t vm, vuint32m2_t vd, vfloat64m4_t vs2,
                                 size_t vl);
vuint32m2_t __riscv_vfncvt_rtz_xu_mu(vbool16_t vm, vuint32m2_t vd,
                                     vfloat64m4_t vs2, size_t vl);
vuint32m4_t __riscv_vfncvt_xu_mu(vbool8_t vm, vuint32m4_t vd, vfloat64m8_t vs2,
                                 size_t vl);
vuint32m4_t __riscv_vfncvt_rtz_xu_mu(vbool8_t vm, vuint32m4_t vd,
                                     vfloat64m8_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_mu(vbool64_t vm, vfloat32mf2_t vd,
                                  vint64m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_mu(vbool32_t vm, vfloat32m1_t vd, vint64m2_t vs2,
                                 size_t vl);
vfloat32m2_t __riscv_vfncvt_f_mu(vbool16_t vm, vfloat32m2_t vd, vint64m4_t vs2,
                                 size_t vl);
vfloat32m4_t __riscv_vfncvt_f_mu(vbool8_t vm, vfloat32m4_t vd, vint64m8_t vs2,
                                 size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_mu(vbool64_t vm, vfloat32mf2_t vd,
                                  vuint64m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_mu(vbool32_t vm, vfloat32m1_t vd, vuint64m2_t vs2,
                                 size_t vl);
vfloat32m2_t __riscv_vfncvt_f_mu(vbool16_t vm, vfloat32m2_t vd, vuint64m4_t vs2,
                                 size_t vl);
vfloat32m4_t __riscv_vfncvt_f_mu(vbool8_t vm, vfloat32m4_t vd, vuint64m8_t vs2,
                                 size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_mu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat64m1_t vs2, size_t vl);
vfloat32mf2_t __riscv_vfncvt_rod_f_mu(vbool64_t vm, vfloat32mf2_t vd,
                                      vfloat64m1_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_mu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat64m2_t vs2, size_t vl);
vfloat32m1_t __riscv_vfncvt_rod_f_mu(vbool32_t vm, vfloat32m1_t vd,
                                     vfloat64m2_t vs2, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_mu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat64m4_t vs2, size_t vl);
vfloat32m2_t __riscv_vfncvt_rod_f_mu(vbool16_t vm, vfloat32m2_t vd,
                                     vfloat64m4_t vs2, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_mu(vbool8_t vm, vfloat32m4_t vd, vfloat64m8_t vs2,
                                 size_t vl);
vfloat32m4_t __riscv_vfncvt_rod_f_mu(vbool8_t vm, vfloat32m4_t vd,
                                     vfloat64m8_t vs2, size_t vl);
vint8mf8_t __riscv_vfncvt_x_tu(vint8mf8_t vd, vfloat16mf4_t vs2,
                               unsigned int frm, size_t vl);
vint8mf4_t __riscv_vfncvt_x_tu(vint8mf4_t vd, vfloat16mf2_t vs2,
                               unsigned int frm, size_t vl);
vint8mf2_t __riscv_vfncvt_x_tu(vint8mf2_t vd, vfloat16m1_t vs2,
                               unsigned int frm, size_t vl);
vint8m1_t __riscv_vfncvt_x_tu(vint8m1_t vd, vfloat16m2_t vs2, unsigned int frm,
                              size_t vl);
vint8m2_t __riscv_vfncvt_x_tu(vint8m2_t vd, vfloat16m4_t vs2, unsigned int frm,
                              size_t vl);
vint8m4_t __riscv_vfncvt_x_tu(vint8m4_t vd, vfloat16m8_t vs2, unsigned int frm,
                              size_t vl);
vuint8mf8_t __riscv_vfncvt_xu_tu(vuint8mf8_t vd, vfloat16mf4_t vs2,
                                 unsigned int frm, size_t vl);
vuint8mf4_t __riscv_vfncvt_xu_tu(vuint8mf4_t vd, vfloat16mf2_t vs2,
                                 unsigned int frm, size_t vl);
vuint8mf2_t __riscv_vfncvt_xu_tu(vuint8mf2_t vd, vfloat16m1_t vs2,
                                 unsigned int frm, size_t vl);
vuint8m1_t __riscv_vfncvt_xu_tu(vuint8m1_t vd, vfloat16m2_t vs2,
                                unsigned int frm, size_t vl);
vuint8m2_t __riscv_vfncvt_xu_tu(vuint8m2_t vd, vfloat16m4_t vs2,
                                unsigned int frm, size_t vl);
vuint8m4_t __riscv_vfncvt_xu_tu(vuint8m4_t vd, vfloat16m8_t vs2,
                                unsigned int frm, size_t vl);
vint16mf4_t __riscv_vfncvt_x_tu(vint16mf4_t vd, vfloat32mf2_t vs2,
                                unsigned int frm, size_t vl);
vint16mf2_t __riscv_vfncvt_x_tu(vint16mf2_t vd, vfloat32m1_t vs2,
                                unsigned int frm, size_t vl);
vint16m1_t __riscv_vfncvt_x_tu(vint16m1_t vd, vfloat32m2_t vs2,
                               unsigned int frm, size_t vl);
vint16m2_t __riscv_vfncvt_x_tu(vint16m2_t vd, vfloat32m4_t vs2,
                               unsigned int frm, size_t vl);
vint16m4_t __riscv_vfncvt_x_tu(vint16m4_t vd, vfloat32m8_t vs2,
                               unsigned int frm, size_t vl);
vuint16mf4_t __riscv_vfncvt_xu_tu(vuint16mf4_t vd, vfloat32mf2_t vs2,
                                  unsigned int frm, size_t vl);
vuint16mf2_t __riscv_vfncvt_xu_tu(vuint16mf2_t vd, vfloat32m1_t vs2,
                                  unsigned int frm, size_t vl);
vuint16m1_t __riscv_vfncvt_xu_tu(vuint16m1_t vd, vfloat32m2_t vs2,
                                 unsigned int frm, size_t vl);
vuint16m2_t __riscv_vfncvt_xu_tu(vuint16m2_t vd, vfloat32m4_t vs2,
                                 unsigned int frm, size_t vl);
vuint16m4_t __riscv_vfncvt_xu_tu(vuint16m4_t vd, vfloat32m8_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_tu(vfloat16mf4_t vd, vint32mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_tu(vfloat16mf2_t vd, vint32m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_tu(vfloat16m1_t vd, vint32m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_tu(vfloat16m2_t vd, vint32m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_tu(vfloat16m4_t vd, vint32m8_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_tu(vfloat16mf4_t vd, vuint32mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_tu(vfloat16mf2_t vd, vuint32m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_tu(vfloat16m1_t vd, vuint32m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_tu(vfloat16m2_t vd, vuint32m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_tu(vfloat16m4_t vd, vuint32m8_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_tu(vfloat16mf4_t vd, vfloat32mf2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_tu(vfloat16mf2_t vd, vfloat32m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_tu(vfloat16m1_t vd, vfloat32m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_tu(vfloat16m2_t vd, vfloat32m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_tu(vfloat16m4_t vd, vfloat32m8_t vs2,
                                 unsigned int frm, size_t vl);
vint32mf2_t __riscv_vfncvt_x_tu(vint32mf2_t vd, vfloat64m1_t vs2,
                                unsigned int frm, size_t vl);
vint32m1_t __riscv_vfncvt_x_tu(vint32m1_t vd, vfloat64m2_t vs2,
                               unsigned int frm, size_t vl);
vint32m2_t __riscv_vfncvt_x_tu(vint32m2_t vd, vfloat64m4_t vs2,
                               unsigned int frm, size_t vl);
vint32m4_t __riscv_vfncvt_x_tu(vint32m4_t vd, vfloat64m8_t vs2,
                               unsigned int frm, size_t vl);
vuint32mf2_t __riscv_vfncvt_xu_tu(vuint32mf2_t vd, vfloat64m1_t vs2,
                                  unsigned int frm, size_t vl);
vuint32m1_t __riscv_vfncvt_xu_tu(vuint32m1_t vd, vfloat64m2_t vs2,
                                 unsigned int frm, size_t vl);
vuint32m2_t __riscv_vfncvt_xu_tu(vuint32m2_t vd, vfloat64m4_t vs2,
                                 unsigned int frm, size_t vl);
vuint32m4_t __riscv_vfncvt_xu_tu(vuint32m4_t vd, vfloat64m8_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_tu(vfloat32mf2_t vd, vint64m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_tu(vfloat32m1_t vd, vint64m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_tu(vfloat32m2_t vd, vint64m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_tu(vfloat32m4_t vd, vint64m8_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_tu(vfloat32mf2_t vd, vuint64m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_tu(vfloat32m1_t vd, vuint64m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_tu(vfloat32m2_t vd, vuint64m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_tu(vfloat32m4_t vd, vuint64m8_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_tu(vfloat32mf2_t vd, vfloat64m1_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_tu(vfloat32m1_t vd, vfloat64m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_tu(vfloat32m2_t vd, vfloat64m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_tu(vfloat32m4_t vd, vfloat64m8_t vs2,
                                 unsigned int frm, size_t vl);
// masked functions
vint8mf8_t __riscv_vfncvt_x_tum(vbool64_t vm, vint8mf8_t vd, vfloat16mf4_t vs2,
                                unsigned int frm, size_t vl);
vint8mf4_t __riscv_vfncvt_x_tum(vbool32_t vm, vint8mf4_t vd, vfloat16mf2_t vs2,
                                unsigned int frm, size_t vl);
vint8mf2_t __riscv_vfncvt_x_tum(vbool16_t vm, vint8mf2_t vd, vfloat16m1_t vs2,
                                unsigned int frm, size_t vl);
vint8m1_t __riscv_vfncvt_x_tum(vbool8_t vm, vint8m1_t vd, vfloat16m2_t vs2,
                               unsigned int frm, size_t vl);
vint8m2_t __riscv_vfncvt_x_tum(vbool4_t vm, vint8m2_t vd, vfloat16m4_t vs2,
                               unsigned int frm, size_t vl);
vint8m4_t __riscv_vfncvt_x_tum(vbool2_t vm, vint8m4_t vd, vfloat16m8_t vs2,
                               unsigned int frm, size_t vl);
vuint8mf8_t __riscv_vfncvt_xu_tum(vbool64_t vm, vuint8mf8_t vd,
                                  vfloat16mf4_t vs2, unsigned int frm,
                                  size_t vl);
vuint8mf4_t __riscv_vfncvt_xu_tum(vbool32_t vm, vuint8mf4_t vd,
                                  vfloat16mf2_t vs2, unsigned int frm,
                                  size_t vl);
vuint8mf2_t __riscv_vfncvt_xu_tum(vbool16_t vm, vuint8mf2_t vd,
                                  vfloat16m1_t vs2, unsigned int frm,
                                  size_t vl);
vuint8m1_t __riscv_vfncvt_xu_tum(vbool8_t vm, vuint8m1_t vd, vfloat16m2_t vs2,
                                 unsigned int frm, size_t vl);
vuint8m2_t __riscv_vfncvt_xu_tum(vbool4_t vm, vuint8m2_t vd, vfloat16m4_t vs2,
                                 unsigned int frm, size_t vl);
vuint8m4_t __riscv_vfncvt_xu_tum(vbool2_t vm, vuint8m4_t vd, vfloat16m8_t vs2,
                                 unsigned int frm, size_t vl);
vint16mf4_t __riscv_vfncvt_x_tum(vbool64_t vm, vint16mf4_t vd,
                                 vfloat32mf2_t vs2, unsigned int frm,
                                 size_t vl);
vint16mf2_t __riscv_vfncvt_x_tum(vbool32_t vm, vint16mf2_t vd, vfloat32m1_t vs2,
                                 unsigned int frm, size_t vl);
vint16m1_t __riscv_vfncvt_x_tum(vbool16_t vm, vint16m1_t vd, vfloat32m2_t vs2,
                                unsigned int frm, size_t vl);
vint16m2_t __riscv_vfncvt_x_tum(vbool8_t vm, vint16m2_t vd, vfloat32m4_t vs2,
                                unsigned int frm, size_t vl);
vint16m4_t __riscv_vfncvt_x_tum(vbool4_t vm, vint16m4_t vd, vfloat32m8_t vs2,
                                unsigned int frm, size_t vl);
vuint16mf4_t __riscv_vfncvt_xu_tum(vbool64_t vm, vuint16mf4_t vd,
                                   vfloat32mf2_t vs2, unsigned int frm,
                                   size_t vl);
vuint16mf2_t __riscv_vfncvt_xu_tum(vbool32_t vm, vuint16mf2_t vd,
                                   vfloat32m1_t vs2, unsigned int frm,
                                   size_t vl);
vuint16m1_t __riscv_vfncvt_xu_tum(vbool16_t vm, vuint16m1_t vd,
                                  vfloat32m2_t vs2, unsigned int frm,
                                  size_t vl);
vuint16m2_t __riscv_vfncvt_xu_tum(vbool8_t vm, vuint16m2_t vd, vfloat32m4_t vs2,
                                  unsigned int frm, size_t vl);
vuint16m4_t __riscv_vfncvt_xu_tum(vbool4_t vm, vuint16m4_t vd, vfloat32m8_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_tum(vbool64_t vm, vfloat16mf4_t vd,
                                   vint32mf2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_tum(vbool32_t vm, vfloat16mf2_t vd,
                                   vint32m1_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_tum(vbool16_t vm, vfloat16m1_t vd, vint32m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_tum(vbool8_t vm, vfloat16m2_t vd, vint32m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_tum(vbool4_t vm, vfloat16m4_t vd, vint32m8_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_tum(vbool64_t vm, vfloat16mf4_t vd,
                                   vuint32mf2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_tum(vbool32_t vm, vfloat16mf2_t vd,
                                   vuint32m1_t vs2, unsigned int frm,
                                   size_t vl);
vfloat16m1_t __riscv_vfncvt_f_tum(vbool16_t vm, vfloat16m1_t vd,
                                  vuint32m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_tum(vbool8_t vm, vfloat16m2_t vd, vuint32m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_tum(vbool4_t vm, vfloat16m4_t vd, vuint32m8_t vs2,
                                  unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_tum(vbool64_t vm, vfloat16mf4_t vd,
                                   vfloat32mf2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_tum(vbool32_t vm, vfloat16mf2_t vd,
                                   vfloat32m1_t vs2, unsigned int frm,
                                   size_t vl);
vfloat16m1_t __riscv_vfncvt_f_tum(vbool16_t vm, vfloat16m1_t vd,
                                  vfloat32m2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m2_t __riscv_vfncvt_f_tum(vbool8_t vm, vfloat16m2_t vd,
                                  vfloat32m4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m4_t __riscv_vfncvt_f_tum(vbool4_t vm, vfloat16m4_t vd,
                                  vfloat32m8_t vs2, unsigned int frm,
                                  size_t vl);
vint32mf2_t __riscv_vfncvt_x_tum(vbool64_t vm, vint32mf2_t vd, vfloat64m1_t vs2,
                                 unsigned int frm, size_t vl);
vint32m1_t __riscv_vfncvt_x_tum(vbool32_t vm, vint32m1_t vd, vfloat64m2_t vs2,
                                unsigned int frm, size_t vl);
vint32m2_t __riscv_vfncvt_x_tum(vbool16_t vm, vint32m2_t vd, vfloat64m4_t vs2,
                                unsigned int frm, size_t vl);
vint32m4_t __riscv_vfncvt_x_tum(vbool8_t vm, vint32m4_t vd, vfloat64m8_t vs2,
                                unsigned int frm, size_t vl);
vuint32mf2_t __riscv_vfncvt_xu_tum(vbool64_t vm, vuint32mf2_t vd,
                                   vfloat64m1_t vs2, unsigned int frm,
                                   size_t vl);
vuint32m1_t __riscv_vfncvt_xu_tum(vbool32_t vm, vuint32m1_t vd,
                                  vfloat64m2_t vs2, unsigned int frm,
                                  size_t vl);
vuint32m2_t __riscv_vfncvt_xu_tum(vbool16_t vm, vuint32m2_t vd,
                                  vfloat64m4_t vs2, unsigned int frm,
                                  size_t vl);
vuint32m4_t __riscv_vfncvt_xu_tum(vbool8_t vm, vuint32m4_t vd, vfloat64m8_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_tum(vbool64_t vm, vfloat32mf2_t vd,
                                   vint64m1_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_tum(vbool32_t vm, vfloat32m1_t vd, vint64m2_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_tum(vbool16_t vm, vfloat32m2_t vd, vint64m4_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_tum(vbool8_t vm, vfloat32m4_t vd, vint64m8_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_tum(vbool64_t vm, vfloat32mf2_t vd,
                                   vuint64m1_t vs2, unsigned int frm,
                                   size_t vl);
vfloat32m1_t __riscv_vfncvt_f_tum(vbool32_t vm, vfloat32m1_t vd,
                                  vuint64m2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_tum(vbool16_t vm, vfloat32m2_t vd,
                                  vuint64m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_tum(vbool8_t vm, vfloat32m4_t vd, vuint64m8_t vs2,
                                  unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_tum(vbool64_t vm, vfloat32mf2_t vd,
                                   vfloat64m1_t vs2, unsigned int frm,
                                   size_t vl);
vfloat32m1_t __riscv_vfncvt_f_tum(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat64m2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m2_t __riscv_vfncvt_f_tum(vbool16_t vm, vfloat32m2_t vd,
                                  vfloat64m4_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m4_t __riscv_vfncvt_f_tum(vbool8_t vm, vfloat32m4_t vd,
                                  vfloat64m8_t vs2, unsigned int frm,
                                  size_t vl);
// masked functions
vint8mf8_t __riscv_vfncvt_x_tumu(vbool64_t vm, vint8mf8_t vd, vfloat16mf4_t vs2,
                                 unsigned int frm, size_t vl);
vint8mf4_t __riscv_vfncvt_x_tumu(vbool32_t vm, vint8mf4_t vd, vfloat16mf2_t vs2,
                                 unsigned int frm, size_t vl);
vint8mf2_t __riscv_vfncvt_x_tumu(vbool16_t vm, vint8mf2_t vd, vfloat16m1_t vs2,
                                 unsigned int frm, size_t vl);
vint8m1_t __riscv_vfncvt_x_tumu(vbool8_t vm, vint8m1_t vd, vfloat16m2_t vs2,
                                unsigned int frm, size_t vl);
vint8m2_t __riscv_vfncvt_x_tumu(vbool4_t vm, vint8m2_t vd, vfloat16m4_t vs2,
                                unsigned int frm, size_t vl);
vint8m4_t __riscv_vfncvt_x_tumu(vbool2_t vm, vint8m4_t vd, vfloat16m8_t vs2,
                                unsigned int frm, size_t vl);
vuint8mf8_t __riscv_vfncvt_xu_tumu(vbool64_t vm, vuint8mf8_t vd,
                                   vfloat16mf4_t vs2, unsigned int frm,
                                   size_t vl);
vuint8mf4_t __riscv_vfncvt_xu_tumu(vbool32_t vm, vuint8mf4_t vd,
                                   vfloat16mf2_t vs2, unsigned int frm,
                                   size_t vl);
vuint8mf2_t __riscv_vfncvt_xu_tumu(vbool16_t vm, vuint8mf2_t vd,
                                   vfloat16m1_t vs2, unsigned int frm,
                                   size_t vl);
vuint8m1_t __riscv_vfncvt_xu_tumu(vbool8_t vm, vuint8m1_t vd, vfloat16m2_t vs2,
                                  unsigned int frm, size_t vl);
vuint8m2_t __riscv_vfncvt_xu_tumu(vbool4_t vm, vuint8m2_t vd, vfloat16m4_t vs2,
                                  unsigned int frm, size_t vl);
vuint8m4_t __riscv_vfncvt_xu_tumu(vbool2_t vm, vuint8m4_t vd, vfloat16m8_t vs2,
                                  unsigned int frm, size_t vl);
vint16mf4_t __riscv_vfncvt_x_tumu(vbool64_t vm, vint16mf4_t vd,
                                  vfloat32mf2_t vs2, unsigned int frm,
                                  size_t vl);
vint16mf2_t __riscv_vfncvt_x_tumu(vbool32_t vm, vint16mf2_t vd,
                                  vfloat32m1_t vs2, unsigned int frm,
                                  size_t vl);
vint16m1_t __riscv_vfncvt_x_tumu(vbool16_t vm, vint16m1_t vd, vfloat32m2_t vs2,
                                 unsigned int frm, size_t vl);
vint16m2_t __riscv_vfncvt_x_tumu(vbool8_t vm, vint16m2_t vd, vfloat32m4_t vs2,
                                 unsigned int frm, size_t vl);
vint16m4_t __riscv_vfncvt_x_tumu(vbool4_t vm, vint16m4_t vd, vfloat32m8_t vs2,
                                 unsigned int frm, size_t vl);
vuint16mf4_t __riscv_vfncvt_xu_tumu(vbool64_t vm, vuint16mf4_t vd,
                                    vfloat32mf2_t vs2, unsigned int frm,
                                    size_t vl);
vuint16mf2_t __riscv_vfncvt_xu_tumu(vbool32_t vm, vuint16mf2_t vd,
                                    vfloat32m1_t vs2, unsigned int frm,
                                    size_t vl);
vuint16m1_t __riscv_vfncvt_xu_tumu(vbool16_t vm, vuint16m1_t vd,
                                   vfloat32m2_t vs2, unsigned int frm,
                                   size_t vl);
vuint16m2_t __riscv_vfncvt_xu_tumu(vbool8_t vm, vuint16m2_t vd,
                                   vfloat32m4_t vs2, unsigned int frm,
                                   size_t vl);
vuint16m4_t __riscv_vfncvt_xu_tumu(vbool4_t vm, vuint16m4_t vd,
                                   vfloat32m8_t vs2, unsigned int frm,
                                   size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                    vint32mf2_t vs2, unsigned int frm,
                                    size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                    vint32m1_t vs2, unsigned int frm,
                                    size_t vl);
vfloat16m1_t __riscv_vfncvt_f_tumu(vbool16_t vm, vfloat16m1_t vd,
                                   vint32m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_tumu(vbool8_t vm, vfloat16m2_t vd, vint32m4_t vs2,
                                   unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_tumu(vbool4_t vm, vfloat16m4_t vd, vint32m8_t vs2,
                                   unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                    vuint32mf2_t vs2, unsigned int frm,
                                    size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                    vuint32m1_t vs2, unsigned int frm,
                                    size_t vl);
vfloat16m1_t __riscv_vfncvt_f_tumu(vbool16_t vm, vfloat16m1_t vd,
                                   vuint32m2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat16m2_t __riscv_vfncvt_f_tumu(vbool8_t vm, vfloat16m2_t vd,
                                   vuint32m4_t vs2, unsigned int frm,
                                   size_t vl);
vfloat16m4_t __riscv_vfncvt_f_tumu(vbool4_t vm, vfloat16m4_t vd,
                                   vuint32m8_t vs2, unsigned int frm,
                                   size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                    vfloat32mf2_t vs2, unsigned int frm,
                                    size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                    vfloat32m1_t vs2, unsigned int frm,
                                    size_t vl);
vfloat16m1_t __riscv_vfncvt_f_tumu(vbool16_t vm, vfloat16m1_t vd,
                                   vfloat32m2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat16m2_t __riscv_vfncvt_f_tumu(vbool8_t vm, vfloat16m2_t vd,
                                   vfloat32m4_t vs2, unsigned int frm,
                                   size_t vl);
vfloat16m4_t __riscv_vfncvt_f_tumu(vbool4_t vm, vfloat16m4_t vd,
                                   vfloat32m8_t vs2, unsigned int frm,
                                   size_t vl);
vint32mf2_t __riscv_vfncvt_x_tumu(vbool64_t vm, vint32mf2_t vd,
                                  vfloat64m1_t vs2, unsigned int frm,
                                  size_t vl);
vint32m1_t __riscv_vfncvt_x_tumu(vbool32_t vm, vint32m1_t vd, vfloat64m2_t vs2,
                                 unsigned int frm, size_t vl);
vint32m2_t __riscv_vfncvt_x_tumu(vbool16_t vm, vint32m2_t vd, vfloat64m4_t vs2,
                                 unsigned int frm, size_t vl);
vint32m4_t __riscv_vfncvt_x_tumu(vbool8_t vm, vint32m4_t vd, vfloat64m8_t vs2,
                                 unsigned int frm, size_t vl);
vuint32mf2_t __riscv_vfncvt_xu_tumu(vbool64_t vm, vuint32mf2_t vd,
                                    vfloat64m1_t vs2, unsigned int frm,
                                    size_t vl);
vuint32m1_t __riscv_vfncvt_xu_tumu(vbool32_t vm, vuint32m1_t vd,
                                   vfloat64m2_t vs2, unsigned int frm,
                                   size_t vl);
vuint32m2_t __riscv_vfncvt_xu_tumu(vbool16_t vm, vuint32m2_t vd,
                                   vfloat64m4_t vs2, unsigned int frm,
                                   size_t vl);
vuint32m4_t __riscv_vfncvt_xu_tumu(vbool8_t vm, vuint32m4_t vd,
                                   vfloat64m8_t vs2, unsigned int frm,
                                   size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                    vint64m1_t vs2, unsigned int frm,
                                    size_t vl);
vfloat32m1_t __riscv_vfncvt_f_tumu(vbool32_t vm, vfloat32m1_t vd,
                                   vint64m2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_tumu(vbool16_t vm, vfloat32m2_t vd,
                                   vint64m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_tumu(vbool8_t vm, vfloat32m4_t vd, vint64m8_t vs2,
                                   unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                    vuint64m1_t vs2, unsigned int frm,
                                    size_t vl);
vfloat32m1_t __riscv_vfncvt_f_tumu(vbool32_t vm, vfloat32m1_t vd,
                                   vuint64m2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat32m2_t __riscv_vfncvt_f_tumu(vbool16_t vm, vfloat32m2_t vd,
                                   vuint64m4_t vs2, unsigned int frm,
                                   size_t vl);
vfloat32m4_t __riscv_vfncvt_f_tumu(vbool8_t vm, vfloat32m4_t vd,
                                   vuint64m8_t vs2, unsigned int frm,
                                   size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                    vfloat64m1_t vs2, unsigned int frm,
                                    size_t vl);
vfloat32m1_t __riscv_vfncvt_f_tumu(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat64m2_t vs2, unsigned int frm,
                                   size_t vl);
vfloat32m2_t __riscv_vfncvt_f_tumu(vbool16_t vm, vfloat32m2_t vd,
                                   vfloat64m4_t vs2, unsigned int frm,
                                   size_t vl);
vfloat32m4_t __riscv_vfncvt_f_tumu(vbool8_t vm, vfloat32m4_t vd,
                                   vfloat64m8_t vs2, unsigned int frm,
                                   size_t vl);
// masked functions
vint8mf8_t __riscv_vfncvt_x_mu(vbool64_t vm, vint8mf8_t vd, vfloat16mf4_t vs2,
                               unsigned int frm, size_t vl);
vint8mf4_t __riscv_vfncvt_x_mu(vbool32_t vm, vint8mf4_t vd, vfloat16mf2_t vs2,
                               unsigned int frm, size_t vl);
vint8mf2_t __riscv_vfncvt_x_mu(vbool16_t vm, vint8mf2_t vd, vfloat16m1_t vs2,
                               unsigned int frm, size_t vl);
vint8m1_t __riscv_vfncvt_x_mu(vbool8_t vm, vint8m1_t vd, vfloat16m2_t vs2,
                              unsigned int frm, size_t vl);
vint8m2_t __riscv_vfncvt_x_mu(vbool4_t vm, vint8m2_t vd, vfloat16m4_t vs2,
                              unsigned int frm, size_t vl);
vint8m4_t __riscv_vfncvt_x_mu(vbool2_t vm, vint8m4_t vd, vfloat16m8_t vs2,
                              unsigned int frm, size_t vl);
vuint8mf8_t __riscv_vfncvt_xu_mu(vbool64_t vm, vuint8mf8_t vd,
                                 vfloat16mf4_t vs2, unsigned int frm,
                                 size_t vl);
vuint8mf4_t __riscv_vfncvt_xu_mu(vbool32_t vm, vuint8mf4_t vd,
                                 vfloat16mf2_t vs2, unsigned int frm,
                                 size_t vl);
vuint8mf2_t __riscv_vfncvt_xu_mu(vbool16_t vm, vuint8mf2_t vd, vfloat16m1_t vs2,
                                 unsigned int frm, size_t vl);
vuint8m1_t __riscv_vfncvt_xu_mu(vbool8_t vm, vuint8m1_t vd, vfloat16m2_t vs2,
                                unsigned int frm, size_t vl);
vuint8m2_t __riscv_vfncvt_xu_mu(vbool4_t vm, vuint8m2_t vd, vfloat16m4_t vs2,
                                unsigned int frm, size_t vl);
vuint8m4_t __riscv_vfncvt_xu_mu(vbool2_t vm, vuint8m4_t vd, vfloat16m8_t vs2,
                                unsigned int frm, size_t vl);
vint16mf4_t __riscv_vfncvt_x_mu(vbool64_t vm, vint16mf4_t vd, vfloat32mf2_t vs2,
                                unsigned int frm, size_t vl);
vint16mf2_t __riscv_vfncvt_x_mu(vbool32_t vm, vint16mf2_t vd, vfloat32m1_t vs2,
                                unsigned int frm, size_t vl);
vint16m1_t __riscv_vfncvt_x_mu(vbool16_t vm, vint16m1_t vd, vfloat32m2_t vs2,
                               unsigned int frm, size_t vl);
vint16m2_t __riscv_vfncvt_x_mu(vbool8_t vm, vint16m2_t vd, vfloat32m4_t vs2,
                               unsigned int frm, size_t vl);
vint16m4_t __riscv_vfncvt_x_mu(vbool4_t vm, vint16m4_t vd, vfloat32m8_t vs2,
                               unsigned int frm, size_t vl);
vuint16mf4_t __riscv_vfncvt_xu_mu(vbool64_t vm, vuint16mf4_t vd,
                                  vfloat32mf2_t vs2, unsigned int frm,
                                  size_t vl);
vuint16mf2_t __riscv_vfncvt_xu_mu(vbool32_t vm, vuint16mf2_t vd,
                                  vfloat32m1_t vs2, unsigned int frm,
                                  size_t vl);
vuint16m1_t __riscv_vfncvt_xu_mu(vbool16_t vm, vuint16m1_t vd, vfloat32m2_t vs2,
                                 unsigned int frm, size_t vl);
vuint16m2_t __riscv_vfncvt_xu_mu(vbool8_t vm, vuint16m2_t vd, vfloat32m4_t vs2,
                                 unsigned int frm, size_t vl);
vuint16m4_t __riscv_vfncvt_xu_mu(vbool4_t vm, vuint16m4_t vd, vfloat32m8_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_mu(vbool64_t vm, vfloat16mf4_t vd,
                                  vint32mf2_t vs2, unsigned int frm, size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_mu(vbool32_t vm, vfloat16mf2_t vd,
                                  vint32m1_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_mu(vbool16_t vm, vfloat16m1_t vd, vint32m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_mu(vbool8_t vm, vfloat16m2_t vd, vint32m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_mu(vbool4_t vm, vfloat16m4_t vd, vint32m8_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_mu(vbool64_t vm, vfloat16mf4_t vd,
                                  vuint32mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_mu(vbool32_t vm, vfloat16mf2_t vd,
                                  vuint32m1_t vs2, unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfncvt_f_mu(vbool16_t vm, vfloat16m1_t vd, vuint32m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_mu(vbool8_t vm, vfloat16m2_t vd, vuint32m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_mu(vbool4_t vm, vfloat16m4_t vd, vuint32m8_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16mf4_t __riscv_vfncvt_f_mu(vbool64_t vm, vfloat16mf4_t vd,
                                  vfloat32mf2_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16mf2_t __riscv_vfncvt_f_mu(vbool32_t vm, vfloat16mf2_t vd,
                                  vfloat32m1_t vs2, unsigned int frm,
                                  size_t vl);
vfloat16m1_t __riscv_vfncvt_f_mu(vbool16_t vm, vfloat16m1_t vd,
                                 vfloat32m2_t vs2, unsigned int frm, size_t vl);
vfloat16m2_t __riscv_vfncvt_f_mu(vbool8_t vm, vfloat16m2_t vd, vfloat32m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat16m4_t __riscv_vfncvt_f_mu(vbool4_t vm, vfloat16m4_t vd, vfloat32m8_t vs2,
                                 unsigned int frm, size_t vl);
vint32mf2_t __riscv_vfncvt_x_mu(vbool64_t vm, vint32mf2_t vd, vfloat64m1_t vs2,
                                unsigned int frm, size_t vl);
vint32m1_t __riscv_vfncvt_x_mu(vbool32_t vm, vint32m1_t vd, vfloat64m2_t vs2,
                               unsigned int frm, size_t vl);
vint32m2_t __riscv_vfncvt_x_mu(vbool16_t vm, vint32m2_t vd, vfloat64m4_t vs2,
                               unsigned int frm, size_t vl);
vint32m4_t __riscv_vfncvt_x_mu(vbool8_t vm, vint32m4_t vd, vfloat64m8_t vs2,
                               unsigned int frm, size_t vl);
vuint32mf2_t __riscv_vfncvt_xu_mu(vbool64_t vm, vuint32mf2_t vd,
                                  vfloat64m1_t vs2, unsigned int frm,
                                  size_t vl);
vuint32m1_t __riscv_vfncvt_xu_mu(vbool32_t vm, vuint32m1_t vd, vfloat64m2_t vs2,
                                 unsigned int frm, size_t vl);
vuint32m2_t __riscv_vfncvt_xu_mu(vbool16_t vm, vuint32m2_t vd, vfloat64m4_t vs2,
                                 unsigned int frm, size_t vl);
vuint32m4_t __riscv_vfncvt_xu_mu(vbool8_t vm, vuint32m4_t vd, vfloat64m8_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_mu(vbool64_t vm, vfloat32mf2_t vd,
                                  vint64m1_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_mu(vbool32_t vm, vfloat32m1_t vd, vint64m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_mu(vbool16_t vm, vfloat32m2_t vd, vint64m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_mu(vbool8_t vm, vfloat32m4_t vd, vint64m8_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_mu(vbool64_t vm, vfloat32mf2_t vd,
                                  vuint64m1_t vs2, unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfncvt_f_mu(vbool32_t vm, vfloat32m1_t vd, vuint64m2_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_mu(vbool16_t vm, vfloat32m2_t vd, vuint64m4_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_mu(vbool8_t vm, vfloat32m4_t vd, vuint64m8_t vs2,
                                 unsigned int frm, size_t vl);
vfloat32mf2_t __riscv_vfncvt_f_mu(vbool64_t vm, vfloat32mf2_t vd,
                                  vfloat64m1_t vs2, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfncvt_f_mu(vbool32_t vm, vfloat32m1_t vd,
                                 vfloat64m2_t vs2, unsigned int frm, size_t vl);
vfloat32m2_t __riscv_vfncvt_f_mu(vbool16_t vm, vfloat32m2_t vd,
                                 vfloat64m4_t vs2, unsigned int frm, size_t vl);
vfloat32m4_t __riscv_vfncvt_f_mu(vbool8_t vm, vfloat32m4_t vd, vfloat64m8_t vs2,
                                 unsigned int frm, size_t vl);