Vector Permutation Intrinsics

Integer and Floating-Point Scalar Move Intrinsics

vfloat16mf4_t __riscv_vfmv_s_f_f16mf4_tu(vfloat16mf4_t vd, _Float16 rs1,
                                         size_t vl);
vfloat16mf2_t __riscv_vfmv_s_f_f16mf2_tu(vfloat16mf2_t vd, _Float16 rs1,
                                         size_t vl);
vfloat16m1_t __riscv_vfmv_s_f_f16m1_tu(vfloat16m1_t vd, _Float16 rs1,
                                       size_t vl);
vfloat16m2_t __riscv_vfmv_s_f_f16m2_tu(vfloat16m2_t vd, _Float16 rs1,
                                       size_t vl);
vfloat16m4_t __riscv_vfmv_s_f_f16m4_tu(vfloat16m4_t vd, _Float16 rs1,
                                       size_t vl);
vfloat16m8_t __riscv_vfmv_s_f_f16m8_tu(vfloat16m8_t vd, _Float16 rs1,
                                       size_t vl);
vfloat32mf2_t __riscv_vfmv_s_f_f32mf2_tu(vfloat32mf2_t vd, float rs1,
                                         size_t vl);
vfloat32m1_t __riscv_vfmv_s_f_f32m1_tu(vfloat32m1_t vd, float rs1, size_t vl);
vfloat32m2_t __riscv_vfmv_s_f_f32m2_tu(vfloat32m2_t vd, float rs1, size_t vl);
vfloat32m4_t __riscv_vfmv_s_f_f32m4_tu(vfloat32m4_t vd, float rs1, size_t vl);
vfloat32m8_t __riscv_vfmv_s_f_f32m8_tu(vfloat32m8_t vd, float rs1, size_t vl);
vfloat64m1_t __riscv_vfmv_s_f_f64m1_tu(vfloat64m1_t vd, double rs1, size_t vl);
vfloat64m2_t __riscv_vfmv_s_f_f64m2_tu(vfloat64m2_t vd, double rs1, size_t vl);
vfloat64m4_t __riscv_vfmv_s_f_f64m4_tu(vfloat64m4_t vd, double rs1, size_t vl);
vfloat64m8_t __riscv_vfmv_s_f_f64m8_tu(vfloat64m8_t vd, double rs1, size_t vl);
vint8mf8_t __riscv_vmv_s_x_i8mf8_tu(vint8mf8_t vd, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vmv_s_x_i8mf4_tu(vint8mf4_t vd, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vmv_s_x_i8mf2_tu(vint8mf2_t vd, int8_t rs1, size_t vl);
vint8m1_t __riscv_vmv_s_x_i8m1_tu(vint8m1_t vd, int8_t rs1, size_t vl);
vint8m2_t __riscv_vmv_s_x_i8m2_tu(vint8m2_t vd, int8_t rs1, size_t vl);
vint8m4_t __riscv_vmv_s_x_i8m4_tu(vint8m4_t vd, int8_t rs1, size_t vl);
vint8m8_t __riscv_vmv_s_x_i8m8_tu(vint8m8_t vd, int8_t rs1, size_t vl);
vint16mf4_t __riscv_vmv_s_x_i16mf4_tu(vint16mf4_t vd, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vmv_s_x_i16mf2_tu(vint16mf2_t vd, int16_t rs1, size_t vl);
vint16m1_t __riscv_vmv_s_x_i16m1_tu(vint16m1_t vd, int16_t rs1, size_t vl);
vint16m2_t __riscv_vmv_s_x_i16m2_tu(vint16m2_t vd, int16_t rs1, size_t vl);
vint16m4_t __riscv_vmv_s_x_i16m4_tu(vint16m4_t vd, int16_t rs1, size_t vl);
vint16m8_t __riscv_vmv_s_x_i16m8_tu(vint16m8_t vd, int16_t rs1, size_t vl);
vint32mf2_t __riscv_vmv_s_x_i32mf2_tu(vint32mf2_t vd, int32_t rs1, size_t vl);
vint32m1_t __riscv_vmv_s_x_i32m1_tu(vint32m1_t vd, int32_t rs1, size_t vl);
vint32m2_t __riscv_vmv_s_x_i32m2_tu(vint32m2_t vd, int32_t rs1, size_t vl);
vint32m4_t __riscv_vmv_s_x_i32m4_tu(vint32m4_t vd, int32_t rs1, size_t vl);
vint32m8_t __riscv_vmv_s_x_i32m8_tu(vint32m8_t vd, int32_t rs1, size_t vl);
vint64m1_t __riscv_vmv_s_x_i64m1_tu(vint64m1_t vd, int64_t rs1, size_t vl);
vint64m2_t __riscv_vmv_s_x_i64m2_tu(vint64m2_t vd, int64_t rs1, size_t vl);
vint64m4_t __riscv_vmv_s_x_i64m4_tu(vint64m4_t vd, int64_t rs1, size_t vl);
vint64m8_t __riscv_vmv_s_x_i64m8_tu(vint64m8_t vd, int64_t rs1, size_t vl);
vuint8mf8_t __riscv_vmv_s_x_u8mf8_tu(vuint8mf8_t vd, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vmv_s_x_u8mf4_tu(vuint8mf4_t vd, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vmv_s_x_u8mf2_tu(vuint8mf2_t vd, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vmv_s_x_u8m1_tu(vuint8m1_t vd, uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vmv_s_x_u8m2_tu(vuint8m2_t vd, uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vmv_s_x_u8m4_tu(vuint8m4_t vd, uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vmv_s_x_u8m8_tu(vuint8m8_t vd, uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vmv_s_x_u16mf4_tu(vuint16mf4_t vd, uint16_t rs1,
                                       size_t vl);
vuint16mf2_t __riscv_vmv_s_x_u16mf2_tu(vuint16mf2_t vd, uint16_t rs1,
                                       size_t vl);
vuint16m1_t __riscv_vmv_s_x_u16m1_tu(vuint16m1_t vd, uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vmv_s_x_u16m2_tu(vuint16m2_t vd, uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vmv_s_x_u16m4_tu(vuint16m4_t vd, uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vmv_s_x_u16m8_tu(vuint16m8_t vd, uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vmv_s_x_u32mf2_tu(vuint32mf2_t vd, uint32_t rs1,
                                       size_t vl);
vuint32m1_t __riscv_vmv_s_x_u32m1_tu(vuint32m1_t vd, uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vmv_s_x_u32m2_tu(vuint32m2_t vd, uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vmv_s_x_u32m4_tu(vuint32m4_t vd, uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vmv_s_x_u32m8_tu(vuint32m8_t vd, uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vmv_s_x_u64m1_tu(vuint64m1_t vd, uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vmv_s_x_u64m2_tu(vuint64m2_t vd, uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vmv_s_x_u64m4_tu(vuint64m4_t vd, uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vmv_s_x_u64m8_tu(vuint64m8_t vd, uint64_t rs1, size_t vl);

Vector Slideup Intrinsics

vfloat16mf4_t __riscv_vslideup_vx_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                            size_t rs1, size_t vl);
vfloat16mf2_t __riscv_vslideup_vx_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                            size_t rs1, size_t vl);
vfloat16m1_t __riscv_vslideup_vx_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                          size_t rs1, size_t vl);
vfloat16m2_t __riscv_vslideup_vx_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                          size_t rs1, size_t vl);
vfloat16m4_t __riscv_vslideup_vx_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                          size_t rs1, size_t vl);
vfloat16m8_t __riscv_vslideup_vx_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                          size_t rs1, size_t vl);
vfloat32mf2_t __riscv_vslideup_vx_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                            size_t rs1, size_t vl);
vfloat32m1_t __riscv_vslideup_vx_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                          size_t rs1, size_t vl);
vfloat32m2_t __riscv_vslideup_vx_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                          size_t rs1, size_t vl);
vfloat32m4_t __riscv_vslideup_vx_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                          size_t rs1, size_t vl);
vfloat32m8_t __riscv_vslideup_vx_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                          size_t rs1, size_t vl);
vfloat64m1_t __riscv_vslideup_vx_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                          size_t rs1, size_t vl);
vfloat64m2_t __riscv_vslideup_vx_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                          size_t rs1, size_t vl);
vfloat64m4_t __riscv_vslideup_vx_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                          size_t rs1, size_t vl);
vfloat64m8_t __riscv_vslideup_vx_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                          size_t rs1, size_t vl);
vint8mf8_t __riscv_vslideup_vx_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                        size_t rs1, size_t vl);
vint8mf4_t __riscv_vslideup_vx_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                        size_t rs1, size_t vl);
vint8mf2_t __riscv_vslideup_vx_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                        size_t rs1, size_t vl);
vint8m1_t __riscv_vslideup_vx_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, size_t rs1,
                                      size_t vl);
vint8m2_t __riscv_vslideup_vx_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, size_t rs1,
                                      size_t vl);
vint8m4_t __riscv_vslideup_vx_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, size_t rs1,
                                      size_t vl);
vint8m8_t __riscv_vslideup_vx_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, size_t rs1,
                                      size_t vl);
vint16mf4_t __riscv_vslideup_vx_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                          size_t rs1, size_t vl);
vint16mf2_t __riscv_vslideup_vx_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                          size_t rs1, size_t vl);
vint16m1_t __riscv_vslideup_vx_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                        size_t rs1, size_t vl);
vint16m2_t __riscv_vslideup_vx_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                        size_t rs1, size_t vl);
vint16m4_t __riscv_vslideup_vx_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                        size_t rs1, size_t vl);
vint16m8_t __riscv_vslideup_vx_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                        size_t rs1, size_t vl);
vint32mf2_t __riscv_vslideup_vx_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                          size_t rs1, size_t vl);
vint32m1_t __riscv_vslideup_vx_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                        size_t rs1, size_t vl);
vint32m2_t __riscv_vslideup_vx_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                        size_t rs1, size_t vl);
vint32m4_t __riscv_vslideup_vx_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                        size_t rs1, size_t vl);
vint32m8_t __riscv_vslideup_vx_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                        size_t rs1, size_t vl);
vint64m1_t __riscv_vslideup_vx_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                        size_t rs1, size_t vl);
vint64m2_t __riscv_vslideup_vx_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                        size_t rs1, size_t vl);
vint64m4_t __riscv_vslideup_vx_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                        size_t rs1, size_t vl);
vint64m8_t __riscv_vslideup_vx_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                        size_t rs1, size_t vl);
vuint8mf8_t __riscv_vslideup_vx_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                         size_t rs1, size_t vl);
vuint8mf4_t __riscv_vslideup_vx_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                         size_t rs1, size_t vl);
vuint8mf2_t __riscv_vslideup_vx_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                         size_t rs1, size_t vl);
vuint8m1_t __riscv_vslideup_vx_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2,
                                       size_t rs1, size_t vl);
vuint8m2_t __riscv_vslideup_vx_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2,
                                       size_t rs1, size_t vl);
vuint8m4_t __riscv_vslideup_vx_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2,
                                       size_t rs1, size_t vl);
vuint8m8_t __riscv_vslideup_vx_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2,
                                       size_t rs1, size_t vl);
vuint16mf4_t __riscv_vslideup_vx_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                           size_t rs1, size_t vl);
vuint16mf2_t __riscv_vslideup_vx_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                           size_t rs1, size_t vl);
vuint16m1_t __riscv_vslideup_vx_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                         size_t rs1, size_t vl);
vuint16m2_t __riscv_vslideup_vx_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                         size_t rs1, size_t vl);
vuint16m4_t __riscv_vslideup_vx_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                         size_t rs1, size_t vl);
vuint16m8_t __riscv_vslideup_vx_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                         size_t rs1, size_t vl);
vuint32mf2_t __riscv_vslideup_vx_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                           size_t rs1, size_t vl);
vuint32m1_t __riscv_vslideup_vx_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                         size_t rs1, size_t vl);
vuint32m2_t __riscv_vslideup_vx_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                         size_t rs1, size_t vl);
vuint32m4_t __riscv_vslideup_vx_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                         size_t rs1, size_t vl);
vuint32m8_t __riscv_vslideup_vx_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                         size_t rs1, size_t vl);
vuint64m1_t __riscv_vslideup_vx_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                         size_t rs1, size_t vl);
vuint64m2_t __riscv_vslideup_vx_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                         size_t rs1, size_t vl);
vuint64m4_t __riscv_vslideup_vx_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                         size_t rs1, size_t vl);
vuint64m8_t __riscv_vslideup_vx_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                         size_t rs1, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vslideup_vx_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs2, size_t rs1,
                                             size_t vl);
vfloat16mf2_t __riscv_vslideup_vx_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs2, size_t rs1,
                                             size_t vl);
vfloat16m1_t __riscv_vslideup_vx_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs2, size_t rs1,
                                           size_t vl);
vfloat16m2_t __riscv_vslideup_vx_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs2, size_t rs1,
                                           size_t vl);
vfloat16m4_t __riscv_vslideup_vx_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs2, size_t rs1,
                                           size_t vl);
vfloat16m8_t __riscv_vslideup_vx_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs2, size_t rs1,
                                           size_t vl);
vfloat32mf2_t __riscv_vslideup_vx_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2, size_t rs1,
                                             size_t vl);
vfloat32m1_t __riscv_vslideup_vx_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs2, size_t rs1,
                                           size_t vl);
vfloat32m2_t __riscv_vslideup_vx_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs2, size_t rs1,
                                           size_t vl);
vfloat32m4_t __riscv_vslideup_vx_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs2, size_t rs1,
                                           size_t vl);
vfloat32m8_t __riscv_vslideup_vx_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs2, size_t rs1,
                                           size_t vl);
vfloat64m1_t __riscv_vslideup_vx_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs2, size_t rs1,
                                           size_t vl);
vfloat64m2_t __riscv_vslideup_vx_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs2, size_t rs1,
                                           size_t vl);
vfloat64m4_t __riscv_vslideup_vx_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs2, size_t rs1,
                                           size_t vl);
vfloat64m8_t __riscv_vslideup_vx_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs2, size_t rs1,
                                           size_t vl);
vint8mf8_t __riscv_vslideup_vx_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                         vint8mf8_t vs2, size_t rs1, size_t vl);
vint8mf4_t __riscv_vslideup_vx_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                         vint8mf4_t vs2, size_t rs1, size_t vl);
vint8mf2_t __riscv_vslideup_vx_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                         vint8mf2_t vs2, size_t rs1, size_t vl);
vint8m1_t __riscv_vslideup_vx_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                       size_t rs1, size_t vl);
vint8m2_t __riscv_vslideup_vx_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                       size_t rs1, size_t vl);
vint8m4_t __riscv_vslideup_vx_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                       size_t rs1, size_t vl);
vint8m8_t __riscv_vslideup_vx_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                       size_t rs1, size_t vl);
vint16mf4_t __riscv_vslideup_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                           vint16mf4_t vs2, size_t rs1,
                                           size_t vl);
vint16mf2_t __riscv_vslideup_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                           vint16mf2_t vs2, size_t rs1,
                                           size_t vl);
vint16m1_t __riscv_vslideup_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                         vint16m1_t vs2, size_t rs1, size_t vl);
vint16m2_t __riscv_vslideup_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                         vint16m2_t vs2, size_t rs1, size_t vl);
vint16m4_t __riscv_vslideup_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                         vint16m4_t vs2, size_t rs1, size_t vl);
vint16m8_t __riscv_vslideup_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                         vint16m8_t vs2, size_t rs1, size_t vl);
vint32mf2_t __riscv_vslideup_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                           vint32mf2_t vs2, size_t rs1,
                                           size_t vl);
vint32m1_t __riscv_vslideup_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                         vint32m1_t vs2, size_t rs1, size_t vl);
vint32m2_t __riscv_vslideup_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                         vint32m2_t vs2, size_t rs1, size_t vl);
vint32m4_t __riscv_vslideup_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                         vint32m4_t vs2, size_t rs1, size_t vl);
vint32m8_t __riscv_vslideup_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                         vint32m8_t vs2, size_t rs1, size_t vl);
vint64m1_t __riscv_vslideup_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                         vint64m1_t vs2, size_t rs1, size_t vl);
vint64m2_t __riscv_vslideup_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                         vint64m2_t vs2, size_t rs1, size_t vl);
vint64m4_t __riscv_vslideup_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                         vint64m4_t vs2, size_t rs1, size_t vl);
vint64m8_t __riscv_vslideup_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                         vint64m8_t vs2, size_t rs1, size_t vl);
vuint8mf8_t __riscv_vslideup_vx_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                          vuint8mf8_t vs2, size_t rs1,
                                          size_t vl);
vuint8mf4_t __riscv_vslideup_vx_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                          vuint8mf4_t vs2, size_t rs1,
                                          size_t vl);
vuint8mf2_t __riscv_vslideup_vx_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                          vuint8mf2_t vs2, size_t rs1,
                                          size_t vl);
vuint8m1_t __riscv_vslideup_vx_u8m1_tum(vbool8_t vm, vuint8m1_t vd,
                                        vuint8m1_t vs2, size_t rs1, size_t vl);
vuint8m2_t __riscv_vslideup_vx_u8m2_tum(vbool4_t vm, vuint8m2_t vd,
                                        vuint8m2_t vs2, size_t rs1, size_t vl);
vuint8m4_t __riscv_vslideup_vx_u8m4_tum(vbool2_t vm, vuint8m4_t vd,
                                        vuint8m4_t vs2, size_t rs1, size_t vl);
vuint8m8_t __riscv_vslideup_vx_u8m8_tum(vbool1_t vm, vuint8m8_t vd,
                                        vuint8m8_t vs2, size_t rs1, size_t vl);
vuint16mf4_t __riscv_vslideup_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                            vuint16mf4_t vs2, size_t rs1,
                                            size_t vl);
vuint16mf2_t __riscv_vslideup_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                            vuint16mf2_t vs2, size_t rs1,
                                            size_t vl);
vuint16m1_t __riscv_vslideup_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                          vuint16m1_t vs2, size_t rs1,
                                          size_t vl);
vuint16m2_t __riscv_vslideup_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                          vuint16m2_t vs2, size_t rs1,
                                          size_t vl);
vuint16m4_t __riscv_vslideup_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                          vuint16m4_t vs2, size_t rs1,
                                          size_t vl);
vuint16m8_t __riscv_vslideup_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                          vuint16m8_t vs2, size_t rs1,
                                          size_t vl);
vuint32mf2_t __riscv_vslideup_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                            vuint32mf2_t vs2, size_t rs1,
                                            size_t vl);
vuint32m1_t __riscv_vslideup_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                          vuint32m1_t vs2, size_t rs1,
                                          size_t vl);
vuint32m2_t __riscv_vslideup_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                          vuint32m2_t vs2, size_t rs1,
                                          size_t vl);
vuint32m4_t __riscv_vslideup_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                          vuint32m4_t vs2, size_t rs1,
                                          size_t vl);
vuint32m8_t __riscv_vslideup_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                          vuint32m8_t vs2, size_t rs1,
                                          size_t vl);
vuint64m1_t __riscv_vslideup_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                          vuint64m1_t vs2, size_t rs1,
                                          size_t vl);
vuint64m2_t __riscv_vslideup_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                          vuint64m2_t vs2, size_t rs1,
                                          size_t vl);
vuint64m4_t __riscv_vslideup_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                          vuint64m4_t vs2, size_t rs1,
                                          size_t vl);
vuint64m8_t __riscv_vslideup_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                          vuint64m8_t vs2, size_t rs1,
                                          size_t vl);
// masked functions
vfloat16mf4_t __riscv_vslideup_vx_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat16mf4_t vs2, size_t rs1,
                                              size_t vl);
vfloat16mf2_t __riscv_vslideup_vx_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat16mf2_t vs2, size_t rs1,
                                              size_t vl);
vfloat16m1_t __riscv_vslideup_vx_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat16m1_t vs2, size_t rs1,
                                            size_t vl);
vfloat16m2_t __riscv_vslideup_vx_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat16m2_t vs2, size_t rs1,
                                            size_t vl);
vfloat16m4_t __riscv_vslideup_vx_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat16m4_t vs2, size_t rs1,
                                            size_t vl);
vfloat16m8_t __riscv_vslideup_vx_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                            vfloat16m8_t vs2, size_t rs1,
                                            size_t vl);
vfloat32mf2_t __riscv_vslideup_vx_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs2, size_t rs1,
                                              size_t vl);
vfloat32m1_t __riscv_vslideup_vx_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs2, size_t rs1,
                                            size_t vl);
vfloat32m2_t __riscv_vslideup_vx_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs2, size_t rs1,
                                            size_t vl);
vfloat32m4_t __riscv_vslideup_vx_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs2, size_t rs1,
                                            size_t vl);
vfloat32m8_t __riscv_vslideup_vx_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs2, size_t rs1,
                                            size_t vl);
vfloat64m1_t __riscv_vslideup_vx_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs2, size_t rs1,
                                            size_t vl);
vfloat64m2_t __riscv_vslideup_vx_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs2, size_t rs1,
                                            size_t vl);
vfloat64m4_t __riscv_vslideup_vx_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs2, size_t rs1,
                                            size_t vl);
vfloat64m8_t __riscv_vslideup_vx_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs2, size_t rs1,
                                            size_t vl);
vint8mf8_t __riscv_vslideup_vx_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                          vint8mf8_t vs2, size_t rs1,
                                          size_t vl);
vint8mf4_t __riscv_vslideup_vx_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                          vint8mf4_t vs2, size_t rs1,
                                          size_t vl);
vint8mf2_t __riscv_vslideup_vx_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                          vint8mf2_t vs2, size_t rs1,
                                          size_t vl);
vint8m1_t __riscv_vslideup_vx_i8m1_tumu(vbool8_t vm, vint8m1_t vd,
                                        vint8m1_t vs2, size_t rs1, size_t vl);
vint8m2_t __riscv_vslideup_vx_i8m2_tumu(vbool4_t vm, vint8m2_t vd,
                                        vint8m2_t vs2, size_t rs1, size_t vl);
vint8m4_t __riscv_vslideup_vx_i8m4_tumu(vbool2_t vm, vint8m4_t vd,
                                        vint8m4_t vs2, size_t rs1, size_t vl);
vint8m8_t __riscv_vslideup_vx_i8m8_tumu(vbool1_t vm, vint8m8_t vd,
                                        vint8m8_t vs2, size_t rs1, size_t vl);
vint16mf4_t __riscv_vslideup_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                            vint16mf4_t vs2, size_t rs1,
                                            size_t vl);
vint16mf2_t __riscv_vslideup_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                            vint16mf2_t vs2, size_t rs1,
                                            size_t vl);
vint16m1_t __riscv_vslideup_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                          vint16m1_t vs2, size_t rs1,
                                          size_t vl);
vint16m2_t __riscv_vslideup_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                          vint16m2_t vs2, size_t rs1,
                                          size_t vl);
vint16m4_t __riscv_vslideup_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                          vint16m4_t vs2, size_t rs1,
                                          size_t vl);
vint16m8_t __riscv_vslideup_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                          vint16m8_t vs2, size_t rs1,
                                          size_t vl);
vint32mf2_t __riscv_vslideup_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                            vint32mf2_t vs2, size_t rs1,
                                            size_t vl);
vint32m1_t __riscv_vslideup_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                          vint32m1_t vs2, size_t rs1,
                                          size_t vl);
vint32m2_t __riscv_vslideup_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                          vint32m2_t vs2, size_t rs1,
                                          size_t vl);
vint32m4_t __riscv_vslideup_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                          vint32m4_t vs2, size_t rs1,
                                          size_t vl);
vint32m8_t __riscv_vslideup_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                          vint32m8_t vs2, size_t rs1,
                                          size_t vl);
vint64m1_t __riscv_vslideup_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                          vint64m1_t vs2, size_t rs1,
                                          size_t vl);
vint64m2_t __riscv_vslideup_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                          vint64m2_t vs2, size_t rs1,
                                          size_t vl);
vint64m4_t __riscv_vslideup_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                          vint64m4_t vs2, size_t rs1,
                                          size_t vl);
vint64m8_t __riscv_vslideup_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                          vint64m8_t vs2, size_t rs1,
                                          size_t vl);
vuint8mf8_t __riscv_vslideup_vx_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                           vuint8mf8_t vs2, size_t rs1,
                                           size_t vl);
vuint8mf4_t __riscv_vslideup_vx_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                           vuint8mf4_t vs2, size_t rs1,
                                           size_t vl);
vuint8mf2_t __riscv_vslideup_vx_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                           vuint8mf2_t vs2, size_t rs1,
                                           size_t vl);
vuint8m1_t __riscv_vslideup_vx_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                         vuint8m1_t vs2, size_t rs1, size_t vl);
vuint8m2_t __riscv_vslideup_vx_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                         vuint8m2_t vs2, size_t rs1, size_t vl);
vuint8m4_t __riscv_vslideup_vx_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                         vuint8m4_t vs2, size_t rs1, size_t vl);
vuint8m8_t __riscv_vslideup_vx_u8m8_tumu(vbool1_t vm, vuint8m8_t vd,
                                         vuint8m8_t vs2, size_t rs1, size_t vl);
vuint16mf4_t __riscv_vslideup_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                             vuint16mf4_t vs2, size_t rs1,
                                             size_t vl);
vuint16mf2_t __riscv_vslideup_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                             vuint16mf2_t vs2, size_t rs1,
                                             size_t vl);
vuint16m1_t __riscv_vslideup_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                           vuint16m1_t vs2, size_t rs1,
                                           size_t vl);
vuint16m2_t __riscv_vslideup_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                           vuint16m2_t vs2, size_t rs1,
                                           size_t vl);
vuint16m4_t __riscv_vslideup_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                           vuint16m4_t vs2, size_t rs1,
                                           size_t vl);
vuint16m8_t __riscv_vslideup_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                           vuint16m8_t vs2, size_t rs1,
                                           size_t vl);
vuint32mf2_t __riscv_vslideup_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                             vuint32mf2_t vs2, size_t rs1,
                                             size_t vl);
vuint32m1_t __riscv_vslideup_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                           vuint32m1_t vs2, size_t rs1,
                                           size_t vl);
vuint32m2_t __riscv_vslideup_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                           vuint32m2_t vs2, size_t rs1,
                                           size_t vl);
vuint32m4_t __riscv_vslideup_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                           vuint32m4_t vs2, size_t rs1,
                                           size_t vl);
vuint32m8_t __riscv_vslideup_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                           vuint32m8_t vs2, size_t rs1,
                                           size_t vl);
vuint64m1_t __riscv_vslideup_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                           vuint64m1_t vs2, size_t rs1,
                                           size_t vl);
vuint64m2_t __riscv_vslideup_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                           vuint64m2_t vs2, size_t rs1,
                                           size_t vl);
vuint64m4_t __riscv_vslideup_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                           vuint64m4_t vs2, size_t rs1,
                                           size_t vl);
vuint64m8_t __riscv_vslideup_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                           vuint64m8_t vs2, size_t rs1,
                                           size_t vl);
// masked functions
vfloat16mf4_t __riscv_vslideup_vx_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs2, size_t rs1,
                                            size_t vl);
vfloat16mf2_t __riscv_vslideup_vx_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs2, size_t rs1,
                                            size_t vl);
vfloat16m1_t __riscv_vslideup_vx_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs2, size_t rs1,
                                          size_t vl);
vfloat16m2_t __riscv_vslideup_vx_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs2, size_t rs1,
                                          size_t vl);
vfloat16m4_t __riscv_vslideup_vx_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs2, size_t rs1,
                                          size_t vl);
vfloat16m8_t __riscv_vslideup_vx_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs2, size_t rs1,
                                          size_t vl);
vfloat32mf2_t __riscv_vslideup_vx_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2, size_t rs1,
                                            size_t vl);
vfloat32m1_t __riscv_vslideup_vx_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, size_t rs1,
                                          size_t vl);
vfloat32m2_t __riscv_vslideup_vx_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, size_t rs1,
                                          size_t vl);
vfloat32m4_t __riscv_vslideup_vx_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, size_t rs1,
                                          size_t vl);
vfloat32m8_t __riscv_vslideup_vx_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, size_t rs1,
                                          size_t vl);
vfloat64m1_t __riscv_vslideup_vx_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, size_t rs1,
                                          size_t vl);
vfloat64m2_t __riscv_vslideup_vx_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, size_t rs1,
                                          size_t vl);
vfloat64m4_t __riscv_vslideup_vx_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, size_t rs1,
                                          size_t vl);
vfloat64m8_t __riscv_vslideup_vx_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, size_t rs1,
                                          size_t vl);
vint8mf8_t __riscv_vslideup_vx_i8mf8_mu(vbool64_t vm, vint8mf8_t vd,
                                        vint8mf8_t vs2, size_t rs1, size_t vl);
vint8mf4_t __riscv_vslideup_vx_i8mf4_mu(vbool32_t vm, vint8mf4_t vd,
                                        vint8mf4_t vs2, size_t rs1, size_t vl);
vint8mf2_t __riscv_vslideup_vx_i8mf2_mu(vbool16_t vm, vint8mf2_t vd,
                                        vint8mf2_t vs2, size_t rs1, size_t vl);
vint8m1_t __riscv_vslideup_vx_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                      size_t rs1, size_t vl);
vint8m2_t __riscv_vslideup_vx_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                      size_t rs1, size_t vl);
vint8m4_t __riscv_vslideup_vx_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                      size_t rs1, size_t vl);
vint8m8_t __riscv_vslideup_vx_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                      size_t rs1, size_t vl);
vint16mf4_t __riscv_vslideup_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                          vint16mf4_t vs2, size_t rs1,
                                          size_t vl);
vint16mf2_t __riscv_vslideup_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                          vint16mf2_t vs2, size_t rs1,
                                          size_t vl);
vint16m1_t __riscv_vslideup_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                        vint16m1_t vs2, size_t rs1, size_t vl);
vint16m2_t __riscv_vslideup_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd,
                                        vint16m2_t vs2, size_t rs1, size_t vl);
vint16m4_t __riscv_vslideup_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd,
                                        vint16m4_t vs2, size_t rs1, size_t vl);
vint16m8_t __riscv_vslideup_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd,
                                        vint16m8_t vs2, size_t rs1, size_t vl);
vint32mf2_t __riscv_vslideup_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                          vint32mf2_t vs2, size_t rs1,
                                          size_t vl);
vint32m1_t __riscv_vslideup_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                        vint32m1_t vs2, size_t rs1, size_t vl);
vint32m2_t __riscv_vslideup_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                        vint32m2_t vs2, size_t rs1, size_t vl);
vint32m4_t __riscv_vslideup_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd,
                                        vint32m4_t vs2, size_t rs1, size_t vl);
vint32m8_t __riscv_vslideup_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd,
                                        vint32m8_t vs2, size_t rs1, size_t vl);
vint64m1_t __riscv_vslideup_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                        vint64m1_t vs2, size_t rs1, size_t vl);
vint64m2_t __riscv_vslideup_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                        vint64m2_t vs2, size_t rs1, size_t vl);
vint64m4_t __riscv_vslideup_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                        vint64m4_t vs2, size_t rs1, size_t vl);
vint64m8_t __riscv_vslideup_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd,
                                        vint64m8_t vs2, size_t rs1, size_t vl);
vuint8mf8_t __riscv_vslideup_vx_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                         vuint8mf8_t vs2, size_t rs1,
                                         size_t vl);
vuint8mf4_t __riscv_vslideup_vx_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                         vuint8mf4_t vs2, size_t rs1,
                                         size_t vl);
vuint8mf2_t __riscv_vslideup_vx_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                         vuint8mf2_t vs2, size_t rs1,
                                         size_t vl);
vuint8m1_t __riscv_vslideup_vx_u8m1_mu(vbool8_t vm, vuint8m1_t vd,
                                       vuint8m1_t vs2, size_t rs1, size_t vl);
vuint8m2_t __riscv_vslideup_vx_u8m2_mu(vbool4_t vm, vuint8m2_t vd,
                                       vuint8m2_t vs2, size_t rs1, size_t vl);
vuint8m4_t __riscv_vslideup_vx_u8m4_mu(vbool2_t vm, vuint8m4_t vd,
                                       vuint8m4_t vs2, size_t rs1, size_t vl);
vuint8m8_t __riscv_vslideup_vx_u8m8_mu(vbool1_t vm, vuint8m8_t vd,
                                       vuint8m8_t vs2, size_t rs1, size_t vl);
vuint16mf4_t __riscv_vslideup_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                           vuint16mf4_t vs2, size_t rs1,
                                           size_t vl);
vuint16mf2_t __riscv_vslideup_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                           vuint16mf2_t vs2, size_t rs1,
                                           size_t vl);
vuint16m1_t __riscv_vslideup_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                         vuint16m1_t vs2, size_t rs1,
                                         size_t vl);
vuint16m2_t __riscv_vslideup_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                         vuint16m2_t vs2, size_t rs1,
                                         size_t vl);
vuint16m4_t __riscv_vslideup_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                         vuint16m4_t vs2, size_t rs1,
                                         size_t vl);
vuint16m8_t __riscv_vslideup_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                         vuint16m8_t vs2, size_t rs1,
                                         size_t vl);
vuint32mf2_t __riscv_vslideup_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                           vuint32mf2_t vs2, size_t rs1,
                                           size_t vl);
vuint32m1_t __riscv_vslideup_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                         vuint32m1_t vs2, size_t rs1,
                                         size_t vl);
vuint32m2_t __riscv_vslideup_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                         vuint32m2_t vs2, size_t rs1,
                                         size_t vl);
vuint32m4_t __riscv_vslideup_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                         vuint32m4_t vs2, size_t rs1,
                                         size_t vl);
vuint32m8_t __riscv_vslideup_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                         vuint32m8_t vs2, size_t rs1,
                                         size_t vl);
vuint64m1_t __riscv_vslideup_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                         vuint64m1_t vs2, size_t rs1,
                                         size_t vl);
vuint64m2_t __riscv_vslideup_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                         vuint64m2_t vs2, size_t rs1,
                                         size_t vl);
vuint64m4_t __riscv_vslideup_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                         vuint64m4_t vs2, size_t rs1,
                                         size_t vl);
vuint64m8_t __riscv_vslideup_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                         vuint64m8_t vs2, size_t rs1,
                                         size_t vl);

Vector Slidedown Intrinsics

vfloat16mf4_t __riscv_vslidedown_vx_f16mf4_tu(vfloat16mf4_t vd,
                                              vfloat16mf4_t vs2, size_t rs1,
                                              size_t vl);
vfloat16mf2_t __riscv_vslidedown_vx_f16mf2_tu(vfloat16mf2_t vd,
                                              vfloat16mf2_t vs2, size_t rs1,
                                              size_t vl);
vfloat16m1_t __riscv_vslidedown_vx_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                            size_t rs1, size_t vl);
vfloat16m2_t __riscv_vslidedown_vx_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                            size_t rs1, size_t vl);
vfloat16m4_t __riscv_vslidedown_vx_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                            size_t rs1, size_t vl);
vfloat16m8_t __riscv_vslidedown_vx_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                            size_t rs1, size_t vl);
vfloat32mf2_t __riscv_vslidedown_vx_f32mf2_tu(vfloat32mf2_t vd,
                                              vfloat32mf2_t vs2, size_t rs1,
                                              size_t vl);
vfloat32m1_t __riscv_vslidedown_vx_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                            size_t rs1, size_t vl);
vfloat32m2_t __riscv_vslidedown_vx_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                            size_t rs1, size_t vl);
vfloat32m4_t __riscv_vslidedown_vx_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                            size_t rs1, size_t vl);
vfloat32m8_t __riscv_vslidedown_vx_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                            size_t rs1, size_t vl);
vfloat64m1_t __riscv_vslidedown_vx_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                            size_t rs1, size_t vl);
vfloat64m2_t __riscv_vslidedown_vx_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                            size_t rs1, size_t vl);
vfloat64m4_t __riscv_vslidedown_vx_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                            size_t rs1, size_t vl);
vfloat64m8_t __riscv_vslidedown_vx_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                            size_t rs1, size_t vl);
vint8mf8_t __riscv_vslidedown_vx_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                          size_t rs1, size_t vl);
vint8mf4_t __riscv_vslidedown_vx_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                          size_t rs1, size_t vl);
vint8mf2_t __riscv_vslidedown_vx_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                          size_t rs1, size_t vl);
vint8m1_t __riscv_vslidedown_vx_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, size_t rs1,
                                        size_t vl);
vint8m2_t __riscv_vslidedown_vx_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, size_t rs1,
                                        size_t vl);
vint8m4_t __riscv_vslidedown_vx_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, size_t rs1,
                                        size_t vl);
vint8m8_t __riscv_vslidedown_vx_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, size_t rs1,
                                        size_t vl);
vint16mf4_t __riscv_vslidedown_vx_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                            size_t rs1, size_t vl);
vint16mf2_t __riscv_vslidedown_vx_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                            size_t rs1, size_t vl);
vint16m1_t __riscv_vslidedown_vx_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                          size_t rs1, size_t vl);
vint16m2_t __riscv_vslidedown_vx_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                          size_t rs1, size_t vl);
vint16m4_t __riscv_vslidedown_vx_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                          size_t rs1, size_t vl);
vint16m8_t __riscv_vslidedown_vx_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                          size_t rs1, size_t vl);
vint32mf2_t __riscv_vslidedown_vx_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                            size_t rs1, size_t vl);
vint32m1_t __riscv_vslidedown_vx_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                          size_t rs1, size_t vl);
vint32m2_t __riscv_vslidedown_vx_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                          size_t rs1, size_t vl);
vint32m4_t __riscv_vslidedown_vx_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                          size_t rs1, size_t vl);
vint32m8_t __riscv_vslidedown_vx_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                          size_t rs1, size_t vl);
vint64m1_t __riscv_vslidedown_vx_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                          size_t rs1, size_t vl);
vint64m2_t __riscv_vslidedown_vx_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                          size_t rs1, size_t vl);
vint64m4_t __riscv_vslidedown_vx_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                          size_t rs1, size_t vl);
vint64m8_t __riscv_vslidedown_vx_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                          size_t rs1, size_t vl);
vuint8mf8_t __riscv_vslidedown_vx_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                           size_t rs1, size_t vl);
vuint8mf4_t __riscv_vslidedown_vx_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                           size_t rs1, size_t vl);
vuint8mf2_t __riscv_vslidedown_vx_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                           size_t rs1, size_t vl);
vuint8m1_t __riscv_vslidedown_vx_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2,
                                         size_t rs1, size_t vl);
vuint8m2_t __riscv_vslidedown_vx_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2,
                                         size_t rs1, size_t vl);
vuint8m4_t __riscv_vslidedown_vx_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2,
                                         size_t rs1, size_t vl);
vuint8m8_t __riscv_vslidedown_vx_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2,
                                         size_t rs1, size_t vl);
vuint16mf4_t __riscv_vslidedown_vx_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                             size_t rs1, size_t vl);
vuint16mf2_t __riscv_vslidedown_vx_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                             size_t rs1, size_t vl);
vuint16m1_t __riscv_vslidedown_vx_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                           size_t rs1, size_t vl);
vuint16m2_t __riscv_vslidedown_vx_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                           size_t rs1, size_t vl);
vuint16m4_t __riscv_vslidedown_vx_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                           size_t rs1, size_t vl);
vuint16m8_t __riscv_vslidedown_vx_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                           size_t rs1, size_t vl);
vuint32mf2_t __riscv_vslidedown_vx_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                             size_t rs1, size_t vl);
vuint32m1_t __riscv_vslidedown_vx_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                           size_t rs1, size_t vl);
vuint32m2_t __riscv_vslidedown_vx_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                           size_t rs1, size_t vl);
vuint32m4_t __riscv_vslidedown_vx_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                           size_t rs1, size_t vl);
vuint32m8_t __riscv_vslidedown_vx_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                           size_t rs1, size_t vl);
vuint64m1_t __riscv_vslidedown_vx_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                           size_t rs1, size_t vl);
vuint64m2_t __riscv_vslidedown_vx_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                           size_t rs1, size_t vl);
vuint64m4_t __riscv_vslidedown_vx_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                           size_t rs1, size_t vl);
vuint64m8_t __riscv_vslidedown_vx_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                           size_t rs1, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vslidedown_vx_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                               vfloat16mf4_t vs2, size_t rs1,
                                               size_t vl);
vfloat16mf2_t __riscv_vslidedown_vx_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                               vfloat16mf2_t vs2, size_t rs1,
                                               size_t vl);
vfloat16m1_t __riscv_vslidedown_vx_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                             vfloat16m1_t vs2, size_t rs1,
                                             size_t vl);
vfloat16m2_t __riscv_vslidedown_vx_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                             vfloat16m2_t vs2, size_t rs1,
                                             size_t vl);
vfloat16m4_t __riscv_vslidedown_vx_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                             vfloat16m4_t vs2, size_t rs1,
                                             size_t vl);
vfloat16m8_t __riscv_vslidedown_vx_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                             vfloat16m8_t vs2, size_t rs1,
                                             size_t vl);
vfloat32mf2_t __riscv_vslidedown_vx_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat32mf2_t vs2, size_t rs1,
                                               size_t vl);
vfloat32m1_t __riscv_vslidedown_vx_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat32m1_t vs2, size_t rs1,
                                             size_t vl);
vfloat32m2_t __riscv_vslidedown_vx_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat32m2_t vs2, size_t rs1,
                                             size_t vl);
vfloat32m4_t __riscv_vslidedown_vx_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat32m4_t vs2, size_t rs1,
                                             size_t vl);
vfloat32m8_t __riscv_vslidedown_vx_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat32m8_t vs2, size_t rs1,
                                             size_t vl);
vfloat64m1_t __riscv_vslidedown_vx_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat64m1_t vs2, size_t rs1,
                                             size_t vl);
vfloat64m2_t __riscv_vslidedown_vx_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat64m2_t vs2, size_t rs1,
                                             size_t vl);
vfloat64m4_t __riscv_vslidedown_vx_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat64m4_t vs2, size_t rs1,
                                             size_t vl);
vfloat64m8_t __riscv_vslidedown_vx_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat64m8_t vs2, size_t rs1,
                                             size_t vl);
vint8mf8_t __riscv_vslidedown_vx_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                           vint8mf8_t vs2, size_t rs1,
                                           size_t vl);
vint8mf4_t __riscv_vslidedown_vx_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                           vint8mf4_t vs2, size_t rs1,
                                           size_t vl);
vint8mf2_t __riscv_vslidedown_vx_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                           vint8mf2_t vs2, size_t rs1,
                                           size_t vl);
vint8m1_t __riscv_vslidedown_vx_i8m1_tum(vbool8_t vm, vint8m1_t vd,
                                         vint8m1_t vs2, size_t rs1, size_t vl);
vint8m2_t __riscv_vslidedown_vx_i8m2_tum(vbool4_t vm, vint8m2_t vd,
                                         vint8m2_t vs2, size_t rs1, size_t vl);
vint8m4_t __riscv_vslidedown_vx_i8m4_tum(vbool2_t vm, vint8m4_t vd,
                                         vint8m4_t vs2, size_t rs1, size_t vl);
vint8m8_t __riscv_vslidedown_vx_i8m8_tum(vbool1_t vm, vint8m8_t vd,
                                         vint8m8_t vs2, size_t rs1, size_t vl);
vint16mf4_t __riscv_vslidedown_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                             vint16mf4_t vs2, size_t rs1,
                                             size_t vl);
vint16mf2_t __riscv_vslidedown_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                             vint16mf2_t vs2, size_t rs1,
                                             size_t vl);
vint16m1_t __riscv_vslidedown_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                           vint16m1_t vs2, size_t rs1,
                                           size_t vl);
vint16m2_t __riscv_vslidedown_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                           vint16m2_t vs2, size_t rs1,
                                           size_t vl);
vint16m4_t __riscv_vslidedown_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                           vint16m4_t vs2, size_t rs1,
                                           size_t vl);
vint16m8_t __riscv_vslidedown_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                           vint16m8_t vs2, size_t rs1,
                                           size_t vl);
vint32mf2_t __riscv_vslidedown_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                             vint32mf2_t vs2, size_t rs1,
                                             size_t vl);
vint32m1_t __riscv_vslidedown_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                           vint32m1_t vs2, size_t rs1,
                                           size_t vl);
vint32m2_t __riscv_vslidedown_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                           vint32m2_t vs2, size_t rs1,
                                           size_t vl);
vint32m4_t __riscv_vslidedown_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                           vint32m4_t vs2, size_t rs1,
                                           size_t vl);
vint32m8_t __riscv_vslidedown_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                           vint32m8_t vs2, size_t rs1,
                                           size_t vl);
vint64m1_t __riscv_vslidedown_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                           vint64m1_t vs2, size_t rs1,
                                           size_t vl);
vint64m2_t __riscv_vslidedown_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                           vint64m2_t vs2, size_t rs1,
                                           size_t vl);
vint64m4_t __riscv_vslidedown_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                           vint64m4_t vs2, size_t rs1,
                                           size_t vl);
vint64m8_t __riscv_vslidedown_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                           vint64m8_t vs2, size_t rs1,
                                           size_t vl);
vuint8mf8_t __riscv_vslidedown_vx_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                            vuint8mf8_t vs2, size_t rs1,
                                            size_t vl);
vuint8mf4_t __riscv_vslidedown_vx_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                            vuint8mf4_t vs2, size_t rs1,
                                            size_t vl);
vuint8mf2_t __riscv_vslidedown_vx_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                            vuint8mf2_t vs2, size_t rs1,
                                            size_t vl);
vuint8m1_t __riscv_vslidedown_vx_u8m1_tum(vbool8_t vm, vuint8m1_t vd,
                                          vuint8m1_t vs2, size_t rs1,
                                          size_t vl);
vuint8m2_t __riscv_vslidedown_vx_u8m2_tum(vbool4_t vm, vuint8m2_t vd,
                                          vuint8m2_t vs2, size_t rs1,
                                          size_t vl);
vuint8m4_t __riscv_vslidedown_vx_u8m4_tum(vbool2_t vm, vuint8m4_t vd,
                                          vuint8m4_t vs2, size_t rs1,
                                          size_t vl);
vuint8m8_t __riscv_vslidedown_vx_u8m8_tum(vbool1_t vm, vuint8m8_t vd,
                                          vuint8m8_t vs2, size_t rs1,
                                          size_t vl);
vuint16mf4_t __riscv_vslidedown_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                              vuint16mf4_t vs2, size_t rs1,
                                              size_t vl);
vuint16mf2_t __riscv_vslidedown_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                              vuint16mf2_t vs2, size_t rs1,
                                              size_t vl);
vuint16m1_t __riscv_vslidedown_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                            vuint16m1_t vs2, size_t rs1,
                                            size_t vl);
vuint16m2_t __riscv_vslidedown_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                            vuint16m2_t vs2, size_t rs1,
                                            size_t vl);
vuint16m4_t __riscv_vslidedown_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                            vuint16m4_t vs2, size_t rs1,
                                            size_t vl);
vuint16m8_t __riscv_vslidedown_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                            vuint16m8_t vs2, size_t rs1,
                                            size_t vl);
vuint32mf2_t __riscv_vslidedown_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                              vuint32mf2_t vs2, size_t rs1,
                                              size_t vl);
vuint32m1_t __riscv_vslidedown_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                            vuint32m1_t vs2, size_t rs1,
                                            size_t vl);
vuint32m2_t __riscv_vslidedown_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                            vuint32m2_t vs2, size_t rs1,
                                            size_t vl);
vuint32m4_t __riscv_vslidedown_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                            vuint32m4_t vs2, size_t rs1,
                                            size_t vl);
vuint32m8_t __riscv_vslidedown_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                            vuint32m8_t vs2, size_t rs1,
                                            size_t vl);
vuint64m1_t __riscv_vslidedown_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                            vuint64m1_t vs2, size_t rs1,
                                            size_t vl);
vuint64m2_t __riscv_vslidedown_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                            vuint64m2_t vs2, size_t rs1,
                                            size_t vl);
vuint64m4_t __riscv_vslidedown_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                            vuint64m4_t vs2, size_t rs1,
                                            size_t vl);
vuint64m8_t __riscv_vslidedown_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                            vuint64m8_t vs2, size_t rs1,
                                            size_t vl);
// masked functions
vfloat16mf4_t __riscv_vslidedown_vx_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                                vfloat16mf4_t vs2, size_t rs1,
                                                size_t vl);
vfloat16mf2_t __riscv_vslidedown_vx_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                                vfloat16mf2_t vs2, size_t rs1,
                                                size_t vl);
vfloat16m1_t __riscv_vslidedown_vx_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                              vfloat16m1_t vs2, size_t rs1,
                                              size_t vl);
vfloat16m2_t __riscv_vslidedown_vx_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                              vfloat16m2_t vs2, size_t rs1,
                                              size_t vl);
vfloat16m4_t __riscv_vslidedown_vx_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                              vfloat16m4_t vs2, size_t rs1,
                                              size_t vl);
vfloat16m8_t __riscv_vslidedown_vx_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                              vfloat16m8_t vs2, size_t rs1,
                                              size_t vl);
vfloat32mf2_t __riscv_vslidedown_vx_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                                vfloat32mf2_t vs2, size_t rs1,
                                                size_t vl);
vfloat32m1_t __riscv_vslidedown_vx_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                              vfloat32m1_t vs2, size_t rs1,
                                              size_t vl);
vfloat32m2_t __riscv_vslidedown_vx_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                              vfloat32m2_t vs2, size_t rs1,
                                              size_t vl);
vfloat32m4_t __riscv_vslidedown_vx_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                              vfloat32m4_t vs2, size_t rs1,
                                              size_t vl);
vfloat32m8_t __riscv_vslidedown_vx_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                              vfloat32m8_t vs2, size_t rs1,
                                              size_t vl);
vfloat64m1_t __riscv_vslidedown_vx_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                              vfloat64m1_t vs2, size_t rs1,
                                              size_t vl);
vfloat64m2_t __riscv_vslidedown_vx_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                              vfloat64m2_t vs2, size_t rs1,
                                              size_t vl);
vfloat64m4_t __riscv_vslidedown_vx_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                              vfloat64m4_t vs2, size_t rs1,
                                              size_t vl);
vfloat64m8_t __riscv_vslidedown_vx_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                              vfloat64m8_t vs2, size_t rs1,
                                              size_t vl);
vint8mf8_t __riscv_vslidedown_vx_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                            vint8mf8_t vs2, size_t rs1,
                                            size_t vl);
vint8mf4_t __riscv_vslidedown_vx_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                            vint8mf4_t vs2, size_t rs1,
                                            size_t vl);
vint8mf2_t __riscv_vslidedown_vx_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                            vint8mf2_t vs2, size_t rs1,
                                            size_t vl);
vint8m1_t __riscv_vslidedown_vx_i8m1_tumu(vbool8_t vm, vint8m1_t vd,
                                          vint8m1_t vs2, size_t rs1, size_t vl);
vint8m2_t __riscv_vslidedown_vx_i8m2_tumu(vbool4_t vm, vint8m2_t vd,
                                          vint8m2_t vs2, size_t rs1, size_t vl);
vint8m4_t __riscv_vslidedown_vx_i8m4_tumu(vbool2_t vm, vint8m4_t vd,
                                          vint8m4_t vs2, size_t rs1, size_t vl);
vint8m8_t __riscv_vslidedown_vx_i8m8_tumu(vbool1_t vm, vint8m8_t vd,
                                          vint8m8_t vs2, size_t rs1, size_t vl);
vint16mf4_t __riscv_vslidedown_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                              vint16mf4_t vs2, size_t rs1,
                                              size_t vl);
vint16mf2_t __riscv_vslidedown_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                              vint16mf2_t vs2, size_t rs1,
                                              size_t vl);
vint16m1_t __riscv_vslidedown_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                            vint16m1_t vs2, size_t rs1,
                                            size_t vl);
vint16m2_t __riscv_vslidedown_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                            vint16m2_t vs2, size_t rs1,
                                            size_t vl);
vint16m4_t __riscv_vslidedown_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                            vint16m4_t vs2, size_t rs1,
                                            size_t vl);
vint16m8_t __riscv_vslidedown_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                            vint16m8_t vs2, size_t rs1,
                                            size_t vl);
vint32mf2_t __riscv_vslidedown_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                              vint32mf2_t vs2, size_t rs1,
                                              size_t vl);
vint32m1_t __riscv_vslidedown_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                            vint32m1_t vs2, size_t rs1,
                                            size_t vl);
vint32m2_t __riscv_vslidedown_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                            vint32m2_t vs2, size_t rs1,
                                            size_t vl);
vint32m4_t __riscv_vslidedown_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                            vint32m4_t vs2, size_t rs1,
                                            size_t vl);
vint32m8_t __riscv_vslidedown_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                            vint32m8_t vs2, size_t rs1,
                                            size_t vl);
vint64m1_t __riscv_vslidedown_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                            vint64m1_t vs2, size_t rs1,
                                            size_t vl);
vint64m2_t __riscv_vslidedown_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                            vint64m2_t vs2, size_t rs1,
                                            size_t vl);
vint64m4_t __riscv_vslidedown_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                            vint64m4_t vs2, size_t rs1,
                                            size_t vl);
vint64m8_t __riscv_vslidedown_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                            vint64m8_t vs2, size_t rs1,
                                            size_t vl);
vuint8mf8_t __riscv_vslidedown_vx_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                             vuint8mf8_t vs2, size_t rs1,
                                             size_t vl);
vuint8mf4_t __riscv_vslidedown_vx_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                             vuint8mf4_t vs2, size_t rs1,
                                             size_t vl);
vuint8mf2_t __riscv_vslidedown_vx_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                             vuint8mf2_t vs2, size_t rs1,
                                             size_t vl);
vuint8m1_t __riscv_vslidedown_vx_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                           vuint8m1_t vs2, size_t rs1,
                                           size_t vl);
vuint8m2_t __riscv_vslidedown_vx_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                           vuint8m2_t vs2, size_t rs1,
                                           size_t vl);
vuint8m4_t __riscv_vslidedown_vx_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                           vuint8m4_t vs2, size_t rs1,
                                           size_t vl);
vuint8m8_t __riscv_vslidedown_vx_u8m8_tumu(vbool1_t vm, vuint8m8_t vd,
                                           vuint8m8_t vs2, size_t rs1,
                                           size_t vl);
vuint16mf4_t __riscv_vslidedown_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                               vuint16mf4_t vs2, size_t rs1,
                                               size_t vl);
vuint16mf2_t __riscv_vslidedown_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                               vuint16mf2_t vs2, size_t rs1,
                                               size_t vl);
vuint16m1_t __riscv_vslidedown_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                             vuint16m1_t vs2, size_t rs1,
                                             size_t vl);
vuint16m2_t __riscv_vslidedown_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                             vuint16m2_t vs2, size_t rs1,
                                             size_t vl);
vuint16m4_t __riscv_vslidedown_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                             vuint16m4_t vs2, size_t rs1,
                                             size_t vl);
vuint16m8_t __riscv_vslidedown_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                             vuint16m8_t vs2, size_t rs1,
                                             size_t vl);
vuint32mf2_t __riscv_vslidedown_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                               vuint32mf2_t vs2, size_t rs1,
                                               size_t vl);
vuint32m1_t __riscv_vslidedown_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                             vuint32m1_t vs2, size_t rs1,
                                             size_t vl);
vuint32m2_t __riscv_vslidedown_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                             vuint32m2_t vs2, size_t rs1,
                                             size_t vl);
vuint32m4_t __riscv_vslidedown_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                             vuint32m4_t vs2, size_t rs1,
                                             size_t vl);
vuint32m8_t __riscv_vslidedown_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                             vuint32m8_t vs2, size_t rs1,
                                             size_t vl);
vuint64m1_t __riscv_vslidedown_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                             vuint64m1_t vs2, size_t rs1,
                                             size_t vl);
vuint64m2_t __riscv_vslidedown_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                             vuint64m2_t vs2, size_t rs1,
                                             size_t vl);
vuint64m4_t __riscv_vslidedown_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                             vuint64m4_t vs2, size_t rs1,
                                             size_t vl);
vuint64m8_t __riscv_vslidedown_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                             vuint64m8_t vs2, size_t rs1,
                                             size_t vl);
// masked functions
vfloat16mf4_t __riscv_vslidedown_vx_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat16mf4_t vs2, size_t rs1,
                                              size_t vl);
vfloat16mf2_t __riscv_vslidedown_vx_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat16mf2_t vs2, size_t rs1,
                                              size_t vl);
vfloat16m1_t __riscv_vslidedown_vx_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat16m1_t vs2, size_t rs1,
                                            size_t vl);
vfloat16m2_t __riscv_vslidedown_vx_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat16m2_t vs2, size_t rs1,
                                            size_t vl);
vfloat16m4_t __riscv_vslidedown_vx_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat16m4_t vs2, size_t rs1,
                                            size_t vl);
vfloat16m8_t __riscv_vslidedown_vx_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                            vfloat16m8_t vs2, size_t rs1,
                                            size_t vl);
vfloat32mf2_t __riscv_vslidedown_vx_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs2, size_t rs1,
                                              size_t vl);
vfloat32m1_t __riscv_vslidedown_vx_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs2, size_t rs1,
                                            size_t vl);
vfloat32m2_t __riscv_vslidedown_vx_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs2, size_t rs1,
                                            size_t vl);
vfloat32m4_t __riscv_vslidedown_vx_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs2, size_t rs1,
                                            size_t vl);
vfloat32m8_t __riscv_vslidedown_vx_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs2, size_t rs1,
                                            size_t vl);
vfloat64m1_t __riscv_vslidedown_vx_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs2, size_t rs1,
                                            size_t vl);
vfloat64m2_t __riscv_vslidedown_vx_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs2, size_t rs1,
                                            size_t vl);
vfloat64m4_t __riscv_vslidedown_vx_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs2, size_t rs1,
                                            size_t vl);
vfloat64m8_t __riscv_vslidedown_vx_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs2, size_t rs1,
                                            size_t vl);
vint8mf8_t __riscv_vslidedown_vx_i8mf8_mu(vbool64_t vm, vint8mf8_t vd,
                                          vint8mf8_t vs2, size_t rs1,
                                          size_t vl);
vint8mf4_t __riscv_vslidedown_vx_i8mf4_mu(vbool32_t vm, vint8mf4_t vd,
                                          vint8mf4_t vs2, size_t rs1,
                                          size_t vl);
vint8mf2_t __riscv_vslidedown_vx_i8mf2_mu(vbool16_t vm, vint8mf2_t vd,
                                          vint8mf2_t vs2, size_t rs1,
                                          size_t vl);
vint8m1_t __riscv_vslidedown_vx_i8m1_mu(vbool8_t vm, vint8m1_t vd,
                                        vint8m1_t vs2, size_t rs1, size_t vl);
vint8m2_t __riscv_vslidedown_vx_i8m2_mu(vbool4_t vm, vint8m2_t vd,
                                        vint8m2_t vs2, size_t rs1, size_t vl);
vint8m4_t __riscv_vslidedown_vx_i8m4_mu(vbool2_t vm, vint8m4_t vd,
                                        vint8m4_t vs2, size_t rs1, size_t vl);
vint8m8_t __riscv_vslidedown_vx_i8m8_mu(vbool1_t vm, vint8m8_t vd,
                                        vint8m8_t vs2, size_t rs1, size_t vl);
vint16mf4_t __riscv_vslidedown_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                            vint16mf4_t vs2, size_t rs1,
                                            size_t vl);
vint16mf2_t __riscv_vslidedown_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                            vint16mf2_t vs2, size_t rs1,
                                            size_t vl);
vint16m1_t __riscv_vslidedown_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                          vint16m1_t vs2, size_t rs1,
                                          size_t vl);
vint16m2_t __riscv_vslidedown_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd,
                                          vint16m2_t vs2, size_t rs1,
                                          size_t vl);
vint16m4_t __riscv_vslidedown_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd,
                                          vint16m4_t vs2, size_t rs1,
                                          size_t vl);
vint16m8_t __riscv_vslidedown_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd,
                                          vint16m8_t vs2, size_t rs1,
                                          size_t vl);
vint32mf2_t __riscv_vslidedown_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                            vint32mf2_t vs2, size_t rs1,
                                            size_t vl);
vint32m1_t __riscv_vslidedown_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                          vint32m1_t vs2, size_t rs1,
                                          size_t vl);
vint32m2_t __riscv_vslidedown_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                          vint32m2_t vs2, size_t rs1,
                                          size_t vl);
vint32m4_t __riscv_vslidedown_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd,
                                          vint32m4_t vs2, size_t rs1,
                                          size_t vl);
vint32m8_t __riscv_vslidedown_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd,
                                          vint32m8_t vs2, size_t rs1,
                                          size_t vl);
vint64m1_t __riscv_vslidedown_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                          vint64m1_t vs2, size_t rs1,
                                          size_t vl);
vint64m2_t __riscv_vslidedown_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                          vint64m2_t vs2, size_t rs1,
                                          size_t vl);
vint64m4_t __riscv_vslidedown_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                          vint64m4_t vs2, size_t rs1,
                                          size_t vl);
vint64m8_t __riscv_vslidedown_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd,
                                          vint64m8_t vs2, size_t rs1,
                                          size_t vl);
vuint8mf8_t __riscv_vslidedown_vx_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                           vuint8mf8_t vs2, size_t rs1,
                                           size_t vl);
vuint8mf4_t __riscv_vslidedown_vx_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                           vuint8mf4_t vs2, size_t rs1,
                                           size_t vl);
vuint8mf2_t __riscv_vslidedown_vx_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                           vuint8mf2_t vs2, size_t rs1,
                                           size_t vl);
vuint8m1_t __riscv_vslidedown_vx_u8m1_mu(vbool8_t vm, vuint8m1_t vd,
                                         vuint8m1_t vs2, size_t rs1, size_t vl);
vuint8m2_t __riscv_vslidedown_vx_u8m2_mu(vbool4_t vm, vuint8m2_t vd,
                                         vuint8m2_t vs2, size_t rs1, size_t vl);
vuint8m4_t __riscv_vslidedown_vx_u8m4_mu(vbool2_t vm, vuint8m4_t vd,
                                         vuint8m4_t vs2, size_t rs1, size_t vl);
vuint8m8_t __riscv_vslidedown_vx_u8m8_mu(vbool1_t vm, vuint8m8_t vd,
                                         vuint8m8_t vs2, size_t rs1, size_t vl);
vuint16mf4_t __riscv_vslidedown_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                             vuint16mf4_t vs2, size_t rs1,
                                             size_t vl);
vuint16mf2_t __riscv_vslidedown_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                             vuint16mf2_t vs2, size_t rs1,
                                             size_t vl);
vuint16m1_t __riscv_vslidedown_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                           vuint16m1_t vs2, size_t rs1,
                                           size_t vl);
vuint16m2_t __riscv_vslidedown_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                           vuint16m2_t vs2, size_t rs1,
                                           size_t vl);
vuint16m4_t __riscv_vslidedown_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                           vuint16m4_t vs2, size_t rs1,
                                           size_t vl);
vuint16m8_t __riscv_vslidedown_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                           vuint16m8_t vs2, size_t rs1,
                                           size_t vl);
vuint32mf2_t __riscv_vslidedown_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                             vuint32mf2_t vs2, size_t rs1,
                                             size_t vl);
vuint32m1_t __riscv_vslidedown_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                           vuint32m1_t vs2, size_t rs1,
                                           size_t vl);
vuint32m2_t __riscv_vslidedown_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                           vuint32m2_t vs2, size_t rs1,
                                           size_t vl);
vuint32m4_t __riscv_vslidedown_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                           vuint32m4_t vs2, size_t rs1,
                                           size_t vl);
vuint32m8_t __riscv_vslidedown_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                           vuint32m8_t vs2, size_t rs1,
                                           size_t vl);
vuint64m1_t __riscv_vslidedown_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                           vuint64m1_t vs2, size_t rs1,
                                           size_t vl);
vuint64m2_t __riscv_vslidedown_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                           vuint64m2_t vs2, size_t rs1,
                                           size_t vl);
vuint64m4_t __riscv_vslidedown_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                           vuint64m4_t vs2, size_t rs1,
                                           size_t vl);
vuint64m8_t __riscv_vslidedown_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                           vuint64m8_t vs2, size_t rs1,
                                           size_t vl);

Vector Slide1up and Slide1down Intrinsics

vfloat16mf4_t __riscv_vfslide1up_vf_f16mf4_tu(vfloat16mf4_t vd,
                                              vfloat16mf4_t vs2, _Float16 rs1,
                                              size_t vl);
vfloat16mf2_t __riscv_vfslide1up_vf_f16mf2_tu(vfloat16mf2_t vd,
                                              vfloat16mf2_t vs2, _Float16 rs1,
                                              size_t vl);
vfloat16m1_t __riscv_vfslide1up_vf_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                            _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfslide1up_vf_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                            _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfslide1up_vf_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                            _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfslide1up_vf_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                            _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfslide1up_vf_f32mf2_tu(vfloat32mf2_t vd,
                                              vfloat32mf2_t vs2, float rs1,
                                              size_t vl);
vfloat32m1_t __riscv_vfslide1up_vf_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                            float rs1, size_t vl);
vfloat32m2_t __riscv_vfslide1up_vf_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                            float rs1, size_t vl);
vfloat32m4_t __riscv_vfslide1up_vf_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                            float rs1, size_t vl);
vfloat32m8_t __riscv_vfslide1up_vf_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                            float rs1, size_t vl);
vfloat64m1_t __riscv_vfslide1up_vf_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                            double rs1, size_t vl);
vfloat64m2_t __riscv_vfslide1up_vf_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                            double rs1, size_t vl);
vfloat64m4_t __riscv_vfslide1up_vf_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                            double rs1, size_t vl);
vfloat64m8_t __riscv_vfslide1up_vf_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                            double rs1, size_t vl);
vfloat16mf4_t __riscv_vfslide1down_vf_f16mf4_tu(vfloat16mf4_t vd,
                                                vfloat16mf4_t vs2, _Float16 rs1,
                                                size_t vl);
vfloat16mf2_t __riscv_vfslide1down_vf_f16mf2_tu(vfloat16mf2_t vd,
                                                vfloat16mf2_t vs2, _Float16 rs1,
                                                size_t vl);
vfloat16m1_t __riscv_vfslide1down_vf_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                              _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfslide1down_vf_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                              _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfslide1down_vf_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                              _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfslide1down_vf_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                              _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfslide1down_vf_f32mf2_tu(vfloat32mf2_t vd,
                                                vfloat32mf2_t vs2, float rs1,
                                                size_t vl);
vfloat32m1_t __riscv_vfslide1down_vf_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                              float rs1, size_t vl);
vfloat32m2_t __riscv_vfslide1down_vf_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                              float rs1, size_t vl);
vfloat32m4_t __riscv_vfslide1down_vf_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                              float rs1, size_t vl);
vfloat32m8_t __riscv_vfslide1down_vf_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                              float rs1, size_t vl);
vfloat64m1_t __riscv_vfslide1down_vf_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                              double rs1, size_t vl);
vfloat64m2_t __riscv_vfslide1down_vf_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                              double rs1, size_t vl);
vfloat64m4_t __riscv_vfslide1down_vf_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                              double rs1, size_t vl);
vfloat64m8_t __riscv_vfslide1down_vf_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                              double rs1, size_t vl);
vint8mf8_t __riscv_vslide1up_vx_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                         int8_t rs1, size_t vl);
vint8mf4_t __riscv_vslide1up_vx_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                         int8_t rs1, size_t vl);
vint8mf2_t __riscv_vslide1up_vx_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                         int8_t rs1, size_t vl);
vint8m1_t __riscv_vslide1up_vx_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, int8_t rs1,
                                       size_t vl);
vint8m2_t __riscv_vslide1up_vx_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, int8_t rs1,
                                       size_t vl);
vint8m4_t __riscv_vslide1up_vx_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, int8_t rs1,
                                       size_t vl);
vint8m8_t __riscv_vslide1up_vx_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, int8_t rs1,
                                       size_t vl);
vint16mf4_t __riscv_vslide1up_vx_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                           int16_t rs1, size_t vl);
vint16mf2_t __riscv_vslide1up_vx_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                           int16_t rs1, size_t vl);
vint16m1_t __riscv_vslide1up_vx_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                         int16_t rs1, size_t vl);
vint16m2_t __riscv_vslide1up_vx_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                         int16_t rs1, size_t vl);
vint16m4_t __riscv_vslide1up_vx_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                         int16_t rs1, size_t vl);
vint16m8_t __riscv_vslide1up_vx_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                         int16_t rs1, size_t vl);
vint32mf2_t __riscv_vslide1up_vx_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                           int32_t rs1, size_t vl);
vint32m1_t __riscv_vslide1up_vx_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                         int32_t rs1, size_t vl);
vint32m2_t __riscv_vslide1up_vx_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                         int32_t rs1, size_t vl);
vint32m4_t __riscv_vslide1up_vx_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                         int32_t rs1, size_t vl);
vint32m8_t __riscv_vslide1up_vx_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                         int32_t rs1, size_t vl);
vint64m1_t __riscv_vslide1up_vx_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                         int64_t rs1, size_t vl);
vint64m2_t __riscv_vslide1up_vx_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                         int64_t rs1, size_t vl);
vint64m4_t __riscv_vslide1up_vx_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                         int64_t rs1, size_t vl);
vint64m8_t __riscv_vslide1up_vx_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                         int64_t rs1, size_t vl);
vint8mf8_t __riscv_vslide1down_vx_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                           int8_t rs1, size_t vl);
vint8mf4_t __riscv_vslide1down_vx_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                           int8_t rs1, size_t vl);
vint8mf2_t __riscv_vslide1down_vx_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                           int8_t rs1, size_t vl);
vint8m1_t __riscv_vslide1down_vx_i8m1_tu(vint8m1_t vd, vint8m1_t vs2,
                                         int8_t rs1, size_t vl);
vint8m2_t __riscv_vslide1down_vx_i8m2_tu(vint8m2_t vd, vint8m2_t vs2,
                                         int8_t rs1, size_t vl);
vint8m4_t __riscv_vslide1down_vx_i8m4_tu(vint8m4_t vd, vint8m4_t vs2,
                                         int8_t rs1, size_t vl);
vint8m8_t __riscv_vslide1down_vx_i8m8_tu(vint8m8_t vd, vint8m8_t vs2,
                                         int8_t rs1, size_t vl);
vint16mf4_t __riscv_vslide1down_vx_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                             int16_t rs1, size_t vl);
vint16mf2_t __riscv_vslide1down_vx_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                             int16_t rs1, size_t vl);
vint16m1_t __riscv_vslide1down_vx_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                           int16_t rs1, size_t vl);
vint16m2_t __riscv_vslide1down_vx_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                           int16_t rs1, size_t vl);
vint16m4_t __riscv_vslide1down_vx_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                           int16_t rs1, size_t vl);
vint16m8_t __riscv_vslide1down_vx_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                           int16_t rs1, size_t vl);
vint32mf2_t __riscv_vslide1down_vx_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                             int32_t rs1, size_t vl);
vint32m1_t __riscv_vslide1down_vx_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                           int32_t rs1, size_t vl);
vint32m2_t __riscv_vslide1down_vx_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                           int32_t rs1, size_t vl);
vint32m4_t __riscv_vslide1down_vx_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                           int32_t rs1, size_t vl);
vint32m8_t __riscv_vslide1down_vx_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                           int32_t rs1, size_t vl);
vint64m1_t __riscv_vslide1down_vx_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                           int64_t rs1, size_t vl);
vint64m2_t __riscv_vslide1down_vx_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                           int64_t rs1, size_t vl);
vint64m4_t __riscv_vslide1down_vx_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                           int64_t rs1, size_t vl);
vint64m8_t __riscv_vslide1down_vx_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                           int64_t rs1, size_t vl);
vuint8mf8_t __riscv_vslide1up_vx_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                          uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vslide1up_vx_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                          uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vslide1up_vx_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                          uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vslide1up_vx_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2,
                                        uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vslide1up_vx_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2,
                                        uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vslide1up_vx_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2,
                                        uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vslide1up_vx_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2,
                                        uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vslide1up_vx_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                            uint16_t rs1, size_t vl);
vuint16mf2_t __riscv_vslide1up_vx_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                            uint16_t rs1, size_t vl);
vuint16m1_t __riscv_vslide1up_vx_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                          uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vslide1up_vx_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                          uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vslide1up_vx_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                          uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vslide1up_vx_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                          uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vslide1up_vx_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                            uint32_t rs1, size_t vl);
vuint32m1_t __riscv_vslide1up_vx_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                          uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vslide1up_vx_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                          uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vslide1up_vx_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                          uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vslide1up_vx_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                          uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vslide1up_vx_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                          uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vslide1up_vx_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                          uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vslide1up_vx_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                          uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vslide1up_vx_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                          uint64_t rs1, size_t vl);
vuint8mf8_t __riscv_vslide1down_vx_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                            uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vslide1down_vx_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                            uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vslide1down_vx_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                            uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vslide1down_vx_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2,
                                          uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vslide1down_vx_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2,
                                          uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vslide1down_vx_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2,
                                          uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vslide1down_vx_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2,
                                          uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vslide1down_vx_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                              uint16_t rs1, size_t vl);
vuint16mf2_t __riscv_vslide1down_vx_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                              uint16_t rs1, size_t vl);
vuint16m1_t __riscv_vslide1down_vx_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                            uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vslide1down_vx_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                            uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vslide1down_vx_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                            uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vslide1down_vx_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                            uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vslide1down_vx_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                              uint32_t rs1, size_t vl);
vuint32m1_t __riscv_vslide1down_vx_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                            uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vslide1down_vx_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                            uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vslide1down_vx_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                            uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vslide1down_vx_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                            uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vslide1down_vx_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                            uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vslide1down_vx_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                            uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vslide1down_vx_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                            uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vslide1down_vx_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                            uint64_t rs1, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfslide1up_vf_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                               vfloat16mf4_t vs2, _Float16 rs1,
                                               size_t vl);
vfloat16mf2_t __riscv_vfslide1up_vf_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                               vfloat16mf2_t vs2, _Float16 rs1,
                                               size_t vl);
vfloat16m1_t __riscv_vfslide1up_vf_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                             vfloat16m1_t vs2, _Float16 rs1,
                                             size_t vl);
vfloat16m2_t __riscv_vfslide1up_vf_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                             vfloat16m2_t vs2, _Float16 rs1,
                                             size_t vl);
vfloat16m4_t __riscv_vfslide1up_vf_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                             vfloat16m4_t vs2, _Float16 rs1,
                                             size_t vl);
vfloat16m8_t __riscv_vfslide1up_vf_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                             vfloat16m8_t vs2, _Float16 rs1,
                                             size_t vl);
vfloat32mf2_t __riscv_vfslide1up_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                               vfloat32mf2_t vs2, float rs1,
                                               size_t vl);
vfloat32m1_t __riscv_vfslide1up_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                             vfloat32m1_t vs2, float rs1,
                                             size_t vl);
vfloat32m2_t __riscv_vfslide1up_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                             vfloat32m2_t vs2, float rs1,
                                             size_t vl);
vfloat32m4_t __riscv_vfslide1up_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                             vfloat32m4_t vs2, float rs1,
                                             size_t vl);
vfloat32m8_t __riscv_vfslide1up_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                             vfloat32m8_t vs2, float rs1,
                                             size_t vl);
vfloat64m1_t __riscv_vfslide1up_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                             vfloat64m1_t vs2, double rs1,
                                             size_t vl);
vfloat64m2_t __riscv_vfslide1up_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                             vfloat64m2_t vs2, double rs1,
                                             size_t vl);
vfloat64m4_t __riscv_vfslide1up_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                             vfloat64m4_t vs2, double rs1,
                                             size_t vl);
vfloat64m8_t __riscv_vfslide1up_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                             vfloat64m8_t vs2, double rs1,
                                             size_t vl);
vfloat16mf4_t __riscv_vfslide1down_vf_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                                 vfloat16mf4_t vs2,
                                                 _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfslide1down_vf_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                                 vfloat16mf2_t vs2,
                                                 _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfslide1down_vf_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                               vfloat16m1_t vs2, _Float16 rs1,
                                               size_t vl);
vfloat16m2_t __riscv_vfslide1down_vf_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                               vfloat16m2_t vs2, _Float16 rs1,
                                               size_t vl);
vfloat16m4_t __riscv_vfslide1down_vf_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                               vfloat16m4_t vs2, _Float16 rs1,
                                               size_t vl);
vfloat16m8_t __riscv_vfslide1down_vf_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                               vfloat16m8_t vs2, _Float16 rs1,
                                               size_t vl);
vfloat32mf2_t __riscv_vfslide1down_vf_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                                 vfloat32mf2_t vs2, float rs1,
                                                 size_t vl);
vfloat32m1_t __riscv_vfslide1down_vf_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                               vfloat32m1_t vs2, float rs1,
                                               size_t vl);
vfloat32m2_t __riscv_vfslide1down_vf_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                               vfloat32m2_t vs2, float rs1,
                                               size_t vl);
vfloat32m4_t __riscv_vfslide1down_vf_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                               vfloat32m4_t vs2, float rs1,
                                               size_t vl);
vfloat32m8_t __riscv_vfslide1down_vf_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                               vfloat32m8_t vs2, float rs1,
                                               size_t vl);
vfloat64m1_t __riscv_vfslide1down_vf_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                               vfloat64m1_t vs2, double rs1,
                                               size_t vl);
vfloat64m2_t __riscv_vfslide1down_vf_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                               vfloat64m2_t vs2, double rs1,
                                               size_t vl);
vfloat64m4_t __riscv_vfslide1down_vf_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                               vfloat64m4_t vs2, double rs1,
                                               size_t vl);
vfloat64m8_t __riscv_vfslide1down_vf_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                               vfloat64m8_t vs2, double rs1,
                                               size_t vl);
vint8mf8_t __riscv_vslide1up_vx_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                          vint8mf8_t vs2, int8_t rs1,
                                          size_t vl);
vint8mf4_t __riscv_vslide1up_vx_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                          vint8mf4_t vs2, int8_t rs1,
                                          size_t vl);
vint8mf2_t __riscv_vslide1up_vx_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                          vint8mf2_t vs2, int8_t rs1,
                                          size_t vl);
vint8m1_t __riscv_vslide1up_vx_i8m1_tum(vbool8_t vm, vint8m1_t vd,
                                        vint8m1_t vs2, int8_t rs1, size_t vl);
vint8m2_t __riscv_vslide1up_vx_i8m2_tum(vbool4_t vm, vint8m2_t vd,
                                        vint8m2_t vs2, int8_t rs1, size_t vl);
vint8m4_t __riscv_vslide1up_vx_i8m4_tum(vbool2_t vm, vint8m4_t vd,
                                        vint8m4_t vs2, int8_t rs1, size_t vl);
vint8m8_t __riscv_vslide1up_vx_i8m8_tum(vbool1_t vm, vint8m8_t vd,
                                        vint8m8_t vs2, int8_t rs1, size_t vl);
vint16mf4_t __riscv_vslide1up_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                            vint16mf4_t vs2, int16_t rs1,
                                            size_t vl);
vint16mf2_t __riscv_vslide1up_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                            vint16mf2_t vs2, int16_t rs1,
                                            size_t vl);
vint16m1_t __riscv_vslide1up_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                          vint16m1_t vs2, int16_t rs1,
                                          size_t vl);
vint16m2_t __riscv_vslide1up_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                          vint16m2_t vs2, int16_t rs1,
                                          size_t vl);
vint16m4_t __riscv_vslide1up_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                          vint16m4_t vs2, int16_t rs1,
                                          size_t vl);
vint16m8_t __riscv_vslide1up_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                          vint16m8_t vs2, int16_t rs1,
                                          size_t vl);
vint32mf2_t __riscv_vslide1up_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                            vint32mf2_t vs2, int32_t rs1,
                                            size_t vl);
vint32m1_t __riscv_vslide1up_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                          vint32m1_t vs2, int32_t rs1,
                                          size_t vl);
vint32m2_t __riscv_vslide1up_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                          vint32m2_t vs2, int32_t rs1,
                                          size_t vl);
vint32m4_t __riscv_vslide1up_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                          vint32m4_t vs2, int32_t rs1,
                                          size_t vl);
vint32m8_t __riscv_vslide1up_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                          vint32m8_t vs2, int32_t rs1,
                                          size_t vl);
vint64m1_t __riscv_vslide1up_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                          vint64m1_t vs2, int64_t rs1,
                                          size_t vl);
vint64m2_t __riscv_vslide1up_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                          vint64m2_t vs2, int64_t rs1,
                                          size_t vl);
vint64m4_t __riscv_vslide1up_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                          vint64m4_t vs2, int64_t rs1,
                                          size_t vl);
vint64m8_t __riscv_vslide1up_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                          vint64m8_t vs2, int64_t rs1,
                                          size_t vl);
vint8mf8_t __riscv_vslide1down_vx_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                            vint8mf8_t vs2, int8_t rs1,
                                            size_t vl);
vint8mf4_t __riscv_vslide1down_vx_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                            vint8mf4_t vs2, int8_t rs1,
                                            size_t vl);
vint8mf2_t __riscv_vslide1down_vx_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                            vint8mf2_t vs2, int8_t rs1,
                                            size_t vl);
vint8m1_t __riscv_vslide1down_vx_i8m1_tum(vbool8_t vm, vint8m1_t vd,
                                          vint8m1_t vs2, int8_t rs1, size_t vl);
vint8m2_t __riscv_vslide1down_vx_i8m2_tum(vbool4_t vm, vint8m2_t vd,
                                          vint8m2_t vs2, int8_t rs1, size_t vl);
vint8m4_t __riscv_vslide1down_vx_i8m4_tum(vbool2_t vm, vint8m4_t vd,
                                          vint8m4_t vs2, int8_t rs1, size_t vl);
vint8m8_t __riscv_vslide1down_vx_i8m8_tum(vbool1_t vm, vint8m8_t vd,
                                          vint8m8_t vs2, int8_t rs1, size_t vl);
vint16mf4_t __riscv_vslide1down_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                              vint16mf4_t vs2, int16_t rs1,
                                              size_t vl);
vint16mf2_t __riscv_vslide1down_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                              vint16mf2_t vs2, int16_t rs1,
                                              size_t vl);
vint16m1_t __riscv_vslide1down_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                            vint16m1_t vs2, int16_t rs1,
                                            size_t vl);
vint16m2_t __riscv_vslide1down_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                            vint16m2_t vs2, int16_t rs1,
                                            size_t vl);
vint16m4_t __riscv_vslide1down_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                            vint16m4_t vs2, int16_t rs1,
                                            size_t vl);
vint16m8_t __riscv_vslide1down_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                            vint16m8_t vs2, int16_t rs1,
                                            size_t vl);
vint32mf2_t __riscv_vslide1down_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                              vint32mf2_t vs2, int32_t rs1,
                                              size_t vl);
vint32m1_t __riscv_vslide1down_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                            vint32m1_t vs2, int32_t rs1,
                                            size_t vl);
vint32m2_t __riscv_vslide1down_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                            vint32m2_t vs2, int32_t rs1,
                                            size_t vl);
vint32m4_t __riscv_vslide1down_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                            vint32m4_t vs2, int32_t rs1,
                                            size_t vl);
vint32m8_t __riscv_vslide1down_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                            vint32m8_t vs2, int32_t rs1,
                                            size_t vl);
vint64m1_t __riscv_vslide1down_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                            vint64m1_t vs2, int64_t rs1,
                                            size_t vl);
vint64m2_t __riscv_vslide1down_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                            vint64m2_t vs2, int64_t rs1,
                                            size_t vl);
vint64m4_t __riscv_vslide1down_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                            vint64m4_t vs2, int64_t rs1,
                                            size_t vl);
vint64m8_t __riscv_vslide1down_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                            vint64m8_t vs2, int64_t rs1,
                                            size_t vl);
vuint8mf8_t __riscv_vslide1up_vx_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                           vuint8mf8_t vs2, uint8_t rs1,
                                           size_t vl);
vuint8mf4_t __riscv_vslide1up_vx_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                           vuint8mf4_t vs2, uint8_t rs1,
                                           size_t vl);
vuint8mf2_t __riscv_vslide1up_vx_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                           vuint8mf2_t vs2, uint8_t rs1,
                                           size_t vl);
vuint8m1_t __riscv_vslide1up_vx_u8m1_tum(vbool8_t vm, vuint8m1_t vd,
                                         vuint8m1_t vs2, uint8_t rs1,
                                         size_t vl);
vuint8m2_t __riscv_vslide1up_vx_u8m2_tum(vbool4_t vm, vuint8m2_t vd,
                                         vuint8m2_t vs2, uint8_t rs1,
                                         size_t vl);
vuint8m4_t __riscv_vslide1up_vx_u8m4_tum(vbool2_t vm, vuint8m4_t vd,
                                         vuint8m4_t vs2, uint8_t rs1,
                                         size_t vl);
vuint8m8_t __riscv_vslide1up_vx_u8m8_tum(vbool1_t vm, vuint8m8_t vd,
                                         vuint8m8_t vs2, uint8_t rs1,
                                         size_t vl);
vuint16mf4_t __riscv_vslide1up_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                             vuint16mf4_t vs2, uint16_t rs1,
                                             size_t vl);
vuint16mf2_t __riscv_vslide1up_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                             vuint16mf2_t vs2, uint16_t rs1,
                                             size_t vl);
vuint16m1_t __riscv_vslide1up_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                           vuint16m1_t vs2, uint16_t rs1,
                                           size_t vl);
vuint16m2_t __riscv_vslide1up_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                           vuint16m2_t vs2, uint16_t rs1,
                                           size_t vl);
vuint16m4_t __riscv_vslide1up_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                           vuint16m4_t vs2, uint16_t rs1,
                                           size_t vl);
vuint16m8_t __riscv_vslide1up_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                           vuint16m8_t vs2, uint16_t rs1,
                                           size_t vl);
vuint32mf2_t __riscv_vslide1up_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                             vuint32mf2_t vs2, uint32_t rs1,
                                             size_t vl);
vuint32m1_t __riscv_vslide1up_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                           vuint32m1_t vs2, uint32_t rs1,
                                           size_t vl);
vuint32m2_t __riscv_vslide1up_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                           vuint32m2_t vs2, uint32_t rs1,
                                           size_t vl);
vuint32m4_t __riscv_vslide1up_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                           vuint32m4_t vs2, uint32_t rs1,
                                           size_t vl);
vuint32m8_t __riscv_vslide1up_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                           vuint32m8_t vs2, uint32_t rs1,
                                           size_t vl);
vuint64m1_t __riscv_vslide1up_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                           vuint64m1_t vs2, uint64_t rs1,
                                           size_t vl);
vuint64m2_t __riscv_vslide1up_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                           vuint64m2_t vs2, uint64_t rs1,
                                           size_t vl);
vuint64m4_t __riscv_vslide1up_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                           vuint64m4_t vs2, uint64_t rs1,
                                           size_t vl);
vuint64m8_t __riscv_vslide1up_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                           vuint64m8_t vs2, uint64_t rs1,
                                           size_t vl);
vuint8mf8_t __riscv_vslide1down_vx_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                             vuint8mf8_t vs2, uint8_t rs1,
                                             size_t vl);
vuint8mf4_t __riscv_vslide1down_vx_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                             vuint8mf4_t vs2, uint8_t rs1,
                                             size_t vl);
vuint8mf2_t __riscv_vslide1down_vx_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                             vuint8mf2_t vs2, uint8_t rs1,
                                             size_t vl);
vuint8m1_t __riscv_vslide1down_vx_u8m1_tum(vbool8_t vm, vuint8m1_t vd,
                                           vuint8m1_t vs2, uint8_t rs1,
                                           size_t vl);
vuint8m2_t __riscv_vslide1down_vx_u8m2_tum(vbool4_t vm, vuint8m2_t vd,
                                           vuint8m2_t vs2, uint8_t rs1,
                                           size_t vl);
vuint8m4_t __riscv_vslide1down_vx_u8m4_tum(vbool2_t vm, vuint8m4_t vd,
                                           vuint8m4_t vs2, uint8_t rs1,
                                           size_t vl);
vuint8m8_t __riscv_vslide1down_vx_u8m8_tum(vbool1_t vm, vuint8m8_t vd,
                                           vuint8m8_t vs2, uint8_t rs1,
                                           size_t vl);
vuint16mf4_t __riscv_vslide1down_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                               vuint16mf4_t vs2, uint16_t rs1,
                                               size_t vl);
vuint16mf2_t __riscv_vslide1down_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                               vuint16mf2_t vs2, uint16_t rs1,
                                               size_t vl);
vuint16m1_t __riscv_vslide1down_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                             vuint16m1_t vs2, uint16_t rs1,
                                             size_t vl);
vuint16m2_t __riscv_vslide1down_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                             vuint16m2_t vs2, uint16_t rs1,
                                             size_t vl);
vuint16m4_t __riscv_vslide1down_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                             vuint16m4_t vs2, uint16_t rs1,
                                             size_t vl);
vuint16m8_t __riscv_vslide1down_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                             vuint16m8_t vs2, uint16_t rs1,
                                             size_t vl);
vuint32mf2_t __riscv_vslide1down_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                               vuint32mf2_t vs2, uint32_t rs1,
                                               size_t vl);
vuint32m1_t __riscv_vslide1down_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                             vuint32m1_t vs2, uint32_t rs1,
                                             size_t vl);
vuint32m2_t __riscv_vslide1down_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                             vuint32m2_t vs2, uint32_t rs1,
                                             size_t vl);
vuint32m4_t __riscv_vslide1down_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                             vuint32m4_t vs2, uint32_t rs1,
                                             size_t vl);
vuint32m8_t __riscv_vslide1down_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                             vuint32m8_t vs2, uint32_t rs1,
                                             size_t vl);
vuint64m1_t __riscv_vslide1down_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                             vuint64m1_t vs2, uint64_t rs1,
                                             size_t vl);
vuint64m2_t __riscv_vslide1down_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                             vuint64m2_t vs2, uint64_t rs1,
                                             size_t vl);
vuint64m4_t __riscv_vslide1down_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                             vuint64m4_t vs2, uint64_t rs1,
                                             size_t vl);
vuint64m8_t __riscv_vslide1down_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                             vuint64m8_t vs2, uint64_t rs1,
                                             size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfslide1up_vf_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                                vfloat16mf4_t vs2, _Float16 rs1,
                                                size_t vl);
vfloat16mf2_t __riscv_vfslide1up_vf_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                                vfloat16mf2_t vs2, _Float16 rs1,
                                                size_t vl);
vfloat16m1_t __riscv_vfslide1up_vf_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                              vfloat16m1_t vs2, _Float16 rs1,
                                              size_t vl);
vfloat16m2_t __riscv_vfslide1up_vf_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                              vfloat16m2_t vs2, _Float16 rs1,
                                              size_t vl);
vfloat16m4_t __riscv_vfslide1up_vf_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                              vfloat16m4_t vs2, _Float16 rs1,
                                              size_t vl);
vfloat16m8_t __riscv_vfslide1up_vf_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                              vfloat16m8_t vs2, _Float16 rs1,
                                              size_t vl);
vfloat32mf2_t __riscv_vfslide1up_vf_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                                vfloat32mf2_t vs2, float rs1,
                                                size_t vl);
vfloat32m1_t __riscv_vfslide1up_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                              vfloat32m1_t vs2, float rs1,
                                              size_t vl);
vfloat32m2_t __riscv_vfslide1up_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                              vfloat32m2_t vs2, float rs1,
                                              size_t vl);
vfloat32m4_t __riscv_vfslide1up_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                              vfloat32m4_t vs2, float rs1,
                                              size_t vl);
vfloat32m8_t __riscv_vfslide1up_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                              vfloat32m8_t vs2, float rs1,
                                              size_t vl);
vfloat64m1_t __riscv_vfslide1up_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                              vfloat64m1_t vs2, double rs1,
                                              size_t vl);
vfloat64m2_t __riscv_vfslide1up_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                              vfloat64m2_t vs2, double rs1,
                                              size_t vl);
vfloat64m4_t __riscv_vfslide1up_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                              vfloat64m4_t vs2, double rs1,
                                              size_t vl);
vfloat64m8_t __riscv_vfslide1up_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                              vfloat64m8_t vs2, double rs1,
                                              size_t vl);
vfloat16mf4_t __riscv_vfslide1down_vf_f16mf4_tumu(vbool64_t vm,
                                                  vfloat16mf4_t vd,
                                                  vfloat16mf4_t vs2,
                                                  _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfslide1down_vf_f16mf2_tumu(vbool32_t vm,
                                                  vfloat16mf2_t vd,
                                                  vfloat16mf2_t vs2,
                                                  _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfslide1down_vf_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                                vfloat16m1_t vs2, _Float16 rs1,
                                                size_t vl);
vfloat16m2_t __riscv_vfslide1down_vf_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                                vfloat16m2_t vs2, _Float16 rs1,
                                                size_t vl);
vfloat16m4_t __riscv_vfslide1down_vf_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                                vfloat16m4_t vs2, _Float16 rs1,
                                                size_t vl);
vfloat16m8_t __riscv_vfslide1down_vf_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                                vfloat16m8_t vs2, _Float16 rs1,
                                                size_t vl);
vfloat32mf2_t __riscv_vfslide1down_vf_f32mf2_tumu(vbool64_t vm,
                                                  vfloat32mf2_t vd,
                                                  vfloat32mf2_t vs2, float rs1,
                                                  size_t vl);
vfloat32m1_t __riscv_vfslide1down_vf_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                                vfloat32m1_t vs2, float rs1,
                                                size_t vl);
vfloat32m2_t __riscv_vfslide1down_vf_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                                vfloat32m2_t vs2, float rs1,
                                                size_t vl);
vfloat32m4_t __riscv_vfslide1down_vf_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                                vfloat32m4_t vs2, float rs1,
                                                size_t vl);
vfloat32m8_t __riscv_vfslide1down_vf_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                                vfloat32m8_t vs2, float rs1,
                                                size_t vl);
vfloat64m1_t __riscv_vfslide1down_vf_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                                vfloat64m1_t vs2, double rs1,
                                                size_t vl);
vfloat64m2_t __riscv_vfslide1down_vf_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                                vfloat64m2_t vs2, double rs1,
                                                size_t vl);
vfloat64m4_t __riscv_vfslide1down_vf_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                                vfloat64m4_t vs2, double rs1,
                                                size_t vl);
vfloat64m8_t __riscv_vfslide1down_vf_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                                vfloat64m8_t vs2, double rs1,
                                                size_t vl);
vint8mf8_t __riscv_vslide1up_vx_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                           vint8mf8_t vs2, int8_t rs1,
                                           size_t vl);
vint8mf4_t __riscv_vslide1up_vx_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                           vint8mf4_t vs2, int8_t rs1,
                                           size_t vl);
vint8mf2_t __riscv_vslide1up_vx_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                           vint8mf2_t vs2, int8_t rs1,
                                           size_t vl);
vint8m1_t __riscv_vslide1up_vx_i8m1_tumu(vbool8_t vm, vint8m1_t vd,
                                         vint8m1_t vs2, int8_t rs1, size_t vl);
vint8m2_t __riscv_vslide1up_vx_i8m2_tumu(vbool4_t vm, vint8m2_t vd,
                                         vint8m2_t vs2, int8_t rs1, size_t vl);
vint8m4_t __riscv_vslide1up_vx_i8m4_tumu(vbool2_t vm, vint8m4_t vd,
                                         vint8m4_t vs2, int8_t rs1, size_t vl);
vint8m8_t __riscv_vslide1up_vx_i8m8_tumu(vbool1_t vm, vint8m8_t vd,
                                         vint8m8_t vs2, int8_t rs1, size_t vl);
vint16mf4_t __riscv_vslide1up_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                             vint16mf4_t vs2, int16_t rs1,
                                             size_t vl);
vint16mf2_t __riscv_vslide1up_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                             vint16mf2_t vs2, int16_t rs1,
                                             size_t vl);
vint16m1_t __riscv_vslide1up_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                           vint16m1_t vs2, int16_t rs1,
                                           size_t vl);
vint16m2_t __riscv_vslide1up_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                           vint16m2_t vs2, int16_t rs1,
                                           size_t vl);
vint16m4_t __riscv_vslide1up_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                           vint16m4_t vs2, int16_t rs1,
                                           size_t vl);
vint16m8_t __riscv_vslide1up_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                           vint16m8_t vs2, int16_t rs1,
                                           size_t vl);
vint32mf2_t __riscv_vslide1up_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                             vint32mf2_t vs2, int32_t rs1,
                                             size_t vl);
vint32m1_t __riscv_vslide1up_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                           vint32m1_t vs2, int32_t rs1,
                                           size_t vl);
vint32m2_t __riscv_vslide1up_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                           vint32m2_t vs2, int32_t rs1,
                                           size_t vl);
vint32m4_t __riscv_vslide1up_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                           vint32m4_t vs2, int32_t rs1,
                                           size_t vl);
vint32m8_t __riscv_vslide1up_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                           vint32m8_t vs2, int32_t rs1,
                                           size_t vl);
vint64m1_t __riscv_vslide1up_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                           vint64m1_t vs2, int64_t rs1,
                                           size_t vl);
vint64m2_t __riscv_vslide1up_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                           vint64m2_t vs2, int64_t rs1,
                                           size_t vl);
vint64m4_t __riscv_vslide1up_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                           vint64m4_t vs2, int64_t rs1,
                                           size_t vl);
vint64m8_t __riscv_vslide1up_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                           vint64m8_t vs2, int64_t rs1,
                                           size_t vl);
vint8mf8_t __riscv_vslide1down_vx_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                             vint8mf8_t vs2, int8_t rs1,
                                             size_t vl);
vint8mf4_t __riscv_vslide1down_vx_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                             vint8mf4_t vs2, int8_t rs1,
                                             size_t vl);
vint8mf2_t __riscv_vslide1down_vx_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                             vint8mf2_t vs2, int8_t rs1,
                                             size_t vl);
vint8m1_t __riscv_vslide1down_vx_i8m1_tumu(vbool8_t vm, vint8m1_t vd,
                                           vint8m1_t vs2, int8_t rs1,
                                           size_t vl);
vint8m2_t __riscv_vslide1down_vx_i8m2_tumu(vbool4_t vm, vint8m2_t vd,
                                           vint8m2_t vs2, int8_t rs1,
                                           size_t vl);
vint8m4_t __riscv_vslide1down_vx_i8m4_tumu(vbool2_t vm, vint8m4_t vd,
                                           vint8m4_t vs2, int8_t rs1,
                                           size_t vl);
vint8m8_t __riscv_vslide1down_vx_i8m8_tumu(vbool1_t vm, vint8m8_t vd,
                                           vint8m8_t vs2, int8_t rs1,
                                           size_t vl);
vint16mf4_t __riscv_vslide1down_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                               vint16mf4_t vs2, int16_t rs1,
                                               size_t vl);
vint16mf2_t __riscv_vslide1down_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                               vint16mf2_t vs2, int16_t rs1,
                                               size_t vl);
vint16m1_t __riscv_vslide1down_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                             vint16m1_t vs2, int16_t rs1,
                                             size_t vl);
vint16m2_t __riscv_vslide1down_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                             vint16m2_t vs2, int16_t rs1,
                                             size_t vl);
vint16m4_t __riscv_vslide1down_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                             vint16m4_t vs2, int16_t rs1,
                                             size_t vl);
vint16m8_t __riscv_vslide1down_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                             vint16m8_t vs2, int16_t rs1,
                                             size_t vl);
vint32mf2_t __riscv_vslide1down_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                               vint32mf2_t vs2, int32_t rs1,
                                               size_t vl);
vint32m1_t __riscv_vslide1down_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                             vint32m1_t vs2, int32_t rs1,
                                             size_t vl);
vint32m2_t __riscv_vslide1down_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                             vint32m2_t vs2, int32_t rs1,
                                             size_t vl);
vint32m4_t __riscv_vslide1down_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                             vint32m4_t vs2, int32_t rs1,
                                             size_t vl);
vint32m8_t __riscv_vslide1down_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                             vint32m8_t vs2, int32_t rs1,
                                             size_t vl);
vint64m1_t __riscv_vslide1down_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                             vint64m1_t vs2, int64_t rs1,
                                             size_t vl);
vint64m2_t __riscv_vslide1down_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                             vint64m2_t vs2, int64_t rs1,
                                             size_t vl);
vint64m4_t __riscv_vslide1down_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                             vint64m4_t vs2, int64_t rs1,
                                             size_t vl);
vint64m8_t __riscv_vslide1down_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                             vint64m8_t vs2, int64_t rs1,
                                             size_t vl);
vuint8mf8_t __riscv_vslide1up_vx_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                            vuint8mf8_t vs2, uint8_t rs1,
                                            size_t vl);
vuint8mf4_t __riscv_vslide1up_vx_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                            vuint8mf4_t vs2, uint8_t rs1,
                                            size_t vl);
vuint8mf2_t __riscv_vslide1up_vx_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                            vuint8mf2_t vs2, uint8_t rs1,
                                            size_t vl);
vuint8m1_t __riscv_vslide1up_vx_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                          vuint8m1_t vs2, uint8_t rs1,
                                          size_t vl);
vuint8m2_t __riscv_vslide1up_vx_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                          vuint8m2_t vs2, uint8_t rs1,
                                          size_t vl);
vuint8m4_t __riscv_vslide1up_vx_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                          vuint8m4_t vs2, uint8_t rs1,
                                          size_t vl);
vuint8m8_t __riscv_vslide1up_vx_u8m8_tumu(vbool1_t vm, vuint8m8_t vd,
                                          vuint8m8_t vs2, uint8_t rs1,
                                          size_t vl);
vuint16mf4_t __riscv_vslide1up_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                              vuint16mf4_t vs2, uint16_t rs1,
                                              size_t vl);
vuint16mf2_t __riscv_vslide1up_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                              vuint16mf2_t vs2, uint16_t rs1,
                                              size_t vl);
vuint16m1_t __riscv_vslide1up_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                            vuint16m1_t vs2, uint16_t rs1,
                                            size_t vl);
vuint16m2_t __riscv_vslide1up_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                            vuint16m2_t vs2, uint16_t rs1,
                                            size_t vl);
vuint16m4_t __riscv_vslide1up_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                            vuint16m4_t vs2, uint16_t rs1,
                                            size_t vl);
vuint16m8_t __riscv_vslide1up_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                            vuint16m8_t vs2, uint16_t rs1,
                                            size_t vl);
vuint32mf2_t __riscv_vslide1up_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                              vuint32mf2_t vs2, uint32_t rs1,
                                              size_t vl);
vuint32m1_t __riscv_vslide1up_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                            vuint32m1_t vs2, uint32_t rs1,
                                            size_t vl);
vuint32m2_t __riscv_vslide1up_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                            vuint32m2_t vs2, uint32_t rs1,
                                            size_t vl);
vuint32m4_t __riscv_vslide1up_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                            vuint32m4_t vs2, uint32_t rs1,
                                            size_t vl);
vuint32m8_t __riscv_vslide1up_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                            vuint32m8_t vs2, uint32_t rs1,
                                            size_t vl);
vuint64m1_t __riscv_vslide1up_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                            vuint64m1_t vs2, uint64_t rs1,
                                            size_t vl);
vuint64m2_t __riscv_vslide1up_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                            vuint64m2_t vs2, uint64_t rs1,
                                            size_t vl);
vuint64m4_t __riscv_vslide1up_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                            vuint64m4_t vs2, uint64_t rs1,
                                            size_t vl);
vuint64m8_t __riscv_vslide1up_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                            vuint64m8_t vs2, uint64_t rs1,
                                            size_t vl);
vuint8mf8_t __riscv_vslide1down_vx_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                              vuint8mf8_t vs2, uint8_t rs1,
                                              size_t vl);
vuint8mf4_t __riscv_vslide1down_vx_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                              vuint8mf4_t vs2, uint8_t rs1,
                                              size_t vl);
vuint8mf2_t __riscv_vslide1down_vx_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                              vuint8mf2_t vs2, uint8_t rs1,
                                              size_t vl);
vuint8m1_t __riscv_vslide1down_vx_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                            vuint8m1_t vs2, uint8_t rs1,
                                            size_t vl);
vuint8m2_t __riscv_vslide1down_vx_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                            vuint8m2_t vs2, uint8_t rs1,
                                            size_t vl);
vuint8m4_t __riscv_vslide1down_vx_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                            vuint8m4_t vs2, uint8_t rs1,
                                            size_t vl);
vuint8m8_t __riscv_vslide1down_vx_u8m8_tumu(vbool1_t vm, vuint8m8_t vd,
                                            vuint8m8_t vs2, uint8_t rs1,
                                            size_t vl);
vuint16mf4_t __riscv_vslide1down_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                                vuint16mf4_t vs2, uint16_t rs1,
                                                size_t vl);
vuint16mf2_t __riscv_vslide1down_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                                vuint16mf2_t vs2, uint16_t rs1,
                                                size_t vl);
vuint16m1_t __riscv_vslide1down_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                              vuint16m1_t vs2, uint16_t rs1,
                                              size_t vl);
vuint16m2_t __riscv_vslide1down_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                              vuint16m2_t vs2, uint16_t rs1,
                                              size_t vl);
vuint16m4_t __riscv_vslide1down_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                              vuint16m4_t vs2, uint16_t rs1,
                                              size_t vl);
vuint16m8_t __riscv_vslide1down_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                              vuint16m8_t vs2, uint16_t rs1,
                                              size_t vl);
vuint32mf2_t __riscv_vslide1down_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                                vuint32mf2_t vs2, uint32_t rs1,
                                                size_t vl);
vuint32m1_t __riscv_vslide1down_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                              vuint32m1_t vs2, uint32_t rs1,
                                              size_t vl);
vuint32m2_t __riscv_vslide1down_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                              vuint32m2_t vs2, uint32_t rs1,
                                              size_t vl);
vuint32m4_t __riscv_vslide1down_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                              vuint32m4_t vs2, uint32_t rs1,
                                              size_t vl);
vuint32m8_t __riscv_vslide1down_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                              vuint32m8_t vs2, uint32_t rs1,
                                              size_t vl);
vuint64m1_t __riscv_vslide1down_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                              vuint64m1_t vs2, uint64_t rs1,
                                              size_t vl);
vuint64m2_t __riscv_vslide1down_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                              vuint64m2_t vs2, uint64_t rs1,
                                              size_t vl);
vuint64m4_t __riscv_vslide1down_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                              vuint64m4_t vs2, uint64_t rs1,
                                              size_t vl);
vuint64m8_t __riscv_vslide1down_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                              vuint64m8_t vs2, uint64_t rs1,
                                              size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfslide1up_vf_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat16mf4_t vs2, _Float16 rs1,
                                              size_t vl);
vfloat16mf2_t __riscv_vfslide1up_vf_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat16mf2_t vs2, _Float16 rs1,
                                              size_t vl);
vfloat16m1_t __riscv_vfslide1up_vf_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat16m1_t vs2, _Float16 rs1,
                                            size_t vl);
vfloat16m2_t __riscv_vfslide1up_vf_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat16m2_t vs2, _Float16 rs1,
                                            size_t vl);
vfloat16m4_t __riscv_vfslide1up_vf_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat16m4_t vs2, _Float16 rs1,
                                            size_t vl);
vfloat16m8_t __riscv_vfslide1up_vf_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                            vfloat16m8_t vs2, _Float16 rs1,
                                            size_t vl);
vfloat32mf2_t __riscv_vfslide1up_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs2, float rs1,
                                              size_t vl);
vfloat32m1_t __riscv_vfslide1up_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs2, float rs1,
                                            size_t vl);
vfloat32m2_t __riscv_vfslide1up_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs2, float rs1,
                                            size_t vl);
vfloat32m4_t __riscv_vfslide1up_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs2, float rs1,
                                            size_t vl);
vfloat32m8_t __riscv_vfslide1up_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs2, float rs1,
                                            size_t vl);
vfloat64m1_t __riscv_vfslide1up_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs2, double rs1,
                                            size_t vl);
vfloat64m2_t __riscv_vfslide1up_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs2, double rs1,
                                            size_t vl);
vfloat64m4_t __riscv_vfslide1up_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs2, double rs1,
                                            size_t vl);
vfloat64m8_t __riscv_vfslide1up_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs2, double rs1,
                                            size_t vl);
vfloat16mf4_t __riscv_vfslide1down_vf_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                                vfloat16mf4_t vs2, _Float16 rs1,
                                                size_t vl);
vfloat16mf2_t __riscv_vfslide1down_vf_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                                vfloat16mf2_t vs2, _Float16 rs1,
                                                size_t vl);
vfloat16m1_t __riscv_vfslide1down_vf_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                              vfloat16m1_t vs2, _Float16 rs1,
                                              size_t vl);
vfloat16m2_t __riscv_vfslide1down_vf_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                              vfloat16m2_t vs2, _Float16 rs1,
                                              size_t vl);
vfloat16m4_t __riscv_vfslide1down_vf_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                              vfloat16m4_t vs2, _Float16 rs1,
                                              size_t vl);
vfloat16m8_t __riscv_vfslide1down_vf_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                              vfloat16m8_t vs2, _Float16 rs1,
                                              size_t vl);
vfloat32mf2_t __riscv_vfslide1down_vf_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                                vfloat32mf2_t vs2, float rs1,
                                                size_t vl);
vfloat32m1_t __riscv_vfslide1down_vf_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                              vfloat32m1_t vs2, float rs1,
                                              size_t vl);
vfloat32m2_t __riscv_vfslide1down_vf_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                              vfloat32m2_t vs2, float rs1,
                                              size_t vl);
vfloat32m4_t __riscv_vfslide1down_vf_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                              vfloat32m4_t vs2, float rs1,
                                              size_t vl);
vfloat32m8_t __riscv_vfslide1down_vf_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                              vfloat32m8_t vs2, float rs1,
                                              size_t vl);
vfloat64m1_t __riscv_vfslide1down_vf_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                              vfloat64m1_t vs2, double rs1,
                                              size_t vl);
vfloat64m2_t __riscv_vfslide1down_vf_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                              vfloat64m2_t vs2, double rs1,
                                              size_t vl);
vfloat64m4_t __riscv_vfslide1down_vf_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                              vfloat64m4_t vs2, double rs1,
                                              size_t vl);
vfloat64m8_t __riscv_vfslide1down_vf_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                              vfloat64m8_t vs2, double rs1,
                                              size_t vl);
vint8mf8_t __riscv_vslide1up_vx_i8mf8_mu(vbool64_t vm, vint8mf8_t vd,
                                         vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vslide1up_vx_i8mf4_mu(vbool32_t vm, vint8mf4_t vd,
                                         vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vslide1up_vx_i8mf2_mu(vbool16_t vm, vint8mf2_t vd,
                                         vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vslide1up_vx_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                       int8_t rs1, size_t vl);
vint8m2_t __riscv_vslide1up_vx_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                       int8_t rs1, size_t vl);
vint8m4_t __riscv_vslide1up_vx_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                       int8_t rs1, size_t vl);
vint8m8_t __riscv_vslide1up_vx_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                       int8_t rs1, size_t vl);
vint16mf4_t __riscv_vslide1up_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                           vint16mf4_t vs2, int16_t rs1,
                                           size_t vl);
vint16mf2_t __riscv_vslide1up_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                           vint16mf2_t vs2, int16_t rs1,
                                           size_t vl);
vint16m1_t __riscv_vslide1up_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                         vint16m1_t vs2, int16_t rs1,
                                         size_t vl);
vint16m2_t __riscv_vslide1up_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd,
                                         vint16m2_t vs2, int16_t rs1,
                                         size_t vl);
vint16m4_t __riscv_vslide1up_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd,
                                         vint16m4_t vs2, int16_t rs1,
                                         size_t vl);
vint16m8_t __riscv_vslide1up_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd,
                                         vint16m8_t vs2, int16_t rs1,
                                         size_t vl);
vint32mf2_t __riscv_vslide1up_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                           vint32mf2_t vs2, int32_t rs1,
                                           size_t vl);
vint32m1_t __riscv_vslide1up_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                         vint32m1_t vs2, int32_t rs1,
                                         size_t vl);
vint32m2_t __riscv_vslide1up_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                         vint32m2_t vs2, int32_t rs1,
                                         size_t vl);
vint32m4_t __riscv_vslide1up_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd,
                                         vint32m4_t vs2, int32_t rs1,
                                         size_t vl);
vint32m8_t __riscv_vslide1up_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd,
                                         vint32m8_t vs2, int32_t rs1,
                                         size_t vl);
vint64m1_t __riscv_vslide1up_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                         vint64m1_t vs2, int64_t rs1,
                                         size_t vl);
vint64m2_t __riscv_vslide1up_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                         vint64m2_t vs2, int64_t rs1,
                                         size_t vl);
vint64m4_t __riscv_vslide1up_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                         vint64m4_t vs2, int64_t rs1,
                                         size_t vl);
vint64m8_t __riscv_vslide1up_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd,
                                         vint64m8_t vs2, int64_t rs1,
                                         size_t vl);
vint8mf8_t __riscv_vslide1down_vx_i8mf8_mu(vbool64_t vm, vint8mf8_t vd,
                                           vint8mf8_t vs2, int8_t rs1,
                                           size_t vl);
vint8mf4_t __riscv_vslide1down_vx_i8mf4_mu(vbool32_t vm, vint8mf4_t vd,
                                           vint8mf4_t vs2, int8_t rs1,
                                           size_t vl);
vint8mf2_t __riscv_vslide1down_vx_i8mf2_mu(vbool16_t vm, vint8mf2_t vd,
                                           vint8mf2_t vs2, int8_t rs1,
                                           size_t vl);
vint8m1_t __riscv_vslide1down_vx_i8m1_mu(vbool8_t vm, vint8m1_t vd,
                                         vint8m1_t vs2, int8_t rs1, size_t vl);
vint8m2_t __riscv_vslide1down_vx_i8m2_mu(vbool4_t vm, vint8m2_t vd,
                                         vint8m2_t vs2, int8_t rs1, size_t vl);
vint8m4_t __riscv_vslide1down_vx_i8m4_mu(vbool2_t vm, vint8m4_t vd,
                                         vint8m4_t vs2, int8_t rs1, size_t vl);
vint8m8_t __riscv_vslide1down_vx_i8m8_mu(vbool1_t vm, vint8m8_t vd,
                                         vint8m8_t vs2, int8_t rs1, size_t vl);
vint16mf4_t __riscv_vslide1down_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                             vint16mf4_t vs2, int16_t rs1,
                                             size_t vl);
vint16mf2_t __riscv_vslide1down_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                             vint16mf2_t vs2, int16_t rs1,
                                             size_t vl);
vint16m1_t __riscv_vslide1down_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                           vint16m1_t vs2, int16_t rs1,
                                           size_t vl);
vint16m2_t __riscv_vslide1down_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd,
                                           vint16m2_t vs2, int16_t rs1,
                                           size_t vl);
vint16m4_t __riscv_vslide1down_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd,
                                           vint16m4_t vs2, int16_t rs1,
                                           size_t vl);
vint16m8_t __riscv_vslide1down_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd,
                                           vint16m8_t vs2, int16_t rs1,
                                           size_t vl);
vint32mf2_t __riscv_vslide1down_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                             vint32mf2_t vs2, int32_t rs1,
                                             size_t vl);
vint32m1_t __riscv_vslide1down_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                           vint32m1_t vs2, int32_t rs1,
                                           size_t vl);
vint32m2_t __riscv_vslide1down_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                           vint32m2_t vs2, int32_t rs1,
                                           size_t vl);
vint32m4_t __riscv_vslide1down_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd,
                                           vint32m4_t vs2, int32_t rs1,
                                           size_t vl);
vint32m8_t __riscv_vslide1down_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd,
                                           vint32m8_t vs2, int32_t rs1,
                                           size_t vl);
vint64m1_t __riscv_vslide1down_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                           vint64m1_t vs2, int64_t rs1,
                                           size_t vl);
vint64m2_t __riscv_vslide1down_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                           vint64m2_t vs2, int64_t rs1,
                                           size_t vl);
vint64m4_t __riscv_vslide1down_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                           vint64m4_t vs2, int64_t rs1,
                                           size_t vl);
vint64m8_t __riscv_vslide1down_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd,
                                           vint64m8_t vs2, int64_t rs1,
                                           size_t vl);
vuint8mf8_t __riscv_vslide1up_vx_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                          vuint8mf8_t vs2, uint8_t rs1,
                                          size_t vl);
vuint8mf4_t __riscv_vslide1up_vx_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                          vuint8mf4_t vs2, uint8_t rs1,
                                          size_t vl);
vuint8mf2_t __riscv_vslide1up_vx_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                          vuint8mf2_t vs2, uint8_t rs1,
                                          size_t vl);
vuint8m1_t __riscv_vslide1up_vx_u8m1_mu(vbool8_t vm, vuint8m1_t vd,
                                        vuint8m1_t vs2, uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vslide1up_vx_u8m2_mu(vbool4_t vm, vuint8m2_t vd,
                                        vuint8m2_t vs2, uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vslide1up_vx_u8m4_mu(vbool2_t vm, vuint8m4_t vd,
                                        vuint8m4_t vs2, uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vslide1up_vx_u8m8_mu(vbool1_t vm, vuint8m8_t vd,
                                        vuint8m8_t vs2, uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vslide1up_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                            vuint16mf4_t vs2, uint16_t rs1,
                                            size_t vl);
vuint16mf2_t __riscv_vslide1up_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                            vuint16mf2_t vs2, uint16_t rs1,
                                            size_t vl);
vuint16m1_t __riscv_vslide1up_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                          vuint16m1_t vs2, uint16_t rs1,
                                          size_t vl);
vuint16m2_t __riscv_vslide1up_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                          vuint16m2_t vs2, uint16_t rs1,
                                          size_t vl);
vuint16m4_t __riscv_vslide1up_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                          vuint16m4_t vs2, uint16_t rs1,
                                          size_t vl);
vuint16m8_t __riscv_vslide1up_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                          vuint16m8_t vs2, uint16_t rs1,
                                          size_t vl);
vuint32mf2_t __riscv_vslide1up_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                            vuint32mf2_t vs2, uint32_t rs1,
                                            size_t vl);
vuint32m1_t __riscv_vslide1up_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                          vuint32m1_t vs2, uint32_t rs1,
                                          size_t vl);
vuint32m2_t __riscv_vslide1up_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                          vuint32m2_t vs2, uint32_t rs1,
                                          size_t vl);
vuint32m4_t __riscv_vslide1up_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                          vuint32m4_t vs2, uint32_t rs1,
                                          size_t vl);
vuint32m8_t __riscv_vslide1up_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                          vuint32m8_t vs2, uint32_t rs1,
                                          size_t vl);
vuint64m1_t __riscv_vslide1up_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                          vuint64m1_t vs2, uint64_t rs1,
                                          size_t vl);
vuint64m2_t __riscv_vslide1up_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                          vuint64m2_t vs2, uint64_t rs1,
                                          size_t vl);
vuint64m4_t __riscv_vslide1up_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                          vuint64m4_t vs2, uint64_t rs1,
                                          size_t vl);
vuint64m8_t __riscv_vslide1up_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                          vuint64m8_t vs2, uint64_t rs1,
                                          size_t vl);
vuint8mf8_t __riscv_vslide1down_vx_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                            vuint8mf8_t vs2, uint8_t rs1,
                                            size_t vl);
vuint8mf4_t __riscv_vslide1down_vx_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                            vuint8mf4_t vs2, uint8_t rs1,
                                            size_t vl);
vuint8mf2_t __riscv_vslide1down_vx_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                            vuint8mf2_t vs2, uint8_t rs1,
                                            size_t vl);
vuint8m1_t __riscv_vslide1down_vx_u8m1_mu(vbool8_t vm, vuint8m1_t vd,
                                          vuint8m1_t vs2, uint8_t rs1,
                                          size_t vl);
vuint8m2_t __riscv_vslide1down_vx_u8m2_mu(vbool4_t vm, vuint8m2_t vd,
                                          vuint8m2_t vs2, uint8_t rs1,
                                          size_t vl);
vuint8m4_t __riscv_vslide1down_vx_u8m4_mu(vbool2_t vm, vuint8m4_t vd,
                                          vuint8m4_t vs2, uint8_t rs1,
                                          size_t vl);
vuint8m8_t __riscv_vslide1down_vx_u8m8_mu(vbool1_t vm, vuint8m8_t vd,
                                          vuint8m8_t vs2, uint8_t rs1,
                                          size_t vl);
vuint16mf4_t __riscv_vslide1down_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                              vuint16mf4_t vs2, uint16_t rs1,
                                              size_t vl);
vuint16mf2_t __riscv_vslide1down_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                              vuint16mf2_t vs2, uint16_t rs1,
                                              size_t vl);
vuint16m1_t __riscv_vslide1down_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                            vuint16m1_t vs2, uint16_t rs1,
                                            size_t vl);
vuint16m2_t __riscv_vslide1down_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                            vuint16m2_t vs2, uint16_t rs1,
                                            size_t vl);
vuint16m4_t __riscv_vslide1down_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                            vuint16m4_t vs2, uint16_t rs1,
                                            size_t vl);
vuint16m8_t __riscv_vslide1down_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                            vuint16m8_t vs2, uint16_t rs1,
                                            size_t vl);
vuint32mf2_t __riscv_vslide1down_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                              vuint32mf2_t vs2, uint32_t rs1,
                                              size_t vl);
vuint32m1_t __riscv_vslide1down_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                            vuint32m1_t vs2, uint32_t rs1,
                                            size_t vl);
vuint32m2_t __riscv_vslide1down_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                            vuint32m2_t vs2, uint32_t rs1,
                                            size_t vl);
vuint32m4_t __riscv_vslide1down_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                            vuint32m4_t vs2, uint32_t rs1,
                                            size_t vl);
vuint32m8_t __riscv_vslide1down_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                            vuint32m8_t vs2, uint32_t rs1,
                                            size_t vl);
vuint64m1_t __riscv_vslide1down_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                            vuint64m1_t vs2, uint64_t rs1,
                                            size_t vl);
vuint64m2_t __riscv_vslide1down_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                            vuint64m2_t vs2, uint64_t rs1,
                                            size_t vl);
vuint64m4_t __riscv_vslide1down_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                            vuint64m4_t vs2, uint64_t rs1,
                                            size_t vl);
vuint64m8_t __riscv_vslide1down_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                            vuint64m8_t vs2, uint64_t rs1,
                                            size_t vl);

Vector Register Gather Intrinsics

vfloat16mf4_t __riscv_vrgather_vv_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                            vuint16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vrgather_vx_f16mf4_tu(vfloat16mf4_t vd, vfloat16mf4_t vs2,
                                            size_t vs1, size_t vl);
vfloat16mf2_t __riscv_vrgather_vv_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                            vuint16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vrgather_vx_f16mf2_tu(vfloat16mf2_t vd, vfloat16mf2_t vs2,
                                            size_t vs1, size_t vl);
vfloat16m1_t __riscv_vrgather_vv_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                          vuint16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vrgather_vx_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                          size_t vs1, size_t vl);
vfloat16m2_t __riscv_vrgather_vv_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                          vuint16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vrgather_vx_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                          size_t vs1, size_t vl);
vfloat16m4_t __riscv_vrgather_vv_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                          vuint16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vrgather_vx_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                          size_t vs1, size_t vl);
vfloat16m8_t __riscv_vrgather_vv_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                          vuint16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vrgather_vx_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                          size_t vs1, size_t vl);
vfloat32mf2_t __riscv_vrgather_vv_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                            vuint32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vrgather_vx_f32mf2_tu(vfloat32mf2_t vd, vfloat32mf2_t vs2,
                                            size_t vs1, size_t vl);
vfloat32m1_t __riscv_vrgather_vv_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                          vuint32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vrgather_vx_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                          size_t vs1, size_t vl);
vfloat32m2_t __riscv_vrgather_vv_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                          vuint32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vrgather_vx_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                          size_t vs1, size_t vl);
vfloat32m4_t __riscv_vrgather_vv_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                          vuint32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vrgather_vx_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                          size_t vs1, size_t vl);
vfloat32m8_t __riscv_vrgather_vv_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                          vuint32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vrgather_vx_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                          size_t vs1, size_t vl);
vfloat64m1_t __riscv_vrgather_vv_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                          vuint64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vrgather_vx_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                          size_t vs1, size_t vl);
vfloat64m2_t __riscv_vrgather_vv_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                          vuint64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vrgather_vx_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                          size_t vs1, size_t vl);
vfloat64m4_t __riscv_vrgather_vv_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                          vuint64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vrgather_vx_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                          size_t vs1, size_t vl);
vfloat64m8_t __riscv_vrgather_vv_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                          vuint64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vrgather_vx_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                          size_t vs1, size_t vl);
vfloat16mf4_t __riscv_vrgatherei16_vv_f16mf4_tu(vfloat16mf4_t vd,
                                                vfloat16mf4_t vs2,
                                                vuint16mf4_t vs1, size_t vl);
vfloat16mf2_t __riscv_vrgatherei16_vv_f16mf2_tu(vfloat16mf2_t vd,
                                                vfloat16mf2_t vs2,
                                                vuint16mf2_t vs1, size_t vl);
vfloat16m1_t __riscv_vrgatherei16_vv_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                              vuint16m1_t vs1, size_t vl);
vfloat16m2_t __riscv_vrgatherei16_vv_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                              vuint16m2_t vs1, size_t vl);
vfloat16m4_t __riscv_vrgatherei16_vv_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                              vuint16m4_t vs1, size_t vl);
vfloat16m8_t __riscv_vrgatherei16_vv_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                              vuint16m8_t vs1, size_t vl);
vfloat32mf2_t __riscv_vrgatherei16_vv_f32mf2_tu(vfloat32mf2_t vd,
                                                vfloat32mf2_t vs2,
                                                vuint16mf4_t vs1, size_t vl);
vfloat32m1_t __riscv_vrgatherei16_vv_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                              vuint16mf2_t vs1, size_t vl);
vfloat32m2_t __riscv_vrgatherei16_vv_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                              vuint16m1_t vs1, size_t vl);
vfloat32m4_t __riscv_vrgatherei16_vv_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                              vuint16m2_t vs1, size_t vl);
vfloat32m8_t __riscv_vrgatherei16_vv_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                              vuint16m4_t vs1, size_t vl);
vfloat64m1_t __riscv_vrgatherei16_vv_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                              vuint16mf4_t vs1, size_t vl);
vfloat64m2_t __riscv_vrgatherei16_vv_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                              vuint16mf2_t vs1, size_t vl);
vfloat64m4_t __riscv_vrgatherei16_vv_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                              vuint16m1_t vs1, size_t vl);
vfloat64m8_t __riscv_vrgatherei16_vv_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                              vuint16m2_t vs1, size_t vl);
vint8mf8_t __riscv_vrgather_vv_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                        vuint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vrgather_vx_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                        size_t vs1, size_t vl);
vint8mf4_t __riscv_vrgather_vv_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                        vuint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vrgather_vx_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                        size_t vs1, size_t vl);
vint8mf2_t __riscv_vrgather_vv_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                        vuint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vrgather_vx_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                        size_t vs1, size_t vl);
vint8m1_t __riscv_vrgather_vv_i8m1_tu(vint8m1_t vd, vint8m1_t vs2,
                                      vuint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vrgather_vx_i8m1_tu(vint8m1_t vd, vint8m1_t vs2, size_t vs1,
                                      size_t vl);
vint8m2_t __riscv_vrgather_vv_i8m2_tu(vint8m2_t vd, vint8m2_t vs2,
                                      vuint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vrgather_vx_i8m2_tu(vint8m2_t vd, vint8m2_t vs2, size_t vs1,
                                      size_t vl);
vint8m4_t __riscv_vrgather_vv_i8m4_tu(vint8m4_t vd, vint8m4_t vs2,
                                      vuint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vrgather_vx_i8m4_tu(vint8m4_t vd, vint8m4_t vs2, size_t vs1,
                                      size_t vl);
vint8m8_t __riscv_vrgather_vv_i8m8_tu(vint8m8_t vd, vint8m8_t vs2,
                                      vuint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vrgather_vx_i8m8_tu(vint8m8_t vd, vint8m8_t vs2, size_t vs1,
                                      size_t vl);
vint16mf4_t __riscv_vrgather_vv_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                          vuint16mf4_t vs1, size_t vl);
vint16mf4_t __riscv_vrgather_vx_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                          size_t vs1, size_t vl);
vint16mf2_t __riscv_vrgather_vv_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                          vuint16mf2_t vs1, size_t vl);
vint16mf2_t __riscv_vrgather_vx_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                          size_t vs1, size_t vl);
vint16m1_t __riscv_vrgather_vv_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                        vuint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vrgather_vx_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                        size_t vs1, size_t vl);
vint16m2_t __riscv_vrgather_vv_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                        vuint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vrgather_vx_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                        size_t vs1, size_t vl);
vint16m4_t __riscv_vrgather_vv_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                        vuint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vrgather_vx_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                        size_t vs1, size_t vl);
vint16m8_t __riscv_vrgather_vv_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                        vuint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vrgather_vx_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                        size_t vs1, size_t vl);
vint32mf2_t __riscv_vrgather_vv_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                          vuint32mf2_t vs1, size_t vl);
vint32mf2_t __riscv_vrgather_vx_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                          size_t vs1, size_t vl);
vint32m1_t __riscv_vrgather_vv_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                        vuint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vrgather_vx_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                        size_t vs1, size_t vl);
vint32m2_t __riscv_vrgather_vv_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                        vuint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vrgather_vx_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                        size_t vs1, size_t vl);
vint32m4_t __riscv_vrgather_vv_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                        vuint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vrgather_vx_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                        size_t vs1, size_t vl);
vint32m8_t __riscv_vrgather_vv_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                        vuint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vrgather_vx_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                        size_t vs1, size_t vl);
vint64m1_t __riscv_vrgather_vv_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                        vuint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vrgather_vx_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                        size_t vs1, size_t vl);
vint64m2_t __riscv_vrgather_vv_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                        vuint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vrgather_vx_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                        size_t vs1, size_t vl);
vint64m4_t __riscv_vrgather_vv_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                        vuint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vrgather_vx_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                        size_t vs1, size_t vl);
vint64m8_t __riscv_vrgather_vv_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                        vuint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vrgather_vx_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                        size_t vs1, size_t vl);
vint8mf8_t __riscv_vrgatherei16_vv_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                            vuint16mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vrgatherei16_vv_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                            vuint16mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vrgatherei16_vv_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                            vuint16m1_t vs1, size_t vl);
vint8m1_t __riscv_vrgatherei16_vv_i8m1_tu(vint8m1_t vd, vint8m1_t vs2,
                                          vuint16m2_t vs1, size_t vl);
vint8m2_t __riscv_vrgatherei16_vv_i8m2_tu(vint8m2_t vd, vint8m2_t vs2,
                                          vuint16m4_t vs1, size_t vl);
vint8m4_t __riscv_vrgatherei16_vv_i8m4_tu(vint8m4_t vd, vint8m4_t vs2,
                                          vuint16m8_t vs1, size_t vl);
vint16mf4_t __riscv_vrgatherei16_vv_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                              vuint16mf4_t vs1, size_t vl);
vint16mf2_t __riscv_vrgatherei16_vv_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                              vuint16mf2_t vs1, size_t vl);
vint16m1_t __riscv_vrgatherei16_vv_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                            vuint16m1_t vs1, size_t vl);
vint16m2_t __riscv_vrgatherei16_vv_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                            vuint16m2_t vs1, size_t vl);
vint16m4_t __riscv_vrgatherei16_vv_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                            vuint16m4_t vs1, size_t vl);
vint16m8_t __riscv_vrgatherei16_vv_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                            vuint16m8_t vs1, size_t vl);
vint32mf2_t __riscv_vrgatherei16_vv_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                              vuint16mf4_t vs1, size_t vl);
vint32m1_t __riscv_vrgatherei16_vv_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                            vuint16mf2_t vs1, size_t vl);
vint32m2_t __riscv_vrgatherei16_vv_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                            vuint16m1_t vs1, size_t vl);
vint32m4_t __riscv_vrgatherei16_vv_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                            vuint16m2_t vs1, size_t vl);
vint32m8_t __riscv_vrgatherei16_vv_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                            vuint16m4_t vs1, size_t vl);
vint64m1_t __riscv_vrgatherei16_vv_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                            vuint16mf4_t vs1, size_t vl);
vint64m2_t __riscv_vrgatherei16_vv_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                            vuint16mf2_t vs1, size_t vl);
vint64m4_t __riscv_vrgatherei16_vv_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                            vuint16m1_t vs1, size_t vl);
vint64m8_t __riscv_vrgatherei16_vv_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                            vuint16m2_t vs1, size_t vl);
vuint8mf8_t __riscv_vrgather_vv_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                         vuint8mf8_t vs1, size_t vl);
vuint8mf8_t __riscv_vrgather_vx_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                         size_t vs1, size_t vl);
vuint8mf4_t __riscv_vrgather_vv_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                         vuint8mf4_t vs1, size_t vl);
vuint8mf4_t __riscv_vrgather_vx_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                         size_t vs1, size_t vl);
vuint8mf2_t __riscv_vrgather_vv_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                         vuint8mf2_t vs1, size_t vl);
vuint8mf2_t __riscv_vrgather_vx_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                         size_t vs1, size_t vl);
vuint8m1_t __riscv_vrgather_vv_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2,
                                       vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vrgather_vx_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2,
                                       size_t vs1, size_t vl);
vuint8m2_t __riscv_vrgather_vv_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2,
                                       vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vrgather_vx_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2,
                                       size_t vs1, size_t vl);
vuint8m4_t __riscv_vrgather_vv_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2,
                                       vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vrgather_vx_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2,
                                       size_t vs1, size_t vl);
vuint8m8_t __riscv_vrgather_vv_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2,
                                       vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vrgather_vx_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2,
                                       size_t vs1, size_t vl);
vuint16mf4_t __riscv_vrgather_vv_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                           vuint16mf4_t vs1, size_t vl);
vuint16mf4_t __riscv_vrgather_vx_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                           size_t vs1, size_t vl);
vuint16mf2_t __riscv_vrgather_vv_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                           vuint16mf2_t vs1, size_t vl);
vuint16mf2_t __riscv_vrgather_vx_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                           size_t vs1, size_t vl);
vuint16m1_t __riscv_vrgather_vv_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                         vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vrgather_vx_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                         size_t vs1, size_t vl);
vuint16m2_t __riscv_vrgather_vv_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                         vuint16m2_t vs1, size_t vl);
vuint16m2_t __riscv_vrgather_vx_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                         size_t vs1, size_t vl);
vuint16m4_t __riscv_vrgather_vv_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                         vuint16m4_t vs1, size_t vl);
vuint16m4_t __riscv_vrgather_vx_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                         size_t vs1, size_t vl);
vuint16m8_t __riscv_vrgather_vv_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                         vuint16m8_t vs1, size_t vl);
vuint16m8_t __riscv_vrgather_vx_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                         size_t vs1, size_t vl);
vuint32mf2_t __riscv_vrgather_vv_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                           vuint32mf2_t vs1, size_t vl);
vuint32mf2_t __riscv_vrgather_vx_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                           size_t vs1, size_t vl);
vuint32m1_t __riscv_vrgather_vv_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                         vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vrgather_vx_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                         size_t vs1, size_t vl);
vuint32m2_t __riscv_vrgather_vv_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                         vuint32m2_t vs1, size_t vl);
vuint32m2_t __riscv_vrgather_vx_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                         size_t vs1, size_t vl);
vuint32m4_t __riscv_vrgather_vv_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                         vuint32m4_t vs1, size_t vl);
vuint32m4_t __riscv_vrgather_vx_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                         size_t vs1, size_t vl);
vuint32m8_t __riscv_vrgather_vv_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                         vuint32m8_t vs1, size_t vl);
vuint32m8_t __riscv_vrgather_vx_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                         size_t vs1, size_t vl);
vuint64m1_t __riscv_vrgather_vv_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                         vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vrgather_vx_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                         size_t vs1, size_t vl);
vuint64m2_t __riscv_vrgather_vv_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                         vuint64m2_t vs1, size_t vl);
vuint64m2_t __riscv_vrgather_vx_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                         size_t vs1, size_t vl);
vuint64m4_t __riscv_vrgather_vv_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                         vuint64m4_t vs1, size_t vl);
vuint64m4_t __riscv_vrgather_vx_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                         size_t vs1, size_t vl);
vuint64m8_t __riscv_vrgather_vv_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                         vuint64m8_t vs1, size_t vl);
vuint64m8_t __riscv_vrgather_vx_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                         size_t vs1, size_t vl);
vuint8mf8_t __riscv_vrgatherei16_vv_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                             vuint16mf4_t vs1, size_t vl);
vuint8mf4_t __riscv_vrgatherei16_vv_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                             vuint16mf2_t vs1, size_t vl);
vuint8mf2_t __riscv_vrgatherei16_vv_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                             vuint16m1_t vs1, size_t vl);
vuint8m1_t __riscv_vrgatherei16_vv_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2,
                                           vuint16m2_t vs1, size_t vl);
vuint8m2_t __riscv_vrgatherei16_vv_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2,
                                           vuint16m4_t vs1, size_t vl);
vuint8m4_t __riscv_vrgatherei16_vv_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2,
                                           vuint16m8_t vs1, size_t vl);
vuint16mf4_t __riscv_vrgatherei16_vv_u16mf4_tu(vuint16mf4_t vd,
                                               vuint16mf4_t vs2,
                                               vuint16mf4_t vs1, size_t vl);
vuint16mf2_t __riscv_vrgatherei16_vv_u16mf2_tu(vuint16mf2_t vd,
                                               vuint16mf2_t vs2,
                                               vuint16mf2_t vs1, size_t vl);
vuint16m1_t __riscv_vrgatherei16_vv_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                             vuint16m1_t vs1, size_t vl);
vuint16m2_t __riscv_vrgatherei16_vv_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                             vuint16m2_t vs1, size_t vl);
vuint16m4_t __riscv_vrgatherei16_vv_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                             vuint16m4_t vs1, size_t vl);
vuint16m8_t __riscv_vrgatherei16_vv_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                             vuint16m8_t vs1, size_t vl);
vuint32mf2_t __riscv_vrgatherei16_vv_u32mf2_tu(vuint32mf2_t vd,
                                               vuint32mf2_t vs2,
                                               vuint16mf4_t vs1, size_t vl);
vuint32m1_t __riscv_vrgatherei16_vv_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                             vuint16mf2_t vs1, size_t vl);
vuint32m2_t __riscv_vrgatherei16_vv_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                             vuint16m1_t vs1, size_t vl);
vuint32m4_t __riscv_vrgatherei16_vv_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                             vuint16m2_t vs1, size_t vl);
vuint32m8_t __riscv_vrgatherei16_vv_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                             vuint16m4_t vs1, size_t vl);
vuint64m1_t __riscv_vrgatherei16_vv_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                             vuint16mf4_t vs1, size_t vl);
vuint64m2_t __riscv_vrgatherei16_vv_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                             vuint16mf2_t vs1, size_t vl);
vuint64m4_t __riscv_vrgatherei16_vv_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                             vuint16m1_t vs1, size_t vl);
vuint64m8_t __riscv_vrgatherei16_vv_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                             vuint16m2_t vs1, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vrgather_vv_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs2,
                                             vuint16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vrgather_vx_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                             vfloat16mf4_t vs2, size_t vs1,
                                             size_t vl);
vfloat16mf2_t __riscv_vrgather_vv_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs2,
                                             vuint16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vrgather_vx_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                             vfloat16mf2_t vs2, size_t vs1,
                                             size_t vl);
vfloat16m1_t __riscv_vrgather_vv_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs2, vuint16m1_t vs1,
                                           size_t vl);
vfloat16m1_t __riscv_vrgather_vx_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                           vfloat16m1_t vs2, size_t vs1,
                                           size_t vl);
vfloat16m2_t __riscv_vrgather_vv_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs2, vuint16m2_t vs1,
                                           size_t vl);
vfloat16m2_t __riscv_vrgather_vx_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                           vfloat16m2_t vs2, size_t vs1,
                                           size_t vl);
vfloat16m4_t __riscv_vrgather_vv_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs2, vuint16m4_t vs1,
                                           size_t vl);
vfloat16m4_t __riscv_vrgather_vx_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                           vfloat16m4_t vs2, size_t vs1,
                                           size_t vl);
vfloat16m8_t __riscv_vrgather_vv_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs2, vuint16m8_t vs1,
                                           size_t vl);
vfloat16m8_t __riscv_vrgather_vx_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                           vfloat16m8_t vs2, size_t vs1,
                                           size_t vl);
vfloat32mf2_t __riscv_vrgather_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2,
                                             vuint32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vrgather_vx_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2, size_t vs1,
                                             size_t vl);
vfloat32m1_t __riscv_vrgather_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs2, vuint32m1_t vs1,
                                           size_t vl);
vfloat32m1_t __riscv_vrgather_vx_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                           vfloat32m1_t vs2, size_t vs1,
                                           size_t vl);
vfloat32m2_t __riscv_vrgather_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs2, vuint32m2_t vs1,
                                           size_t vl);
vfloat32m2_t __riscv_vrgather_vx_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                           vfloat32m2_t vs2, size_t vs1,
                                           size_t vl);
vfloat32m4_t __riscv_vrgather_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs2, vuint32m4_t vs1,
                                           size_t vl);
vfloat32m4_t __riscv_vrgather_vx_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                           vfloat32m4_t vs2, size_t vs1,
                                           size_t vl);
vfloat32m8_t __riscv_vrgather_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs2, vuint32m8_t vs1,
                                           size_t vl);
vfloat32m8_t __riscv_vrgather_vx_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                           vfloat32m8_t vs2, size_t vs1,
                                           size_t vl);
vfloat64m1_t __riscv_vrgather_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs2, vuint64m1_t vs1,
                                           size_t vl);
vfloat64m1_t __riscv_vrgather_vx_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                           vfloat64m1_t vs2, size_t vs1,
                                           size_t vl);
vfloat64m2_t __riscv_vrgather_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs2, vuint64m2_t vs1,
                                           size_t vl);
vfloat64m2_t __riscv_vrgather_vx_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                           vfloat64m2_t vs2, size_t vs1,
                                           size_t vl);
vfloat64m4_t __riscv_vrgather_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs2, vuint64m4_t vs1,
                                           size_t vl);
vfloat64m4_t __riscv_vrgather_vx_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                           vfloat64m4_t vs2, size_t vs1,
                                           size_t vl);
vfloat64m8_t __riscv_vrgather_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs2, vuint64m8_t vs1,
                                           size_t vl);
vfloat64m8_t __riscv_vrgather_vx_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                           vfloat64m8_t vs2, size_t vs1,
                                           size_t vl);
vfloat16mf4_t __riscv_vrgatherei16_vv_f16mf4_tum(vbool64_t vm, vfloat16mf4_t vd,
                                                 vfloat16mf4_t vs2,
                                                 vuint16mf4_t vs1, size_t vl);
vfloat16mf2_t __riscv_vrgatherei16_vv_f16mf2_tum(vbool32_t vm, vfloat16mf2_t vd,
                                                 vfloat16mf2_t vs2,
                                                 vuint16mf2_t vs1, size_t vl);
vfloat16m1_t __riscv_vrgatherei16_vv_f16m1_tum(vbool16_t vm, vfloat16m1_t vd,
                                               vfloat16m1_t vs2,
                                               vuint16m1_t vs1, size_t vl);
vfloat16m2_t __riscv_vrgatherei16_vv_f16m2_tum(vbool8_t vm, vfloat16m2_t vd,
                                               vfloat16m2_t vs2,
                                               vuint16m2_t vs1, size_t vl);
vfloat16m4_t __riscv_vrgatherei16_vv_f16m4_tum(vbool4_t vm, vfloat16m4_t vd,
                                               vfloat16m4_t vs2,
                                               vuint16m4_t vs1, size_t vl);
vfloat16m8_t __riscv_vrgatherei16_vv_f16m8_tum(vbool2_t vm, vfloat16m8_t vd,
                                               vfloat16m8_t vs2,
                                               vuint16m8_t vs1, size_t vl);
vfloat32mf2_t __riscv_vrgatherei16_vv_f32mf2_tum(vbool64_t vm, vfloat32mf2_t vd,
                                                 vfloat32mf2_t vs2,
                                                 vuint16mf4_t vs1, size_t vl);
vfloat32m1_t __riscv_vrgatherei16_vv_f32m1_tum(vbool32_t vm, vfloat32m1_t vd,
                                               vfloat32m1_t vs2,
                                               vuint16mf2_t vs1, size_t vl);
vfloat32m2_t __riscv_vrgatherei16_vv_f32m2_tum(vbool16_t vm, vfloat32m2_t vd,
                                               vfloat32m2_t vs2,
                                               vuint16m1_t vs1, size_t vl);
vfloat32m4_t __riscv_vrgatherei16_vv_f32m4_tum(vbool8_t vm, vfloat32m4_t vd,
                                               vfloat32m4_t vs2,
                                               vuint16m2_t vs1, size_t vl);
vfloat32m8_t __riscv_vrgatherei16_vv_f32m8_tum(vbool4_t vm, vfloat32m8_t vd,
                                               vfloat32m8_t vs2,
                                               vuint16m4_t vs1, size_t vl);
vfloat64m1_t __riscv_vrgatherei16_vv_f64m1_tum(vbool64_t vm, vfloat64m1_t vd,
                                               vfloat64m1_t vs2,
                                               vuint16mf4_t vs1, size_t vl);
vfloat64m2_t __riscv_vrgatherei16_vv_f64m2_tum(vbool32_t vm, vfloat64m2_t vd,
                                               vfloat64m2_t vs2,
                                               vuint16mf2_t vs1, size_t vl);
vfloat64m4_t __riscv_vrgatherei16_vv_f64m4_tum(vbool16_t vm, vfloat64m4_t vd,
                                               vfloat64m4_t vs2,
                                               vuint16m1_t vs1, size_t vl);
vfloat64m8_t __riscv_vrgatherei16_vv_f64m8_tum(vbool8_t vm, vfloat64m8_t vd,
                                               vfloat64m8_t vs2,
                                               vuint16m2_t vs1, size_t vl);
vint8mf8_t __riscv_vrgather_vv_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                         vint8mf8_t vs2, vuint8mf8_t vs1,
                                         size_t vl);
vint8mf8_t __riscv_vrgather_vx_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                         vint8mf8_t vs2, size_t vs1, size_t vl);
vint8mf4_t __riscv_vrgather_vv_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                         vint8mf4_t vs2, vuint8mf4_t vs1,
                                         size_t vl);
vint8mf4_t __riscv_vrgather_vx_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                         vint8mf4_t vs2, size_t vs1, size_t vl);
vint8mf2_t __riscv_vrgather_vv_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                         vint8mf2_t vs2, vuint8mf2_t vs1,
                                         size_t vl);
vint8mf2_t __riscv_vrgather_vx_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                         vint8mf2_t vs2, size_t vs1, size_t vl);
vint8m1_t __riscv_vrgather_vv_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                       vuint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vrgather_vx_i8m1_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                       size_t vs1, size_t vl);
vint8m2_t __riscv_vrgather_vv_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                       vuint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vrgather_vx_i8m2_tum(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                       size_t vs1, size_t vl);
vint8m4_t __riscv_vrgather_vv_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                       vuint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vrgather_vx_i8m4_tum(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                       size_t vs1, size_t vl);
vint8m8_t __riscv_vrgather_vv_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                       vuint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vrgather_vx_i8m8_tum(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                       size_t vs1, size_t vl);
vint16mf4_t __riscv_vrgather_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                           vint16mf4_t vs2, vuint16mf4_t vs1,
                                           size_t vl);
vint16mf4_t __riscv_vrgather_vx_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                           vint16mf4_t vs2, size_t vs1,
                                           size_t vl);
vint16mf2_t __riscv_vrgather_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                           vint16mf2_t vs2, vuint16mf2_t vs1,
                                           size_t vl);
vint16mf2_t __riscv_vrgather_vx_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                           vint16mf2_t vs2, size_t vs1,
                                           size_t vl);
vint16m1_t __riscv_vrgather_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                         vint16m1_t vs2, vuint16m1_t vs1,
                                         size_t vl);
vint16m1_t __riscv_vrgather_vx_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                         vint16m1_t vs2, size_t vs1, size_t vl);
vint16m2_t __riscv_vrgather_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                         vint16m2_t vs2, vuint16m2_t vs1,
                                         size_t vl);
vint16m2_t __riscv_vrgather_vx_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                         vint16m2_t vs2, size_t vs1, size_t vl);
vint16m4_t __riscv_vrgather_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                         vint16m4_t vs2, vuint16m4_t vs1,
                                         size_t vl);
vint16m4_t __riscv_vrgather_vx_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                         vint16m4_t vs2, size_t vs1, size_t vl);
vint16m8_t __riscv_vrgather_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                         vint16m8_t vs2, vuint16m8_t vs1,
                                         size_t vl);
vint16m8_t __riscv_vrgather_vx_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                         vint16m8_t vs2, size_t vs1, size_t vl);
vint32mf2_t __riscv_vrgather_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                           vint32mf2_t vs2, vuint32mf2_t vs1,
                                           size_t vl);
vint32mf2_t __riscv_vrgather_vx_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                           vint32mf2_t vs2, size_t vs1,
                                           size_t vl);
vint32m1_t __riscv_vrgather_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                         vint32m1_t vs2, vuint32m1_t vs1,
                                         size_t vl);
vint32m1_t __riscv_vrgather_vx_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                         vint32m1_t vs2, size_t vs1, size_t vl);
vint32m2_t __riscv_vrgather_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                         vint32m2_t vs2, vuint32m2_t vs1,
                                         size_t vl);
vint32m2_t __riscv_vrgather_vx_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                         vint32m2_t vs2, size_t vs1, size_t vl);
vint32m4_t __riscv_vrgather_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                         vint32m4_t vs2, vuint32m4_t vs1,
                                         size_t vl);
vint32m4_t __riscv_vrgather_vx_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                         vint32m4_t vs2, size_t vs1, size_t vl);
vint32m8_t __riscv_vrgather_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                         vint32m8_t vs2, vuint32m8_t vs1,
                                         size_t vl);
vint32m8_t __riscv_vrgather_vx_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                         vint32m8_t vs2, size_t vs1, size_t vl);
vint64m1_t __riscv_vrgather_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                         vint64m1_t vs2, vuint64m1_t vs1,
                                         size_t vl);
vint64m1_t __riscv_vrgather_vx_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                         vint64m1_t vs2, size_t vs1, size_t vl);
vint64m2_t __riscv_vrgather_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                         vint64m2_t vs2, vuint64m2_t vs1,
                                         size_t vl);
vint64m2_t __riscv_vrgather_vx_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                         vint64m2_t vs2, size_t vs1, size_t vl);
vint64m4_t __riscv_vrgather_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                         vint64m4_t vs2, vuint64m4_t vs1,
                                         size_t vl);
vint64m4_t __riscv_vrgather_vx_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                         vint64m4_t vs2, size_t vs1, size_t vl);
vint64m8_t __riscv_vrgather_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                         vint64m8_t vs2, vuint64m8_t vs1,
                                         size_t vl);
vint64m8_t __riscv_vrgather_vx_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                         vint64m8_t vs2, size_t vs1, size_t vl);
vint8mf8_t __riscv_vrgatherei16_vv_i8mf8_tum(vbool64_t vm, vint8mf8_t vd,
                                             vint8mf8_t vs2, vuint16mf4_t vs1,
                                             size_t vl);
vint8mf4_t __riscv_vrgatherei16_vv_i8mf4_tum(vbool32_t vm, vint8mf4_t vd,
                                             vint8mf4_t vs2, vuint16mf2_t vs1,
                                             size_t vl);
vint8mf2_t __riscv_vrgatherei16_vv_i8mf2_tum(vbool16_t vm, vint8mf2_t vd,
                                             vint8mf2_t vs2, vuint16m1_t vs1,
                                             size_t vl);
vint8m1_t __riscv_vrgatherei16_vv_i8m1_tum(vbool8_t vm, vint8m1_t vd,
                                           vint8m1_t vs2, vuint16m2_t vs1,
                                           size_t vl);
vint8m2_t __riscv_vrgatherei16_vv_i8m2_tum(vbool4_t vm, vint8m2_t vd,
                                           vint8m2_t vs2, vuint16m4_t vs1,
                                           size_t vl);
vint8m4_t __riscv_vrgatherei16_vv_i8m4_tum(vbool2_t vm, vint8m4_t vd,
                                           vint8m4_t vs2, vuint16m8_t vs1,
                                           size_t vl);
vint16mf4_t __riscv_vrgatherei16_vv_i16mf4_tum(vbool64_t vm, vint16mf4_t vd,
                                               vint16mf4_t vs2,
                                               vuint16mf4_t vs1, size_t vl);
vint16mf2_t __riscv_vrgatherei16_vv_i16mf2_tum(vbool32_t vm, vint16mf2_t vd,
                                               vint16mf2_t vs2,
                                               vuint16mf2_t vs1, size_t vl);
vint16m1_t __riscv_vrgatherei16_vv_i16m1_tum(vbool16_t vm, vint16m1_t vd,
                                             vint16m1_t vs2, vuint16m1_t vs1,
                                             size_t vl);
vint16m2_t __riscv_vrgatherei16_vv_i16m2_tum(vbool8_t vm, vint16m2_t vd,
                                             vint16m2_t vs2, vuint16m2_t vs1,
                                             size_t vl);
vint16m4_t __riscv_vrgatherei16_vv_i16m4_tum(vbool4_t vm, vint16m4_t vd,
                                             vint16m4_t vs2, vuint16m4_t vs1,
                                             size_t vl);
vint16m8_t __riscv_vrgatherei16_vv_i16m8_tum(vbool2_t vm, vint16m8_t vd,
                                             vint16m8_t vs2, vuint16m8_t vs1,
                                             size_t vl);
vint32mf2_t __riscv_vrgatherei16_vv_i32mf2_tum(vbool64_t vm, vint32mf2_t vd,
                                               vint32mf2_t vs2,
                                               vuint16mf4_t vs1, size_t vl);
vint32m1_t __riscv_vrgatherei16_vv_i32m1_tum(vbool32_t vm, vint32m1_t vd,
                                             vint32m1_t vs2, vuint16mf2_t vs1,
                                             size_t vl);
vint32m2_t __riscv_vrgatherei16_vv_i32m2_tum(vbool16_t vm, vint32m2_t vd,
                                             vint32m2_t vs2, vuint16m1_t vs1,
                                             size_t vl);
vint32m4_t __riscv_vrgatherei16_vv_i32m4_tum(vbool8_t vm, vint32m4_t vd,
                                             vint32m4_t vs2, vuint16m2_t vs1,
                                             size_t vl);
vint32m8_t __riscv_vrgatherei16_vv_i32m8_tum(vbool4_t vm, vint32m8_t vd,
                                             vint32m8_t vs2, vuint16m4_t vs1,
                                             size_t vl);
vint64m1_t __riscv_vrgatherei16_vv_i64m1_tum(vbool64_t vm, vint64m1_t vd,
                                             vint64m1_t vs2, vuint16mf4_t vs1,
                                             size_t vl);
vint64m2_t __riscv_vrgatherei16_vv_i64m2_tum(vbool32_t vm, vint64m2_t vd,
                                             vint64m2_t vs2, vuint16mf2_t vs1,
                                             size_t vl);
vint64m4_t __riscv_vrgatherei16_vv_i64m4_tum(vbool16_t vm, vint64m4_t vd,
                                             vint64m4_t vs2, vuint16m1_t vs1,
                                             size_t vl);
vint64m8_t __riscv_vrgatherei16_vv_i64m8_tum(vbool8_t vm, vint64m8_t vd,
                                             vint64m8_t vs2, vuint16m2_t vs1,
                                             size_t vl);
vuint8mf8_t __riscv_vrgather_vv_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                          vuint8mf8_t vs2, vuint8mf8_t vs1,
                                          size_t vl);
vuint8mf8_t __riscv_vrgather_vx_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                          vuint8mf8_t vs2, size_t vs1,
                                          size_t vl);
vuint8mf4_t __riscv_vrgather_vv_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                          vuint8mf4_t vs2, vuint8mf4_t vs1,
                                          size_t vl);
vuint8mf4_t __riscv_vrgather_vx_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                          vuint8mf4_t vs2, size_t vs1,
                                          size_t vl);
vuint8mf2_t __riscv_vrgather_vv_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                          vuint8mf2_t vs2, vuint8mf2_t vs1,
                                          size_t vl);
vuint8mf2_t __riscv_vrgather_vx_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                          vuint8mf2_t vs2, size_t vs1,
                                          size_t vl);
vuint8m1_t __riscv_vrgather_vv_u8m1_tum(vbool8_t vm, vuint8m1_t vd,
                                        vuint8m1_t vs2, vuint8m1_t vs1,
                                        size_t vl);
vuint8m1_t __riscv_vrgather_vx_u8m1_tum(vbool8_t vm, vuint8m1_t vd,
                                        vuint8m1_t vs2, size_t vs1, size_t vl);
vuint8m2_t __riscv_vrgather_vv_u8m2_tum(vbool4_t vm, vuint8m2_t vd,
                                        vuint8m2_t vs2, vuint8m2_t vs1,
                                        size_t vl);
vuint8m2_t __riscv_vrgather_vx_u8m2_tum(vbool4_t vm, vuint8m2_t vd,
                                        vuint8m2_t vs2, size_t vs1, size_t vl);
vuint8m4_t __riscv_vrgather_vv_u8m4_tum(vbool2_t vm, vuint8m4_t vd,
                                        vuint8m4_t vs2, vuint8m4_t vs1,
                                        size_t vl);
vuint8m4_t __riscv_vrgather_vx_u8m4_tum(vbool2_t vm, vuint8m4_t vd,
                                        vuint8m4_t vs2, size_t vs1, size_t vl);
vuint8m8_t __riscv_vrgather_vv_u8m8_tum(vbool1_t vm, vuint8m8_t vd,
                                        vuint8m8_t vs2, vuint8m8_t vs1,
                                        size_t vl);
vuint8m8_t __riscv_vrgather_vx_u8m8_tum(vbool1_t vm, vuint8m8_t vd,
                                        vuint8m8_t vs2, size_t vs1, size_t vl);
vuint16mf4_t __riscv_vrgather_vv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                            vuint16mf4_t vs2, vuint16mf4_t vs1,
                                            size_t vl);
vuint16mf4_t __riscv_vrgather_vx_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                            vuint16mf4_t vs2, size_t vs1,
                                            size_t vl);
vuint16mf2_t __riscv_vrgather_vv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                            vuint16mf2_t vs2, vuint16mf2_t vs1,
                                            size_t vl);
vuint16mf2_t __riscv_vrgather_vx_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                            vuint16mf2_t vs2, size_t vs1,
                                            size_t vl);
vuint16m1_t __riscv_vrgather_vv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                          vuint16m1_t vs2, vuint16m1_t vs1,
                                          size_t vl);
vuint16m1_t __riscv_vrgather_vx_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                          vuint16m1_t vs2, size_t vs1,
                                          size_t vl);
vuint16m2_t __riscv_vrgather_vv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                          vuint16m2_t vs2, vuint16m2_t vs1,
                                          size_t vl);
vuint16m2_t __riscv_vrgather_vx_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                          vuint16m2_t vs2, size_t vs1,
                                          size_t vl);
vuint16m4_t __riscv_vrgather_vv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                          vuint16m4_t vs2, vuint16m4_t vs1,
                                          size_t vl);
vuint16m4_t __riscv_vrgather_vx_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                          vuint16m4_t vs2, size_t vs1,
                                          size_t vl);
vuint16m8_t __riscv_vrgather_vv_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                          vuint16m8_t vs2, vuint16m8_t vs1,
                                          size_t vl);
vuint16m8_t __riscv_vrgather_vx_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                          vuint16m8_t vs2, size_t vs1,
                                          size_t vl);
vuint32mf2_t __riscv_vrgather_vv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                            vuint32mf2_t vs2, vuint32mf2_t vs1,
                                            size_t vl);
vuint32mf2_t __riscv_vrgather_vx_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                            vuint32mf2_t vs2, size_t vs1,
                                            size_t vl);
vuint32m1_t __riscv_vrgather_vv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                          vuint32m1_t vs2, vuint32m1_t vs1,
                                          size_t vl);
vuint32m1_t __riscv_vrgather_vx_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                          vuint32m1_t vs2, size_t vs1,
                                          size_t vl);
vuint32m2_t __riscv_vrgather_vv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                          vuint32m2_t vs2, vuint32m2_t vs1,
                                          size_t vl);
vuint32m2_t __riscv_vrgather_vx_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                          vuint32m2_t vs2, size_t vs1,
                                          size_t vl);
vuint32m4_t __riscv_vrgather_vv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                          vuint32m4_t vs2, vuint32m4_t vs1,
                                          size_t vl);
vuint32m4_t __riscv_vrgather_vx_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                          vuint32m4_t vs2, size_t vs1,
                                          size_t vl);
vuint32m8_t __riscv_vrgather_vv_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                          vuint32m8_t vs2, vuint32m8_t vs1,
                                          size_t vl);
vuint32m8_t __riscv_vrgather_vx_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                          vuint32m8_t vs2, size_t vs1,
                                          size_t vl);
vuint64m1_t __riscv_vrgather_vv_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                          vuint64m1_t vs2, vuint64m1_t vs1,
                                          size_t vl);
vuint64m1_t __riscv_vrgather_vx_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                          vuint64m1_t vs2, size_t vs1,
                                          size_t vl);
vuint64m2_t __riscv_vrgather_vv_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                          vuint64m2_t vs2, vuint64m2_t vs1,
                                          size_t vl);
vuint64m2_t __riscv_vrgather_vx_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                          vuint64m2_t vs2, size_t vs1,
                                          size_t vl);
vuint64m4_t __riscv_vrgather_vv_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                          vuint64m4_t vs2, vuint64m4_t vs1,
                                          size_t vl);
vuint64m4_t __riscv_vrgather_vx_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                          vuint64m4_t vs2, size_t vs1,
                                          size_t vl);
vuint64m8_t __riscv_vrgather_vv_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                          vuint64m8_t vs2, vuint64m8_t vs1,
                                          size_t vl);
vuint64m8_t __riscv_vrgather_vx_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                          vuint64m8_t vs2, size_t vs1,
                                          size_t vl);
vuint8mf8_t __riscv_vrgatherei16_vv_u8mf8_tum(vbool64_t vm, vuint8mf8_t vd,
                                              vuint8mf8_t vs2, vuint16mf4_t vs1,
                                              size_t vl);
vuint8mf4_t __riscv_vrgatherei16_vv_u8mf4_tum(vbool32_t vm, vuint8mf4_t vd,
                                              vuint8mf4_t vs2, vuint16mf2_t vs1,
                                              size_t vl);
vuint8mf2_t __riscv_vrgatherei16_vv_u8mf2_tum(vbool16_t vm, vuint8mf2_t vd,
                                              vuint8mf2_t vs2, vuint16m1_t vs1,
                                              size_t vl);
vuint8m1_t __riscv_vrgatherei16_vv_u8m1_tum(vbool8_t vm, vuint8m1_t vd,
                                            vuint8m1_t vs2, vuint16m2_t vs1,
                                            size_t vl);
vuint8m2_t __riscv_vrgatherei16_vv_u8m2_tum(vbool4_t vm, vuint8m2_t vd,
                                            vuint8m2_t vs2, vuint16m4_t vs1,
                                            size_t vl);
vuint8m4_t __riscv_vrgatherei16_vv_u8m4_tum(vbool2_t vm, vuint8m4_t vd,
                                            vuint8m4_t vs2, vuint16m8_t vs1,
                                            size_t vl);
vuint16mf4_t __riscv_vrgatherei16_vv_u16mf4_tum(vbool64_t vm, vuint16mf4_t vd,
                                                vuint16mf4_t vs2,
                                                vuint16mf4_t vs1, size_t vl);
vuint16mf2_t __riscv_vrgatherei16_vv_u16mf2_tum(vbool32_t vm, vuint16mf2_t vd,
                                                vuint16mf2_t vs2,
                                                vuint16mf2_t vs1, size_t vl);
vuint16m1_t __riscv_vrgatherei16_vv_u16m1_tum(vbool16_t vm, vuint16m1_t vd,
                                              vuint16m1_t vs2, vuint16m1_t vs1,
                                              size_t vl);
vuint16m2_t __riscv_vrgatherei16_vv_u16m2_tum(vbool8_t vm, vuint16m2_t vd,
                                              vuint16m2_t vs2, vuint16m2_t vs1,
                                              size_t vl);
vuint16m4_t __riscv_vrgatherei16_vv_u16m4_tum(vbool4_t vm, vuint16m4_t vd,
                                              vuint16m4_t vs2, vuint16m4_t vs1,
                                              size_t vl);
vuint16m8_t __riscv_vrgatherei16_vv_u16m8_tum(vbool2_t vm, vuint16m8_t vd,
                                              vuint16m8_t vs2, vuint16m8_t vs1,
                                              size_t vl);
vuint32mf2_t __riscv_vrgatherei16_vv_u32mf2_tum(vbool64_t vm, vuint32mf2_t vd,
                                                vuint32mf2_t vs2,
                                                vuint16mf4_t vs1, size_t vl);
vuint32m1_t __riscv_vrgatherei16_vv_u32m1_tum(vbool32_t vm, vuint32m1_t vd,
                                              vuint32m1_t vs2, vuint16mf2_t vs1,
                                              size_t vl);
vuint32m2_t __riscv_vrgatherei16_vv_u32m2_tum(vbool16_t vm, vuint32m2_t vd,
                                              vuint32m2_t vs2, vuint16m1_t vs1,
                                              size_t vl);
vuint32m4_t __riscv_vrgatherei16_vv_u32m4_tum(vbool8_t vm, vuint32m4_t vd,
                                              vuint32m4_t vs2, vuint16m2_t vs1,
                                              size_t vl);
vuint32m8_t __riscv_vrgatherei16_vv_u32m8_tum(vbool4_t vm, vuint32m8_t vd,
                                              vuint32m8_t vs2, vuint16m4_t vs1,
                                              size_t vl);
vuint64m1_t __riscv_vrgatherei16_vv_u64m1_tum(vbool64_t vm, vuint64m1_t vd,
                                              vuint64m1_t vs2, vuint16mf4_t vs1,
                                              size_t vl);
vuint64m2_t __riscv_vrgatherei16_vv_u64m2_tum(vbool32_t vm, vuint64m2_t vd,
                                              vuint64m2_t vs2, vuint16mf2_t vs1,
                                              size_t vl);
vuint64m4_t __riscv_vrgatherei16_vv_u64m4_tum(vbool16_t vm, vuint64m4_t vd,
                                              vuint64m4_t vs2, vuint16m1_t vs1,
                                              size_t vl);
vuint64m8_t __riscv_vrgatherei16_vv_u64m8_tum(vbool8_t vm, vuint64m8_t vd,
                                              vuint64m8_t vs2, vuint16m2_t vs1,
                                              size_t vl);
// masked functions
vfloat16mf4_t __riscv_vrgather_vv_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat16mf4_t vs2,
                                              vuint16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vrgather_vx_f16mf4_tumu(vbool64_t vm, vfloat16mf4_t vd,
                                              vfloat16mf4_t vs2, size_t vs1,
                                              size_t vl);
vfloat16mf2_t __riscv_vrgather_vv_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat16mf2_t vs2,
                                              vuint16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vrgather_vx_f16mf2_tumu(vbool32_t vm, vfloat16mf2_t vd,
                                              vfloat16mf2_t vs2, size_t vs1,
                                              size_t vl);
vfloat16m1_t __riscv_vrgather_vv_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat16m1_t vs2, vuint16m1_t vs1,
                                            size_t vl);
vfloat16m1_t __riscv_vrgather_vx_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                            vfloat16m1_t vs2, size_t vs1,
                                            size_t vl);
vfloat16m2_t __riscv_vrgather_vv_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat16m2_t vs2, vuint16m2_t vs1,
                                            size_t vl);
vfloat16m2_t __riscv_vrgather_vx_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                            vfloat16m2_t vs2, size_t vs1,
                                            size_t vl);
vfloat16m4_t __riscv_vrgather_vv_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat16m4_t vs2, vuint16m4_t vs1,
                                            size_t vl);
vfloat16m4_t __riscv_vrgather_vx_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                            vfloat16m4_t vs2, size_t vs1,
                                            size_t vl);
vfloat16m8_t __riscv_vrgather_vv_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                            vfloat16m8_t vs2, vuint16m8_t vs1,
                                            size_t vl);
vfloat16m8_t __riscv_vrgather_vx_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                            vfloat16m8_t vs2, size_t vs1,
                                            size_t vl);
vfloat32mf2_t __riscv_vrgather_vv_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs2,
                                              vuint32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vrgather_vx_f32mf2_tumu(vbool64_t vm, vfloat32mf2_t vd,
                                              vfloat32mf2_t vs2, size_t vs1,
                                              size_t vl);
vfloat32m1_t __riscv_vrgather_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs2, vuint32m1_t vs1,
                                            size_t vl);
vfloat32m1_t __riscv_vrgather_vx_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                            vfloat32m1_t vs2, size_t vs1,
                                            size_t vl);
vfloat32m2_t __riscv_vrgather_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs2, vuint32m2_t vs1,
                                            size_t vl);
vfloat32m2_t __riscv_vrgather_vx_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                            vfloat32m2_t vs2, size_t vs1,
                                            size_t vl);
vfloat32m4_t __riscv_vrgather_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs2, vuint32m4_t vs1,
                                            size_t vl);
vfloat32m4_t __riscv_vrgather_vx_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                            vfloat32m4_t vs2, size_t vs1,
                                            size_t vl);
vfloat32m8_t __riscv_vrgather_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs2, vuint32m8_t vs1,
                                            size_t vl);
vfloat32m8_t __riscv_vrgather_vx_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                            vfloat32m8_t vs2, size_t vs1,
                                            size_t vl);
vfloat64m1_t __riscv_vrgather_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs2, vuint64m1_t vs1,
                                            size_t vl);
vfloat64m1_t __riscv_vrgather_vx_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                            vfloat64m1_t vs2, size_t vs1,
                                            size_t vl);
vfloat64m2_t __riscv_vrgather_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs2, vuint64m2_t vs1,
                                            size_t vl);
vfloat64m2_t __riscv_vrgather_vx_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                            vfloat64m2_t vs2, size_t vs1,
                                            size_t vl);
vfloat64m4_t __riscv_vrgather_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs2, vuint64m4_t vs1,
                                            size_t vl);
vfloat64m4_t __riscv_vrgather_vx_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                            vfloat64m4_t vs2, size_t vs1,
                                            size_t vl);
vfloat64m8_t __riscv_vrgather_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs2, vuint64m8_t vs1,
                                            size_t vl);
vfloat64m8_t __riscv_vrgather_vx_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                            vfloat64m8_t vs2, size_t vs1,
                                            size_t vl);
vfloat16mf4_t __riscv_vrgatherei16_vv_f16mf4_tumu(vbool64_t vm,
                                                  vfloat16mf4_t vd,
                                                  vfloat16mf4_t vs2,
                                                  vuint16mf4_t vs1, size_t vl);
vfloat16mf2_t __riscv_vrgatherei16_vv_f16mf2_tumu(vbool32_t vm,
                                                  vfloat16mf2_t vd,
                                                  vfloat16mf2_t vs2,
                                                  vuint16mf2_t vs1, size_t vl);
vfloat16m1_t __riscv_vrgatherei16_vv_f16m1_tumu(vbool16_t vm, vfloat16m1_t vd,
                                                vfloat16m1_t vs2,
                                                vuint16m1_t vs1, size_t vl);
vfloat16m2_t __riscv_vrgatherei16_vv_f16m2_tumu(vbool8_t vm, vfloat16m2_t vd,
                                                vfloat16m2_t vs2,
                                                vuint16m2_t vs1, size_t vl);
vfloat16m4_t __riscv_vrgatherei16_vv_f16m4_tumu(vbool4_t vm, vfloat16m4_t vd,
                                                vfloat16m4_t vs2,
                                                vuint16m4_t vs1, size_t vl);
vfloat16m8_t __riscv_vrgatherei16_vv_f16m8_tumu(vbool2_t vm, vfloat16m8_t vd,
                                                vfloat16m8_t vs2,
                                                vuint16m8_t vs1, size_t vl);
vfloat32mf2_t __riscv_vrgatherei16_vv_f32mf2_tumu(vbool64_t vm,
                                                  vfloat32mf2_t vd,
                                                  vfloat32mf2_t vs2,
                                                  vuint16mf4_t vs1, size_t vl);
vfloat32m1_t __riscv_vrgatherei16_vv_f32m1_tumu(vbool32_t vm, vfloat32m1_t vd,
                                                vfloat32m1_t vs2,
                                                vuint16mf2_t vs1, size_t vl);
vfloat32m2_t __riscv_vrgatherei16_vv_f32m2_tumu(vbool16_t vm, vfloat32m2_t vd,
                                                vfloat32m2_t vs2,
                                                vuint16m1_t vs1, size_t vl);
vfloat32m4_t __riscv_vrgatherei16_vv_f32m4_tumu(vbool8_t vm, vfloat32m4_t vd,
                                                vfloat32m4_t vs2,
                                                vuint16m2_t vs1, size_t vl);
vfloat32m8_t __riscv_vrgatherei16_vv_f32m8_tumu(vbool4_t vm, vfloat32m8_t vd,
                                                vfloat32m8_t vs2,
                                                vuint16m4_t vs1, size_t vl);
vfloat64m1_t __riscv_vrgatherei16_vv_f64m1_tumu(vbool64_t vm, vfloat64m1_t vd,
                                                vfloat64m1_t vs2,
                                                vuint16mf4_t vs1, size_t vl);
vfloat64m2_t __riscv_vrgatherei16_vv_f64m2_tumu(vbool32_t vm, vfloat64m2_t vd,
                                                vfloat64m2_t vs2,
                                                vuint16mf2_t vs1, size_t vl);
vfloat64m4_t __riscv_vrgatherei16_vv_f64m4_tumu(vbool16_t vm, vfloat64m4_t vd,
                                                vfloat64m4_t vs2,
                                                vuint16m1_t vs1, size_t vl);
vfloat64m8_t __riscv_vrgatherei16_vv_f64m8_tumu(vbool8_t vm, vfloat64m8_t vd,
                                                vfloat64m8_t vs2,
                                                vuint16m2_t vs1, size_t vl);
vint8mf8_t __riscv_vrgather_vv_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                          vint8mf8_t vs2, vuint8mf8_t vs1,
                                          size_t vl);
vint8mf8_t __riscv_vrgather_vx_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                          vint8mf8_t vs2, size_t vs1,
                                          size_t vl);
vint8mf4_t __riscv_vrgather_vv_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                          vint8mf4_t vs2, vuint8mf4_t vs1,
                                          size_t vl);
vint8mf4_t __riscv_vrgather_vx_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                          vint8mf4_t vs2, size_t vs1,
                                          size_t vl);
vint8mf2_t __riscv_vrgather_vv_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                          vint8mf2_t vs2, vuint8mf2_t vs1,
                                          size_t vl);
vint8mf2_t __riscv_vrgather_vx_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                          vint8mf2_t vs2, size_t vs1,
                                          size_t vl);
vint8m1_t __riscv_vrgather_vv_i8m1_tumu(vbool8_t vm, vint8m1_t vd,
                                        vint8m1_t vs2, vuint8m1_t vs1,
                                        size_t vl);
vint8m1_t __riscv_vrgather_vx_i8m1_tumu(vbool8_t vm, vint8m1_t vd,
                                        vint8m1_t vs2, size_t vs1, size_t vl);
vint8m2_t __riscv_vrgather_vv_i8m2_tumu(vbool4_t vm, vint8m2_t vd,
                                        vint8m2_t vs2, vuint8m2_t vs1,
                                        size_t vl);
vint8m2_t __riscv_vrgather_vx_i8m2_tumu(vbool4_t vm, vint8m2_t vd,
                                        vint8m2_t vs2, size_t vs1, size_t vl);
vint8m4_t __riscv_vrgather_vv_i8m4_tumu(vbool2_t vm, vint8m4_t vd,
                                        vint8m4_t vs2, vuint8m4_t vs1,
                                        size_t vl);
vint8m4_t __riscv_vrgather_vx_i8m4_tumu(vbool2_t vm, vint8m4_t vd,
                                        vint8m4_t vs2, size_t vs1, size_t vl);
vint8m8_t __riscv_vrgather_vv_i8m8_tumu(vbool1_t vm, vint8m8_t vd,
                                        vint8m8_t vs2, vuint8m8_t vs1,
                                        size_t vl);
vint8m8_t __riscv_vrgather_vx_i8m8_tumu(vbool1_t vm, vint8m8_t vd,
                                        vint8m8_t vs2, size_t vs1, size_t vl);
vint16mf4_t __riscv_vrgather_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                            vint16mf4_t vs2, vuint16mf4_t vs1,
                                            size_t vl);
vint16mf4_t __riscv_vrgather_vx_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                            vint16mf4_t vs2, size_t vs1,
                                            size_t vl);
vint16mf2_t __riscv_vrgather_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                            vint16mf2_t vs2, vuint16mf2_t vs1,
                                            size_t vl);
vint16mf2_t __riscv_vrgather_vx_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                            vint16mf2_t vs2, size_t vs1,
                                            size_t vl);
vint16m1_t __riscv_vrgather_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                          vint16m1_t vs2, vuint16m1_t vs1,
                                          size_t vl);
vint16m1_t __riscv_vrgather_vx_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                          vint16m1_t vs2, size_t vs1,
                                          size_t vl);
vint16m2_t __riscv_vrgather_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                          vint16m2_t vs2, vuint16m2_t vs1,
                                          size_t vl);
vint16m2_t __riscv_vrgather_vx_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                          vint16m2_t vs2, size_t vs1,
                                          size_t vl);
vint16m4_t __riscv_vrgather_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                          vint16m4_t vs2, vuint16m4_t vs1,
                                          size_t vl);
vint16m4_t __riscv_vrgather_vx_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                          vint16m4_t vs2, size_t vs1,
                                          size_t vl);
vint16m8_t __riscv_vrgather_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                          vint16m8_t vs2, vuint16m8_t vs1,
                                          size_t vl);
vint16m8_t __riscv_vrgather_vx_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                          vint16m8_t vs2, size_t vs1,
                                          size_t vl);
vint32mf2_t __riscv_vrgather_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                            vint32mf2_t vs2, vuint32mf2_t vs1,
                                            size_t vl);
vint32mf2_t __riscv_vrgather_vx_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                            vint32mf2_t vs2, size_t vs1,
                                            size_t vl);
vint32m1_t __riscv_vrgather_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                          vint32m1_t vs2, vuint32m1_t vs1,
                                          size_t vl);
vint32m1_t __riscv_vrgather_vx_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                          vint32m1_t vs2, size_t vs1,
                                          size_t vl);
vint32m2_t __riscv_vrgather_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                          vint32m2_t vs2, vuint32m2_t vs1,
                                          size_t vl);
vint32m2_t __riscv_vrgather_vx_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                          vint32m2_t vs2, size_t vs1,
                                          size_t vl);
vint32m4_t __riscv_vrgather_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                          vint32m4_t vs2, vuint32m4_t vs1,
                                          size_t vl);
vint32m4_t __riscv_vrgather_vx_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                          vint32m4_t vs2, size_t vs1,
                                          size_t vl);
vint32m8_t __riscv_vrgather_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                          vint32m8_t vs2, vuint32m8_t vs1,
                                          size_t vl);
vint32m8_t __riscv_vrgather_vx_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                          vint32m8_t vs2, size_t vs1,
                                          size_t vl);
vint64m1_t __riscv_vrgather_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                          vint64m1_t vs2, vuint64m1_t vs1,
                                          size_t vl);
vint64m1_t __riscv_vrgather_vx_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                          vint64m1_t vs2, size_t vs1,
                                          size_t vl);
vint64m2_t __riscv_vrgather_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                          vint64m2_t vs2, vuint64m2_t vs1,
                                          size_t vl);
vint64m2_t __riscv_vrgather_vx_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                          vint64m2_t vs2, size_t vs1,
                                          size_t vl);
vint64m4_t __riscv_vrgather_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                          vint64m4_t vs2, vuint64m4_t vs1,
                                          size_t vl);
vint64m4_t __riscv_vrgather_vx_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                          vint64m4_t vs2, size_t vs1,
                                          size_t vl);
vint64m8_t __riscv_vrgather_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                          vint64m8_t vs2, vuint64m8_t vs1,
                                          size_t vl);
vint64m8_t __riscv_vrgather_vx_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                          vint64m8_t vs2, size_t vs1,
                                          size_t vl);
vint8mf8_t __riscv_vrgatherei16_vv_i8mf8_tumu(vbool64_t vm, vint8mf8_t vd,
                                              vint8mf8_t vs2, vuint16mf4_t vs1,
                                              size_t vl);
vint8mf4_t __riscv_vrgatherei16_vv_i8mf4_tumu(vbool32_t vm, vint8mf4_t vd,
                                              vint8mf4_t vs2, vuint16mf2_t vs1,
                                              size_t vl);
vint8mf2_t __riscv_vrgatherei16_vv_i8mf2_tumu(vbool16_t vm, vint8mf2_t vd,
                                              vint8mf2_t vs2, vuint16m1_t vs1,
                                              size_t vl);
vint8m1_t __riscv_vrgatherei16_vv_i8m1_tumu(vbool8_t vm, vint8m1_t vd,
                                            vint8m1_t vs2, vuint16m2_t vs1,
                                            size_t vl);
vint8m2_t __riscv_vrgatherei16_vv_i8m2_tumu(vbool4_t vm, vint8m2_t vd,
                                            vint8m2_t vs2, vuint16m4_t vs1,
                                            size_t vl);
vint8m4_t __riscv_vrgatherei16_vv_i8m4_tumu(vbool2_t vm, vint8m4_t vd,
                                            vint8m4_t vs2, vuint16m8_t vs1,
                                            size_t vl);
vint16mf4_t __riscv_vrgatherei16_vv_i16mf4_tumu(vbool64_t vm, vint16mf4_t vd,
                                                vint16mf4_t vs2,
                                                vuint16mf4_t vs1, size_t vl);
vint16mf2_t __riscv_vrgatherei16_vv_i16mf2_tumu(vbool32_t vm, vint16mf2_t vd,
                                                vint16mf2_t vs2,
                                                vuint16mf2_t vs1, size_t vl);
vint16m1_t __riscv_vrgatherei16_vv_i16m1_tumu(vbool16_t vm, vint16m1_t vd,
                                              vint16m1_t vs2, vuint16m1_t vs1,
                                              size_t vl);
vint16m2_t __riscv_vrgatherei16_vv_i16m2_tumu(vbool8_t vm, vint16m2_t vd,
                                              vint16m2_t vs2, vuint16m2_t vs1,
                                              size_t vl);
vint16m4_t __riscv_vrgatherei16_vv_i16m4_tumu(vbool4_t vm, vint16m4_t vd,
                                              vint16m4_t vs2, vuint16m4_t vs1,
                                              size_t vl);
vint16m8_t __riscv_vrgatherei16_vv_i16m8_tumu(vbool2_t vm, vint16m8_t vd,
                                              vint16m8_t vs2, vuint16m8_t vs1,
                                              size_t vl);
vint32mf2_t __riscv_vrgatherei16_vv_i32mf2_tumu(vbool64_t vm, vint32mf2_t vd,
                                                vint32mf2_t vs2,
                                                vuint16mf4_t vs1, size_t vl);
vint32m1_t __riscv_vrgatherei16_vv_i32m1_tumu(vbool32_t vm, vint32m1_t vd,
                                              vint32m1_t vs2, vuint16mf2_t vs1,
                                              size_t vl);
vint32m2_t __riscv_vrgatherei16_vv_i32m2_tumu(vbool16_t vm, vint32m2_t vd,
                                              vint32m2_t vs2, vuint16m1_t vs1,
                                              size_t vl);
vint32m4_t __riscv_vrgatherei16_vv_i32m4_tumu(vbool8_t vm, vint32m4_t vd,
                                              vint32m4_t vs2, vuint16m2_t vs1,
                                              size_t vl);
vint32m8_t __riscv_vrgatherei16_vv_i32m8_tumu(vbool4_t vm, vint32m8_t vd,
                                              vint32m8_t vs2, vuint16m4_t vs1,
                                              size_t vl);
vint64m1_t __riscv_vrgatherei16_vv_i64m1_tumu(vbool64_t vm, vint64m1_t vd,
                                              vint64m1_t vs2, vuint16mf4_t vs1,
                                              size_t vl);
vint64m2_t __riscv_vrgatherei16_vv_i64m2_tumu(vbool32_t vm, vint64m2_t vd,
                                              vint64m2_t vs2, vuint16mf2_t vs1,
                                              size_t vl);
vint64m4_t __riscv_vrgatherei16_vv_i64m4_tumu(vbool16_t vm, vint64m4_t vd,
                                              vint64m4_t vs2, vuint16m1_t vs1,
                                              size_t vl);
vint64m8_t __riscv_vrgatherei16_vv_i64m8_tumu(vbool8_t vm, vint64m8_t vd,
                                              vint64m8_t vs2, vuint16m2_t vs1,
                                              size_t vl);
vuint8mf8_t __riscv_vrgather_vv_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                           vuint8mf8_t vs2, vuint8mf8_t vs1,
                                           size_t vl);
vuint8mf8_t __riscv_vrgather_vx_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                           vuint8mf8_t vs2, size_t vs1,
                                           size_t vl);
vuint8mf4_t __riscv_vrgather_vv_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                           vuint8mf4_t vs2, vuint8mf4_t vs1,
                                           size_t vl);
vuint8mf4_t __riscv_vrgather_vx_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                           vuint8mf4_t vs2, size_t vs1,
                                           size_t vl);
vuint8mf2_t __riscv_vrgather_vv_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                           vuint8mf2_t vs2, vuint8mf2_t vs1,
                                           size_t vl);
vuint8mf2_t __riscv_vrgather_vx_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                           vuint8mf2_t vs2, size_t vs1,
                                           size_t vl);
vuint8m1_t __riscv_vrgather_vv_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                         vuint8m1_t vs2, vuint8m1_t vs1,
                                         size_t vl);
vuint8m1_t __riscv_vrgather_vx_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                         vuint8m1_t vs2, size_t vs1, size_t vl);
vuint8m2_t __riscv_vrgather_vv_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                         vuint8m2_t vs2, vuint8m2_t vs1,
                                         size_t vl);
vuint8m2_t __riscv_vrgather_vx_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                         vuint8m2_t vs2, size_t vs1, size_t vl);
vuint8m4_t __riscv_vrgather_vv_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                         vuint8m4_t vs2, vuint8m4_t vs1,
                                         size_t vl);
vuint8m4_t __riscv_vrgather_vx_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                         vuint8m4_t vs2, size_t vs1, size_t vl);
vuint8m8_t __riscv_vrgather_vv_u8m8_tumu(vbool1_t vm, vuint8m8_t vd,
                                         vuint8m8_t vs2, vuint8m8_t vs1,
                                         size_t vl);
vuint8m8_t __riscv_vrgather_vx_u8m8_tumu(vbool1_t vm, vuint8m8_t vd,
                                         vuint8m8_t vs2, size_t vs1, size_t vl);
vuint16mf4_t __riscv_vrgather_vv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                             vuint16mf4_t vs2, vuint16mf4_t vs1,
                                             size_t vl);
vuint16mf4_t __riscv_vrgather_vx_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                             vuint16mf4_t vs2, size_t vs1,
                                             size_t vl);
vuint16mf2_t __riscv_vrgather_vv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                             vuint16mf2_t vs2, vuint16mf2_t vs1,
                                             size_t vl);
vuint16mf2_t __riscv_vrgather_vx_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                             vuint16mf2_t vs2, size_t vs1,
                                             size_t vl);
vuint16m1_t __riscv_vrgather_vv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                           vuint16m1_t vs2, vuint16m1_t vs1,
                                           size_t vl);
vuint16m1_t __riscv_vrgather_vx_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                           vuint16m1_t vs2, size_t vs1,
                                           size_t vl);
vuint16m2_t __riscv_vrgather_vv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                           vuint16m2_t vs2, vuint16m2_t vs1,
                                           size_t vl);
vuint16m2_t __riscv_vrgather_vx_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                           vuint16m2_t vs2, size_t vs1,
                                           size_t vl);
vuint16m4_t __riscv_vrgather_vv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                           vuint16m4_t vs2, vuint16m4_t vs1,
                                           size_t vl);
vuint16m4_t __riscv_vrgather_vx_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                           vuint16m4_t vs2, size_t vs1,
                                           size_t vl);
vuint16m8_t __riscv_vrgather_vv_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                           vuint16m8_t vs2, vuint16m8_t vs1,
                                           size_t vl);
vuint16m8_t __riscv_vrgather_vx_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                           vuint16m8_t vs2, size_t vs1,
                                           size_t vl);
vuint32mf2_t __riscv_vrgather_vv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                             vuint32mf2_t vs2, vuint32mf2_t vs1,
                                             size_t vl);
vuint32mf2_t __riscv_vrgather_vx_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                             vuint32mf2_t vs2, size_t vs1,
                                             size_t vl);
vuint32m1_t __riscv_vrgather_vv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                           vuint32m1_t vs2, vuint32m1_t vs1,
                                           size_t vl);
vuint32m1_t __riscv_vrgather_vx_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                           vuint32m1_t vs2, size_t vs1,
                                           size_t vl);
vuint32m2_t __riscv_vrgather_vv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                           vuint32m2_t vs2, vuint32m2_t vs1,
                                           size_t vl);
vuint32m2_t __riscv_vrgather_vx_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                           vuint32m2_t vs2, size_t vs1,
                                           size_t vl);
vuint32m4_t __riscv_vrgather_vv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                           vuint32m4_t vs2, vuint32m4_t vs1,
                                           size_t vl);
vuint32m4_t __riscv_vrgather_vx_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                           vuint32m4_t vs2, size_t vs1,
                                           size_t vl);
vuint32m8_t __riscv_vrgather_vv_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                           vuint32m8_t vs2, vuint32m8_t vs1,
                                           size_t vl);
vuint32m8_t __riscv_vrgather_vx_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                           vuint32m8_t vs2, size_t vs1,
                                           size_t vl);
vuint64m1_t __riscv_vrgather_vv_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                           vuint64m1_t vs2, vuint64m1_t vs1,
                                           size_t vl);
vuint64m1_t __riscv_vrgather_vx_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                           vuint64m1_t vs2, size_t vs1,
                                           size_t vl);
vuint64m2_t __riscv_vrgather_vv_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                           vuint64m2_t vs2, vuint64m2_t vs1,
                                           size_t vl);
vuint64m2_t __riscv_vrgather_vx_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                           vuint64m2_t vs2, size_t vs1,
                                           size_t vl);
vuint64m4_t __riscv_vrgather_vv_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                           vuint64m4_t vs2, vuint64m4_t vs1,
                                           size_t vl);
vuint64m4_t __riscv_vrgather_vx_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                           vuint64m4_t vs2, size_t vs1,
                                           size_t vl);
vuint64m8_t __riscv_vrgather_vv_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                           vuint64m8_t vs2, vuint64m8_t vs1,
                                           size_t vl);
vuint64m8_t __riscv_vrgather_vx_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                           vuint64m8_t vs2, size_t vs1,
                                           size_t vl);
vuint8mf8_t __riscv_vrgatherei16_vv_u8mf8_tumu(vbool64_t vm, vuint8mf8_t vd,
                                               vuint8mf8_t vs2,
                                               vuint16mf4_t vs1, size_t vl);
vuint8mf4_t __riscv_vrgatherei16_vv_u8mf4_tumu(vbool32_t vm, vuint8mf4_t vd,
                                               vuint8mf4_t vs2,
                                               vuint16mf2_t vs1, size_t vl);
vuint8mf2_t __riscv_vrgatherei16_vv_u8mf2_tumu(vbool16_t vm, vuint8mf2_t vd,
                                               vuint8mf2_t vs2, vuint16m1_t vs1,
                                               size_t vl);
vuint8m1_t __riscv_vrgatherei16_vv_u8m1_tumu(vbool8_t vm, vuint8m1_t vd,
                                             vuint8m1_t vs2, vuint16m2_t vs1,
                                             size_t vl);
vuint8m2_t __riscv_vrgatherei16_vv_u8m2_tumu(vbool4_t vm, vuint8m2_t vd,
                                             vuint8m2_t vs2, vuint16m4_t vs1,
                                             size_t vl);
vuint8m4_t __riscv_vrgatherei16_vv_u8m4_tumu(vbool2_t vm, vuint8m4_t vd,
                                             vuint8m4_t vs2, vuint16m8_t vs1,
                                             size_t vl);
vuint16mf4_t __riscv_vrgatherei16_vv_u16mf4_tumu(vbool64_t vm, vuint16mf4_t vd,
                                                 vuint16mf4_t vs2,
                                                 vuint16mf4_t vs1, size_t vl);
vuint16mf2_t __riscv_vrgatherei16_vv_u16mf2_tumu(vbool32_t vm, vuint16mf2_t vd,
                                                 vuint16mf2_t vs2,
                                                 vuint16mf2_t vs1, size_t vl);
vuint16m1_t __riscv_vrgatherei16_vv_u16m1_tumu(vbool16_t vm, vuint16m1_t vd,
                                               vuint16m1_t vs2, vuint16m1_t vs1,
                                               size_t vl);
vuint16m2_t __riscv_vrgatherei16_vv_u16m2_tumu(vbool8_t vm, vuint16m2_t vd,
                                               vuint16m2_t vs2, vuint16m2_t vs1,
                                               size_t vl);
vuint16m4_t __riscv_vrgatherei16_vv_u16m4_tumu(vbool4_t vm, vuint16m4_t vd,
                                               vuint16m4_t vs2, vuint16m4_t vs1,
                                               size_t vl);
vuint16m8_t __riscv_vrgatherei16_vv_u16m8_tumu(vbool2_t vm, vuint16m8_t vd,
                                               vuint16m8_t vs2, vuint16m8_t vs1,
                                               size_t vl);
vuint32mf2_t __riscv_vrgatherei16_vv_u32mf2_tumu(vbool64_t vm, vuint32mf2_t vd,
                                                 vuint32mf2_t vs2,
                                                 vuint16mf4_t vs1, size_t vl);
vuint32m1_t __riscv_vrgatherei16_vv_u32m1_tumu(vbool32_t vm, vuint32m1_t vd,
                                               vuint32m1_t vs2,
                                               vuint16mf2_t vs1, size_t vl);
vuint32m2_t __riscv_vrgatherei16_vv_u32m2_tumu(vbool16_t vm, vuint32m2_t vd,
                                               vuint32m2_t vs2, vuint16m1_t vs1,
                                               size_t vl);
vuint32m4_t __riscv_vrgatherei16_vv_u32m4_tumu(vbool8_t vm, vuint32m4_t vd,
                                               vuint32m4_t vs2, vuint16m2_t vs1,
                                               size_t vl);
vuint32m8_t __riscv_vrgatherei16_vv_u32m8_tumu(vbool4_t vm, vuint32m8_t vd,
                                               vuint32m8_t vs2, vuint16m4_t vs1,
                                               size_t vl);
vuint64m1_t __riscv_vrgatherei16_vv_u64m1_tumu(vbool64_t vm, vuint64m1_t vd,
                                               vuint64m1_t vs2,
                                               vuint16mf4_t vs1, size_t vl);
vuint64m2_t __riscv_vrgatherei16_vv_u64m2_tumu(vbool32_t vm, vuint64m2_t vd,
                                               vuint64m2_t vs2,
                                               vuint16mf2_t vs1, size_t vl);
vuint64m4_t __riscv_vrgatherei16_vv_u64m4_tumu(vbool16_t vm, vuint64m4_t vd,
                                               vuint64m4_t vs2, vuint16m1_t vs1,
                                               size_t vl);
vuint64m8_t __riscv_vrgatherei16_vv_u64m8_tumu(vbool8_t vm, vuint64m8_t vd,
                                               vuint64m8_t vs2, vuint16m2_t vs1,
                                               size_t vl);
// masked functions
vfloat16mf4_t __riscv_vrgather_vv_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs2, vuint16mf4_t vs1,
                                            size_t vl);
vfloat16mf4_t __riscv_vrgather_vx_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                            vfloat16mf4_t vs2, size_t vs1,
                                            size_t vl);
vfloat16mf2_t __riscv_vrgather_vv_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs2, vuint16mf2_t vs1,
                                            size_t vl);
vfloat16mf2_t __riscv_vrgather_vx_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                            vfloat16mf2_t vs2, size_t vs1,
                                            size_t vl);
vfloat16m1_t __riscv_vrgather_vv_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs2, vuint16m1_t vs1,
                                          size_t vl);
vfloat16m1_t __riscv_vrgather_vx_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                          vfloat16m1_t vs2, size_t vs1,
                                          size_t vl);
vfloat16m2_t __riscv_vrgather_vv_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs2, vuint16m2_t vs1,
                                          size_t vl);
vfloat16m2_t __riscv_vrgather_vx_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                          vfloat16m2_t vs2, size_t vs1,
                                          size_t vl);
vfloat16m4_t __riscv_vrgather_vv_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs2, vuint16m4_t vs1,
                                          size_t vl);
vfloat16m4_t __riscv_vrgather_vx_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                          vfloat16m4_t vs2, size_t vs1,
                                          size_t vl);
vfloat16m8_t __riscv_vrgather_vv_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs2, vuint16m8_t vs1,
                                          size_t vl);
vfloat16m8_t __riscv_vrgather_vx_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                          vfloat16m8_t vs2, size_t vs1,
                                          size_t vl);
vfloat32mf2_t __riscv_vrgather_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2, vuint32mf2_t vs1,
                                            size_t vl);
vfloat32mf2_t __riscv_vrgather_vx_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                            vfloat32mf2_t vs2, size_t vs1,
                                            size_t vl);
vfloat32m1_t __riscv_vrgather_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, vuint32m1_t vs1,
                                          size_t vl);
vfloat32m1_t __riscv_vrgather_vx_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                          vfloat32m1_t vs2, size_t vs1,
                                          size_t vl);
vfloat32m2_t __riscv_vrgather_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, vuint32m2_t vs1,
                                          size_t vl);
vfloat32m2_t __riscv_vrgather_vx_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                          vfloat32m2_t vs2, size_t vs1,
                                          size_t vl);
vfloat32m4_t __riscv_vrgather_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, vuint32m4_t vs1,
                                          size_t vl);
vfloat32m4_t __riscv_vrgather_vx_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                          vfloat32m4_t vs2, size_t vs1,
                                          size_t vl);
vfloat32m8_t __riscv_vrgather_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, vuint32m8_t vs1,
                                          size_t vl);
vfloat32m8_t __riscv_vrgather_vx_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                          vfloat32m8_t vs2, size_t vs1,
                                          size_t vl);
vfloat64m1_t __riscv_vrgather_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, vuint64m1_t vs1,
                                          size_t vl);
vfloat64m1_t __riscv_vrgather_vx_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                          vfloat64m1_t vs2, size_t vs1,
                                          size_t vl);
vfloat64m2_t __riscv_vrgather_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, vuint64m2_t vs1,
                                          size_t vl);
vfloat64m2_t __riscv_vrgather_vx_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                          vfloat64m2_t vs2, size_t vs1,
                                          size_t vl);
vfloat64m4_t __riscv_vrgather_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, vuint64m4_t vs1,
                                          size_t vl);
vfloat64m4_t __riscv_vrgather_vx_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                          vfloat64m4_t vs2, size_t vs1,
                                          size_t vl);
vfloat64m8_t __riscv_vrgather_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, vuint64m8_t vs1,
                                          size_t vl);
vfloat64m8_t __riscv_vrgather_vx_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                          vfloat64m8_t vs2, size_t vs1,
                                          size_t vl);
vfloat16mf4_t __riscv_vrgatherei16_vv_f16mf4_mu(vbool64_t vm, vfloat16mf4_t vd,
                                                vfloat16mf4_t vs2,
                                                vuint16mf4_t vs1, size_t vl);
vfloat16mf2_t __riscv_vrgatherei16_vv_f16mf2_mu(vbool32_t vm, vfloat16mf2_t vd,
                                                vfloat16mf2_t vs2,
                                                vuint16mf2_t vs1, size_t vl);
vfloat16m1_t __riscv_vrgatherei16_vv_f16m1_mu(vbool16_t vm, vfloat16m1_t vd,
                                              vfloat16m1_t vs2, vuint16m1_t vs1,
                                              size_t vl);
vfloat16m2_t __riscv_vrgatherei16_vv_f16m2_mu(vbool8_t vm, vfloat16m2_t vd,
                                              vfloat16m2_t vs2, vuint16m2_t vs1,
                                              size_t vl);
vfloat16m4_t __riscv_vrgatherei16_vv_f16m4_mu(vbool4_t vm, vfloat16m4_t vd,
                                              vfloat16m4_t vs2, vuint16m4_t vs1,
                                              size_t vl);
vfloat16m8_t __riscv_vrgatherei16_vv_f16m8_mu(vbool2_t vm, vfloat16m8_t vd,
                                              vfloat16m8_t vs2, vuint16m8_t vs1,
                                              size_t vl);
vfloat32mf2_t __riscv_vrgatherei16_vv_f32mf2_mu(vbool64_t vm, vfloat32mf2_t vd,
                                                vfloat32mf2_t vs2,
                                                vuint16mf4_t vs1, size_t vl);
vfloat32m1_t __riscv_vrgatherei16_vv_f32m1_mu(vbool32_t vm, vfloat32m1_t vd,
                                              vfloat32m1_t vs2,
                                              vuint16mf2_t vs1, size_t vl);
vfloat32m2_t __riscv_vrgatherei16_vv_f32m2_mu(vbool16_t vm, vfloat32m2_t vd,
                                              vfloat32m2_t vs2, vuint16m1_t vs1,
                                              size_t vl);
vfloat32m4_t __riscv_vrgatherei16_vv_f32m4_mu(vbool8_t vm, vfloat32m4_t vd,
                                              vfloat32m4_t vs2, vuint16m2_t vs1,
                                              size_t vl);
vfloat32m8_t __riscv_vrgatherei16_vv_f32m8_mu(vbool4_t vm, vfloat32m8_t vd,
                                              vfloat32m8_t vs2, vuint16m4_t vs1,
                                              size_t vl);
vfloat64m1_t __riscv_vrgatherei16_vv_f64m1_mu(vbool64_t vm, vfloat64m1_t vd,
                                              vfloat64m1_t vs2,
                                              vuint16mf4_t vs1, size_t vl);
vfloat64m2_t __riscv_vrgatherei16_vv_f64m2_mu(vbool32_t vm, vfloat64m2_t vd,
                                              vfloat64m2_t vs2,
                                              vuint16mf2_t vs1, size_t vl);
vfloat64m4_t __riscv_vrgatherei16_vv_f64m4_mu(vbool16_t vm, vfloat64m4_t vd,
                                              vfloat64m4_t vs2, vuint16m1_t vs1,
                                              size_t vl);
vfloat64m8_t __riscv_vrgatherei16_vv_f64m8_mu(vbool8_t vm, vfloat64m8_t vd,
                                              vfloat64m8_t vs2, vuint16m2_t vs1,
                                              size_t vl);
vint8mf8_t __riscv_vrgather_vv_i8mf8_mu(vbool64_t vm, vint8mf8_t vd,
                                        vint8mf8_t vs2, vuint8mf8_t vs1,
                                        size_t vl);
vint8mf8_t __riscv_vrgather_vx_i8mf8_mu(vbool64_t vm, vint8mf8_t vd,
                                        vint8mf8_t vs2, size_t vs1, size_t vl);
vint8mf4_t __riscv_vrgather_vv_i8mf4_mu(vbool32_t vm, vint8mf4_t vd,
                                        vint8mf4_t vs2, vuint8mf4_t vs1,
                                        size_t vl);
vint8mf4_t __riscv_vrgather_vx_i8mf4_mu(vbool32_t vm, vint8mf4_t vd,
                                        vint8mf4_t vs2, size_t vs1, size_t vl);
vint8mf2_t __riscv_vrgather_vv_i8mf2_mu(vbool16_t vm, vint8mf2_t vd,
                                        vint8mf2_t vs2, vuint8mf2_t vs1,
                                        size_t vl);
vint8mf2_t __riscv_vrgather_vx_i8mf2_mu(vbool16_t vm, vint8mf2_t vd,
                                        vint8mf2_t vs2, size_t vs1, size_t vl);
vint8m1_t __riscv_vrgather_vv_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                      vuint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vrgather_vx_i8m1_mu(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                                      size_t vs1, size_t vl);
vint8m2_t __riscv_vrgather_vv_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                      vuint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vrgather_vx_i8m2_mu(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2,
                                      size_t vs1, size_t vl);
vint8m4_t __riscv_vrgather_vv_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                      vuint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vrgather_vx_i8m4_mu(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2,
                                      size_t vs1, size_t vl);
vint8m8_t __riscv_vrgather_vv_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                      vuint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vrgather_vx_i8m8_mu(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2,
                                      size_t vs1, size_t vl);
vint16mf4_t __riscv_vrgather_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                          vint16mf4_t vs2, vuint16mf4_t vs1,
                                          size_t vl);
vint16mf4_t __riscv_vrgather_vx_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                          vint16mf4_t vs2, size_t vs1,
                                          size_t vl);
vint16mf2_t __riscv_vrgather_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                          vint16mf2_t vs2, vuint16mf2_t vs1,
                                          size_t vl);
vint16mf2_t __riscv_vrgather_vx_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                          vint16mf2_t vs2, size_t vs1,
                                          size_t vl);
vint16m1_t __riscv_vrgather_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                        vint16m1_t vs2, vuint16m1_t vs1,
                                        size_t vl);
vint16m1_t __riscv_vrgather_vx_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                        vint16m1_t vs2, size_t vs1, size_t vl);
vint16m2_t __riscv_vrgather_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd,
                                        vint16m2_t vs2, vuint16m2_t vs1,
                                        size_t vl);
vint16m2_t __riscv_vrgather_vx_i16m2_mu(vbool8_t vm, vint16m2_t vd,
                                        vint16m2_t vs2, size_t vs1, size_t vl);
vint16m4_t __riscv_vrgather_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd,
                                        vint16m4_t vs2, vuint16m4_t vs1,
                                        size_t vl);
vint16m4_t __riscv_vrgather_vx_i16m4_mu(vbool4_t vm, vint16m4_t vd,
                                        vint16m4_t vs2, size_t vs1, size_t vl);
vint16m8_t __riscv_vrgather_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd,
                                        vint16m8_t vs2, vuint16m8_t vs1,
                                        size_t vl);
vint16m8_t __riscv_vrgather_vx_i16m8_mu(vbool2_t vm, vint16m8_t vd,
                                        vint16m8_t vs2, size_t vs1, size_t vl);
vint32mf2_t __riscv_vrgather_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                          vint32mf2_t vs2, vuint32mf2_t vs1,
                                          size_t vl);
vint32mf2_t __riscv_vrgather_vx_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                          vint32mf2_t vs2, size_t vs1,
                                          size_t vl);
vint32m1_t __riscv_vrgather_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                        vint32m1_t vs2, vuint32m1_t vs1,
                                        size_t vl);
vint32m1_t __riscv_vrgather_vx_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                        vint32m1_t vs2, size_t vs1, size_t vl);
vint32m2_t __riscv_vrgather_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                        vint32m2_t vs2, vuint32m2_t vs1,
                                        size_t vl);
vint32m2_t __riscv_vrgather_vx_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                        vint32m2_t vs2, size_t vs1, size_t vl);
vint32m4_t __riscv_vrgather_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd,
                                        vint32m4_t vs2, vuint32m4_t vs1,
                                        size_t vl);
vint32m4_t __riscv_vrgather_vx_i32m4_mu(vbool8_t vm, vint32m4_t vd,
                                        vint32m4_t vs2, size_t vs1, size_t vl);
vint32m8_t __riscv_vrgather_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd,
                                        vint32m8_t vs2, vuint32m8_t vs1,
                                        size_t vl);
vint32m8_t __riscv_vrgather_vx_i32m8_mu(vbool4_t vm, vint32m8_t vd,
                                        vint32m8_t vs2, size_t vs1, size_t vl);
vint64m1_t __riscv_vrgather_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                        vint64m1_t vs2, vuint64m1_t vs1,
                                        size_t vl);
vint64m1_t __riscv_vrgather_vx_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                        vint64m1_t vs2, size_t vs1, size_t vl);
vint64m2_t __riscv_vrgather_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                        vint64m2_t vs2, vuint64m2_t vs1,
                                        size_t vl);
vint64m2_t __riscv_vrgather_vx_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                        vint64m2_t vs2, size_t vs1, size_t vl);
vint64m4_t __riscv_vrgather_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                        vint64m4_t vs2, vuint64m4_t vs1,
                                        size_t vl);
vint64m4_t __riscv_vrgather_vx_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                        vint64m4_t vs2, size_t vs1, size_t vl);
vint64m8_t __riscv_vrgather_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd,
                                        vint64m8_t vs2, vuint64m8_t vs1,
                                        size_t vl);
vint64m8_t __riscv_vrgather_vx_i64m8_mu(vbool8_t vm, vint64m8_t vd,
                                        vint64m8_t vs2, size_t vs1, size_t vl);
vint8mf8_t __riscv_vrgatherei16_vv_i8mf8_mu(vbool64_t vm, vint8mf8_t vd,
                                            vint8mf8_t vs2, vuint16mf4_t vs1,
                                            size_t vl);
vint8mf4_t __riscv_vrgatherei16_vv_i8mf4_mu(vbool32_t vm, vint8mf4_t vd,
                                            vint8mf4_t vs2, vuint16mf2_t vs1,
                                            size_t vl);
vint8mf2_t __riscv_vrgatherei16_vv_i8mf2_mu(vbool16_t vm, vint8mf2_t vd,
                                            vint8mf2_t vs2, vuint16m1_t vs1,
                                            size_t vl);
vint8m1_t __riscv_vrgatherei16_vv_i8m1_mu(vbool8_t vm, vint8m1_t vd,
                                          vint8m1_t vs2, vuint16m2_t vs1,
                                          size_t vl);
vint8m2_t __riscv_vrgatherei16_vv_i8m2_mu(vbool4_t vm, vint8m2_t vd,
                                          vint8m2_t vs2, vuint16m4_t vs1,
                                          size_t vl);
vint8m4_t __riscv_vrgatherei16_vv_i8m4_mu(vbool2_t vm, vint8m4_t vd,
                                          vint8m4_t vs2, vuint16m8_t vs1,
                                          size_t vl);
vint16mf4_t __riscv_vrgatherei16_vv_i16mf4_mu(vbool64_t vm, vint16mf4_t vd,
                                              vint16mf4_t vs2, vuint16mf4_t vs1,
                                              size_t vl);
vint16mf2_t __riscv_vrgatherei16_vv_i16mf2_mu(vbool32_t vm, vint16mf2_t vd,
                                              vint16mf2_t vs2, vuint16mf2_t vs1,
                                              size_t vl);
vint16m1_t __riscv_vrgatherei16_vv_i16m1_mu(vbool16_t vm, vint16m1_t vd,
                                            vint16m1_t vs2, vuint16m1_t vs1,
                                            size_t vl);
vint16m2_t __riscv_vrgatherei16_vv_i16m2_mu(vbool8_t vm, vint16m2_t vd,
                                            vint16m2_t vs2, vuint16m2_t vs1,
                                            size_t vl);
vint16m4_t __riscv_vrgatherei16_vv_i16m4_mu(vbool4_t vm, vint16m4_t vd,
                                            vint16m4_t vs2, vuint16m4_t vs1,
                                            size_t vl);
vint16m8_t __riscv_vrgatherei16_vv_i16m8_mu(vbool2_t vm, vint16m8_t vd,
                                            vint16m8_t vs2, vuint16m8_t vs1,
                                            size_t vl);
vint32mf2_t __riscv_vrgatherei16_vv_i32mf2_mu(vbool64_t vm, vint32mf2_t vd,
                                              vint32mf2_t vs2, vuint16mf4_t vs1,
                                              size_t vl);
vint32m1_t __riscv_vrgatherei16_vv_i32m1_mu(vbool32_t vm, vint32m1_t vd,
                                            vint32m1_t vs2, vuint16mf2_t vs1,
                                            size_t vl);
vint32m2_t __riscv_vrgatherei16_vv_i32m2_mu(vbool16_t vm, vint32m2_t vd,
                                            vint32m2_t vs2, vuint16m1_t vs1,
                                            size_t vl);
vint32m4_t __riscv_vrgatherei16_vv_i32m4_mu(vbool8_t vm, vint32m4_t vd,
                                            vint32m4_t vs2, vuint16m2_t vs1,
                                            size_t vl);
vint32m8_t __riscv_vrgatherei16_vv_i32m8_mu(vbool4_t vm, vint32m8_t vd,
                                            vint32m8_t vs2, vuint16m4_t vs1,
                                            size_t vl);
vint64m1_t __riscv_vrgatherei16_vv_i64m1_mu(vbool64_t vm, vint64m1_t vd,
                                            vint64m1_t vs2, vuint16mf4_t vs1,
                                            size_t vl);
vint64m2_t __riscv_vrgatherei16_vv_i64m2_mu(vbool32_t vm, vint64m2_t vd,
                                            vint64m2_t vs2, vuint16mf2_t vs1,
                                            size_t vl);
vint64m4_t __riscv_vrgatherei16_vv_i64m4_mu(vbool16_t vm, vint64m4_t vd,
                                            vint64m4_t vs2, vuint16m1_t vs1,
                                            size_t vl);
vint64m8_t __riscv_vrgatherei16_vv_i64m8_mu(vbool8_t vm, vint64m8_t vd,
                                            vint64m8_t vs2, vuint16m2_t vs1,
                                            size_t vl);
vuint8mf8_t __riscv_vrgather_vv_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                         vuint8mf8_t vs2, vuint8mf8_t vs1,
                                         size_t vl);
vuint8mf8_t __riscv_vrgather_vx_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                         vuint8mf8_t vs2, size_t vs1,
                                         size_t vl);
vuint8mf4_t __riscv_vrgather_vv_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                         vuint8mf4_t vs2, vuint8mf4_t vs1,
                                         size_t vl);
vuint8mf4_t __riscv_vrgather_vx_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                         vuint8mf4_t vs2, size_t vs1,
                                         size_t vl);
vuint8mf2_t __riscv_vrgather_vv_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                         vuint8mf2_t vs2, vuint8mf2_t vs1,
                                         size_t vl);
vuint8mf2_t __riscv_vrgather_vx_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                         vuint8mf2_t vs2, size_t vs1,
                                         size_t vl);
vuint8m1_t __riscv_vrgather_vv_u8m1_mu(vbool8_t vm, vuint8m1_t vd,
                                       vuint8m1_t vs2, vuint8m1_t vs1,
                                       size_t vl);
vuint8m1_t __riscv_vrgather_vx_u8m1_mu(vbool8_t vm, vuint8m1_t vd,
                                       vuint8m1_t vs2, size_t vs1, size_t vl);
vuint8m2_t __riscv_vrgather_vv_u8m2_mu(vbool4_t vm, vuint8m2_t vd,
                                       vuint8m2_t vs2, vuint8m2_t vs1,
                                       size_t vl);
vuint8m2_t __riscv_vrgather_vx_u8m2_mu(vbool4_t vm, vuint8m2_t vd,
                                       vuint8m2_t vs2, size_t vs1, size_t vl);
vuint8m4_t __riscv_vrgather_vv_u8m4_mu(vbool2_t vm, vuint8m4_t vd,
                                       vuint8m4_t vs2, vuint8m4_t vs1,
                                       size_t vl);
vuint8m4_t __riscv_vrgather_vx_u8m4_mu(vbool2_t vm, vuint8m4_t vd,
                                       vuint8m4_t vs2, size_t vs1, size_t vl);
vuint8m8_t __riscv_vrgather_vv_u8m8_mu(vbool1_t vm, vuint8m8_t vd,
                                       vuint8m8_t vs2, vuint8m8_t vs1,
                                       size_t vl);
vuint8m8_t __riscv_vrgather_vx_u8m8_mu(vbool1_t vm, vuint8m8_t vd,
                                       vuint8m8_t vs2, size_t vs1, size_t vl);
vuint16mf4_t __riscv_vrgather_vv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                           vuint16mf4_t vs2, vuint16mf4_t vs1,
                                           size_t vl);
vuint16mf4_t __riscv_vrgather_vx_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                           vuint16mf4_t vs2, size_t vs1,
                                           size_t vl);
vuint16mf2_t __riscv_vrgather_vv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                           vuint16mf2_t vs2, vuint16mf2_t vs1,
                                           size_t vl);
vuint16mf2_t __riscv_vrgather_vx_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                           vuint16mf2_t vs2, size_t vs1,
                                           size_t vl);
vuint16m1_t __riscv_vrgather_vv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                         vuint16m1_t vs2, vuint16m1_t vs1,
                                         size_t vl);
vuint16m1_t __riscv_vrgather_vx_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                         vuint16m1_t vs2, size_t vs1,
                                         size_t vl);
vuint16m2_t __riscv_vrgather_vv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                         vuint16m2_t vs2, vuint16m2_t vs1,
                                         size_t vl);
vuint16m2_t __riscv_vrgather_vx_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                         vuint16m2_t vs2, size_t vs1,
                                         size_t vl);
vuint16m4_t __riscv_vrgather_vv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                         vuint16m4_t vs2, vuint16m4_t vs1,
                                         size_t vl);
vuint16m4_t __riscv_vrgather_vx_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                         vuint16m4_t vs2, size_t vs1,
                                         size_t vl);
vuint16m8_t __riscv_vrgather_vv_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                         vuint16m8_t vs2, vuint16m8_t vs1,
                                         size_t vl);
vuint16m8_t __riscv_vrgather_vx_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                         vuint16m8_t vs2, size_t vs1,
                                         size_t vl);
vuint32mf2_t __riscv_vrgather_vv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                           vuint32mf2_t vs2, vuint32mf2_t vs1,
                                           size_t vl);
vuint32mf2_t __riscv_vrgather_vx_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                           vuint32mf2_t vs2, size_t vs1,
                                           size_t vl);
vuint32m1_t __riscv_vrgather_vv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                         vuint32m1_t vs2, vuint32m1_t vs1,
                                         size_t vl);
vuint32m1_t __riscv_vrgather_vx_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                         vuint32m1_t vs2, size_t vs1,
                                         size_t vl);
vuint32m2_t __riscv_vrgather_vv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                         vuint32m2_t vs2, vuint32m2_t vs1,
                                         size_t vl);
vuint32m2_t __riscv_vrgather_vx_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                         vuint32m2_t vs2, size_t vs1,
                                         size_t vl);
vuint32m4_t __riscv_vrgather_vv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                         vuint32m4_t vs2, vuint32m4_t vs1,
                                         size_t vl);
vuint32m4_t __riscv_vrgather_vx_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                         vuint32m4_t vs2, size_t vs1,
                                         size_t vl);
vuint32m8_t __riscv_vrgather_vv_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                         vuint32m8_t vs2, vuint32m8_t vs1,
                                         size_t vl);
vuint32m8_t __riscv_vrgather_vx_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                         vuint32m8_t vs2, size_t vs1,
                                         size_t vl);
vuint64m1_t __riscv_vrgather_vv_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                         vuint64m1_t vs2, vuint64m1_t vs1,
                                         size_t vl);
vuint64m1_t __riscv_vrgather_vx_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                         vuint64m1_t vs2, size_t vs1,
                                         size_t vl);
vuint64m2_t __riscv_vrgather_vv_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                         vuint64m2_t vs2, vuint64m2_t vs1,
                                         size_t vl);
vuint64m2_t __riscv_vrgather_vx_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                         vuint64m2_t vs2, size_t vs1,
                                         size_t vl);
vuint64m4_t __riscv_vrgather_vv_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                         vuint64m4_t vs2, vuint64m4_t vs1,
                                         size_t vl);
vuint64m4_t __riscv_vrgather_vx_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                         vuint64m4_t vs2, size_t vs1,
                                         size_t vl);
vuint64m8_t __riscv_vrgather_vv_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                         vuint64m8_t vs2, vuint64m8_t vs1,
                                         size_t vl);
vuint64m8_t __riscv_vrgather_vx_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                         vuint64m8_t vs2, size_t vs1,
                                         size_t vl);
vuint8mf8_t __riscv_vrgatherei16_vv_u8mf8_mu(vbool64_t vm, vuint8mf8_t vd,
                                             vuint8mf8_t vs2, vuint16mf4_t vs1,
                                             size_t vl);
vuint8mf4_t __riscv_vrgatherei16_vv_u8mf4_mu(vbool32_t vm, vuint8mf4_t vd,
                                             vuint8mf4_t vs2, vuint16mf2_t vs1,
                                             size_t vl);
vuint8mf2_t __riscv_vrgatherei16_vv_u8mf2_mu(vbool16_t vm, vuint8mf2_t vd,
                                             vuint8mf2_t vs2, vuint16m1_t vs1,
                                             size_t vl);
vuint8m1_t __riscv_vrgatherei16_vv_u8m1_mu(vbool8_t vm, vuint8m1_t vd,
                                           vuint8m1_t vs2, vuint16m2_t vs1,
                                           size_t vl);
vuint8m2_t __riscv_vrgatherei16_vv_u8m2_mu(vbool4_t vm, vuint8m2_t vd,
                                           vuint8m2_t vs2, vuint16m4_t vs1,
                                           size_t vl);
vuint8m4_t __riscv_vrgatherei16_vv_u8m4_mu(vbool2_t vm, vuint8m4_t vd,
                                           vuint8m4_t vs2, vuint16m8_t vs1,
                                           size_t vl);
vuint16mf4_t __riscv_vrgatherei16_vv_u16mf4_mu(vbool64_t vm, vuint16mf4_t vd,
                                               vuint16mf4_t vs2,
                                               vuint16mf4_t vs1, size_t vl);
vuint16mf2_t __riscv_vrgatherei16_vv_u16mf2_mu(vbool32_t vm, vuint16mf2_t vd,
                                               vuint16mf2_t vs2,
                                               vuint16mf2_t vs1, size_t vl);
vuint16m1_t __riscv_vrgatherei16_vv_u16m1_mu(vbool16_t vm, vuint16m1_t vd,
                                             vuint16m1_t vs2, vuint16m1_t vs1,
                                             size_t vl);
vuint16m2_t __riscv_vrgatherei16_vv_u16m2_mu(vbool8_t vm, vuint16m2_t vd,
                                             vuint16m2_t vs2, vuint16m2_t vs1,
                                             size_t vl);
vuint16m4_t __riscv_vrgatherei16_vv_u16m4_mu(vbool4_t vm, vuint16m4_t vd,
                                             vuint16m4_t vs2, vuint16m4_t vs1,
                                             size_t vl);
vuint16m8_t __riscv_vrgatherei16_vv_u16m8_mu(vbool2_t vm, vuint16m8_t vd,
                                             vuint16m8_t vs2, vuint16m8_t vs1,
                                             size_t vl);
vuint32mf2_t __riscv_vrgatherei16_vv_u32mf2_mu(vbool64_t vm, vuint32mf2_t vd,
                                               vuint32mf2_t vs2,
                                               vuint16mf4_t vs1, size_t vl);
vuint32m1_t __riscv_vrgatherei16_vv_u32m1_mu(vbool32_t vm, vuint32m1_t vd,
                                             vuint32m1_t vs2, vuint16mf2_t vs1,
                                             size_t vl);
vuint32m2_t __riscv_vrgatherei16_vv_u32m2_mu(vbool16_t vm, vuint32m2_t vd,
                                             vuint32m2_t vs2, vuint16m1_t vs1,
                                             size_t vl);
vuint32m4_t __riscv_vrgatherei16_vv_u32m4_mu(vbool8_t vm, vuint32m4_t vd,
                                             vuint32m4_t vs2, vuint16m2_t vs1,
                                             size_t vl);
vuint32m8_t __riscv_vrgatherei16_vv_u32m8_mu(vbool4_t vm, vuint32m8_t vd,
                                             vuint32m8_t vs2, vuint16m4_t vs1,
                                             size_t vl);
vuint64m1_t __riscv_vrgatherei16_vv_u64m1_mu(vbool64_t vm, vuint64m1_t vd,
                                             vuint64m1_t vs2, vuint16mf4_t vs1,
                                             size_t vl);
vuint64m2_t __riscv_vrgatherei16_vv_u64m2_mu(vbool32_t vm, vuint64m2_t vd,
                                             vuint64m2_t vs2, vuint16mf2_t vs1,
                                             size_t vl);
vuint64m4_t __riscv_vrgatherei16_vv_u64m4_mu(vbool16_t vm, vuint64m4_t vd,
                                             vuint64m4_t vs2, vuint16m1_t vs1,
                                             size_t vl);
vuint64m8_t __riscv_vrgatherei16_vv_u64m8_mu(vbool8_t vm, vuint64m8_t vd,
                                             vuint64m8_t vs2, vuint16m2_t vs1,
                                             size_t vl);

Vector Compress Intrinsics

vfloat16mf4_t __riscv_vcompress_vm_f16mf4_tu(vfloat16mf4_t vd,
                                             vfloat16mf4_t vs2, vbool64_t vs1,
                                             size_t vl);
vfloat16mf2_t __riscv_vcompress_vm_f16mf2_tu(vfloat16mf2_t vd,
                                             vfloat16mf2_t vs2, vbool32_t vs1,
                                             size_t vl);
vfloat16m1_t __riscv_vcompress_vm_f16m1_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                           vbool16_t vs1, size_t vl);
vfloat16m2_t __riscv_vcompress_vm_f16m2_tu(vfloat16m2_t vd, vfloat16m2_t vs2,
                                           vbool8_t vs1, size_t vl);
vfloat16m4_t __riscv_vcompress_vm_f16m4_tu(vfloat16m4_t vd, vfloat16m4_t vs2,
                                           vbool4_t vs1, size_t vl);
vfloat16m8_t __riscv_vcompress_vm_f16m8_tu(vfloat16m8_t vd, vfloat16m8_t vs2,
                                           vbool2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vcompress_vm_f32mf2_tu(vfloat32mf2_t vd,
                                             vfloat32mf2_t vs2, vbool64_t vs1,
                                             size_t vl);
vfloat32m1_t __riscv_vcompress_vm_f32m1_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                           vbool32_t vs1, size_t vl);
vfloat32m2_t __riscv_vcompress_vm_f32m2_tu(vfloat32m2_t vd, vfloat32m2_t vs2,
                                           vbool16_t vs1, size_t vl);
vfloat32m4_t __riscv_vcompress_vm_f32m4_tu(vfloat32m4_t vd, vfloat32m4_t vs2,
                                           vbool8_t vs1, size_t vl);
vfloat32m8_t __riscv_vcompress_vm_f32m8_tu(vfloat32m8_t vd, vfloat32m8_t vs2,
                                           vbool4_t vs1, size_t vl);
vfloat64m1_t __riscv_vcompress_vm_f64m1_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                           vbool64_t vs1, size_t vl);
vfloat64m2_t __riscv_vcompress_vm_f64m2_tu(vfloat64m2_t vd, vfloat64m2_t vs2,
                                           vbool32_t vs1, size_t vl);
vfloat64m4_t __riscv_vcompress_vm_f64m4_tu(vfloat64m4_t vd, vfloat64m4_t vs2,
                                           vbool16_t vs1, size_t vl);
vfloat64m8_t __riscv_vcompress_vm_f64m8_tu(vfloat64m8_t vd, vfloat64m8_t vs2,
                                           vbool8_t vs1, size_t vl);
vint8mf8_t __riscv_vcompress_vm_i8mf8_tu(vint8mf8_t vd, vint8mf8_t vs2,
                                         vbool64_t vs1, size_t vl);
vint8mf4_t __riscv_vcompress_vm_i8mf4_tu(vint8mf4_t vd, vint8mf4_t vs2,
                                         vbool32_t vs1, size_t vl);
vint8mf2_t __riscv_vcompress_vm_i8mf2_tu(vint8mf2_t vd, vint8mf2_t vs2,
                                         vbool16_t vs1, size_t vl);
vint8m1_t __riscv_vcompress_vm_i8m1_tu(vint8m1_t vd, vint8m1_t vs2,
                                       vbool8_t vs1, size_t vl);
vint8m2_t __riscv_vcompress_vm_i8m2_tu(vint8m2_t vd, vint8m2_t vs2,
                                       vbool4_t vs1, size_t vl);
vint8m4_t __riscv_vcompress_vm_i8m4_tu(vint8m4_t vd, vint8m4_t vs2,
                                       vbool2_t vs1, size_t vl);
vint8m8_t __riscv_vcompress_vm_i8m8_tu(vint8m8_t vd, vint8m8_t vs2,
                                       vbool1_t vs1, size_t vl);
vint16mf4_t __riscv_vcompress_vm_i16mf4_tu(vint16mf4_t vd, vint16mf4_t vs2,
                                           vbool64_t vs1, size_t vl);
vint16mf2_t __riscv_vcompress_vm_i16mf2_tu(vint16mf2_t vd, vint16mf2_t vs2,
                                           vbool32_t vs1, size_t vl);
vint16m1_t __riscv_vcompress_vm_i16m1_tu(vint16m1_t vd, vint16m1_t vs2,
                                         vbool16_t vs1, size_t vl);
vint16m2_t __riscv_vcompress_vm_i16m2_tu(vint16m2_t vd, vint16m2_t vs2,
                                         vbool8_t vs1, size_t vl);
vint16m4_t __riscv_vcompress_vm_i16m4_tu(vint16m4_t vd, vint16m4_t vs2,
                                         vbool4_t vs1, size_t vl);
vint16m8_t __riscv_vcompress_vm_i16m8_tu(vint16m8_t vd, vint16m8_t vs2,
                                         vbool2_t vs1, size_t vl);
vint32mf2_t __riscv_vcompress_vm_i32mf2_tu(vint32mf2_t vd, vint32mf2_t vs2,
                                           vbool64_t vs1, size_t vl);
vint32m1_t __riscv_vcompress_vm_i32m1_tu(vint32m1_t vd, vint32m1_t vs2,
                                         vbool32_t vs1, size_t vl);
vint32m2_t __riscv_vcompress_vm_i32m2_tu(vint32m2_t vd, vint32m2_t vs2,
                                         vbool16_t vs1, size_t vl);
vint32m4_t __riscv_vcompress_vm_i32m4_tu(vint32m4_t vd, vint32m4_t vs2,
                                         vbool8_t vs1, size_t vl);
vint32m8_t __riscv_vcompress_vm_i32m8_tu(vint32m8_t vd, vint32m8_t vs2,
                                         vbool4_t vs1, size_t vl);
vint64m1_t __riscv_vcompress_vm_i64m1_tu(vint64m1_t vd, vint64m1_t vs2,
                                         vbool64_t vs1, size_t vl);
vint64m2_t __riscv_vcompress_vm_i64m2_tu(vint64m2_t vd, vint64m2_t vs2,
                                         vbool32_t vs1, size_t vl);
vint64m4_t __riscv_vcompress_vm_i64m4_tu(vint64m4_t vd, vint64m4_t vs2,
                                         vbool16_t vs1, size_t vl);
vint64m8_t __riscv_vcompress_vm_i64m8_tu(vint64m8_t vd, vint64m8_t vs2,
                                         vbool8_t vs1, size_t vl);
vuint8mf8_t __riscv_vcompress_vm_u8mf8_tu(vuint8mf8_t vd, vuint8mf8_t vs2,
                                          vbool64_t vs1, size_t vl);
vuint8mf4_t __riscv_vcompress_vm_u8mf4_tu(vuint8mf4_t vd, vuint8mf4_t vs2,
                                          vbool32_t vs1, size_t vl);
vuint8mf2_t __riscv_vcompress_vm_u8mf2_tu(vuint8mf2_t vd, vuint8mf2_t vs2,
                                          vbool16_t vs1, size_t vl);
vuint8m1_t __riscv_vcompress_vm_u8m1_tu(vuint8m1_t vd, vuint8m1_t vs2,
                                        vbool8_t vs1, size_t vl);
vuint8m2_t __riscv_vcompress_vm_u8m2_tu(vuint8m2_t vd, vuint8m2_t vs2,
                                        vbool4_t vs1, size_t vl);
vuint8m4_t __riscv_vcompress_vm_u8m4_tu(vuint8m4_t vd, vuint8m4_t vs2,
                                        vbool2_t vs1, size_t vl);
vuint8m8_t __riscv_vcompress_vm_u8m8_tu(vuint8m8_t vd, vuint8m8_t vs2,
                                        vbool1_t vs1, size_t vl);
vuint16mf4_t __riscv_vcompress_vm_u16mf4_tu(vuint16mf4_t vd, vuint16mf4_t vs2,
                                            vbool64_t vs1, size_t vl);
vuint16mf2_t __riscv_vcompress_vm_u16mf2_tu(vuint16mf2_t vd, vuint16mf2_t vs2,
                                            vbool32_t vs1, size_t vl);
vuint16m1_t __riscv_vcompress_vm_u16m1_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                          vbool16_t vs1, size_t vl);
vuint16m2_t __riscv_vcompress_vm_u16m2_tu(vuint16m2_t vd, vuint16m2_t vs2,
                                          vbool8_t vs1, size_t vl);
vuint16m4_t __riscv_vcompress_vm_u16m4_tu(vuint16m4_t vd, vuint16m4_t vs2,
                                          vbool4_t vs1, size_t vl);
vuint16m8_t __riscv_vcompress_vm_u16m8_tu(vuint16m8_t vd, vuint16m8_t vs2,
                                          vbool2_t vs1, size_t vl);
vuint32mf2_t __riscv_vcompress_vm_u32mf2_tu(vuint32mf2_t vd, vuint32mf2_t vs2,
                                            vbool64_t vs1, size_t vl);
vuint32m1_t __riscv_vcompress_vm_u32m1_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                          vbool32_t vs1, size_t vl);
vuint32m2_t __riscv_vcompress_vm_u32m2_tu(vuint32m2_t vd, vuint32m2_t vs2,
                                          vbool16_t vs1, size_t vl);
vuint32m4_t __riscv_vcompress_vm_u32m4_tu(vuint32m4_t vd, vuint32m4_t vs2,
                                          vbool8_t vs1, size_t vl);
vuint32m8_t __riscv_vcompress_vm_u32m8_tu(vuint32m8_t vd, vuint32m8_t vs2,
                                          vbool4_t vs1, size_t vl);
vuint64m1_t __riscv_vcompress_vm_u64m1_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                          vbool64_t vs1, size_t vl);
vuint64m2_t __riscv_vcompress_vm_u64m2_tu(vuint64m2_t vd, vuint64m2_t vs2,
                                          vbool32_t vs1, size_t vl);
vuint64m4_t __riscv_vcompress_vm_u64m4_tu(vuint64m4_t vd, vuint64m4_t vs2,
                                          vbool16_t vs1, size_t vl);
vuint64m8_t __riscv_vcompress_vm_u64m8_tu(vuint64m8_t vd, vuint64m8_t vs2,
                                          vbool8_t vs1, size_t vl);