Vector Permutation Intrinsics

Integer and Floating-Point Scalar Move Intrinsics

_Float16 __riscv_vfmv_f(vfloat16mf4_t vs1);
_Float16 __riscv_vfmv_f(vfloat16mf2_t vs1);
_Float16 __riscv_vfmv_f(vfloat16m1_t vs1);
_Float16 __riscv_vfmv_f(vfloat16m2_t vs1);
_Float16 __riscv_vfmv_f(vfloat16m4_t vs1);
_Float16 __riscv_vfmv_f(vfloat16m8_t vs1);
float __riscv_vfmv_f(vfloat32mf2_t vs1);
float __riscv_vfmv_f(vfloat32m1_t vs1);
float __riscv_vfmv_f(vfloat32m2_t vs1);
float __riscv_vfmv_f(vfloat32m4_t vs1);
float __riscv_vfmv_f(vfloat32m8_t vs1);
double __riscv_vfmv_f(vfloat64m1_t vs1);
double __riscv_vfmv_f(vfloat64m2_t vs1);
double __riscv_vfmv_f(vfloat64m4_t vs1);
double __riscv_vfmv_f(vfloat64m8_t vs1);
int8_t __riscv_vmv_x(vint8mf8_t vs1);
int8_t __riscv_vmv_x(vint8mf4_t vs1);
int8_t __riscv_vmv_x(vint8mf2_t vs1);
int8_t __riscv_vmv_x(vint8m1_t vs1);
int8_t __riscv_vmv_x(vint8m2_t vs1);
int8_t __riscv_vmv_x(vint8m4_t vs1);
int8_t __riscv_vmv_x(vint8m8_t vs1);
int16_t __riscv_vmv_x(vint16mf4_t vs1);
int16_t __riscv_vmv_x(vint16mf2_t vs1);
int16_t __riscv_vmv_x(vint16m1_t vs1);
int16_t __riscv_vmv_x(vint16m2_t vs1);
int16_t __riscv_vmv_x(vint16m4_t vs1);
int16_t __riscv_vmv_x(vint16m8_t vs1);
int32_t __riscv_vmv_x(vint32mf2_t vs1);
int32_t __riscv_vmv_x(vint32m1_t vs1);
int32_t __riscv_vmv_x(vint32m2_t vs1);
int32_t __riscv_vmv_x(vint32m4_t vs1);
int32_t __riscv_vmv_x(vint32m8_t vs1);
int64_t __riscv_vmv_x(vint64m1_t vs1);
int64_t __riscv_vmv_x(vint64m2_t vs1);
int64_t __riscv_vmv_x(vint64m4_t vs1);
int64_t __riscv_vmv_x(vint64m8_t vs1);
uint8_t __riscv_vmv_x(vuint8mf8_t vs1);
uint8_t __riscv_vmv_x(vuint8mf4_t vs1);
uint8_t __riscv_vmv_x(vuint8mf2_t vs1);
uint8_t __riscv_vmv_x(vuint8m1_t vs1);
uint8_t __riscv_vmv_x(vuint8m2_t vs1);
uint8_t __riscv_vmv_x(vuint8m4_t vs1);
uint8_t __riscv_vmv_x(vuint8m8_t vs1);
uint16_t __riscv_vmv_x(vuint16mf4_t vs1);
uint16_t __riscv_vmv_x(vuint16mf2_t vs1);
uint16_t __riscv_vmv_x(vuint16m1_t vs1);
uint16_t __riscv_vmv_x(vuint16m2_t vs1);
uint16_t __riscv_vmv_x(vuint16m4_t vs1);
uint16_t __riscv_vmv_x(vuint16m8_t vs1);
uint32_t __riscv_vmv_x(vuint32mf2_t vs1);
uint32_t __riscv_vmv_x(vuint32m1_t vs1);
uint32_t __riscv_vmv_x(vuint32m2_t vs1);
uint32_t __riscv_vmv_x(vuint32m4_t vs1);
uint32_t __riscv_vmv_x(vuint32m8_t vs1);
uint64_t __riscv_vmv_x(vuint64m1_t vs1);
uint64_t __riscv_vmv_x(vuint64m2_t vs1);
uint64_t __riscv_vmv_x(vuint64m4_t vs1);
uint64_t __riscv_vmv_x(vuint64m8_t vs1);

Vector Slideup Intrinsics

vfloat16mf4_t __riscv_vslideup(vfloat16mf4_t vd, vfloat16mf4_t vs2, size_t rs1,
                               size_t vl);
vfloat16mf2_t __riscv_vslideup(vfloat16mf2_t vd, vfloat16mf2_t vs2, size_t rs1,
                               size_t vl);
vfloat16m1_t __riscv_vslideup(vfloat16m1_t vd, vfloat16m1_t vs2, size_t rs1,
                              size_t vl);
vfloat16m2_t __riscv_vslideup(vfloat16m2_t vd, vfloat16m2_t vs2, size_t rs1,
                              size_t vl);
vfloat16m4_t __riscv_vslideup(vfloat16m4_t vd, vfloat16m4_t vs2, size_t rs1,
                              size_t vl);
vfloat16m8_t __riscv_vslideup(vfloat16m8_t vd, vfloat16m8_t vs2, size_t rs1,
                              size_t vl);
vfloat32mf2_t __riscv_vslideup(vfloat32mf2_t vd, vfloat32mf2_t vs2, size_t rs1,
                               size_t vl);
vfloat32m1_t __riscv_vslideup(vfloat32m1_t vd, vfloat32m1_t vs2, size_t rs1,
                              size_t vl);
vfloat32m2_t __riscv_vslideup(vfloat32m2_t vd, vfloat32m2_t vs2, size_t rs1,
                              size_t vl);
vfloat32m4_t __riscv_vslideup(vfloat32m4_t vd, vfloat32m4_t vs2, size_t rs1,
                              size_t vl);
vfloat32m8_t __riscv_vslideup(vfloat32m8_t vd, vfloat32m8_t vs2, size_t rs1,
                              size_t vl);
vfloat64m1_t __riscv_vslideup(vfloat64m1_t vd, vfloat64m1_t vs2, size_t rs1,
                              size_t vl);
vfloat64m2_t __riscv_vslideup(vfloat64m2_t vd, vfloat64m2_t vs2, size_t rs1,
                              size_t vl);
vfloat64m4_t __riscv_vslideup(vfloat64m4_t vd, vfloat64m4_t vs2, size_t rs1,
                              size_t vl);
vfloat64m8_t __riscv_vslideup(vfloat64m8_t vd, vfloat64m8_t vs2, size_t rs1,
                              size_t vl);
vint8mf8_t __riscv_vslideup(vint8mf8_t vd, vint8mf8_t vs2, size_t rs1,
                            size_t vl);
vint8mf4_t __riscv_vslideup(vint8mf4_t vd, vint8mf4_t vs2, size_t rs1,
                            size_t vl);
vint8mf2_t __riscv_vslideup(vint8mf2_t vd, vint8mf2_t vs2, size_t rs1,
                            size_t vl);
vint8m1_t __riscv_vslideup(vint8m1_t vd, vint8m1_t vs2, size_t rs1, size_t vl);
vint8m2_t __riscv_vslideup(vint8m2_t vd, vint8m2_t vs2, size_t rs1, size_t vl);
vint8m4_t __riscv_vslideup(vint8m4_t vd, vint8m4_t vs2, size_t rs1, size_t vl);
vint8m8_t __riscv_vslideup(vint8m8_t vd, vint8m8_t vs2, size_t rs1, size_t vl);
vint16mf4_t __riscv_vslideup(vint16mf4_t vd, vint16mf4_t vs2, size_t rs1,
                             size_t vl);
vint16mf2_t __riscv_vslideup(vint16mf2_t vd, vint16mf2_t vs2, size_t rs1,
                             size_t vl);
vint16m1_t __riscv_vslideup(vint16m1_t vd, vint16m1_t vs2, size_t rs1,
                            size_t vl);
vint16m2_t __riscv_vslideup(vint16m2_t vd, vint16m2_t vs2, size_t rs1,
                            size_t vl);
vint16m4_t __riscv_vslideup(vint16m4_t vd, vint16m4_t vs2, size_t rs1,
                            size_t vl);
vint16m8_t __riscv_vslideup(vint16m8_t vd, vint16m8_t vs2, size_t rs1,
                            size_t vl);
vint32mf2_t __riscv_vslideup(vint32mf2_t vd, vint32mf2_t vs2, size_t rs1,
                             size_t vl);
vint32m1_t __riscv_vslideup(vint32m1_t vd, vint32m1_t vs2, size_t rs1,
                            size_t vl);
vint32m2_t __riscv_vslideup(vint32m2_t vd, vint32m2_t vs2, size_t rs1,
                            size_t vl);
vint32m4_t __riscv_vslideup(vint32m4_t vd, vint32m4_t vs2, size_t rs1,
                            size_t vl);
vint32m8_t __riscv_vslideup(vint32m8_t vd, vint32m8_t vs2, size_t rs1,
                            size_t vl);
vint64m1_t __riscv_vslideup(vint64m1_t vd, vint64m1_t vs2, size_t rs1,
                            size_t vl);
vint64m2_t __riscv_vslideup(vint64m2_t vd, vint64m2_t vs2, size_t rs1,
                            size_t vl);
vint64m4_t __riscv_vslideup(vint64m4_t vd, vint64m4_t vs2, size_t rs1,
                            size_t vl);
vint64m8_t __riscv_vslideup(vint64m8_t vd, vint64m8_t vs2, size_t rs1,
                            size_t vl);
vuint8mf8_t __riscv_vslideup(vuint8mf8_t vd, vuint8mf8_t vs2, size_t rs1,
                             size_t vl);
vuint8mf4_t __riscv_vslideup(vuint8mf4_t vd, vuint8mf4_t vs2, size_t rs1,
                             size_t vl);
vuint8mf2_t __riscv_vslideup(vuint8mf2_t vd, vuint8mf2_t vs2, size_t rs1,
                             size_t vl);
vuint8m1_t __riscv_vslideup(vuint8m1_t vd, vuint8m1_t vs2, size_t rs1,
                            size_t vl);
vuint8m2_t __riscv_vslideup(vuint8m2_t vd, vuint8m2_t vs2, size_t rs1,
                            size_t vl);
vuint8m4_t __riscv_vslideup(vuint8m4_t vd, vuint8m4_t vs2, size_t rs1,
                            size_t vl);
vuint8m8_t __riscv_vslideup(vuint8m8_t vd, vuint8m8_t vs2, size_t rs1,
                            size_t vl);
vuint16mf4_t __riscv_vslideup(vuint16mf4_t vd, vuint16mf4_t vs2, size_t rs1,
                              size_t vl);
vuint16mf2_t __riscv_vslideup(vuint16mf2_t vd, vuint16mf2_t vs2, size_t rs1,
                              size_t vl);
vuint16m1_t __riscv_vslideup(vuint16m1_t vd, vuint16m1_t vs2, size_t rs1,
                             size_t vl);
vuint16m2_t __riscv_vslideup(vuint16m2_t vd, vuint16m2_t vs2, size_t rs1,
                             size_t vl);
vuint16m4_t __riscv_vslideup(vuint16m4_t vd, vuint16m4_t vs2, size_t rs1,
                             size_t vl);
vuint16m8_t __riscv_vslideup(vuint16m8_t vd, vuint16m8_t vs2, size_t rs1,
                             size_t vl);
vuint32mf2_t __riscv_vslideup(vuint32mf2_t vd, vuint32mf2_t vs2, size_t rs1,
                              size_t vl);
vuint32m1_t __riscv_vslideup(vuint32m1_t vd, vuint32m1_t vs2, size_t rs1,
                             size_t vl);
vuint32m2_t __riscv_vslideup(vuint32m2_t vd, vuint32m2_t vs2, size_t rs1,
                             size_t vl);
vuint32m4_t __riscv_vslideup(vuint32m4_t vd, vuint32m4_t vs2, size_t rs1,
                             size_t vl);
vuint32m8_t __riscv_vslideup(vuint32m8_t vd, vuint32m8_t vs2, size_t rs1,
                             size_t vl);
vuint64m1_t __riscv_vslideup(vuint64m1_t vd, vuint64m1_t vs2, size_t rs1,
                             size_t vl);
vuint64m2_t __riscv_vslideup(vuint64m2_t vd, vuint64m2_t vs2, size_t rs1,
                             size_t vl);
vuint64m4_t __riscv_vslideup(vuint64m4_t vd, vuint64m4_t vs2, size_t rs1,
                             size_t vl);
vuint64m8_t __riscv_vslideup(vuint64m8_t vd, vuint64m8_t vs2, size_t rs1,
                             size_t vl);
// masked functions
vfloat16mf4_t __riscv_vslideup(vbool64_t vm, vfloat16mf4_t vd,
                               vfloat16mf4_t vs2, size_t rs1, size_t vl);
vfloat16mf2_t __riscv_vslideup(vbool32_t vm, vfloat16mf2_t vd,
                               vfloat16mf2_t vs2, size_t rs1, size_t vl);
vfloat16m1_t __riscv_vslideup(vbool16_t vm, vfloat16m1_t vd, vfloat16m1_t vs2,
                              size_t rs1, size_t vl);
vfloat16m2_t __riscv_vslideup(vbool8_t vm, vfloat16m2_t vd, vfloat16m2_t vs2,
                              size_t rs1, size_t vl);
vfloat16m4_t __riscv_vslideup(vbool4_t vm, vfloat16m4_t vd, vfloat16m4_t vs2,
                              size_t rs1, size_t vl);
vfloat16m8_t __riscv_vslideup(vbool2_t vm, vfloat16m8_t vd, vfloat16m8_t vs2,
                              size_t rs1, size_t vl);
vfloat32mf2_t __riscv_vslideup(vbool64_t vm, vfloat32mf2_t vd,
                               vfloat32mf2_t vs2, size_t rs1, size_t vl);
vfloat32m1_t __riscv_vslideup(vbool32_t vm, vfloat32m1_t vd, vfloat32m1_t vs2,
                              size_t rs1, size_t vl);
vfloat32m2_t __riscv_vslideup(vbool16_t vm, vfloat32m2_t vd, vfloat32m2_t vs2,
                              size_t rs1, size_t vl);
vfloat32m4_t __riscv_vslideup(vbool8_t vm, vfloat32m4_t vd, vfloat32m4_t vs2,
                              size_t rs1, size_t vl);
vfloat32m8_t __riscv_vslideup(vbool4_t vm, vfloat32m8_t vd, vfloat32m8_t vs2,
                              size_t rs1, size_t vl);
vfloat64m1_t __riscv_vslideup(vbool64_t vm, vfloat64m1_t vd, vfloat64m1_t vs2,
                              size_t rs1, size_t vl);
vfloat64m2_t __riscv_vslideup(vbool32_t vm, vfloat64m2_t vd, vfloat64m2_t vs2,
                              size_t rs1, size_t vl);
vfloat64m4_t __riscv_vslideup(vbool16_t vm, vfloat64m4_t vd, vfloat64m4_t vs2,
                              size_t rs1, size_t vl);
vfloat64m8_t __riscv_vslideup(vbool8_t vm, vfloat64m8_t vd, vfloat64m8_t vs2,
                              size_t rs1, size_t vl);
vint8mf8_t __riscv_vslideup(vbool64_t vm, vint8mf8_t vd, vint8mf8_t vs2,
                            size_t rs1, size_t vl);
vint8mf4_t __riscv_vslideup(vbool32_t vm, vint8mf4_t vd, vint8mf4_t vs2,
                            size_t rs1, size_t vl);
vint8mf2_t __riscv_vslideup(vbool16_t vm, vint8mf2_t vd, vint8mf2_t vs2,
                            size_t rs1, size_t vl);
vint8m1_t __riscv_vslideup(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2, size_t rs1,
                           size_t vl);
vint8m2_t __riscv_vslideup(vbool4_t vm, vint8m2_t vd, vint8m2_t vs2, size_t rs1,
                           size_t vl);
vint8m4_t __riscv_vslideup(vbool2_t vm, vint8m4_t vd, vint8m4_t vs2, size_t rs1,
                           size_t vl);
vint8m8_t __riscv_vslideup(vbool1_t vm, vint8m8_t vd, vint8m8_t vs2, size_t rs1,
                           size_t vl);
vint16mf4_t __riscv_vslideup(vbool64_t vm, vint16mf4_t vd, vint16mf4_t vs2,
                             size_t rs1, size_t vl);
vint16mf2_t __riscv_vslideup(vbool32_t vm, vint16mf2_t vd, vint16mf2_t vs2,
                             size_t rs1, size_t vl);
vint16m1_t __riscv_vslideup(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                            size_t rs1, size_t vl);
vint16m2_t __riscv_vslideup(vbool8_t vm, vint16m2_t vd, vint16m2_t vs2,
                            size_t rs1, size_t vl);
vint16m4_t __riscv_vslideup(vbool4_t vm, vint16m4_t vd, vint16m4_t vs2,
                            size_t rs1, size_t vl);
vint16m8_t __riscv_vslideup(vbool2_t vm, vint16m8_t vd, vint16m8_t vs2,
                            size_t rs1, size_t vl);
vint32mf2_t __riscv_vslideup(vbool64_t vm, vint32mf2_t vd, vint32mf2_t vs2,
                             size_t rs1, size_t vl);
vint32m1_t __riscv_vslideup(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                            size_t rs1, size_t vl);
vint32m2_t __riscv_vslideup(vbool16_t vm, vint32m2_t vd, vint32m2_t vs2,
                            size_t rs1, size_t vl);
vint32m4_t __riscv_vslideup(vbool8_t vm, vint32m4_t vd, vint32m4_t vs2,
                            size_t rs1, size_t vl);
vint32m8_t __riscv_vslideup(vbool4_t vm, vint32m8_t vd, vint32m8_t vs2,
                            size_t rs1, size_t vl);
vint64m1_t __riscv_vslideup(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                            size_t rs1, size_t vl);
vint64m2_t __riscv_vslideup(vbool32_t vm, vint64m2_t vd, vint64m2_t vs2,
                            size_t rs1, size_t vl);
vint64m4_t __riscv_vslideup(vbool16_t vm, vint64m4_t vd, vint64m4_t vs2,
                            size_t rs1, size_t vl);
vint64m8_t __riscv_vslideup(vbool8_t vm, vint64m8_t vd, vint64m8_t vs2,
                            size_t rs1, size_t vl);
vuint8mf8_t __riscv_vslideup(vbool64_t vm, vuint8mf8_t vd, vuint8mf8_t vs2,
                             size_t rs1, size_t vl);
vuint8mf4_t __riscv_vslideup(vbool32_t vm, vuint8mf4_t vd, vuint8mf4_t vs2,
                             size_t rs1, size_t vl);
vuint8mf2_t __riscv_vslideup(vbool16_t vm, vuint8mf2_t vd, vuint8mf2_t vs2,
                             size_t rs1, size_t vl);
vuint8m1_t __riscv_vslideup(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                            size_t rs1, size_t vl);
vuint8m2_t __riscv_vslideup(vbool4_t vm, vuint8m2_t vd, vuint8m2_t vs2,
                            size_t rs1, size_t vl);
vuint8m4_t __riscv_vslideup(vbool2_t vm, vuint8m4_t vd, vuint8m4_t vs2,
                            size_t rs1, size_t vl);
vuint8m8_t __riscv_vslideup(vbool1_t vm, vuint8m8_t vd, vuint8m8_t vs2,
                            size_t rs1, size_t vl);
vuint16mf4_t __riscv_vslideup(vbool64_t vm, vuint16mf4_t vd, vuint16mf4_t vs2,
                              size_t rs1, size_t vl);
vuint16mf2_t __riscv_vslideup(vbool32_t vm, vuint16mf2_t vd, vuint16mf2_t vs2,
                              size_t rs1, size_t vl);
vuint16m1_t __riscv_vslideup(vbool16_t vm, vuint16m1_t vd, vuint16m1_t vs2,
                             size_t rs1, size_t vl);
vuint16m2_t __riscv_vslideup(vbool8_t vm, vuint16m2_t vd, vuint16m2_t vs2,
                             size_t rs1, size_t vl);
vuint16m4_t __riscv_vslideup(vbool4_t vm, vuint16m4_t vd, vuint16m4_t vs2,
                             size_t rs1, size_t vl);
vuint16m8_t __riscv_vslideup(vbool2_t vm, vuint16m8_t vd, vuint16m8_t vs2,
                             size_t rs1, size_t vl);
vuint32mf2_t __riscv_vslideup(vbool64_t vm, vuint32mf2_t vd, vuint32mf2_t vs2,
                              size_t rs1, size_t vl);
vuint32m1_t __riscv_vslideup(vbool32_t vm, vuint32m1_t vd, vuint32m1_t vs2,
                             size_t rs1, size_t vl);
vuint32m2_t __riscv_vslideup(vbool16_t vm, vuint32m2_t vd, vuint32m2_t vs2,
                             size_t rs1, size_t vl);
vuint32m4_t __riscv_vslideup(vbool8_t vm, vuint32m4_t vd, vuint32m4_t vs2,
                             size_t rs1, size_t vl);
vuint32m8_t __riscv_vslideup(vbool4_t vm, vuint32m8_t vd, vuint32m8_t vs2,
                             size_t rs1, size_t vl);
vuint64m1_t __riscv_vslideup(vbool64_t vm, vuint64m1_t vd, vuint64m1_t vs2,
                             size_t rs1, size_t vl);
vuint64m2_t __riscv_vslideup(vbool32_t vm, vuint64m2_t vd, vuint64m2_t vs2,
                             size_t rs1, size_t vl);
vuint64m4_t __riscv_vslideup(vbool16_t vm, vuint64m4_t vd, vuint64m4_t vs2,
                             size_t rs1, size_t vl);
vuint64m8_t __riscv_vslideup(vbool8_t vm, vuint64m8_t vd, vuint64m8_t vs2,
                             size_t rs1, size_t vl);

Vector Slidedown Intrinsics

vfloat16mf4_t __riscv_vslidedown(vfloat16mf4_t vs2, size_t rs1, size_t vl);
vfloat16mf2_t __riscv_vslidedown(vfloat16mf2_t vs2, size_t rs1, size_t vl);
vfloat16m1_t __riscv_vslidedown(vfloat16m1_t vs2, size_t rs1, size_t vl);
vfloat16m2_t __riscv_vslidedown(vfloat16m2_t vs2, size_t rs1, size_t vl);
vfloat16m4_t __riscv_vslidedown(vfloat16m4_t vs2, size_t rs1, size_t vl);
vfloat16m8_t __riscv_vslidedown(vfloat16m8_t vs2, size_t rs1, size_t vl);
vfloat32mf2_t __riscv_vslidedown(vfloat32mf2_t vs2, size_t rs1, size_t vl);
vfloat32m1_t __riscv_vslidedown(vfloat32m1_t vs2, size_t rs1, size_t vl);
vfloat32m2_t __riscv_vslidedown(vfloat32m2_t vs2, size_t rs1, size_t vl);
vfloat32m4_t __riscv_vslidedown(vfloat32m4_t vs2, size_t rs1, size_t vl);
vfloat32m8_t __riscv_vslidedown(vfloat32m8_t vs2, size_t rs1, size_t vl);
vfloat64m1_t __riscv_vslidedown(vfloat64m1_t vs2, size_t rs1, size_t vl);
vfloat64m2_t __riscv_vslidedown(vfloat64m2_t vs2, size_t rs1, size_t vl);
vfloat64m4_t __riscv_vslidedown(vfloat64m4_t vs2, size_t rs1, size_t vl);
vfloat64m8_t __riscv_vslidedown(vfloat64m8_t vs2, size_t rs1, size_t vl);
vint8mf8_t __riscv_vslidedown(vint8mf8_t vs2, size_t rs1, size_t vl);
vint8mf4_t __riscv_vslidedown(vint8mf4_t vs2, size_t rs1, size_t vl);
vint8mf2_t __riscv_vslidedown(vint8mf2_t vs2, size_t rs1, size_t vl);
vint8m1_t __riscv_vslidedown(vint8m1_t vs2, size_t rs1, size_t vl);
vint8m2_t __riscv_vslidedown(vint8m2_t vs2, size_t rs1, size_t vl);
vint8m4_t __riscv_vslidedown(vint8m4_t vs2, size_t rs1, size_t vl);
vint8m8_t __riscv_vslidedown(vint8m8_t vs2, size_t rs1, size_t vl);
vint16mf4_t __riscv_vslidedown(vint16mf4_t vs2, size_t rs1, size_t vl);
vint16mf2_t __riscv_vslidedown(vint16mf2_t vs2, size_t rs1, size_t vl);
vint16m1_t __riscv_vslidedown(vint16m1_t vs2, size_t rs1, size_t vl);
vint16m2_t __riscv_vslidedown(vint16m2_t vs2, size_t rs1, size_t vl);
vint16m4_t __riscv_vslidedown(vint16m4_t vs2, size_t rs1, size_t vl);
vint16m8_t __riscv_vslidedown(vint16m8_t vs2, size_t rs1, size_t vl);
vint32mf2_t __riscv_vslidedown(vint32mf2_t vs2, size_t rs1, size_t vl);
vint32m1_t __riscv_vslidedown(vint32m1_t vs2, size_t rs1, size_t vl);
vint32m2_t __riscv_vslidedown(vint32m2_t vs2, size_t rs1, size_t vl);
vint32m4_t __riscv_vslidedown(vint32m4_t vs2, size_t rs1, size_t vl);
vint32m8_t __riscv_vslidedown(vint32m8_t vs2, size_t rs1, size_t vl);
vint64m1_t __riscv_vslidedown(vint64m1_t vs2, size_t rs1, size_t vl);
vint64m2_t __riscv_vslidedown(vint64m2_t vs2, size_t rs1, size_t vl);
vint64m4_t __riscv_vslidedown(vint64m4_t vs2, size_t rs1, size_t vl);
vint64m8_t __riscv_vslidedown(vint64m8_t vs2, size_t rs1, size_t vl);
vuint8mf8_t __riscv_vslidedown(vuint8mf8_t vs2, size_t rs1, size_t vl);
vuint8mf4_t __riscv_vslidedown(vuint8mf4_t vs2, size_t rs1, size_t vl);
vuint8mf2_t __riscv_vslidedown(vuint8mf2_t vs2, size_t rs1, size_t vl);
vuint8m1_t __riscv_vslidedown(vuint8m1_t vs2, size_t rs1, size_t vl);
vuint8m2_t __riscv_vslidedown(vuint8m2_t vs2, size_t rs1, size_t vl);
vuint8m4_t __riscv_vslidedown(vuint8m4_t vs2, size_t rs1, size_t vl);
vuint8m8_t __riscv_vslidedown(vuint8m8_t vs2, size_t rs1, size_t vl);
vuint16mf4_t __riscv_vslidedown(vuint16mf4_t vs2, size_t rs1, size_t vl);
vuint16mf2_t __riscv_vslidedown(vuint16mf2_t vs2, size_t rs1, size_t vl);
vuint16m1_t __riscv_vslidedown(vuint16m1_t vs2, size_t rs1, size_t vl);
vuint16m2_t __riscv_vslidedown(vuint16m2_t vs2, size_t rs1, size_t vl);
vuint16m4_t __riscv_vslidedown(vuint16m4_t vs2, size_t rs1, size_t vl);
vuint16m8_t __riscv_vslidedown(vuint16m8_t vs2, size_t rs1, size_t vl);
vuint32mf2_t __riscv_vslidedown(vuint32mf2_t vs2, size_t rs1, size_t vl);
vuint32m1_t __riscv_vslidedown(vuint32m1_t vs2, size_t rs1, size_t vl);
vuint32m2_t __riscv_vslidedown(vuint32m2_t vs2, size_t rs1, size_t vl);
vuint32m4_t __riscv_vslidedown(vuint32m4_t vs2, size_t rs1, size_t vl);
vuint32m8_t __riscv_vslidedown(vuint32m8_t vs2, size_t rs1, size_t vl);
vuint64m1_t __riscv_vslidedown(vuint64m1_t vs2, size_t rs1, size_t vl);
vuint64m2_t __riscv_vslidedown(vuint64m2_t vs2, size_t rs1, size_t vl);
vuint64m4_t __riscv_vslidedown(vuint64m4_t vs2, size_t rs1, size_t vl);
vuint64m8_t __riscv_vslidedown(vuint64m8_t vs2, size_t rs1, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vslidedown(vbool64_t vm, vfloat16mf4_t vs2, size_t rs1,
                                 size_t vl);
vfloat16mf2_t __riscv_vslidedown(vbool32_t vm, vfloat16mf2_t vs2, size_t rs1,
                                 size_t vl);
vfloat16m1_t __riscv_vslidedown(vbool16_t vm, vfloat16m1_t vs2, size_t rs1,
                                size_t vl);
vfloat16m2_t __riscv_vslidedown(vbool8_t vm, vfloat16m2_t vs2, size_t rs1,
                                size_t vl);
vfloat16m4_t __riscv_vslidedown(vbool4_t vm, vfloat16m4_t vs2, size_t rs1,
                                size_t vl);
vfloat16m8_t __riscv_vslidedown(vbool2_t vm, vfloat16m8_t vs2, size_t rs1,
                                size_t vl);
vfloat32mf2_t __riscv_vslidedown(vbool64_t vm, vfloat32mf2_t vs2, size_t rs1,
                                 size_t vl);
vfloat32m1_t __riscv_vslidedown(vbool32_t vm, vfloat32m1_t vs2, size_t rs1,
                                size_t vl);
vfloat32m2_t __riscv_vslidedown(vbool16_t vm, vfloat32m2_t vs2, size_t rs1,
                                size_t vl);
vfloat32m4_t __riscv_vslidedown(vbool8_t vm, vfloat32m4_t vs2, size_t rs1,
                                size_t vl);
vfloat32m8_t __riscv_vslidedown(vbool4_t vm, vfloat32m8_t vs2, size_t rs1,
                                size_t vl);
vfloat64m1_t __riscv_vslidedown(vbool64_t vm, vfloat64m1_t vs2, size_t rs1,
                                size_t vl);
vfloat64m2_t __riscv_vslidedown(vbool32_t vm, vfloat64m2_t vs2, size_t rs1,
                                size_t vl);
vfloat64m4_t __riscv_vslidedown(vbool16_t vm, vfloat64m4_t vs2, size_t rs1,
                                size_t vl);
vfloat64m8_t __riscv_vslidedown(vbool8_t vm, vfloat64m8_t vs2, size_t rs1,
                                size_t vl);
vint8mf8_t __riscv_vslidedown(vbool64_t vm, vint8mf8_t vs2, size_t rs1,
                              size_t vl);
vint8mf4_t __riscv_vslidedown(vbool32_t vm, vint8mf4_t vs2, size_t rs1,
                              size_t vl);
vint8mf2_t __riscv_vslidedown(vbool16_t vm, vint8mf2_t vs2, size_t rs1,
                              size_t vl);
vint8m1_t __riscv_vslidedown(vbool8_t vm, vint8m1_t vs2, size_t rs1, size_t vl);
vint8m2_t __riscv_vslidedown(vbool4_t vm, vint8m2_t vs2, size_t rs1, size_t vl);
vint8m4_t __riscv_vslidedown(vbool2_t vm, vint8m4_t vs2, size_t rs1, size_t vl);
vint8m8_t __riscv_vslidedown(vbool1_t vm, vint8m8_t vs2, size_t rs1, size_t vl);
vint16mf4_t __riscv_vslidedown(vbool64_t vm, vint16mf4_t vs2, size_t rs1,
                               size_t vl);
vint16mf2_t __riscv_vslidedown(vbool32_t vm, vint16mf2_t vs2, size_t rs1,
                               size_t vl);
vint16m1_t __riscv_vslidedown(vbool16_t vm, vint16m1_t vs2, size_t rs1,
                              size_t vl);
vint16m2_t __riscv_vslidedown(vbool8_t vm, vint16m2_t vs2, size_t rs1,
                              size_t vl);
vint16m4_t __riscv_vslidedown(vbool4_t vm, vint16m4_t vs2, size_t rs1,
                              size_t vl);
vint16m8_t __riscv_vslidedown(vbool2_t vm, vint16m8_t vs2, size_t rs1,
                              size_t vl);
vint32mf2_t __riscv_vslidedown(vbool64_t vm, vint32mf2_t vs2, size_t rs1,
                               size_t vl);
vint32m1_t __riscv_vslidedown(vbool32_t vm, vint32m1_t vs2, size_t rs1,
                              size_t vl);
vint32m2_t __riscv_vslidedown(vbool16_t vm, vint32m2_t vs2, size_t rs1,
                              size_t vl);
vint32m4_t __riscv_vslidedown(vbool8_t vm, vint32m4_t vs2, size_t rs1,
                              size_t vl);
vint32m8_t __riscv_vslidedown(vbool4_t vm, vint32m8_t vs2, size_t rs1,
                              size_t vl);
vint64m1_t __riscv_vslidedown(vbool64_t vm, vint64m1_t vs2, size_t rs1,
                              size_t vl);
vint64m2_t __riscv_vslidedown(vbool32_t vm, vint64m2_t vs2, size_t rs1,
                              size_t vl);
vint64m4_t __riscv_vslidedown(vbool16_t vm, vint64m4_t vs2, size_t rs1,
                              size_t vl);
vint64m8_t __riscv_vslidedown(vbool8_t vm, vint64m8_t vs2, size_t rs1,
                              size_t vl);
vuint8mf8_t __riscv_vslidedown(vbool64_t vm, vuint8mf8_t vs2, size_t rs1,
                               size_t vl);
vuint8mf4_t __riscv_vslidedown(vbool32_t vm, vuint8mf4_t vs2, size_t rs1,
                               size_t vl);
vuint8mf2_t __riscv_vslidedown(vbool16_t vm, vuint8mf2_t vs2, size_t rs1,
                               size_t vl);
vuint8m1_t __riscv_vslidedown(vbool8_t vm, vuint8m1_t vs2, size_t rs1,
                              size_t vl);
vuint8m2_t __riscv_vslidedown(vbool4_t vm, vuint8m2_t vs2, size_t rs1,
                              size_t vl);
vuint8m4_t __riscv_vslidedown(vbool2_t vm, vuint8m4_t vs2, size_t rs1,
                              size_t vl);
vuint8m8_t __riscv_vslidedown(vbool1_t vm, vuint8m8_t vs2, size_t rs1,
                              size_t vl);
vuint16mf4_t __riscv_vslidedown(vbool64_t vm, vuint16mf4_t vs2, size_t rs1,
                                size_t vl);
vuint16mf2_t __riscv_vslidedown(vbool32_t vm, vuint16mf2_t vs2, size_t rs1,
                                size_t vl);
vuint16m1_t __riscv_vslidedown(vbool16_t vm, vuint16m1_t vs2, size_t rs1,
                               size_t vl);
vuint16m2_t __riscv_vslidedown(vbool8_t vm, vuint16m2_t vs2, size_t rs1,
                               size_t vl);
vuint16m4_t __riscv_vslidedown(vbool4_t vm, vuint16m4_t vs2, size_t rs1,
                               size_t vl);
vuint16m8_t __riscv_vslidedown(vbool2_t vm, vuint16m8_t vs2, size_t rs1,
                               size_t vl);
vuint32mf2_t __riscv_vslidedown(vbool64_t vm, vuint32mf2_t vs2, size_t rs1,
                                size_t vl);
vuint32m1_t __riscv_vslidedown(vbool32_t vm, vuint32m1_t vs2, size_t rs1,
                               size_t vl);
vuint32m2_t __riscv_vslidedown(vbool16_t vm, vuint32m2_t vs2, size_t rs1,
                               size_t vl);
vuint32m4_t __riscv_vslidedown(vbool8_t vm, vuint32m4_t vs2, size_t rs1,
                               size_t vl);
vuint32m8_t __riscv_vslidedown(vbool4_t vm, vuint32m8_t vs2, size_t rs1,
                               size_t vl);
vuint64m1_t __riscv_vslidedown(vbool64_t vm, vuint64m1_t vs2, size_t rs1,
                               size_t vl);
vuint64m2_t __riscv_vslidedown(vbool32_t vm, vuint64m2_t vs2, size_t rs1,
                               size_t vl);
vuint64m4_t __riscv_vslidedown(vbool16_t vm, vuint64m4_t vs2, size_t rs1,
                               size_t vl);
vuint64m8_t __riscv_vslidedown(vbool8_t vm, vuint64m8_t vs2, size_t rs1,
                               size_t vl);

Vector Slide1up and Slide1down Intrinsics

vfloat16mf4_t __riscv_vfslide1up(vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfslide1up(vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfslide1up(vfloat16m1_t vs2, _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfslide1up(vfloat16m2_t vs2, _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfslide1up(vfloat16m4_t vs2, _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfslide1up(vfloat16m8_t vs2, _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfslide1up(vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfslide1up(vfloat32m1_t vs2, float rs1, size_t vl);
vfloat32m2_t __riscv_vfslide1up(vfloat32m2_t vs2, float rs1, size_t vl);
vfloat32m4_t __riscv_vfslide1up(vfloat32m4_t vs2, float rs1, size_t vl);
vfloat32m8_t __riscv_vfslide1up(vfloat32m8_t vs2, float rs1, size_t vl);
vfloat64m1_t __riscv_vfslide1up(vfloat64m1_t vs2, double rs1, size_t vl);
vfloat64m2_t __riscv_vfslide1up(vfloat64m2_t vs2, double rs1, size_t vl);
vfloat64m4_t __riscv_vfslide1up(vfloat64m4_t vs2, double rs1, size_t vl);
vfloat64m8_t __riscv_vfslide1up(vfloat64m8_t vs2, double rs1, size_t vl);
vfloat16mf4_t __riscv_vfslide1down(vfloat16mf4_t vs2, _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfslide1down(vfloat16mf2_t vs2, _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfslide1down(vfloat16m1_t vs2, _Float16 rs1, size_t vl);
vfloat16m2_t __riscv_vfslide1down(vfloat16m2_t vs2, _Float16 rs1, size_t vl);
vfloat16m4_t __riscv_vfslide1down(vfloat16m4_t vs2, _Float16 rs1, size_t vl);
vfloat16m8_t __riscv_vfslide1down(vfloat16m8_t vs2, _Float16 rs1, size_t vl);
vfloat32mf2_t __riscv_vfslide1down(vfloat32mf2_t vs2, float rs1, size_t vl);
vfloat32m1_t __riscv_vfslide1down(vfloat32m1_t vs2, float rs1, size_t vl);
vfloat32m2_t __riscv_vfslide1down(vfloat32m2_t vs2, float rs1, size_t vl);
vfloat32m4_t __riscv_vfslide1down(vfloat32m4_t vs2, float rs1, size_t vl);
vfloat32m8_t __riscv_vfslide1down(vfloat32m8_t vs2, float rs1, size_t vl);
vfloat64m1_t __riscv_vfslide1down(vfloat64m1_t vs2, double rs1, size_t vl);
vfloat64m2_t __riscv_vfslide1down(vfloat64m2_t vs2, double rs1, size_t vl);
vfloat64m4_t __riscv_vfslide1down(vfloat64m4_t vs2, double rs1, size_t vl);
vfloat64m8_t __riscv_vfslide1down(vfloat64m8_t vs2, double rs1, size_t vl);
vint8mf8_t __riscv_vslide1up(vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vslide1up(vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vslide1up(vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vslide1up(vint8m1_t vs2, int8_t rs1, size_t vl);
vint8m2_t __riscv_vslide1up(vint8m2_t vs2, int8_t rs1, size_t vl);
vint8m4_t __riscv_vslide1up(vint8m4_t vs2, int8_t rs1, size_t vl);
vint8m8_t __riscv_vslide1up(vint8m8_t vs2, int8_t rs1, size_t vl);
vint16mf4_t __riscv_vslide1up(vint16mf4_t vs2, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vslide1up(vint16mf2_t vs2, int16_t rs1, size_t vl);
vint16m1_t __riscv_vslide1up(vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vslide1up(vint16m2_t vs2, int16_t rs1, size_t vl);
vint16m4_t __riscv_vslide1up(vint16m4_t vs2, int16_t rs1, size_t vl);
vint16m8_t __riscv_vslide1up(vint16m8_t vs2, int16_t rs1, size_t vl);
vint32mf2_t __riscv_vslide1up(vint32mf2_t vs2, int32_t rs1, size_t vl);
vint32m1_t __riscv_vslide1up(vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vslide1up(vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vslide1up(vint32m4_t vs2, int32_t rs1, size_t vl);
vint32m8_t __riscv_vslide1up(vint32m8_t vs2, int32_t rs1, size_t vl);
vint64m1_t __riscv_vslide1up(vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vslide1up(vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vslide1up(vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vslide1up(vint64m8_t vs2, int64_t rs1, size_t vl);
vint8mf8_t __riscv_vslide1down(vint8mf8_t vs2, int8_t rs1, size_t vl);
vint8mf4_t __riscv_vslide1down(vint8mf4_t vs2, int8_t rs1, size_t vl);
vint8mf2_t __riscv_vslide1down(vint8mf2_t vs2, int8_t rs1, size_t vl);
vint8m1_t __riscv_vslide1down(vint8m1_t vs2, int8_t rs1, size_t vl);
vint8m2_t __riscv_vslide1down(vint8m2_t vs2, int8_t rs1, size_t vl);
vint8m4_t __riscv_vslide1down(vint8m4_t vs2, int8_t rs1, size_t vl);
vint8m8_t __riscv_vslide1down(vint8m8_t vs2, int8_t rs1, size_t vl);
vint16mf4_t __riscv_vslide1down(vint16mf4_t vs2, int16_t rs1, size_t vl);
vint16mf2_t __riscv_vslide1down(vint16mf2_t vs2, int16_t rs1, size_t vl);
vint16m1_t __riscv_vslide1down(vint16m1_t vs2, int16_t rs1, size_t vl);
vint16m2_t __riscv_vslide1down(vint16m2_t vs2, int16_t rs1, size_t vl);
vint16m4_t __riscv_vslide1down(vint16m4_t vs2, int16_t rs1, size_t vl);
vint16m8_t __riscv_vslide1down(vint16m8_t vs2, int16_t rs1, size_t vl);
vint32mf2_t __riscv_vslide1down(vint32mf2_t vs2, int32_t rs1, size_t vl);
vint32m1_t __riscv_vslide1down(vint32m1_t vs2, int32_t rs1, size_t vl);
vint32m2_t __riscv_vslide1down(vint32m2_t vs2, int32_t rs1, size_t vl);
vint32m4_t __riscv_vslide1down(vint32m4_t vs2, int32_t rs1, size_t vl);
vint32m8_t __riscv_vslide1down(vint32m8_t vs2, int32_t rs1, size_t vl);
vint64m1_t __riscv_vslide1down(vint64m1_t vs2, int64_t rs1, size_t vl);
vint64m2_t __riscv_vslide1down(vint64m2_t vs2, int64_t rs1, size_t vl);
vint64m4_t __riscv_vslide1down(vint64m4_t vs2, int64_t rs1, size_t vl);
vint64m8_t __riscv_vslide1down(vint64m8_t vs2, int64_t rs1, size_t vl);
vuint8mf8_t __riscv_vslide1up(vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vslide1up(vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vslide1up(vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vslide1up(vuint8m1_t vs2, uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vslide1up(vuint8m2_t vs2, uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vslide1up(vuint8m4_t vs2, uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vslide1up(vuint8m8_t vs2, uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vslide1up(vuint16mf4_t vs2, uint16_t rs1, size_t vl);
vuint16mf2_t __riscv_vslide1up(vuint16mf2_t vs2, uint16_t rs1, size_t vl);
vuint16m1_t __riscv_vslide1up(vuint16m1_t vs2, uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vslide1up(vuint16m2_t vs2, uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vslide1up(vuint16m4_t vs2, uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vslide1up(vuint16m8_t vs2, uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vslide1up(vuint32mf2_t vs2, uint32_t rs1, size_t vl);
vuint32m1_t __riscv_vslide1up(vuint32m1_t vs2, uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vslide1up(vuint32m2_t vs2, uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vslide1up(vuint32m4_t vs2, uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vslide1up(vuint32m8_t vs2, uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vslide1up(vuint64m1_t vs2, uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vslide1up(vuint64m2_t vs2, uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vslide1up(vuint64m4_t vs2, uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vslide1up(vuint64m8_t vs2, uint64_t rs1, size_t vl);
vuint8mf8_t __riscv_vslide1down(vuint8mf8_t vs2, uint8_t rs1, size_t vl);
vuint8mf4_t __riscv_vslide1down(vuint8mf4_t vs2, uint8_t rs1, size_t vl);
vuint8mf2_t __riscv_vslide1down(vuint8mf2_t vs2, uint8_t rs1, size_t vl);
vuint8m1_t __riscv_vslide1down(vuint8m1_t vs2, uint8_t rs1, size_t vl);
vuint8m2_t __riscv_vslide1down(vuint8m2_t vs2, uint8_t rs1, size_t vl);
vuint8m4_t __riscv_vslide1down(vuint8m4_t vs2, uint8_t rs1, size_t vl);
vuint8m8_t __riscv_vslide1down(vuint8m8_t vs2, uint8_t rs1, size_t vl);
vuint16mf4_t __riscv_vslide1down(vuint16mf4_t vs2, uint16_t rs1, size_t vl);
vuint16mf2_t __riscv_vslide1down(vuint16mf2_t vs2, uint16_t rs1, size_t vl);
vuint16m1_t __riscv_vslide1down(vuint16m1_t vs2, uint16_t rs1, size_t vl);
vuint16m2_t __riscv_vslide1down(vuint16m2_t vs2, uint16_t rs1, size_t vl);
vuint16m4_t __riscv_vslide1down(vuint16m4_t vs2, uint16_t rs1, size_t vl);
vuint16m8_t __riscv_vslide1down(vuint16m8_t vs2, uint16_t rs1, size_t vl);
vuint32mf2_t __riscv_vslide1down(vuint32mf2_t vs2, uint32_t rs1, size_t vl);
vuint32m1_t __riscv_vslide1down(vuint32m1_t vs2, uint32_t rs1, size_t vl);
vuint32m2_t __riscv_vslide1down(vuint32m2_t vs2, uint32_t rs1, size_t vl);
vuint32m4_t __riscv_vslide1down(vuint32m4_t vs2, uint32_t rs1, size_t vl);
vuint32m8_t __riscv_vslide1down(vuint32m8_t vs2, uint32_t rs1, size_t vl);
vuint64m1_t __riscv_vslide1down(vuint64m1_t vs2, uint64_t rs1, size_t vl);
vuint64m2_t __riscv_vslide1down(vuint64m2_t vs2, uint64_t rs1, size_t vl);
vuint64m4_t __riscv_vslide1down(vuint64m4_t vs2, uint64_t rs1, size_t vl);
vuint64m8_t __riscv_vslide1down(vuint64m8_t vs2, uint64_t rs1, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vfslide1up(vbool64_t vm, vfloat16mf4_t vs2, _Float16 rs1,
                                 size_t vl);
vfloat16mf2_t __riscv_vfslide1up(vbool32_t vm, vfloat16mf2_t vs2, _Float16 rs1,
                                 size_t vl);
vfloat16m1_t __riscv_vfslide1up(vbool16_t vm, vfloat16m1_t vs2, _Float16 rs1,
                                size_t vl);
vfloat16m2_t __riscv_vfslide1up(vbool8_t vm, vfloat16m2_t vs2, _Float16 rs1,
                                size_t vl);
vfloat16m4_t __riscv_vfslide1up(vbool4_t vm, vfloat16m4_t vs2, _Float16 rs1,
                                size_t vl);
vfloat16m8_t __riscv_vfslide1up(vbool2_t vm, vfloat16m8_t vs2, _Float16 rs1,
                                size_t vl);
vfloat32mf2_t __riscv_vfslide1up(vbool64_t vm, vfloat32mf2_t vs2, float rs1,
                                 size_t vl);
vfloat32m1_t __riscv_vfslide1up(vbool32_t vm, vfloat32m1_t vs2, float rs1,
                                size_t vl);
vfloat32m2_t __riscv_vfslide1up(vbool16_t vm, vfloat32m2_t vs2, float rs1,
                                size_t vl);
vfloat32m4_t __riscv_vfslide1up(vbool8_t vm, vfloat32m4_t vs2, float rs1,
                                size_t vl);
vfloat32m8_t __riscv_vfslide1up(vbool4_t vm, vfloat32m8_t vs2, float rs1,
                                size_t vl);
vfloat64m1_t __riscv_vfslide1up(vbool64_t vm, vfloat64m1_t vs2, double rs1,
                                size_t vl);
vfloat64m2_t __riscv_vfslide1up(vbool32_t vm, vfloat64m2_t vs2, double rs1,
                                size_t vl);
vfloat64m4_t __riscv_vfslide1up(vbool16_t vm, vfloat64m4_t vs2, double rs1,
                                size_t vl);
vfloat64m8_t __riscv_vfslide1up(vbool8_t vm, vfloat64m8_t vs2, double rs1,
                                size_t vl);
vfloat16mf4_t __riscv_vfslide1down(vbool64_t vm, vfloat16mf4_t vs2,
                                   _Float16 rs1, size_t vl);
vfloat16mf2_t __riscv_vfslide1down(vbool32_t vm, vfloat16mf2_t vs2,
                                   _Float16 rs1, size_t vl);
vfloat16m1_t __riscv_vfslide1down(vbool16_t vm, vfloat16m1_t vs2, _Float16 rs1,
                                  size_t vl);
vfloat16m2_t __riscv_vfslide1down(vbool8_t vm, vfloat16m2_t vs2, _Float16 rs1,
                                  size_t vl);
vfloat16m4_t __riscv_vfslide1down(vbool4_t vm, vfloat16m4_t vs2, _Float16 rs1,
                                  size_t vl);
vfloat16m8_t __riscv_vfslide1down(vbool2_t vm, vfloat16m8_t vs2, _Float16 rs1,
                                  size_t vl);
vfloat32mf2_t __riscv_vfslide1down(vbool64_t vm, vfloat32mf2_t vs2, float rs1,
                                   size_t vl);
vfloat32m1_t __riscv_vfslide1down(vbool32_t vm, vfloat32m1_t vs2, float rs1,
                                  size_t vl);
vfloat32m2_t __riscv_vfslide1down(vbool16_t vm, vfloat32m2_t vs2, float rs1,
                                  size_t vl);
vfloat32m4_t __riscv_vfslide1down(vbool8_t vm, vfloat32m4_t vs2, float rs1,
                                  size_t vl);
vfloat32m8_t __riscv_vfslide1down(vbool4_t vm, vfloat32m8_t vs2, float rs1,
                                  size_t vl);
vfloat64m1_t __riscv_vfslide1down(vbool64_t vm, vfloat64m1_t vs2, double rs1,
                                  size_t vl);
vfloat64m2_t __riscv_vfslide1down(vbool32_t vm, vfloat64m2_t vs2, double rs1,
                                  size_t vl);
vfloat64m4_t __riscv_vfslide1down(vbool16_t vm, vfloat64m4_t vs2, double rs1,
                                  size_t vl);
vfloat64m8_t __riscv_vfslide1down(vbool8_t vm, vfloat64m8_t vs2, double rs1,
                                  size_t vl);
vint8mf8_t __riscv_vslide1up(vbool64_t vm, vint8mf8_t vs2, int8_t rs1,
                             size_t vl);
vint8mf4_t __riscv_vslide1up(vbool32_t vm, vint8mf4_t vs2, int8_t rs1,
                             size_t vl);
vint8mf2_t __riscv_vslide1up(vbool16_t vm, vint8mf2_t vs2, int8_t rs1,
                             size_t vl);
vint8m1_t __riscv_vslide1up(vbool8_t vm, vint8m1_t vs2, int8_t rs1, size_t vl);
vint8m2_t __riscv_vslide1up(vbool4_t vm, vint8m2_t vs2, int8_t rs1, size_t vl);
vint8m4_t __riscv_vslide1up(vbool2_t vm, vint8m4_t vs2, int8_t rs1, size_t vl);
vint8m8_t __riscv_vslide1up(vbool1_t vm, vint8m8_t vs2, int8_t rs1, size_t vl);
vint16mf4_t __riscv_vslide1up(vbool64_t vm, vint16mf4_t vs2, int16_t rs1,
                              size_t vl);
vint16mf2_t __riscv_vslide1up(vbool32_t vm, vint16mf2_t vs2, int16_t rs1,
                              size_t vl);
vint16m1_t __riscv_vslide1up(vbool16_t vm, vint16m1_t vs2, int16_t rs1,
                             size_t vl);
vint16m2_t __riscv_vslide1up(vbool8_t vm, vint16m2_t vs2, int16_t rs1,
                             size_t vl);
vint16m4_t __riscv_vslide1up(vbool4_t vm, vint16m4_t vs2, int16_t rs1,
                             size_t vl);
vint16m8_t __riscv_vslide1up(vbool2_t vm, vint16m8_t vs2, int16_t rs1,
                             size_t vl);
vint32mf2_t __riscv_vslide1up(vbool64_t vm, vint32mf2_t vs2, int32_t rs1,
                              size_t vl);
vint32m1_t __riscv_vslide1up(vbool32_t vm, vint32m1_t vs2, int32_t rs1,
                             size_t vl);
vint32m2_t __riscv_vslide1up(vbool16_t vm, vint32m2_t vs2, int32_t rs1,
                             size_t vl);
vint32m4_t __riscv_vslide1up(vbool8_t vm, vint32m4_t vs2, int32_t rs1,
                             size_t vl);
vint32m8_t __riscv_vslide1up(vbool4_t vm, vint32m8_t vs2, int32_t rs1,
                             size_t vl);
vint64m1_t __riscv_vslide1up(vbool64_t vm, vint64m1_t vs2, int64_t rs1,
                             size_t vl);
vint64m2_t __riscv_vslide1up(vbool32_t vm, vint64m2_t vs2, int64_t rs1,
                             size_t vl);
vint64m4_t __riscv_vslide1up(vbool16_t vm, vint64m4_t vs2, int64_t rs1,
                             size_t vl);
vint64m8_t __riscv_vslide1up(vbool8_t vm, vint64m8_t vs2, int64_t rs1,
                             size_t vl);
vint8mf8_t __riscv_vslide1down(vbool64_t vm, vint8mf8_t vs2, int8_t rs1,
                               size_t vl);
vint8mf4_t __riscv_vslide1down(vbool32_t vm, vint8mf4_t vs2, int8_t rs1,
                               size_t vl);
vint8mf2_t __riscv_vslide1down(vbool16_t vm, vint8mf2_t vs2, int8_t rs1,
                               size_t vl);
vint8m1_t __riscv_vslide1down(vbool8_t vm, vint8m1_t vs2, int8_t rs1,
                              size_t vl);
vint8m2_t __riscv_vslide1down(vbool4_t vm, vint8m2_t vs2, int8_t rs1,
                              size_t vl);
vint8m4_t __riscv_vslide1down(vbool2_t vm, vint8m4_t vs2, int8_t rs1,
                              size_t vl);
vint8m8_t __riscv_vslide1down(vbool1_t vm, vint8m8_t vs2, int8_t rs1,
                              size_t vl);
vint16mf4_t __riscv_vslide1down(vbool64_t vm, vint16mf4_t vs2, int16_t rs1,
                                size_t vl);
vint16mf2_t __riscv_vslide1down(vbool32_t vm, vint16mf2_t vs2, int16_t rs1,
                                size_t vl);
vint16m1_t __riscv_vslide1down(vbool16_t vm, vint16m1_t vs2, int16_t rs1,
                               size_t vl);
vint16m2_t __riscv_vslide1down(vbool8_t vm, vint16m2_t vs2, int16_t rs1,
                               size_t vl);
vint16m4_t __riscv_vslide1down(vbool4_t vm, vint16m4_t vs2, int16_t rs1,
                               size_t vl);
vint16m8_t __riscv_vslide1down(vbool2_t vm, vint16m8_t vs2, int16_t rs1,
                               size_t vl);
vint32mf2_t __riscv_vslide1down(vbool64_t vm, vint32mf2_t vs2, int32_t rs1,
                                size_t vl);
vint32m1_t __riscv_vslide1down(vbool32_t vm, vint32m1_t vs2, int32_t rs1,
                               size_t vl);
vint32m2_t __riscv_vslide1down(vbool16_t vm, vint32m2_t vs2, int32_t rs1,
                               size_t vl);
vint32m4_t __riscv_vslide1down(vbool8_t vm, vint32m4_t vs2, int32_t rs1,
                               size_t vl);
vint32m8_t __riscv_vslide1down(vbool4_t vm, vint32m8_t vs2, int32_t rs1,
                               size_t vl);
vint64m1_t __riscv_vslide1down(vbool64_t vm, vint64m1_t vs2, int64_t rs1,
                               size_t vl);
vint64m2_t __riscv_vslide1down(vbool32_t vm, vint64m2_t vs2, int64_t rs1,
                               size_t vl);
vint64m4_t __riscv_vslide1down(vbool16_t vm, vint64m4_t vs2, int64_t rs1,
                               size_t vl);
vint64m8_t __riscv_vslide1down(vbool8_t vm, vint64m8_t vs2, int64_t rs1,
                               size_t vl);
vuint8mf8_t __riscv_vslide1up(vbool64_t vm, vuint8mf8_t vs2, uint8_t rs1,
                              size_t vl);
vuint8mf4_t __riscv_vslide1up(vbool32_t vm, vuint8mf4_t vs2, uint8_t rs1,
                              size_t vl);
vuint8mf2_t __riscv_vslide1up(vbool16_t vm, vuint8mf2_t vs2, uint8_t rs1,
                              size_t vl);
vuint8m1_t __riscv_vslide1up(vbool8_t vm, vuint8m1_t vs2, uint8_t rs1,
                             size_t vl);
vuint8m2_t __riscv_vslide1up(vbool4_t vm, vuint8m2_t vs2, uint8_t rs1,
                             size_t vl);
vuint8m4_t __riscv_vslide1up(vbool2_t vm, vuint8m4_t vs2, uint8_t rs1,
                             size_t vl);
vuint8m8_t __riscv_vslide1up(vbool1_t vm, vuint8m8_t vs2, uint8_t rs1,
                             size_t vl);
vuint16mf4_t __riscv_vslide1up(vbool64_t vm, vuint16mf4_t vs2, uint16_t rs1,
                               size_t vl);
vuint16mf2_t __riscv_vslide1up(vbool32_t vm, vuint16mf2_t vs2, uint16_t rs1,
                               size_t vl);
vuint16m1_t __riscv_vslide1up(vbool16_t vm, vuint16m1_t vs2, uint16_t rs1,
                              size_t vl);
vuint16m2_t __riscv_vslide1up(vbool8_t vm, vuint16m2_t vs2, uint16_t rs1,
                              size_t vl);
vuint16m4_t __riscv_vslide1up(vbool4_t vm, vuint16m4_t vs2, uint16_t rs1,
                              size_t vl);
vuint16m8_t __riscv_vslide1up(vbool2_t vm, vuint16m8_t vs2, uint16_t rs1,
                              size_t vl);
vuint32mf2_t __riscv_vslide1up(vbool64_t vm, vuint32mf2_t vs2, uint32_t rs1,
                               size_t vl);
vuint32m1_t __riscv_vslide1up(vbool32_t vm, vuint32m1_t vs2, uint32_t rs1,
                              size_t vl);
vuint32m2_t __riscv_vslide1up(vbool16_t vm, vuint32m2_t vs2, uint32_t rs1,
                              size_t vl);
vuint32m4_t __riscv_vslide1up(vbool8_t vm, vuint32m4_t vs2, uint32_t rs1,
                              size_t vl);
vuint32m8_t __riscv_vslide1up(vbool4_t vm, vuint32m8_t vs2, uint32_t rs1,
                              size_t vl);
vuint64m1_t __riscv_vslide1up(vbool64_t vm, vuint64m1_t vs2, uint64_t rs1,
                              size_t vl);
vuint64m2_t __riscv_vslide1up(vbool32_t vm, vuint64m2_t vs2, uint64_t rs1,
                              size_t vl);
vuint64m4_t __riscv_vslide1up(vbool16_t vm, vuint64m4_t vs2, uint64_t rs1,
                              size_t vl);
vuint64m8_t __riscv_vslide1up(vbool8_t vm, vuint64m8_t vs2, uint64_t rs1,
                              size_t vl);
vuint8mf8_t __riscv_vslide1down(vbool64_t vm, vuint8mf8_t vs2, uint8_t rs1,
                                size_t vl);
vuint8mf4_t __riscv_vslide1down(vbool32_t vm, vuint8mf4_t vs2, uint8_t rs1,
                                size_t vl);
vuint8mf2_t __riscv_vslide1down(vbool16_t vm, vuint8mf2_t vs2, uint8_t rs1,
                                size_t vl);
vuint8m1_t __riscv_vslide1down(vbool8_t vm, vuint8m1_t vs2, uint8_t rs1,
                               size_t vl);
vuint8m2_t __riscv_vslide1down(vbool4_t vm, vuint8m2_t vs2, uint8_t rs1,
                               size_t vl);
vuint8m4_t __riscv_vslide1down(vbool2_t vm, vuint8m4_t vs2, uint8_t rs1,
                               size_t vl);
vuint8m8_t __riscv_vslide1down(vbool1_t vm, vuint8m8_t vs2, uint8_t rs1,
                               size_t vl);
vuint16mf4_t __riscv_vslide1down(vbool64_t vm, vuint16mf4_t vs2, uint16_t rs1,
                                 size_t vl);
vuint16mf2_t __riscv_vslide1down(vbool32_t vm, vuint16mf2_t vs2, uint16_t rs1,
                                 size_t vl);
vuint16m1_t __riscv_vslide1down(vbool16_t vm, vuint16m1_t vs2, uint16_t rs1,
                                size_t vl);
vuint16m2_t __riscv_vslide1down(vbool8_t vm, vuint16m2_t vs2, uint16_t rs1,
                                size_t vl);
vuint16m4_t __riscv_vslide1down(vbool4_t vm, vuint16m4_t vs2, uint16_t rs1,
                                size_t vl);
vuint16m8_t __riscv_vslide1down(vbool2_t vm, vuint16m8_t vs2, uint16_t rs1,
                                size_t vl);
vuint32mf2_t __riscv_vslide1down(vbool64_t vm, vuint32mf2_t vs2, uint32_t rs1,
                                 size_t vl);
vuint32m1_t __riscv_vslide1down(vbool32_t vm, vuint32m1_t vs2, uint32_t rs1,
                                size_t vl);
vuint32m2_t __riscv_vslide1down(vbool16_t vm, vuint32m2_t vs2, uint32_t rs1,
                                size_t vl);
vuint32m4_t __riscv_vslide1down(vbool8_t vm, vuint32m4_t vs2, uint32_t rs1,
                                size_t vl);
vuint32m8_t __riscv_vslide1down(vbool4_t vm, vuint32m8_t vs2, uint32_t rs1,
                                size_t vl);
vuint64m1_t __riscv_vslide1down(vbool64_t vm, vuint64m1_t vs2, uint64_t rs1,
                                size_t vl);
vuint64m2_t __riscv_vslide1down(vbool32_t vm, vuint64m2_t vs2, uint64_t rs1,
                                size_t vl);
vuint64m4_t __riscv_vslide1down(vbool16_t vm, vuint64m4_t vs2, uint64_t rs1,
                                size_t vl);
vuint64m8_t __riscv_vslide1down(vbool8_t vm, vuint64m8_t vs2, uint64_t rs1,
                                size_t vl);

Vector Register Gather Intrinsics

vfloat16mf4_t __riscv_vrgather(vfloat16mf4_t vs2, vuint16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vrgather(vfloat16mf4_t vs2, size_t vs1, size_t vl);
vfloat16mf2_t __riscv_vrgather(vfloat16mf2_t vs2, vuint16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vrgather(vfloat16mf2_t vs2, size_t vs1, size_t vl);
vfloat16m1_t __riscv_vrgather(vfloat16m1_t vs2, vuint16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vrgather(vfloat16m1_t vs2, size_t vs1, size_t vl);
vfloat16m2_t __riscv_vrgather(vfloat16m2_t vs2, vuint16m2_t vs1, size_t vl);
vfloat16m2_t __riscv_vrgather(vfloat16m2_t vs2, size_t vs1, size_t vl);
vfloat16m4_t __riscv_vrgather(vfloat16m4_t vs2, vuint16m4_t vs1, size_t vl);
vfloat16m4_t __riscv_vrgather(vfloat16m4_t vs2, size_t vs1, size_t vl);
vfloat16m8_t __riscv_vrgather(vfloat16m8_t vs2, vuint16m8_t vs1, size_t vl);
vfloat16m8_t __riscv_vrgather(vfloat16m8_t vs2, size_t vs1, size_t vl);
vfloat32mf2_t __riscv_vrgather(vfloat32mf2_t vs2, vuint32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vrgather(vfloat32mf2_t vs2, size_t vs1, size_t vl);
vfloat32m1_t __riscv_vrgather(vfloat32m1_t vs2, vuint32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vrgather(vfloat32m1_t vs2, size_t vs1, size_t vl);
vfloat32m2_t __riscv_vrgather(vfloat32m2_t vs2, vuint32m2_t vs1, size_t vl);
vfloat32m2_t __riscv_vrgather(vfloat32m2_t vs2, size_t vs1, size_t vl);
vfloat32m4_t __riscv_vrgather(vfloat32m4_t vs2, vuint32m4_t vs1, size_t vl);
vfloat32m4_t __riscv_vrgather(vfloat32m4_t vs2, size_t vs1, size_t vl);
vfloat32m8_t __riscv_vrgather(vfloat32m8_t vs2, vuint32m8_t vs1, size_t vl);
vfloat32m8_t __riscv_vrgather(vfloat32m8_t vs2, size_t vs1, size_t vl);
vfloat64m1_t __riscv_vrgather(vfloat64m1_t vs2, vuint64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vrgather(vfloat64m1_t vs2, size_t vs1, size_t vl);
vfloat64m2_t __riscv_vrgather(vfloat64m2_t vs2, vuint64m2_t vs1, size_t vl);
vfloat64m2_t __riscv_vrgather(vfloat64m2_t vs2, size_t vs1, size_t vl);
vfloat64m4_t __riscv_vrgather(vfloat64m4_t vs2, vuint64m4_t vs1, size_t vl);
vfloat64m4_t __riscv_vrgather(vfloat64m4_t vs2, size_t vs1, size_t vl);
vfloat64m8_t __riscv_vrgather(vfloat64m8_t vs2, vuint64m8_t vs1, size_t vl);
vfloat64m8_t __riscv_vrgather(vfloat64m8_t vs2, size_t vs1, size_t vl);
vfloat16mf4_t __riscv_vrgatherei16(vfloat16mf4_t vs2, vuint16mf4_t vs1,
                                   size_t vl);
vfloat16mf2_t __riscv_vrgatherei16(vfloat16mf2_t vs2, vuint16mf2_t vs1,
                                   size_t vl);
vfloat16m1_t __riscv_vrgatherei16(vfloat16m1_t vs2, vuint16m1_t vs1, size_t vl);
vfloat16m2_t __riscv_vrgatherei16(vfloat16m2_t vs2, vuint16m2_t vs1, size_t vl);
vfloat16m4_t __riscv_vrgatherei16(vfloat16m4_t vs2, vuint16m4_t vs1, size_t vl);
vfloat16m8_t __riscv_vrgatherei16(vfloat16m8_t vs2, vuint16m8_t vs1, size_t vl);
vfloat32mf2_t __riscv_vrgatherei16(vfloat32mf2_t vs2, vuint16mf4_t vs1,
                                   size_t vl);
vfloat32m1_t __riscv_vrgatherei16(vfloat32m1_t vs2, vuint16mf2_t vs1,
                                  size_t vl);
vfloat32m2_t __riscv_vrgatherei16(vfloat32m2_t vs2, vuint16m1_t vs1, size_t vl);
vfloat32m4_t __riscv_vrgatherei16(vfloat32m4_t vs2, vuint16m2_t vs1, size_t vl);
vfloat32m8_t __riscv_vrgatherei16(vfloat32m8_t vs2, vuint16m4_t vs1, size_t vl);
vfloat64m1_t __riscv_vrgatherei16(vfloat64m1_t vs2, vuint16mf4_t vs1,
                                  size_t vl);
vfloat64m2_t __riscv_vrgatherei16(vfloat64m2_t vs2, vuint16mf2_t vs1,
                                  size_t vl);
vfloat64m4_t __riscv_vrgatherei16(vfloat64m4_t vs2, vuint16m1_t vs1, size_t vl);
vfloat64m8_t __riscv_vrgatherei16(vfloat64m8_t vs2, vuint16m2_t vs1, size_t vl);
vint8mf8_t __riscv_vrgather(vint8mf8_t vs2, vuint8mf8_t vs1, size_t vl);
vint8mf8_t __riscv_vrgather(vint8mf8_t vs2, size_t vs1, size_t vl);
vint8mf4_t __riscv_vrgather(vint8mf4_t vs2, vuint8mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vrgather(vint8mf4_t vs2, size_t vs1, size_t vl);
vint8mf2_t __riscv_vrgather(vint8mf2_t vs2, vuint8mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vrgather(vint8mf2_t vs2, size_t vs1, size_t vl);
vint8m1_t __riscv_vrgather(vint8m1_t vs2, vuint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vrgather(vint8m1_t vs2, size_t vs1, size_t vl);
vint8m2_t __riscv_vrgather(vint8m2_t vs2, vuint8m2_t vs1, size_t vl);
vint8m2_t __riscv_vrgather(vint8m2_t vs2, size_t vs1, size_t vl);
vint8m4_t __riscv_vrgather(vint8m4_t vs2, vuint8m4_t vs1, size_t vl);
vint8m4_t __riscv_vrgather(vint8m4_t vs2, size_t vs1, size_t vl);
vint8m8_t __riscv_vrgather(vint8m8_t vs2, vuint8m8_t vs1, size_t vl);
vint8m8_t __riscv_vrgather(vint8m8_t vs2, size_t vs1, size_t vl);
vint16mf4_t __riscv_vrgather(vint16mf4_t vs2, vuint16mf4_t vs1, size_t vl);
vint16mf4_t __riscv_vrgather(vint16mf4_t vs2, size_t vs1, size_t vl);
vint16mf2_t __riscv_vrgather(vint16mf2_t vs2, vuint16mf2_t vs1, size_t vl);
vint16mf2_t __riscv_vrgather(vint16mf2_t vs2, size_t vs1, size_t vl);
vint16m1_t __riscv_vrgather(vint16m1_t vs2, vuint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vrgather(vint16m1_t vs2, size_t vs1, size_t vl);
vint16m2_t __riscv_vrgather(vint16m2_t vs2, vuint16m2_t vs1, size_t vl);
vint16m2_t __riscv_vrgather(vint16m2_t vs2, size_t vs1, size_t vl);
vint16m4_t __riscv_vrgather(vint16m4_t vs2, vuint16m4_t vs1, size_t vl);
vint16m4_t __riscv_vrgather(vint16m4_t vs2, size_t vs1, size_t vl);
vint16m8_t __riscv_vrgather(vint16m8_t vs2, vuint16m8_t vs1, size_t vl);
vint16m8_t __riscv_vrgather(vint16m8_t vs2, size_t vs1, size_t vl);
vint32mf2_t __riscv_vrgather(vint32mf2_t vs2, vuint32mf2_t vs1, size_t vl);
vint32mf2_t __riscv_vrgather(vint32mf2_t vs2, size_t vs1, size_t vl);
vint32m1_t __riscv_vrgather(vint32m1_t vs2, vuint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vrgather(vint32m1_t vs2, size_t vs1, size_t vl);
vint32m2_t __riscv_vrgather(vint32m2_t vs2, vuint32m2_t vs1, size_t vl);
vint32m2_t __riscv_vrgather(vint32m2_t vs2, size_t vs1, size_t vl);
vint32m4_t __riscv_vrgather(vint32m4_t vs2, vuint32m4_t vs1, size_t vl);
vint32m4_t __riscv_vrgather(vint32m4_t vs2, size_t vs1, size_t vl);
vint32m8_t __riscv_vrgather(vint32m8_t vs2, vuint32m8_t vs1, size_t vl);
vint32m8_t __riscv_vrgather(vint32m8_t vs2, size_t vs1, size_t vl);
vint64m1_t __riscv_vrgather(vint64m1_t vs2, vuint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vrgather(vint64m1_t vs2, size_t vs1, size_t vl);
vint64m2_t __riscv_vrgather(vint64m2_t vs2, vuint64m2_t vs1, size_t vl);
vint64m2_t __riscv_vrgather(vint64m2_t vs2, size_t vs1, size_t vl);
vint64m4_t __riscv_vrgather(vint64m4_t vs2, vuint64m4_t vs1, size_t vl);
vint64m4_t __riscv_vrgather(vint64m4_t vs2, size_t vs1, size_t vl);
vint64m8_t __riscv_vrgather(vint64m8_t vs2, vuint64m8_t vs1, size_t vl);
vint64m8_t __riscv_vrgather(vint64m8_t vs2, size_t vs1, size_t vl);
vint8mf8_t __riscv_vrgatherei16(vint8mf8_t vs2, vuint16mf4_t vs1, size_t vl);
vint8mf4_t __riscv_vrgatherei16(vint8mf4_t vs2, vuint16mf2_t vs1, size_t vl);
vint8mf2_t __riscv_vrgatherei16(vint8mf2_t vs2, vuint16m1_t vs1, size_t vl);
vint8m1_t __riscv_vrgatherei16(vint8m1_t vs2, vuint16m2_t vs1, size_t vl);
vint8m2_t __riscv_vrgatherei16(vint8m2_t vs2, vuint16m4_t vs1, size_t vl);
vint8m4_t __riscv_vrgatherei16(vint8m4_t vs2, vuint16m8_t vs1, size_t vl);
vint16mf4_t __riscv_vrgatherei16(vint16mf4_t vs2, vuint16mf4_t vs1, size_t vl);
vint16mf2_t __riscv_vrgatherei16(vint16mf2_t vs2, vuint16mf2_t vs1, size_t vl);
vint16m1_t __riscv_vrgatherei16(vint16m1_t vs2, vuint16m1_t vs1, size_t vl);
vint16m2_t __riscv_vrgatherei16(vint16m2_t vs2, vuint16m2_t vs1, size_t vl);
vint16m4_t __riscv_vrgatherei16(vint16m4_t vs2, vuint16m4_t vs1, size_t vl);
vint16m8_t __riscv_vrgatherei16(vint16m8_t vs2, vuint16m8_t vs1, size_t vl);
vint32mf2_t __riscv_vrgatherei16(vint32mf2_t vs2, vuint16mf4_t vs1, size_t vl);
vint32m1_t __riscv_vrgatherei16(vint32m1_t vs2, vuint16mf2_t vs1, size_t vl);
vint32m2_t __riscv_vrgatherei16(vint32m2_t vs2, vuint16m1_t vs1, size_t vl);
vint32m4_t __riscv_vrgatherei16(vint32m4_t vs2, vuint16m2_t vs1, size_t vl);
vint32m8_t __riscv_vrgatherei16(vint32m8_t vs2, vuint16m4_t vs1, size_t vl);
vint64m1_t __riscv_vrgatherei16(vint64m1_t vs2, vuint16mf4_t vs1, size_t vl);
vint64m2_t __riscv_vrgatherei16(vint64m2_t vs2, vuint16mf2_t vs1, size_t vl);
vint64m4_t __riscv_vrgatherei16(vint64m4_t vs2, vuint16m1_t vs1, size_t vl);
vint64m8_t __riscv_vrgatherei16(vint64m8_t vs2, vuint16m2_t vs1, size_t vl);
vuint8mf8_t __riscv_vrgather(vuint8mf8_t vs2, vuint8mf8_t vs1, size_t vl);
vuint8mf8_t __riscv_vrgather(vuint8mf8_t vs2, size_t vs1, size_t vl);
vuint8mf4_t __riscv_vrgather(vuint8mf4_t vs2, vuint8mf4_t vs1, size_t vl);
vuint8mf4_t __riscv_vrgather(vuint8mf4_t vs2, size_t vs1, size_t vl);
vuint8mf2_t __riscv_vrgather(vuint8mf2_t vs2, vuint8mf2_t vs1, size_t vl);
vuint8mf2_t __riscv_vrgather(vuint8mf2_t vs2, size_t vs1, size_t vl);
vuint8m1_t __riscv_vrgather(vuint8m1_t vs2, vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vrgather(vuint8m1_t vs2, size_t vs1, size_t vl);
vuint8m2_t __riscv_vrgather(vuint8m2_t vs2, vuint8m2_t vs1, size_t vl);
vuint8m2_t __riscv_vrgather(vuint8m2_t vs2, size_t vs1, size_t vl);
vuint8m4_t __riscv_vrgather(vuint8m4_t vs2, vuint8m4_t vs1, size_t vl);
vuint8m4_t __riscv_vrgather(vuint8m4_t vs2, size_t vs1, size_t vl);
vuint8m8_t __riscv_vrgather(vuint8m8_t vs2, vuint8m8_t vs1, size_t vl);
vuint8m8_t __riscv_vrgather(vuint8m8_t vs2, size_t vs1, size_t vl);
vuint16mf4_t __riscv_vrgather(vuint16mf4_t vs2, vuint16mf4_t vs1, size_t vl);
vuint16mf4_t __riscv_vrgather(vuint16mf4_t vs2, size_t vs1, size_t vl);
vuint16mf2_t __riscv_vrgather(vuint16mf2_t vs2, vuint16mf2_t vs1, size_t vl);
vuint16mf2_t __riscv_vrgather(vuint16mf2_t vs2, size_t vs1, size_t vl);
vuint16m1_t __riscv_vrgather(vuint16m1_t vs2, vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vrgather(vuint16m1_t vs2, size_t vs1, size_t vl);
vuint16m2_t __riscv_vrgather(vuint16m2_t vs2, vuint16m2_t vs1, size_t vl);
vuint16m2_t __riscv_vrgather(vuint16m2_t vs2, size_t vs1, size_t vl);
vuint16m4_t __riscv_vrgather(vuint16m4_t vs2, vuint16m4_t vs1, size_t vl);
vuint16m4_t __riscv_vrgather(vuint16m4_t vs2, size_t vs1, size_t vl);
vuint16m8_t __riscv_vrgather(vuint16m8_t vs2, vuint16m8_t vs1, size_t vl);
vuint16m8_t __riscv_vrgather(vuint16m8_t vs2, size_t vs1, size_t vl);
vuint32mf2_t __riscv_vrgather(vuint32mf2_t vs2, vuint32mf2_t vs1, size_t vl);
vuint32mf2_t __riscv_vrgather(vuint32mf2_t vs2, size_t vs1, size_t vl);
vuint32m1_t __riscv_vrgather(vuint32m1_t vs2, vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vrgather(vuint32m1_t vs2, size_t vs1, size_t vl);
vuint32m2_t __riscv_vrgather(vuint32m2_t vs2, vuint32m2_t vs1, size_t vl);
vuint32m2_t __riscv_vrgather(vuint32m2_t vs2, size_t vs1, size_t vl);
vuint32m4_t __riscv_vrgather(vuint32m4_t vs2, vuint32m4_t vs1, size_t vl);
vuint32m4_t __riscv_vrgather(vuint32m4_t vs2, size_t vs1, size_t vl);
vuint32m8_t __riscv_vrgather(vuint32m8_t vs2, vuint32m8_t vs1, size_t vl);
vuint32m8_t __riscv_vrgather(vuint32m8_t vs2, size_t vs1, size_t vl);
vuint64m1_t __riscv_vrgather(vuint64m1_t vs2, vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vrgather(vuint64m1_t vs2, size_t vs1, size_t vl);
vuint64m2_t __riscv_vrgather(vuint64m2_t vs2, vuint64m2_t vs1, size_t vl);
vuint64m2_t __riscv_vrgather(vuint64m2_t vs2, size_t vs1, size_t vl);
vuint64m4_t __riscv_vrgather(vuint64m4_t vs2, vuint64m4_t vs1, size_t vl);
vuint64m4_t __riscv_vrgather(vuint64m4_t vs2, size_t vs1, size_t vl);
vuint64m8_t __riscv_vrgather(vuint64m8_t vs2, vuint64m8_t vs1, size_t vl);
vuint64m8_t __riscv_vrgather(vuint64m8_t vs2, size_t vs1, size_t vl);
vuint8mf8_t __riscv_vrgatherei16(vuint8mf8_t vs2, vuint16mf4_t vs1, size_t vl);
vuint8mf4_t __riscv_vrgatherei16(vuint8mf4_t vs2, vuint16mf2_t vs1, size_t vl);
vuint8mf2_t __riscv_vrgatherei16(vuint8mf2_t vs2, vuint16m1_t vs1, size_t vl);
vuint8m1_t __riscv_vrgatherei16(vuint8m1_t vs2, vuint16m2_t vs1, size_t vl);
vuint8m2_t __riscv_vrgatherei16(vuint8m2_t vs2, vuint16m4_t vs1, size_t vl);
vuint8m4_t __riscv_vrgatherei16(vuint8m4_t vs2, vuint16m8_t vs1, size_t vl);
vuint16mf4_t __riscv_vrgatherei16(vuint16mf4_t vs2, vuint16mf4_t vs1,
                                  size_t vl);
vuint16mf2_t __riscv_vrgatherei16(vuint16mf2_t vs2, vuint16mf2_t vs1,
                                  size_t vl);
vuint16m1_t __riscv_vrgatherei16(vuint16m1_t vs2, vuint16m1_t vs1, size_t vl);
vuint16m2_t __riscv_vrgatherei16(vuint16m2_t vs2, vuint16m2_t vs1, size_t vl);
vuint16m4_t __riscv_vrgatherei16(vuint16m4_t vs2, vuint16m4_t vs1, size_t vl);
vuint16m8_t __riscv_vrgatherei16(vuint16m8_t vs2, vuint16m8_t vs1, size_t vl);
vuint32mf2_t __riscv_vrgatherei16(vuint32mf2_t vs2, vuint16mf4_t vs1,
                                  size_t vl);
vuint32m1_t __riscv_vrgatherei16(vuint32m1_t vs2, vuint16mf2_t vs1, size_t vl);
vuint32m2_t __riscv_vrgatherei16(vuint32m2_t vs2, vuint16m1_t vs1, size_t vl);
vuint32m4_t __riscv_vrgatherei16(vuint32m4_t vs2, vuint16m2_t vs1, size_t vl);
vuint32m8_t __riscv_vrgatherei16(vuint32m8_t vs2, vuint16m4_t vs1, size_t vl);
vuint64m1_t __riscv_vrgatherei16(vuint64m1_t vs2, vuint16mf4_t vs1, size_t vl);
vuint64m2_t __riscv_vrgatherei16(vuint64m2_t vs2, vuint16mf2_t vs1, size_t vl);
vuint64m4_t __riscv_vrgatherei16(vuint64m4_t vs2, vuint16m1_t vs1, size_t vl);
vuint64m8_t __riscv_vrgatherei16(vuint64m8_t vs2, vuint16m2_t vs1, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vrgather(vbool64_t vm, vfloat16mf4_t vs2,
                               vuint16mf4_t vs1, size_t vl);
vfloat16mf4_t __riscv_vrgather(vbool64_t vm, vfloat16mf4_t vs2, size_t vs1,
                               size_t vl);
vfloat16mf2_t __riscv_vrgather(vbool32_t vm, vfloat16mf2_t vs2,
                               vuint16mf2_t vs1, size_t vl);
vfloat16mf2_t __riscv_vrgather(vbool32_t vm, vfloat16mf2_t vs2, size_t vs1,
                               size_t vl);
vfloat16m1_t __riscv_vrgather(vbool16_t vm, vfloat16m1_t vs2, vuint16m1_t vs1,
                              size_t vl);
vfloat16m1_t __riscv_vrgather(vbool16_t vm, vfloat16m1_t vs2, size_t vs1,
                              size_t vl);
vfloat16m2_t __riscv_vrgather(vbool8_t vm, vfloat16m2_t vs2, vuint16m2_t vs1,
                              size_t vl);
vfloat16m2_t __riscv_vrgather(vbool8_t vm, vfloat16m2_t vs2, size_t vs1,
                              size_t vl);
vfloat16m4_t __riscv_vrgather(vbool4_t vm, vfloat16m4_t vs2, vuint16m4_t vs1,
                              size_t vl);
vfloat16m4_t __riscv_vrgather(vbool4_t vm, vfloat16m4_t vs2, size_t vs1,
                              size_t vl);
vfloat16m8_t __riscv_vrgather(vbool2_t vm, vfloat16m8_t vs2, vuint16m8_t vs1,
                              size_t vl);
vfloat16m8_t __riscv_vrgather(vbool2_t vm, vfloat16m8_t vs2, size_t vs1,
                              size_t vl);
vfloat32mf2_t __riscv_vrgather(vbool64_t vm, vfloat32mf2_t vs2,
                               vuint32mf2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vrgather(vbool64_t vm, vfloat32mf2_t vs2, size_t vs1,
                               size_t vl);
vfloat32m1_t __riscv_vrgather(vbool32_t vm, vfloat32m1_t vs2, vuint32m1_t vs1,
                              size_t vl);
vfloat32m1_t __riscv_vrgather(vbool32_t vm, vfloat32m1_t vs2, size_t vs1,
                              size_t vl);
vfloat32m2_t __riscv_vrgather(vbool16_t vm, vfloat32m2_t vs2, vuint32m2_t vs1,
                              size_t vl);
vfloat32m2_t __riscv_vrgather(vbool16_t vm, vfloat32m2_t vs2, size_t vs1,
                              size_t vl);
vfloat32m4_t __riscv_vrgather(vbool8_t vm, vfloat32m4_t vs2, vuint32m4_t vs1,
                              size_t vl);
vfloat32m4_t __riscv_vrgather(vbool8_t vm, vfloat32m4_t vs2, size_t vs1,
                              size_t vl);
vfloat32m8_t __riscv_vrgather(vbool4_t vm, vfloat32m8_t vs2, vuint32m8_t vs1,
                              size_t vl);
vfloat32m8_t __riscv_vrgather(vbool4_t vm, vfloat32m8_t vs2, size_t vs1,
                              size_t vl);
vfloat64m1_t __riscv_vrgather(vbool64_t vm, vfloat64m1_t vs2, vuint64m1_t vs1,
                              size_t vl);
vfloat64m1_t __riscv_vrgather(vbool64_t vm, vfloat64m1_t vs2, size_t vs1,
                              size_t vl);
vfloat64m2_t __riscv_vrgather(vbool32_t vm, vfloat64m2_t vs2, vuint64m2_t vs1,
                              size_t vl);
vfloat64m2_t __riscv_vrgather(vbool32_t vm, vfloat64m2_t vs2, size_t vs1,
                              size_t vl);
vfloat64m4_t __riscv_vrgather(vbool16_t vm, vfloat64m4_t vs2, vuint64m4_t vs1,
                              size_t vl);
vfloat64m4_t __riscv_vrgather(vbool16_t vm, vfloat64m4_t vs2, size_t vs1,
                              size_t vl);
vfloat64m8_t __riscv_vrgather(vbool8_t vm, vfloat64m8_t vs2, vuint64m8_t vs1,
                              size_t vl);
vfloat64m8_t __riscv_vrgather(vbool8_t vm, vfloat64m8_t vs2, size_t vs1,
                              size_t vl);
vfloat16mf4_t __riscv_vrgatherei16(vbool64_t vm, vfloat16mf4_t vs2,
                                   vuint16mf4_t vs1, size_t vl);
vfloat16mf2_t __riscv_vrgatherei16(vbool32_t vm, vfloat16mf2_t vs2,
                                   vuint16mf2_t vs1, size_t vl);
vfloat16m1_t __riscv_vrgatherei16(vbool16_t vm, vfloat16m1_t vs2,
                                  vuint16m1_t vs1, size_t vl);
vfloat16m2_t __riscv_vrgatherei16(vbool8_t vm, vfloat16m2_t vs2,
                                  vuint16m2_t vs1, size_t vl);
vfloat16m4_t __riscv_vrgatherei16(vbool4_t vm, vfloat16m4_t vs2,
                                  vuint16m4_t vs1, size_t vl);
vfloat16m8_t __riscv_vrgatherei16(vbool2_t vm, vfloat16m8_t vs2,
                                  vuint16m8_t vs1, size_t vl);
vfloat32mf2_t __riscv_vrgatherei16(vbool64_t vm, vfloat32mf2_t vs2,
                                   vuint16mf4_t vs1, size_t vl);
vfloat32m1_t __riscv_vrgatherei16(vbool32_t vm, vfloat32m1_t vs2,
                                  vuint16mf2_t vs1, size_t vl);
vfloat32m2_t __riscv_vrgatherei16(vbool16_t vm, vfloat32m2_t vs2,
                                  vuint16m1_t vs1, size_t vl);
vfloat32m4_t __riscv_vrgatherei16(vbool8_t vm, vfloat32m4_t vs2,
                                  vuint16m2_t vs1, size_t vl);
vfloat32m8_t __riscv_vrgatherei16(vbool4_t vm, vfloat32m8_t vs2,
                                  vuint16m4_t vs1, size_t vl);
vfloat64m1_t __riscv_vrgatherei16(vbool64_t vm, vfloat64m1_t vs2,
                                  vuint16mf4_t vs1, size_t vl);
vfloat64m2_t __riscv_vrgatherei16(vbool32_t vm, vfloat64m2_t vs2,
                                  vuint16mf2_t vs1, size_t vl);
vfloat64m4_t __riscv_vrgatherei16(vbool16_t vm, vfloat64m4_t vs2,
                                  vuint16m1_t vs1, size_t vl);
vfloat64m8_t __riscv_vrgatherei16(vbool8_t vm, vfloat64m8_t vs2,
                                  vuint16m2_t vs1, size_t vl);
vint8mf8_t __riscv_vrgather(vbool64_t vm, vint8mf8_t vs2, vuint8mf8_t vs1,
                            size_t vl);
vint8mf8_t __riscv_vrgather(vbool64_t vm, vint8mf8_t vs2, size_t vs1,
                            size_t vl);
vint8mf4_t __riscv_vrgather(vbool32_t vm, vint8mf4_t vs2, vuint8mf4_t vs1,
                            size_t vl);
vint8mf4_t __riscv_vrgather(vbool32_t vm, vint8mf4_t vs2, size_t vs1,
                            size_t vl);
vint8mf2_t __riscv_vrgather(vbool16_t vm, vint8mf2_t vs2, vuint8mf2_t vs1,
                            size_t vl);
vint8mf2_t __riscv_vrgather(vbool16_t vm, vint8mf2_t vs2, size_t vs1,
                            size_t vl);
vint8m1_t __riscv_vrgather(vbool8_t vm, vint8m1_t vs2, vuint8m1_t vs1,
                           size_t vl);
vint8m1_t __riscv_vrgather(vbool8_t vm, vint8m1_t vs2, size_t vs1, size_t vl);
vint8m2_t __riscv_vrgather(vbool4_t vm, vint8m2_t vs2, vuint8m2_t vs1,
                           size_t vl);
vint8m2_t __riscv_vrgather(vbool4_t vm, vint8m2_t vs2, size_t vs1, size_t vl);
vint8m4_t __riscv_vrgather(vbool2_t vm, vint8m4_t vs2, vuint8m4_t vs1,
                           size_t vl);
vint8m4_t __riscv_vrgather(vbool2_t vm, vint8m4_t vs2, size_t vs1, size_t vl);
vint8m8_t __riscv_vrgather(vbool1_t vm, vint8m8_t vs2, vuint8m8_t vs1,
                           size_t vl);
vint8m8_t __riscv_vrgather(vbool1_t vm, vint8m8_t vs2, size_t vs1, size_t vl);
vint16mf4_t __riscv_vrgather(vbool64_t vm, vint16mf4_t vs2, vuint16mf4_t vs1,
                             size_t vl);
vint16mf4_t __riscv_vrgather(vbool64_t vm, vint16mf4_t vs2, size_t vs1,
                             size_t vl);
vint16mf2_t __riscv_vrgather(vbool32_t vm, vint16mf2_t vs2, vuint16mf2_t vs1,
                             size_t vl);
vint16mf2_t __riscv_vrgather(vbool32_t vm, vint16mf2_t vs2, size_t vs1,
                             size_t vl);
vint16m1_t __riscv_vrgather(vbool16_t vm, vint16m1_t vs2, vuint16m1_t vs1,
                            size_t vl);
vint16m1_t __riscv_vrgather(vbool16_t vm, vint16m1_t vs2, size_t vs1,
                            size_t vl);
vint16m2_t __riscv_vrgather(vbool8_t vm, vint16m2_t vs2, vuint16m2_t vs1,
                            size_t vl);
vint16m2_t __riscv_vrgather(vbool8_t vm, vint16m2_t vs2, size_t vs1, size_t vl);
vint16m4_t __riscv_vrgather(vbool4_t vm, vint16m4_t vs2, vuint16m4_t vs1,
                            size_t vl);
vint16m4_t __riscv_vrgather(vbool4_t vm, vint16m4_t vs2, size_t vs1, size_t vl);
vint16m8_t __riscv_vrgather(vbool2_t vm, vint16m8_t vs2, vuint16m8_t vs1,
                            size_t vl);
vint16m8_t __riscv_vrgather(vbool2_t vm, vint16m8_t vs2, size_t vs1, size_t vl);
vint32mf2_t __riscv_vrgather(vbool64_t vm, vint32mf2_t vs2, vuint32mf2_t vs1,
                             size_t vl);
vint32mf2_t __riscv_vrgather(vbool64_t vm, vint32mf2_t vs2, size_t vs1,
                             size_t vl);
vint32m1_t __riscv_vrgather(vbool32_t vm, vint32m1_t vs2, vuint32m1_t vs1,
                            size_t vl);
vint32m1_t __riscv_vrgather(vbool32_t vm, vint32m1_t vs2, size_t vs1,
                            size_t vl);
vint32m2_t __riscv_vrgather(vbool16_t vm, vint32m2_t vs2, vuint32m2_t vs1,
                            size_t vl);
vint32m2_t __riscv_vrgather(vbool16_t vm, vint32m2_t vs2, size_t vs1,
                            size_t vl);
vint32m4_t __riscv_vrgather(vbool8_t vm, vint32m4_t vs2, vuint32m4_t vs1,
                            size_t vl);
vint32m4_t __riscv_vrgather(vbool8_t vm, vint32m4_t vs2, size_t vs1, size_t vl);
vint32m8_t __riscv_vrgather(vbool4_t vm, vint32m8_t vs2, vuint32m8_t vs1,
                            size_t vl);
vint32m8_t __riscv_vrgather(vbool4_t vm, vint32m8_t vs2, size_t vs1, size_t vl);
vint64m1_t __riscv_vrgather(vbool64_t vm, vint64m1_t vs2, vuint64m1_t vs1,
                            size_t vl);
vint64m1_t __riscv_vrgather(vbool64_t vm, vint64m1_t vs2, size_t vs1,
                            size_t vl);
vint64m2_t __riscv_vrgather(vbool32_t vm, vint64m2_t vs2, vuint64m2_t vs1,
                            size_t vl);
vint64m2_t __riscv_vrgather(vbool32_t vm, vint64m2_t vs2, size_t vs1,
                            size_t vl);
vint64m4_t __riscv_vrgather(vbool16_t vm, vint64m4_t vs2, vuint64m4_t vs1,
                            size_t vl);
vint64m4_t __riscv_vrgather(vbool16_t vm, vint64m4_t vs2, size_t vs1,
                            size_t vl);
vint64m8_t __riscv_vrgather(vbool8_t vm, vint64m8_t vs2, vuint64m8_t vs1,
                            size_t vl);
vint64m8_t __riscv_vrgather(vbool8_t vm, vint64m8_t vs2, size_t vs1, size_t vl);
vint8mf8_t __riscv_vrgatherei16(vbool64_t vm, vint8mf8_t vs2, vuint16mf4_t vs1,
                                size_t vl);
vint8mf4_t __riscv_vrgatherei16(vbool32_t vm, vint8mf4_t vs2, vuint16mf2_t vs1,
                                size_t vl);
vint8mf2_t __riscv_vrgatherei16(vbool16_t vm, vint8mf2_t vs2, vuint16m1_t vs1,
                                size_t vl);
vint8m1_t __riscv_vrgatherei16(vbool8_t vm, vint8m1_t vs2, vuint16m2_t vs1,
                               size_t vl);
vint8m2_t __riscv_vrgatherei16(vbool4_t vm, vint8m2_t vs2, vuint16m4_t vs1,
                               size_t vl);
vint8m4_t __riscv_vrgatherei16(vbool2_t vm, vint8m4_t vs2, vuint16m8_t vs1,
                               size_t vl);
vint16mf4_t __riscv_vrgatherei16(vbool64_t vm, vint16mf4_t vs2,
                                 vuint16mf4_t vs1, size_t vl);
vint16mf2_t __riscv_vrgatherei16(vbool32_t vm, vint16mf2_t vs2,
                                 vuint16mf2_t vs1, size_t vl);
vint16m1_t __riscv_vrgatherei16(vbool16_t vm, vint16m1_t vs2, vuint16m1_t vs1,
                                size_t vl);
vint16m2_t __riscv_vrgatherei16(vbool8_t vm, vint16m2_t vs2, vuint16m2_t vs1,
                                size_t vl);
vint16m4_t __riscv_vrgatherei16(vbool4_t vm, vint16m4_t vs2, vuint16m4_t vs1,
                                size_t vl);
vint16m8_t __riscv_vrgatherei16(vbool2_t vm, vint16m8_t vs2, vuint16m8_t vs1,
                                size_t vl);
vint32mf2_t __riscv_vrgatherei16(vbool64_t vm, vint32mf2_t vs2,
                                 vuint16mf4_t vs1, size_t vl);
vint32m1_t __riscv_vrgatherei16(vbool32_t vm, vint32m1_t vs2, vuint16mf2_t vs1,
                                size_t vl);
vint32m2_t __riscv_vrgatherei16(vbool16_t vm, vint32m2_t vs2, vuint16m1_t vs1,
                                size_t vl);
vint32m4_t __riscv_vrgatherei16(vbool8_t vm, vint32m4_t vs2, vuint16m2_t vs1,
                                size_t vl);
vint32m8_t __riscv_vrgatherei16(vbool4_t vm, vint32m8_t vs2, vuint16m4_t vs1,
                                size_t vl);
vint64m1_t __riscv_vrgatherei16(vbool64_t vm, vint64m1_t vs2, vuint16mf4_t vs1,
                                size_t vl);
vint64m2_t __riscv_vrgatherei16(vbool32_t vm, vint64m2_t vs2, vuint16mf2_t vs1,
                                size_t vl);
vint64m4_t __riscv_vrgatherei16(vbool16_t vm, vint64m4_t vs2, vuint16m1_t vs1,
                                size_t vl);
vint64m8_t __riscv_vrgatherei16(vbool8_t vm, vint64m8_t vs2, vuint16m2_t vs1,
                                size_t vl);
vuint8mf8_t __riscv_vrgather(vbool64_t vm, vuint8mf8_t vs2, vuint8mf8_t vs1,
                             size_t vl);
vuint8mf8_t __riscv_vrgather(vbool64_t vm, vuint8mf8_t vs2, size_t vs1,
                             size_t vl);
vuint8mf4_t __riscv_vrgather(vbool32_t vm, vuint8mf4_t vs2, vuint8mf4_t vs1,
                             size_t vl);
vuint8mf4_t __riscv_vrgather(vbool32_t vm, vuint8mf4_t vs2, size_t vs1,
                             size_t vl);
vuint8mf2_t __riscv_vrgather(vbool16_t vm, vuint8mf2_t vs2, vuint8mf2_t vs1,
                             size_t vl);
vuint8mf2_t __riscv_vrgather(vbool16_t vm, vuint8mf2_t vs2, size_t vs1,
                             size_t vl);
vuint8m1_t __riscv_vrgather(vbool8_t vm, vuint8m1_t vs2, vuint8m1_t vs1,
                            size_t vl);
vuint8m1_t __riscv_vrgather(vbool8_t vm, vuint8m1_t vs2, size_t vs1, size_t vl);
vuint8m2_t __riscv_vrgather(vbool4_t vm, vuint8m2_t vs2, vuint8m2_t vs1,
                            size_t vl);
vuint8m2_t __riscv_vrgather(vbool4_t vm, vuint8m2_t vs2, size_t vs1, size_t vl);
vuint8m4_t __riscv_vrgather(vbool2_t vm, vuint8m4_t vs2, vuint8m4_t vs1,
                            size_t vl);
vuint8m4_t __riscv_vrgather(vbool2_t vm, vuint8m4_t vs2, size_t vs1, size_t vl);
vuint8m8_t __riscv_vrgather(vbool1_t vm, vuint8m8_t vs2, vuint8m8_t vs1,
                            size_t vl);
vuint8m8_t __riscv_vrgather(vbool1_t vm, vuint8m8_t vs2, size_t vs1, size_t vl);
vuint16mf4_t __riscv_vrgather(vbool64_t vm, vuint16mf4_t vs2, vuint16mf4_t vs1,
                              size_t vl);
vuint16mf4_t __riscv_vrgather(vbool64_t vm, vuint16mf4_t vs2, size_t vs1,
                              size_t vl);
vuint16mf2_t __riscv_vrgather(vbool32_t vm, vuint16mf2_t vs2, vuint16mf2_t vs1,
                              size_t vl);
vuint16mf2_t __riscv_vrgather(vbool32_t vm, vuint16mf2_t vs2, size_t vs1,
                              size_t vl);
vuint16m1_t __riscv_vrgather(vbool16_t vm, vuint16m1_t vs2, vuint16m1_t vs1,
                             size_t vl);
vuint16m1_t __riscv_vrgather(vbool16_t vm, vuint16m1_t vs2, size_t vs1,
                             size_t vl);
vuint16m2_t __riscv_vrgather(vbool8_t vm, vuint16m2_t vs2, vuint16m2_t vs1,
                             size_t vl);
vuint16m2_t __riscv_vrgather(vbool8_t vm, vuint16m2_t vs2, size_t vs1,
                             size_t vl);
vuint16m4_t __riscv_vrgather(vbool4_t vm, vuint16m4_t vs2, vuint16m4_t vs1,
                             size_t vl);
vuint16m4_t __riscv_vrgather(vbool4_t vm, vuint16m4_t vs2, size_t vs1,
                             size_t vl);
vuint16m8_t __riscv_vrgather(vbool2_t vm, vuint16m8_t vs2, vuint16m8_t vs1,
                             size_t vl);
vuint16m8_t __riscv_vrgather(vbool2_t vm, vuint16m8_t vs2, size_t vs1,
                             size_t vl);
vuint32mf2_t __riscv_vrgather(vbool64_t vm, vuint32mf2_t vs2, vuint32mf2_t vs1,
                              size_t vl);
vuint32mf2_t __riscv_vrgather(vbool64_t vm, vuint32mf2_t vs2, size_t vs1,
                              size_t vl);
vuint32m1_t __riscv_vrgather(vbool32_t vm, vuint32m1_t vs2, vuint32m1_t vs1,
                             size_t vl);
vuint32m1_t __riscv_vrgather(vbool32_t vm, vuint32m1_t vs2, size_t vs1,
                             size_t vl);
vuint32m2_t __riscv_vrgather(vbool16_t vm, vuint32m2_t vs2, vuint32m2_t vs1,
                             size_t vl);
vuint32m2_t __riscv_vrgather(vbool16_t vm, vuint32m2_t vs2, size_t vs1,
                             size_t vl);
vuint32m4_t __riscv_vrgather(vbool8_t vm, vuint32m4_t vs2, vuint32m4_t vs1,
                             size_t vl);
vuint32m4_t __riscv_vrgather(vbool8_t vm, vuint32m4_t vs2, size_t vs1,
                             size_t vl);
vuint32m8_t __riscv_vrgather(vbool4_t vm, vuint32m8_t vs2, vuint32m8_t vs1,
                             size_t vl);
vuint32m8_t __riscv_vrgather(vbool4_t vm, vuint32m8_t vs2, size_t vs1,
                             size_t vl);
vuint64m1_t __riscv_vrgather(vbool64_t vm, vuint64m1_t vs2, vuint64m1_t vs1,
                             size_t vl);
vuint64m1_t __riscv_vrgather(vbool64_t vm, vuint64m1_t vs2, size_t vs1,
                             size_t vl);
vuint64m2_t __riscv_vrgather(vbool32_t vm, vuint64m2_t vs2, vuint64m2_t vs1,
                             size_t vl);
vuint64m2_t __riscv_vrgather(vbool32_t vm, vuint64m2_t vs2, size_t vs1,
                             size_t vl);
vuint64m4_t __riscv_vrgather(vbool16_t vm, vuint64m4_t vs2, vuint64m4_t vs1,
                             size_t vl);
vuint64m4_t __riscv_vrgather(vbool16_t vm, vuint64m4_t vs2, size_t vs1,
                             size_t vl);
vuint64m8_t __riscv_vrgather(vbool8_t vm, vuint64m8_t vs2, vuint64m8_t vs1,
                             size_t vl);
vuint64m8_t __riscv_vrgather(vbool8_t vm, vuint64m8_t vs2, size_t vs1,
                             size_t vl);
vuint8mf8_t __riscv_vrgatherei16(vbool64_t vm, vuint8mf8_t vs2,
                                 vuint16mf4_t vs1, size_t vl);
vuint8mf4_t __riscv_vrgatherei16(vbool32_t vm, vuint8mf4_t vs2,
                                 vuint16mf2_t vs1, size_t vl);
vuint8mf2_t __riscv_vrgatherei16(vbool16_t vm, vuint8mf2_t vs2, vuint16m1_t vs1,
                                 size_t vl);
vuint8m1_t __riscv_vrgatherei16(vbool8_t vm, vuint8m1_t vs2, vuint16m2_t vs1,
                                size_t vl);
vuint8m2_t __riscv_vrgatherei16(vbool4_t vm, vuint8m2_t vs2, vuint16m4_t vs1,
                                size_t vl);
vuint8m4_t __riscv_vrgatherei16(vbool2_t vm, vuint8m4_t vs2, vuint16m8_t vs1,
                                size_t vl);
vuint16mf4_t __riscv_vrgatherei16(vbool64_t vm, vuint16mf4_t vs2,
                                  vuint16mf4_t vs1, size_t vl);
vuint16mf2_t __riscv_vrgatherei16(vbool32_t vm, vuint16mf2_t vs2,
                                  vuint16mf2_t vs1, size_t vl);
vuint16m1_t __riscv_vrgatherei16(vbool16_t vm, vuint16m1_t vs2, vuint16m1_t vs1,
                                 size_t vl);
vuint16m2_t __riscv_vrgatherei16(vbool8_t vm, vuint16m2_t vs2, vuint16m2_t vs1,
                                 size_t vl);
vuint16m4_t __riscv_vrgatherei16(vbool4_t vm, vuint16m4_t vs2, vuint16m4_t vs1,
                                 size_t vl);
vuint16m8_t __riscv_vrgatherei16(vbool2_t vm, vuint16m8_t vs2, vuint16m8_t vs1,
                                 size_t vl);
vuint32mf2_t __riscv_vrgatherei16(vbool64_t vm, vuint32mf2_t vs2,
                                  vuint16mf4_t vs1, size_t vl);
vuint32m1_t __riscv_vrgatherei16(vbool32_t vm, vuint32m1_t vs2,
                                 vuint16mf2_t vs1, size_t vl);
vuint32m2_t __riscv_vrgatherei16(vbool16_t vm, vuint32m2_t vs2, vuint16m1_t vs1,
                                 size_t vl);
vuint32m4_t __riscv_vrgatherei16(vbool8_t vm, vuint32m4_t vs2, vuint16m2_t vs1,
                                 size_t vl);
vuint32m8_t __riscv_vrgatherei16(vbool4_t vm, vuint32m8_t vs2, vuint16m4_t vs1,
                                 size_t vl);
vuint64m1_t __riscv_vrgatherei16(vbool64_t vm, vuint64m1_t vs2,
                                 vuint16mf4_t vs1, size_t vl);
vuint64m2_t __riscv_vrgatherei16(vbool32_t vm, vuint64m2_t vs2,
                                 vuint16mf2_t vs1, size_t vl);
vuint64m4_t __riscv_vrgatherei16(vbool16_t vm, vuint64m4_t vs2, vuint16m1_t vs1,
                                 size_t vl);
vuint64m8_t __riscv_vrgatherei16(vbool8_t vm, vuint64m8_t vs2, vuint16m2_t vs1,
                                 size_t vl);

Vector Compress Intrinsics

vfloat16mf4_t __riscv_vcompress(vfloat16mf4_t vs2, vbool64_t vs1, size_t vl);
vfloat16mf2_t __riscv_vcompress(vfloat16mf2_t vs2, vbool32_t vs1, size_t vl);
vfloat16m1_t __riscv_vcompress(vfloat16m1_t vs2, vbool16_t vs1, size_t vl);
vfloat16m2_t __riscv_vcompress(vfloat16m2_t vs2, vbool8_t vs1, size_t vl);
vfloat16m4_t __riscv_vcompress(vfloat16m4_t vs2, vbool4_t vs1, size_t vl);
vfloat16m8_t __riscv_vcompress(vfloat16m8_t vs2, vbool2_t vs1, size_t vl);
vfloat32mf2_t __riscv_vcompress(vfloat32mf2_t vs2, vbool64_t vs1, size_t vl);
vfloat32m1_t __riscv_vcompress(vfloat32m1_t vs2, vbool32_t vs1, size_t vl);
vfloat32m2_t __riscv_vcompress(vfloat32m2_t vs2, vbool16_t vs1, size_t vl);
vfloat32m4_t __riscv_vcompress(vfloat32m4_t vs2, vbool8_t vs1, size_t vl);
vfloat32m8_t __riscv_vcompress(vfloat32m8_t vs2, vbool4_t vs1, size_t vl);
vfloat64m1_t __riscv_vcompress(vfloat64m1_t vs2, vbool64_t vs1, size_t vl);
vfloat64m2_t __riscv_vcompress(vfloat64m2_t vs2, vbool32_t vs1, size_t vl);
vfloat64m4_t __riscv_vcompress(vfloat64m4_t vs2, vbool16_t vs1, size_t vl);
vfloat64m8_t __riscv_vcompress(vfloat64m8_t vs2, vbool8_t vs1, size_t vl);
vint8mf8_t __riscv_vcompress(vint8mf8_t vs2, vbool64_t vs1, size_t vl);
vint8mf4_t __riscv_vcompress(vint8mf4_t vs2, vbool32_t vs1, size_t vl);
vint8mf2_t __riscv_vcompress(vint8mf2_t vs2, vbool16_t vs1, size_t vl);
vint8m1_t __riscv_vcompress(vint8m1_t vs2, vbool8_t vs1, size_t vl);
vint8m2_t __riscv_vcompress(vint8m2_t vs2, vbool4_t vs1, size_t vl);
vint8m4_t __riscv_vcompress(vint8m4_t vs2, vbool2_t vs1, size_t vl);
vint8m8_t __riscv_vcompress(vint8m8_t vs2, vbool1_t vs1, size_t vl);
vint16mf4_t __riscv_vcompress(vint16mf4_t vs2, vbool64_t vs1, size_t vl);
vint16mf2_t __riscv_vcompress(vint16mf2_t vs2, vbool32_t vs1, size_t vl);
vint16m1_t __riscv_vcompress(vint16m1_t vs2, vbool16_t vs1, size_t vl);
vint16m2_t __riscv_vcompress(vint16m2_t vs2, vbool8_t vs1, size_t vl);
vint16m4_t __riscv_vcompress(vint16m4_t vs2, vbool4_t vs1, size_t vl);
vint16m8_t __riscv_vcompress(vint16m8_t vs2, vbool2_t vs1, size_t vl);
vint32mf2_t __riscv_vcompress(vint32mf2_t vs2, vbool64_t vs1, size_t vl);
vint32m1_t __riscv_vcompress(vint32m1_t vs2, vbool32_t vs1, size_t vl);
vint32m2_t __riscv_vcompress(vint32m2_t vs2, vbool16_t vs1, size_t vl);
vint32m4_t __riscv_vcompress(vint32m4_t vs2, vbool8_t vs1, size_t vl);
vint32m8_t __riscv_vcompress(vint32m8_t vs2, vbool4_t vs1, size_t vl);
vint64m1_t __riscv_vcompress(vint64m1_t vs2, vbool64_t vs1, size_t vl);
vint64m2_t __riscv_vcompress(vint64m2_t vs2, vbool32_t vs1, size_t vl);
vint64m4_t __riscv_vcompress(vint64m4_t vs2, vbool16_t vs1, size_t vl);
vint64m8_t __riscv_vcompress(vint64m8_t vs2, vbool8_t vs1, size_t vl);
vuint8mf8_t __riscv_vcompress(vuint8mf8_t vs2, vbool64_t vs1, size_t vl);
vuint8mf4_t __riscv_vcompress(vuint8mf4_t vs2, vbool32_t vs1, size_t vl);
vuint8mf2_t __riscv_vcompress(vuint8mf2_t vs2, vbool16_t vs1, size_t vl);
vuint8m1_t __riscv_vcompress(vuint8m1_t vs2, vbool8_t vs1, size_t vl);
vuint8m2_t __riscv_vcompress(vuint8m2_t vs2, vbool4_t vs1, size_t vl);
vuint8m4_t __riscv_vcompress(vuint8m4_t vs2, vbool2_t vs1, size_t vl);
vuint8m8_t __riscv_vcompress(vuint8m8_t vs2, vbool1_t vs1, size_t vl);
vuint16mf4_t __riscv_vcompress(vuint16mf4_t vs2, vbool64_t vs1, size_t vl);
vuint16mf2_t __riscv_vcompress(vuint16mf2_t vs2, vbool32_t vs1, size_t vl);
vuint16m1_t __riscv_vcompress(vuint16m1_t vs2, vbool16_t vs1, size_t vl);
vuint16m2_t __riscv_vcompress(vuint16m2_t vs2, vbool8_t vs1, size_t vl);
vuint16m4_t __riscv_vcompress(vuint16m4_t vs2, vbool4_t vs1, size_t vl);
vuint16m8_t __riscv_vcompress(vuint16m8_t vs2, vbool2_t vs1, size_t vl);
vuint32mf2_t __riscv_vcompress(vuint32mf2_t vs2, vbool64_t vs1, size_t vl);
vuint32m1_t __riscv_vcompress(vuint32m1_t vs2, vbool32_t vs1, size_t vl);
vuint32m2_t __riscv_vcompress(vuint32m2_t vs2, vbool16_t vs1, size_t vl);
vuint32m4_t __riscv_vcompress(vuint32m4_t vs2, vbool8_t vs1, size_t vl);
vuint32m8_t __riscv_vcompress(vuint32m8_t vs2, vbool4_t vs1, size_t vl);
vuint64m1_t __riscv_vcompress(vuint64m1_t vs2, vbool64_t vs1, size_t vl);
vuint64m2_t __riscv_vcompress(vuint64m2_t vs2, vbool32_t vs1, size_t vl);
vuint64m4_t __riscv_vcompress(vuint64m4_t vs2, vbool16_t vs1, size_t vl);
vuint64m8_t __riscv_vcompress(vuint64m8_t vs2, vbool8_t vs1, size_t vl);