Vector Loads and Stores Intrinsics

Vector Unit-Stride Load Intrinsics

vfloat16mf4_t __riscv_vle16_v_f16mf4(const _Float16 *rs1, size_t vl);
vfloat16mf2_t __riscv_vle16_v_f16mf2(const _Float16 *rs1, size_t vl);
vfloat16m1_t __riscv_vle16_v_f16m1(const _Float16 *rs1, size_t vl);
vfloat16m2_t __riscv_vle16_v_f16m2(const _Float16 *rs1, size_t vl);
vfloat16m4_t __riscv_vle16_v_f16m4(const _Float16 *rs1, size_t vl);
vfloat16m8_t __riscv_vle16_v_f16m8(const _Float16 *rs1, size_t vl);
vfloat32mf2_t __riscv_vle32_v_f32mf2(const float *rs1, size_t vl);
vfloat32m1_t __riscv_vle32_v_f32m1(const float *rs1, size_t vl);
vfloat32m2_t __riscv_vle32_v_f32m2(const float *rs1, size_t vl);
vfloat32m4_t __riscv_vle32_v_f32m4(const float *rs1, size_t vl);
vfloat32m8_t __riscv_vle32_v_f32m8(const float *rs1, size_t vl);
vfloat64m1_t __riscv_vle64_v_f64m1(const double *rs1, size_t vl);
vfloat64m2_t __riscv_vle64_v_f64m2(const double *rs1, size_t vl);
vfloat64m4_t __riscv_vle64_v_f64m4(const double *rs1, size_t vl);
vfloat64m8_t __riscv_vle64_v_f64m8(const double *rs1, size_t vl);
vint8mf8_t __riscv_vle8_v_i8mf8(const int8_t *rs1, size_t vl);
vint8mf4_t __riscv_vle8_v_i8mf4(const int8_t *rs1, size_t vl);
vint8mf2_t __riscv_vle8_v_i8mf2(const int8_t *rs1, size_t vl);
vint8m1_t __riscv_vle8_v_i8m1(const int8_t *rs1, size_t vl);
vint8m2_t __riscv_vle8_v_i8m2(const int8_t *rs1, size_t vl);
vint8m4_t __riscv_vle8_v_i8m4(const int8_t *rs1, size_t vl);
vint8m8_t __riscv_vle8_v_i8m8(const int8_t *rs1, size_t vl);
vint16mf4_t __riscv_vle16_v_i16mf4(const int16_t *rs1, size_t vl);
vint16mf2_t __riscv_vle16_v_i16mf2(const int16_t *rs1, size_t vl);
vint16m1_t __riscv_vle16_v_i16m1(const int16_t *rs1, size_t vl);
vint16m2_t __riscv_vle16_v_i16m2(const int16_t *rs1, size_t vl);
vint16m4_t __riscv_vle16_v_i16m4(const int16_t *rs1, size_t vl);
vint16m8_t __riscv_vle16_v_i16m8(const int16_t *rs1, size_t vl);
vint32mf2_t __riscv_vle32_v_i32mf2(const int32_t *rs1, size_t vl);
vint32m1_t __riscv_vle32_v_i32m1(const int32_t *rs1, size_t vl);
vint32m2_t __riscv_vle32_v_i32m2(const int32_t *rs1, size_t vl);
vint32m4_t __riscv_vle32_v_i32m4(const int32_t *rs1, size_t vl);
vint32m8_t __riscv_vle32_v_i32m8(const int32_t *rs1, size_t vl);
vint64m1_t __riscv_vle64_v_i64m1(const int64_t *rs1, size_t vl);
vint64m2_t __riscv_vle64_v_i64m2(const int64_t *rs1, size_t vl);
vint64m4_t __riscv_vle64_v_i64m4(const int64_t *rs1, size_t vl);
vint64m8_t __riscv_vle64_v_i64m8(const int64_t *rs1, size_t vl);
vuint8mf8_t __riscv_vle8_v_u8mf8(const uint8_t *rs1, size_t vl);
vuint8mf4_t __riscv_vle8_v_u8mf4(const uint8_t *rs1, size_t vl);
vuint8mf2_t __riscv_vle8_v_u8mf2(const uint8_t *rs1, size_t vl);
vuint8m1_t __riscv_vle8_v_u8m1(const uint8_t *rs1, size_t vl);
vuint8m2_t __riscv_vle8_v_u8m2(const uint8_t *rs1, size_t vl);
vuint8m4_t __riscv_vle8_v_u8m4(const uint8_t *rs1, size_t vl);
vuint8m8_t __riscv_vle8_v_u8m8(const uint8_t *rs1, size_t vl);
vuint16mf4_t __riscv_vle16_v_u16mf4(const uint16_t *rs1, size_t vl);
vuint16mf2_t __riscv_vle16_v_u16mf2(const uint16_t *rs1, size_t vl);
vuint16m1_t __riscv_vle16_v_u16m1(const uint16_t *rs1, size_t vl);
vuint16m2_t __riscv_vle16_v_u16m2(const uint16_t *rs1, size_t vl);
vuint16m4_t __riscv_vle16_v_u16m4(const uint16_t *rs1, size_t vl);
vuint16m8_t __riscv_vle16_v_u16m8(const uint16_t *rs1, size_t vl);
vuint32mf2_t __riscv_vle32_v_u32mf2(const uint32_t *rs1, size_t vl);
vuint32m1_t __riscv_vle32_v_u32m1(const uint32_t *rs1, size_t vl);
vuint32m2_t __riscv_vle32_v_u32m2(const uint32_t *rs1, size_t vl);
vuint32m4_t __riscv_vle32_v_u32m4(const uint32_t *rs1, size_t vl);
vuint32m8_t __riscv_vle32_v_u32m8(const uint32_t *rs1, size_t vl);
vuint64m1_t __riscv_vle64_v_u64m1(const uint64_t *rs1, size_t vl);
vuint64m2_t __riscv_vle64_v_u64m2(const uint64_t *rs1, size_t vl);
vuint64m4_t __riscv_vle64_v_u64m4(const uint64_t *rs1, size_t vl);
vuint64m8_t __riscv_vle64_v_u64m8(const uint64_t *rs1, size_t vl);
// masked functions
vfloat16mf4_t __riscv_vle16_v_f16mf4_m(vbool64_t vm, const _Float16 *rs1,
                                       size_t vl);
vfloat16mf2_t __riscv_vle16_v_f16mf2_m(vbool32_t vm, const _Float16 *rs1,
                                       size_t vl);
vfloat16m1_t __riscv_vle16_v_f16m1_m(vbool16_t vm, const _Float16 *rs1,
                                     size_t vl);
vfloat16m2_t __riscv_vle16_v_f16m2_m(vbool8_t vm, const _Float16 *rs1,
                                     size_t vl);
vfloat16m4_t __riscv_vle16_v_f16m4_m(vbool4_t vm, const _Float16 *rs1,
                                     size_t vl);
vfloat16m8_t __riscv_vle16_v_f16m8_m(vbool2_t vm, const _Float16 *rs1,
                                     size_t vl);
vfloat32mf2_t __riscv_vle32_v_f32mf2_m(vbool64_t vm, const float *rs1,
                                       size_t vl);
vfloat32m1_t __riscv_vle32_v_f32m1_m(vbool32_t vm, const float *rs1, size_t vl);
vfloat32m2_t __riscv_vle32_v_f32m2_m(vbool16_t vm, const float *rs1, size_t vl);
vfloat32m4_t __riscv_vle32_v_f32m4_m(vbool8_t vm, const float *rs1, size_t vl);
vfloat32m8_t __riscv_vle32_v_f32m8_m(vbool4_t vm, const float *rs1, size_t vl);
vfloat64m1_t __riscv_vle64_v_f64m1_m(vbool64_t vm, const double *rs1,
                                     size_t vl);
vfloat64m2_t __riscv_vle64_v_f64m2_m(vbool32_t vm, const double *rs1,
                                     size_t vl);
vfloat64m4_t __riscv_vle64_v_f64m4_m(vbool16_t vm, const double *rs1,
                                     size_t vl);
vfloat64m8_t __riscv_vle64_v_f64m8_m(vbool8_t vm, const double *rs1, size_t vl);
vint8mf8_t __riscv_vle8_v_i8mf8_m(vbool64_t vm, const int8_t *rs1, size_t vl);
vint8mf4_t __riscv_vle8_v_i8mf4_m(vbool32_t vm, const int8_t *rs1, size_t vl);
vint8mf2_t __riscv_vle8_v_i8mf2_m(vbool16_t vm, const int8_t *rs1, size_t vl);
vint8m1_t __riscv_vle8_v_i8m1_m(vbool8_t vm, const int8_t *rs1, size_t vl);
vint8m2_t __riscv_vle8_v_i8m2_m(vbool4_t vm, const int8_t *rs1, size_t vl);
vint8m4_t __riscv_vle8_v_i8m4_m(vbool2_t vm, const int8_t *rs1, size_t vl);
vint8m8_t __riscv_vle8_v_i8m8_m(vbool1_t vm, const int8_t *rs1, size_t vl);
vint16mf4_t __riscv_vle16_v_i16mf4_m(vbool64_t vm, const int16_t *rs1,
                                     size_t vl);
vint16mf2_t __riscv_vle16_v_i16mf2_m(vbool32_t vm, const int16_t *rs1,
                                     size_t vl);
vint16m1_t __riscv_vle16_v_i16m1_m(vbool16_t vm, const int16_t *rs1, size_t vl);
vint16m2_t __riscv_vle16_v_i16m2_m(vbool8_t vm, const int16_t *rs1, size_t vl);
vint16m4_t __riscv_vle16_v_i16m4_m(vbool4_t vm, const int16_t *rs1, size_t vl);
vint16m8_t __riscv_vle16_v_i16m8_m(vbool2_t vm, const int16_t *rs1, size_t vl);
vint32mf2_t __riscv_vle32_v_i32mf2_m(vbool64_t vm, const int32_t *rs1,
                                     size_t vl);
vint32m1_t __riscv_vle32_v_i32m1_m(vbool32_t vm, const int32_t *rs1, size_t vl);
vint32m2_t __riscv_vle32_v_i32m2_m(vbool16_t vm, const int32_t *rs1, size_t vl);
vint32m4_t __riscv_vle32_v_i32m4_m(vbool8_t vm, const int32_t *rs1, size_t vl);
vint32m8_t __riscv_vle32_v_i32m8_m(vbool4_t vm, const int32_t *rs1, size_t vl);
vint64m1_t __riscv_vle64_v_i64m1_m(vbool64_t vm, const int64_t *rs1, size_t vl);
vint64m2_t __riscv_vle64_v_i64m2_m(vbool32_t vm, const int64_t *rs1, size_t vl);
vint64m4_t __riscv_vle64_v_i64m4_m(vbool16_t vm, const int64_t *rs1, size_t vl);
vint64m8_t __riscv_vle64_v_i64m8_m(vbool8_t vm, const int64_t *rs1, size_t vl);
vuint8mf8_t __riscv_vle8_v_u8mf8_m(vbool64_t vm, const uint8_t *rs1, size_t vl);
vuint8mf4_t __riscv_vle8_v_u8mf4_m(vbool32_t vm, const uint8_t *rs1, size_t vl);
vuint8mf2_t __riscv_vle8_v_u8mf2_m(vbool16_t vm, const uint8_t *rs1, size_t vl);
vuint8m1_t __riscv_vle8_v_u8m1_m(vbool8_t vm, const uint8_t *rs1, size_t vl);
vuint8m2_t __riscv_vle8_v_u8m2_m(vbool4_t vm, const uint8_t *rs1, size_t vl);
vuint8m4_t __riscv_vle8_v_u8m4_m(vbool2_t vm, const uint8_t *rs1, size_t vl);
vuint8m8_t __riscv_vle8_v_u8m8_m(vbool1_t vm, const uint8_t *rs1, size_t vl);
vuint16mf4_t __riscv_vle16_v_u16mf4_m(vbool64_t vm, const uint16_t *rs1,
                                      size_t vl);
vuint16mf2_t __riscv_vle16_v_u16mf2_m(vbool32_t vm, const uint16_t *rs1,
                                      size_t vl);
vuint16m1_t __riscv_vle16_v_u16m1_m(vbool16_t vm, const uint16_t *rs1,
                                    size_t vl);
vuint16m2_t __riscv_vle16_v_u16m2_m(vbool8_t vm, const uint16_t *rs1,
                                    size_t vl);
vuint16m4_t __riscv_vle16_v_u16m4_m(vbool4_t vm, const uint16_t *rs1,
                                    size_t vl);
vuint16m8_t __riscv_vle16_v_u16m8_m(vbool2_t vm, const uint16_t *rs1,
                                    size_t vl);
vuint32mf2_t __riscv_vle32_v_u32mf2_m(vbool64_t vm, const uint32_t *rs1,
                                      size_t vl);
vuint32m1_t __riscv_vle32_v_u32m1_m(vbool32_t vm, const uint32_t *rs1,
                                    size_t vl);
vuint32m2_t __riscv_vle32_v_u32m2_m(vbool16_t vm, const uint32_t *rs1,
                                    size_t vl);
vuint32m4_t __riscv_vle32_v_u32m4_m(vbool8_t vm, const uint32_t *rs1,
                                    size_t vl);
vuint32m8_t __riscv_vle32_v_u32m8_m(vbool4_t vm, const uint32_t *rs1,
                                    size_t vl);
vuint64m1_t __riscv_vle64_v_u64m1_m(vbool64_t vm, const uint64_t *rs1,
                                    size_t vl);
vuint64m2_t __riscv_vle64_v_u64m2_m(vbool32_t vm, const uint64_t *rs1,
                                    size_t vl);
vuint64m4_t __riscv_vle64_v_u64m4_m(vbool16_t vm, const uint64_t *rs1,
                                    size_t vl);
vuint64m8_t __riscv_vle64_v_u64m8_m(vbool8_t vm, const uint64_t *rs1,
                                    size_t vl);

Vector Unit-Stride Store Intrinsics

void __riscv_vse16_v_f16mf4(_Float16 *rs1, vfloat16mf4_t vs3, size_t vl);
void __riscv_vse16_v_f16mf2(_Float16 *rs1, vfloat16mf2_t vs3, size_t vl);
void __riscv_vse16_v_f16m1(_Float16 *rs1, vfloat16m1_t vs3, size_t vl);
void __riscv_vse16_v_f16m2(_Float16 *rs1, vfloat16m2_t vs3, size_t vl);
void __riscv_vse16_v_f16m4(_Float16 *rs1, vfloat16m4_t vs3, size_t vl);
void __riscv_vse16_v_f16m8(_Float16 *rs1, vfloat16m8_t vs3, size_t vl);
void __riscv_vse32_v_f32mf2(float *rs1, vfloat32mf2_t vs3, size_t vl);
void __riscv_vse32_v_f32m1(float *rs1, vfloat32m1_t vs3, size_t vl);
void __riscv_vse32_v_f32m2(float *rs1, vfloat32m2_t vs3, size_t vl);
void __riscv_vse32_v_f32m4(float *rs1, vfloat32m4_t vs3, size_t vl);
void __riscv_vse32_v_f32m8(float *rs1, vfloat32m8_t vs3, size_t vl);
void __riscv_vse64_v_f64m1(double *rs1, vfloat64m1_t vs3, size_t vl);
void __riscv_vse64_v_f64m2(double *rs1, vfloat64m2_t vs3, size_t vl);
void __riscv_vse64_v_f64m4(double *rs1, vfloat64m4_t vs3, size_t vl);
void __riscv_vse64_v_f64m8(double *rs1, vfloat64m8_t vs3, size_t vl);
void __riscv_vse8_v_i8mf8(int8_t *rs1, vint8mf8_t vs3, size_t vl);
void __riscv_vse8_v_i8mf4(int8_t *rs1, vint8mf4_t vs3, size_t vl);
void __riscv_vse8_v_i8mf2(int8_t *rs1, vint8mf2_t vs3, size_t vl);
void __riscv_vse8_v_i8m1(int8_t *rs1, vint8m1_t vs3, size_t vl);
void __riscv_vse8_v_i8m2(int8_t *rs1, vint8m2_t vs3, size_t vl);
void __riscv_vse8_v_i8m4(int8_t *rs1, vint8m4_t vs3, size_t vl);
void __riscv_vse8_v_i8m8(int8_t *rs1, vint8m8_t vs3, size_t vl);
void __riscv_vse16_v_i16mf4(int16_t *rs1, vint16mf4_t vs3, size_t vl);
void __riscv_vse16_v_i16mf2(int16_t *rs1, vint16mf2_t vs3, size_t vl);
void __riscv_vse16_v_i16m1(int16_t *rs1, vint16m1_t vs3, size_t vl);
void __riscv_vse16_v_i16m2(int16_t *rs1, vint16m2_t vs3, size_t vl);
void __riscv_vse16_v_i16m4(int16_t *rs1, vint16m4_t vs3, size_t vl);
void __riscv_vse16_v_i16m8(int16_t *rs1, vint16m8_t vs3, size_t vl);
void __riscv_vse32_v_i32mf2(int32_t *rs1, vint32mf2_t vs3, size_t vl);
void __riscv_vse32_v_i32m1(int32_t *rs1, vint32m1_t vs3, size_t vl);
void __riscv_vse32_v_i32m2(int32_t *rs1, vint32m2_t vs3, size_t vl);
void __riscv_vse32_v_i32m4(int32_t *rs1, vint32m4_t vs3, size_t vl);
void __riscv_vse32_v_i32m8(int32_t *rs1, vint32m8_t vs3, size_t vl);
void __riscv_vse64_v_i64m1(int64_t *rs1, vint64m1_t vs3, size_t vl);
void __riscv_vse64_v_i64m2(int64_t *rs1, vint64m2_t vs3, size_t vl);
void __riscv_vse64_v_i64m4(int64_t *rs1, vint64m4_t vs3, size_t vl);
void __riscv_vse64_v_i64m8(int64_t *rs1, vint64m8_t vs3, size_t vl);
void __riscv_vse8_v_u8mf8(uint8_t *rs1, vuint8mf8_t vs3, size_t vl);
void __riscv_vse8_v_u8mf4(uint8_t *rs1, vuint8mf4_t vs3, size_t vl);
void __riscv_vse8_v_u8mf2(uint8_t *rs1, vuint8mf2_t vs3, size_t vl);
void __riscv_vse8_v_u8m1(uint8_t *rs1, vuint8m1_t vs3, size_t vl);
void __riscv_vse8_v_u8m2(uint8_t *rs1, vuint8m2_t vs3, size_t vl);
void __riscv_vse8_v_u8m4(uint8_t *rs1, vuint8m4_t vs3, size_t vl);
void __riscv_vse8_v_u8m8(uint8_t *rs1, vuint8m8_t vs3, size_t vl);
void __riscv_vse16_v_u16mf4(uint16_t *rs1, vuint16mf4_t vs3, size_t vl);
void __riscv_vse16_v_u16mf2(uint16_t *rs1, vuint16mf2_t vs3, size_t vl);
void __riscv_vse16_v_u16m1(uint16_t *rs1, vuint16m1_t vs3, size_t vl);
void __riscv_vse16_v_u16m2(uint16_t *rs1, vuint16m2_t vs3, size_t vl);
void __riscv_vse16_v_u16m4(uint16_t *rs1, vuint16m4_t vs3, size_t vl);
void __riscv_vse16_v_u16m8(uint16_t *rs1, vuint16m8_t vs3, size_t vl);
void __riscv_vse32_v_u32mf2(uint32_t *rs1, vuint32mf2_t vs3, size_t vl);
void __riscv_vse32_v_u32m1(uint32_t *rs1, vuint32m1_t vs3, size_t vl);
void __riscv_vse32_v_u32m2(uint32_t *rs1, vuint32m2_t vs3, size_t vl);
void __riscv_vse32_v_u32m4(uint32_t *rs1, vuint32m4_t vs3, size_t vl);
void __riscv_vse32_v_u32m8(uint32_t *rs1, vuint32m8_t vs3, size_t vl);
void __riscv_vse64_v_u64m1(uint64_t *rs1, vuint64m1_t vs3, size_t vl);
void __riscv_vse64_v_u64m2(uint64_t *rs1, vuint64m2_t vs3, size_t vl);
void __riscv_vse64_v_u64m4(uint64_t *rs1, vuint64m4_t vs3, size_t vl);
void __riscv_vse64_v_u64m8(uint64_t *rs1, vuint64m8_t vs3, size_t vl);
// masked functions
void __riscv_vse16_v_f16mf4_m(vbool64_t vm, _Float16 *rs1, vfloat16mf4_t vs3,
                              size_t vl);
void __riscv_vse16_v_f16mf2_m(vbool32_t vm, _Float16 *rs1, vfloat16mf2_t vs3,
                              size_t vl);
void __riscv_vse16_v_f16m1_m(vbool16_t vm, _Float16 *rs1, vfloat16m1_t vs3,
                             size_t vl);
void __riscv_vse16_v_f16m2_m(vbool8_t vm, _Float16 *rs1, vfloat16m2_t vs3,
                             size_t vl);
void __riscv_vse16_v_f16m4_m(vbool4_t vm, _Float16 *rs1, vfloat16m4_t vs3,
                             size_t vl);
void __riscv_vse16_v_f16m8_m(vbool2_t vm, _Float16 *rs1, vfloat16m8_t vs3,
                             size_t vl);
void __riscv_vse32_v_f32mf2_m(vbool64_t vm, float *rs1, vfloat32mf2_t vs3,
                              size_t vl);
void __riscv_vse32_v_f32m1_m(vbool32_t vm, float *rs1, vfloat32m1_t vs3,
                             size_t vl);
void __riscv_vse32_v_f32m2_m(vbool16_t vm, float *rs1, vfloat32m2_t vs3,
                             size_t vl);
void __riscv_vse32_v_f32m4_m(vbool8_t vm, float *rs1, vfloat32m4_t vs3,
                             size_t vl);
void __riscv_vse32_v_f32m8_m(vbool4_t vm, float *rs1, vfloat32m8_t vs3,
                             size_t vl);
void __riscv_vse64_v_f64m1_m(vbool64_t vm, double *rs1, vfloat64m1_t vs3,
                             size_t vl);
void __riscv_vse64_v_f64m2_m(vbool32_t vm, double *rs1, vfloat64m2_t vs3,
                             size_t vl);
void __riscv_vse64_v_f64m4_m(vbool16_t vm, double *rs1, vfloat64m4_t vs3,
                             size_t vl);
void __riscv_vse64_v_f64m8_m(vbool8_t vm, double *rs1, vfloat64m8_t vs3,
                             size_t vl);
void __riscv_vse8_v_i8mf8_m(vbool64_t vm, int8_t *rs1, vint8mf8_t vs3,
                            size_t vl);
void __riscv_vse8_v_i8mf4_m(vbool32_t vm, int8_t *rs1, vint8mf4_t vs3,
                            size_t vl);
void __riscv_vse8_v_i8mf2_m(vbool16_t vm, int8_t *rs1, vint8mf2_t vs3,
                            size_t vl);
void __riscv_vse8_v_i8m1_m(vbool8_t vm, int8_t *rs1, vint8m1_t vs3, size_t vl);
void __riscv_vse8_v_i8m2_m(vbool4_t vm, int8_t *rs1, vint8m2_t vs3, size_t vl);
void __riscv_vse8_v_i8m4_m(vbool2_t vm, int8_t *rs1, vint8m4_t vs3, size_t vl);
void __riscv_vse8_v_i8m8_m(vbool1_t vm, int8_t *rs1, vint8m8_t vs3, size_t vl);
void __riscv_vse16_v_i16mf4_m(vbool64_t vm, int16_t *rs1, vint16mf4_t vs3,
                              size_t vl);
void __riscv_vse16_v_i16mf2_m(vbool32_t vm, int16_t *rs1, vint16mf2_t vs3,
                              size_t vl);
void __riscv_vse16_v_i16m1_m(vbool16_t vm, int16_t *rs1, vint16m1_t vs3,
                             size_t vl);
void __riscv_vse16_v_i16m2_m(vbool8_t vm, int16_t *rs1, vint16m2_t vs3,
                             size_t vl);
void __riscv_vse16_v_i16m4_m(vbool4_t vm, int16_t *rs1, vint16m4_t vs3,
                             size_t vl);
void __riscv_vse16_v_i16m8_m(vbool2_t vm, int16_t *rs1, vint16m8_t vs3,
                             size_t vl);
void __riscv_vse32_v_i32mf2_m(vbool64_t vm, int32_t *rs1, vint32mf2_t vs3,
                              size_t vl);
void __riscv_vse32_v_i32m1_m(vbool32_t vm, int32_t *rs1, vint32m1_t vs3,
                             size_t vl);
void __riscv_vse32_v_i32m2_m(vbool16_t vm, int32_t *rs1, vint32m2_t vs3,
                             size_t vl);
void __riscv_vse32_v_i32m4_m(vbool8_t vm, int32_t *rs1, vint32m4_t vs3,
                             size_t vl);
void __riscv_vse32_v_i32m8_m(vbool4_t vm, int32_t *rs1, vint32m8_t vs3,
                             size_t vl);
void __riscv_vse64_v_i64m1_m(vbool64_t vm, int64_t *rs1, vint64m1_t vs3,
                             size_t vl);
void __riscv_vse64_v_i64m2_m(vbool32_t vm, int64_t *rs1, vint64m2_t vs3,
                             size_t vl);
void __riscv_vse64_v_i64m4_m(vbool16_t vm, int64_t *rs1, vint64m4_t vs3,
                             size_t vl);
void __riscv_vse64_v_i64m8_m(vbool8_t vm, int64_t *rs1, vint64m8_t vs3,
                             size_t vl);
void __riscv_vse8_v_u8mf8_m(vbool64_t vm, uint8_t *rs1, vuint8mf8_t vs3,
                            size_t vl);
void __riscv_vse8_v_u8mf4_m(vbool32_t vm, uint8_t *rs1, vuint8mf4_t vs3,
                            size_t vl);
void __riscv_vse8_v_u8mf2_m(vbool16_t vm, uint8_t *rs1, vuint8mf2_t vs3,
                            size_t vl);
void __riscv_vse8_v_u8m1_m(vbool8_t vm, uint8_t *rs1, vuint8m1_t vs3,
                           size_t vl);
void __riscv_vse8_v_u8m2_m(vbool4_t vm, uint8_t *rs1, vuint8m2_t vs3,
                           size_t vl);
void __riscv_vse8_v_u8m4_m(vbool2_t vm, uint8_t *rs1, vuint8m4_t vs3,
                           size_t vl);
void __riscv_vse8_v_u8m8_m(vbool1_t vm, uint8_t *rs1, vuint8m8_t vs3,
                           size_t vl);
void __riscv_vse16_v_u16mf4_m(vbool64_t vm, uint16_t *rs1, vuint16mf4_t vs3,
                              size_t vl);
void __riscv_vse16_v_u16mf2_m(vbool32_t vm, uint16_t *rs1, vuint16mf2_t vs3,
                              size_t vl);
void __riscv_vse16_v_u16m1_m(vbool16_t vm, uint16_t *rs1, vuint16m1_t vs3,
                             size_t vl);
void __riscv_vse16_v_u16m2_m(vbool8_t vm, uint16_t *rs1, vuint16m2_t vs3,
                             size_t vl);
void __riscv_vse16_v_u16m4_m(vbool4_t vm, uint16_t *rs1, vuint16m4_t vs3,
                             size_t vl);
void __riscv_vse16_v_u16m8_m(vbool2_t vm, uint16_t *rs1, vuint16m8_t vs3,
                             size_t vl);
void __riscv_vse32_v_u32mf2_m(vbool64_t vm, uint32_t *rs1, vuint32mf2_t vs3,
                              size_t vl);
void __riscv_vse32_v_u32m1_m(vbool32_t vm, uint32_t *rs1, vuint32m1_t vs3,
                             size_t vl);
void __riscv_vse32_v_u32m2_m(vbool16_t vm, uint32_t *rs1, vuint32m2_t vs3,
                             size_t vl);
void __riscv_vse32_v_u32m4_m(vbool8_t vm, uint32_t *rs1, vuint32m4_t vs3,
                             size_t vl);
void __riscv_vse32_v_u32m8_m(vbool4_t vm, uint32_t *rs1, vuint32m8_t vs3,
                             size_t vl);
void __riscv_vse64_v_u64m1_m(vbool64_t vm, uint64_t *rs1, vuint64m1_t vs3,
                             size_t vl);
void __riscv_vse64_v_u64m2_m(vbool32_t vm, uint64_t *rs1, vuint64m2_t vs3,
                             size_t vl);
void __riscv_vse64_v_u64m4_m(vbool16_t vm, uint64_t *rs1, vuint64m4_t vs3,
                             size_t vl);
void __riscv_vse64_v_u64m8_m(vbool8_t vm, uint64_t *rs1, vuint64m8_t vs3,
                             size_t vl);

Vector Mask Load/Store Intrinsics

vbool1_t __riscv_vlm_v_b1(const uint8_t *rs1, size_t vl);
vbool2_t __riscv_vlm_v_b2(const uint8_t *rs1, size_t vl);
vbool4_t __riscv_vlm_v_b4(const uint8_t *rs1, size_t vl);
vbool8_t __riscv_vlm_v_b8(const uint8_t *rs1, size_t vl);
vbool16_t __riscv_vlm_v_b16(const uint8_t *rs1, size_t vl);
vbool32_t __riscv_vlm_v_b32(const uint8_t *rs1, size_t vl);
vbool64_t __riscv_vlm_v_b64(const uint8_t *rs1, size_t vl);
void __riscv_vsm_v_b1(uint8_t *rs1, vbool1_t vs3, size_t vl);
void __riscv_vsm_v_b2(uint8_t *rs1, vbool2_t vs3, size_t vl);
void __riscv_vsm_v_b4(uint8_t *rs1, vbool4_t vs3, size_t vl);
void __riscv_vsm_v_b8(uint8_t *rs1, vbool8_t vs3, size_t vl);
void __riscv_vsm_v_b16(uint8_t *rs1, vbool16_t vs3, size_t vl);
void __riscv_vsm_v_b32(uint8_t *rs1, vbool32_t vs3, size_t vl);
void __riscv_vsm_v_b64(uint8_t *rs1, vbool64_t vs3, size_t vl);

Vector Strided Load Intrinsics

vfloat16mf4_t __riscv_vlse16_v_f16mf4(const _Float16 *rs1, ptrdiff_t rs2,
                                      size_t vl);
vfloat16mf2_t __riscv_vlse16_v_f16mf2(const _Float16 *rs1, ptrdiff_t rs2,
                                      size_t vl);
vfloat16m1_t __riscv_vlse16_v_f16m1(const _Float16 *rs1, ptrdiff_t rs2,
                                    size_t vl);
vfloat16m2_t __riscv_vlse16_v_f16m2(const _Float16 *rs1, ptrdiff_t rs2,
                                    size_t vl);
vfloat16m4_t __riscv_vlse16_v_f16m4(const _Float16 *rs1, ptrdiff_t rs2,
                                    size_t vl);
vfloat16m8_t __riscv_vlse16_v_f16m8(const _Float16 *rs1, ptrdiff_t rs2,
                                    size_t vl);
vfloat32mf2_t __riscv_vlse32_v_f32mf2(const float *rs1, ptrdiff_t rs2,
                                      size_t vl);
vfloat32m1_t __riscv_vlse32_v_f32m1(const float *rs1, ptrdiff_t rs2, size_t vl);
vfloat32m2_t __riscv_vlse32_v_f32m2(const float *rs1, ptrdiff_t rs2, size_t vl);
vfloat32m4_t __riscv_vlse32_v_f32m4(const float *rs1, ptrdiff_t rs2, size_t vl);
vfloat32m8_t __riscv_vlse32_v_f32m8(const float *rs1, ptrdiff_t rs2, size_t vl);
vfloat64m1_t __riscv_vlse64_v_f64m1(const double *rs1, ptrdiff_t rs2,
                                    size_t vl);
vfloat64m2_t __riscv_vlse64_v_f64m2(const double *rs1, ptrdiff_t rs2,
                                    size_t vl);
vfloat64m4_t __riscv_vlse64_v_f64m4(const double *rs1, ptrdiff_t rs2,
                                    size_t vl);
vfloat64m8_t __riscv_vlse64_v_f64m8(const double *rs1, ptrdiff_t rs2,
                                    size_t vl);
vint8mf8_t __riscv_vlse8_v_i8mf8(const int8_t *rs1, ptrdiff_t rs2, size_t vl);
vint8mf4_t __riscv_vlse8_v_i8mf4(const int8_t *rs1, ptrdiff_t rs2, size_t vl);
vint8mf2_t __riscv_vlse8_v_i8mf2(const int8_t *rs1, ptrdiff_t rs2, size_t vl);
vint8m1_t __riscv_vlse8_v_i8m1(const int8_t *rs1, ptrdiff_t rs2, size_t vl);
vint8m2_t __riscv_vlse8_v_i8m2(const int8_t *rs1, ptrdiff_t rs2, size_t vl);
vint8m4_t __riscv_vlse8_v_i8m4(const int8_t *rs1, ptrdiff_t rs2, size_t vl);
vint8m8_t __riscv_vlse8_v_i8m8(const int8_t *rs1, ptrdiff_t rs2, size_t vl);
vint16mf4_t __riscv_vlse16_v_i16mf4(const int16_t *rs1, ptrdiff_t rs2,
                                    size_t vl);
vint16mf2_t __riscv_vlse16_v_i16mf2(const int16_t *rs1, ptrdiff_t rs2,
                                    size_t vl);
vint16m1_t __riscv_vlse16_v_i16m1(const int16_t *rs1, ptrdiff_t rs2, size_t vl);
vint16m2_t __riscv_vlse16_v_i16m2(const int16_t *rs1, ptrdiff_t rs2, size_t vl);
vint16m4_t __riscv_vlse16_v_i16m4(const int16_t *rs1, ptrdiff_t rs2, size_t vl);
vint16m8_t __riscv_vlse16_v_i16m8(const int16_t *rs1, ptrdiff_t rs2, size_t vl);
vint32mf2_t __riscv_vlse32_v_i32mf2(const int32_t *rs1, ptrdiff_t rs2,
                                    size_t vl);
vint32m1_t __riscv_vlse32_v_i32m1(const int32_t *rs1, ptrdiff_t rs2, size_t vl);
vint32m2_t __riscv_vlse32_v_i32m2(const int32_t *rs1, ptrdiff_t rs2, size_t vl);
vint32m4_t __riscv_vlse32_v_i32m4(const int32_t *rs1, ptrdiff_t rs2, size_t vl);
vint32m8_t __riscv_vlse32_v_i32m8(const int32_t *rs1, ptrdiff_t rs2, size_t vl);
vint64m1_t __riscv_vlse64_v_i64m1(const int64_t *rs1, ptrdiff_t rs2, size_t vl);
vint64m2_t __riscv_vlse64_v_i64m2(const int64_t *rs1, ptrdiff_t rs2, size_t vl);
vint64m4_t __riscv_vlse64_v_i64m4(const int64_t *rs1, ptrdiff_t rs2, size_t vl);
vint64m8_t __riscv_vlse64_v_i64m8(const int64_t *rs1, ptrdiff_t rs2, size_t vl);
vuint8mf8_t __riscv_vlse8_v_u8mf8(const uint8_t *rs1, ptrdiff_t rs2, size_t vl);
vuint8mf4_t __riscv_vlse8_v_u8mf4(const uint8_t *rs1, ptrdiff_t rs2, size_t vl);
vuint8mf2_t __riscv_vlse8_v_u8mf2(const uint8_t *rs1, ptrdiff_t rs2, size_t vl);
vuint8m1_t __riscv_vlse8_v_u8m1(const uint8_t *rs1, ptrdiff_t rs2, size_t vl);
vuint8m2_t __riscv_vlse8_v_u8m2(const uint8_t *rs1, ptrdiff_t rs2, size_t vl);
vuint8m4_t __riscv_vlse8_v_u8m4(const uint8_t *rs1, ptrdiff_t rs2, size_t vl);
vuint8m8_t __riscv_vlse8_v_u8m8(const uint8_t *rs1, ptrdiff_t rs2, size_t vl);
vuint16mf4_t __riscv_vlse16_v_u16mf4(const uint16_t *rs1, ptrdiff_t rs2,
                                     size_t vl);
vuint16mf2_t __riscv_vlse16_v_u16mf2(const uint16_t *rs1, ptrdiff_t rs2,
                                     size_t vl);
vuint16m1_t __riscv_vlse16_v_u16m1(const uint16_t *rs1, ptrdiff_t rs2,
                                   size_t vl);
vuint16m2_t __riscv_vlse16_v_u16m2(const uint16_t *rs1, ptrdiff_t rs2,
                                   size_t vl);
vuint16m4_t __riscv_vlse16_v_u16m4(const uint16_t *rs1, ptrdiff_t rs2,
                                   size_t vl);
vuint16m8_t __riscv_vlse16_v_u16m8(const uint16_t *rs1, ptrdiff_t rs2,
                                   size_t vl);
vuint32mf2_t __riscv_vlse32_v_u32mf2(const uint32_t *rs1, ptrdiff_t rs2,
                                     size_t vl);
vuint32m1_t __riscv_vlse32_v_u32m1(const uint32_t *rs1, ptrdiff_t rs2,
                                   size_t vl);
vuint32m2_t __riscv_vlse32_v_u32m2(const uint32_t *rs1, ptrdiff_t rs2,
                                   size_t vl);
vuint32m4_t __riscv_vlse32_v_u32m4(const uint32_t *rs1, ptrdiff_t rs2,
                                   size_t vl);
vuint32m8_t __riscv_vlse32_v_u32m8(const uint32_t *rs1, ptrdiff_t rs2,
                                   size_t vl);
vuint64m1_t __riscv_vlse64_v_u64m1(const uint64_t *rs1, ptrdiff_t rs2,
                                   size_t vl);
vuint64m2_t __riscv_vlse64_v_u64m2(const uint64_t *rs1, ptrdiff_t rs2,
                                   size_t vl);
vuint64m4_t __riscv_vlse64_v_u64m4(const uint64_t *rs1, ptrdiff_t rs2,
                                   size_t vl);
vuint64m8_t __riscv_vlse64_v_u64m8(const uint64_t *rs1, ptrdiff_t rs2,
                                   size_t vl);
// masked functions
vfloat16mf4_t __riscv_vlse16_v_f16mf4_m(vbool64_t vm, const _Float16 *rs1,
                                        ptrdiff_t rs2, size_t vl);
vfloat16mf2_t __riscv_vlse16_v_f16mf2_m(vbool32_t vm, const _Float16 *rs1,
                                        ptrdiff_t rs2, size_t vl);
vfloat16m1_t __riscv_vlse16_v_f16m1_m(vbool16_t vm, const _Float16 *rs1,
                                      ptrdiff_t rs2, size_t vl);
vfloat16m2_t __riscv_vlse16_v_f16m2_m(vbool8_t vm, const _Float16 *rs1,
                                      ptrdiff_t rs2, size_t vl);
vfloat16m4_t __riscv_vlse16_v_f16m4_m(vbool4_t vm, const _Float16 *rs1,
                                      ptrdiff_t rs2, size_t vl);
vfloat16m8_t __riscv_vlse16_v_f16m8_m(vbool2_t vm, const _Float16 *rs1,
                                      ptrdiff_t rs2, size_t vl);
vfloat32mf2_t __riscv_vlse32_v_f32mf2_m(vbool64_t vm, const float *rs1,
                                        ptrdiff_t rs2, size_t vl);
vfloat32m1_t __riscv_vlse32_v_f32m1_m(vbool32_t vm, const float *rs1,
                                      ptrdiff_t rs2, size_t vl);
vfloat32m2_t __riscv_vlse32_v_f32m2_m(vbool16_t vm, const float *rs1,
                                      ptrdiff_t rs2, size_t vl);
vfloat32m4_t __riscv_vlse32_v_f32m4_m(vbool8_t vm, const float *rs1,
                                      ptrdiff_t rs2, size_t vl);
vfloat32m8_t __riscv_vlse32_v_f32m8_m(vbool4_t vm, const float *rs1,
                                      ptrdiff_t rs2, size_t vl);
vfloat64m1_t __riscv_vlse64_v_f64m1_m(vbool64_t vm, const double *rs1,
                                      ptrdiff_t rs2, size_t vl);
vfloat64m2_t __riscv_vlse64_v_f64m2_m(vbool32_t vm, const double *rs1,
                                      ptrdiff_t rs2, size_t vl);
vfloat64m4_t __riscv_vlse64_v_f64m4_m(vbool16_t vm, const double *rs1,
                                      ptrdiff_t rs2, size_t vl);
vfloat64m8_t __riscv_vlse64_v_f64m8_m(vbool8_t vm, const double *rs1,
                                      ptrdiff_t rs2, size_t vl);
vint8mf8_t __riscv_vlse8_v_i8mf8_m(vbool64_t vm, const int8_t *rs1,
                                   ptrdiff_t rs2, size_t vl);
vint8mf4_t __riscv_vlse8_v_i8mf4_m(vbool32_t vm, const int8_t *rs1,
                                   ptrdiff_t rs2, size_t vl);
vint8mf2_t __riscv_vlse8_v_i8mf2_m(vbool16_t vm, const int8_t *rs1,
                                   ptrdiff_t rs2, size_t vl);
vint8m1_t __riscv_vlse8_v_i8m1_m(vbool8_t vm, const int8_t *rs1, ptrdiff_t rs2,
                                 size_t vl);
vint8m2_t __riscv_vlse8_v_i8m2_m(vbool4_t vm, const int8_t *rs1, ptrdiff_t rs2,
                                 size_t vl);
vint8m4_t __riscv_vlse8_v_i8m4_m(vbool2_t vm, const int8_t *rs1, ptrdiff_t rs2,
                                 size_t vl);
vint8m8_t __riscv_vlse8_v_i8m8_m(vbool1_t vm, const int8_t *rs1, ptrdiff_t rs2,
                                 size_t vl);
vint16mf4_t __riscv_vlse16_v_i16mf4_m(vbool64_t vm, const int16_t *rs1,
                                      ptrdiff_t rs2, size_t vl);
vint16mf2_t __riscv_vlse16_v_i16mf2_m(vbool32_t vm, const int16_t *rs1,
                                      ptrdiff_t rs2, size_t vl);
vint16m1_t __riscv_vlse16_v_i16m1_m(vbool16_t vm, const int16_t *rs1,
                                    ptrdiff_t rs2, size_t vl);
vint16m2_t __riscv_vlse16_v_i16m2_m(vbool8_t vm, const int16_t *rs1,
                                    ptrdiff_t rs2, size_t vl);
vint16m4_t __riscv_vlse16_v_i16m4_m(vbool4_t vm, const int16_t *rs1,
                                    ptrdiff_t rs2, size_t vl);
vint16m8_t __riscv_vlse16_v_i16m8_m(vbool2_t vm, const int16_t *rs1,
                                    ptrdiff_t rs2, size_t vl);
vint32mf2_t __riscv_vlse32_v_i32mf2_m(vbool64_t vm, const int32_t *rs1,
                                      ptrdiff_t rs2, size_t vl);
vint32m1_t __riscv_vlse32_v_i32m1_m(vbool32_t vm, const int32_t *rs1,
                                    ptrdiff_t rs2, size_t vl);
vint32m2_t __riscv_vlse32_v_i32m2_m(vbool16_t vm, const int32_t *rs1,
                                    ptrdiff_t rs2, size_t vl);
vint32m4_t __riscv_vlse32_v_i32m4_m(vbool8_t vm, const int32_t *rs1,
                                    ptrdiff_t rs2, size_t vl);
vint32m8_t __riscv_vlse32_v_i32m8_m(vbool4_t vm, const int32_t *rs1,
                                    ptrdiff_t rs2, size_t vl);
vint64m1_t __riscv_vlse64_v_i64m1_m(vbool64_t vm, const int64_t *rs1,
                                    ptrdiff_t rs2, size_t vl);
vint64m2_t __riscv_vlse64_v_i64m2_m(vbool32_t vm, const int64_t *rs1,
                                    ptrdiff_t rs2, size_t vl);
vint64m4_t __riscv_vlse64_v_i64m4_m(vbool16_t vm, const int64_t *rs1,
                                    ptrdiff_t rs2, size_t vl);
vint64m8_t __riscv_vlse64_v_i64m8_m(vbool8_t vm, const int64_t *rs1,
                                    ptrdiff_t rs2, size_t vl);
vuint8mf8_t __riscv_vlse8_v_u8mf8_m(vbool64_t vm, const uint8_t *rs1,
                                    ptrdiff_t rs2, size_t vl);
vuint8mf4_t __riscv_vlse8_v_u8mf4_m(vbool32_t vm, const uint8_t *rs1,
                                    ptrdiff_t rs2, size_t vl);
vuint8mf2_t __riscv_vlse8_v_u8mf2_m(vbool16_t vm, const uint8_t *rs1,
                                    ptrdiff_t rs2, size_t vl);
vuint8m1_t __riscv_vlse8_v_u8m1_m(vbool8_t vm, const uint8_t *rs1,
                                  ptrdiff_t rs2, size_t vl);
vuint8m2_t __riscv_vlse8_v_u8m2_m(vbool4_t vm, const uint8_t *rs1,
                                  ptrdiff_t rs2, size_t vl);
vuint8m4_t __riscv_vlse8_v_u8m4_m(vbool2_t vm, const uint8_t *rs1,
                                  ptrdiff_t rs2, size_t vl);
vuint8m8_t __riscv_vlse8_v_u8m8_m(vbool1_t vm, const uint8_t *rs1,
                                  ptrdiff_t rs2, size_t vl);
vuint16mf4_t __riscv_vlse16_v_u16mf4_m(vbool64_t vm, const uint16_t *rs1,
                                       ptrdiff_t rs2, size_t vl);
vuint16mf2_t __riscv_vlse16_v_u16mf2_m(vbool32_t vm, const uint16_t *rs1,
                                       ptrdiff_t rs2, size_t vl);
vuint16m1_t __riscv_vlse16_v_u16m1_m(vbool16_t vm, const uint16_t *rs1,
                                     ptrdiff_t rs2, size_t vl);
vuint16m2_t __riscv_vlse16_v_u16m2_m(vbool8_t vm, const uint16_t *rs1,
                                     ptrdiff_t rs2, size_t vl);
vuint16m4_t __riscv_vlse16_v_u16m4_m(vbool4_t vm, const uint16_t *rs1,
                                     ptrdiff_t rs2, size_t vl);
vuint16m8_t __riscv_vlse16_v_u16m8_m(vbool2_t vm, const uint16_t *rs1,
                                     ptrdiff_t rs2, size_t vl);
vuint32mf2_t __riscv_vlse32_v_u32mf2_m(vbool64_t vm, const uint32_t *rs1,
                                       ptrdiff_t rs2, size_t vl);
vuint32m1_t __riscv_vlse32_v_u32m1_m(vbool32_t vm, const uint32_t *rs1,
                                     ptrdiff_t rs2, size_t vl);
vuint32m2_t __riscv_vlse32_v_u32m2_m(vbool16_t vm, const uint32_t *rs1,
                                     ptrdiff_t rs2, size_t vl);
vuint32m4_t __riscv_vlse32_v_u32m4_m(vbool8_t vm, const uint32_t *rs1,
                                     ptrdiff_t rs2, size_t vl);
vuint32m8_t __riscv_vlse32_v_u32m8_m(vbool4_t vm, const uint32_t *rs1,
                                     ptrdiff_t rs2, size_t vl);
vuint64m1_t __riscv_vlse64_v_u64m1_m(vbool64_t vm, const uint64_t *rs1,
                                     ptrdiff_t rs2, size_t vl);
vuint64m2_t __riscv_vlse64_v_u64m2_m(vbool32_t vm, const uint64_t *rs1,
                                     ptrdiff_t rs2, size_t vl);
vuint64m4_t __riscv_vlse64_v_u64m4_m(vbool16_t vm, const uint64_t *rs1,
                                     ptrdiff_t rs2, size_t vl);
vuint64m8_t __riscv_vlse64_v_u64m8_m(vbool8_t vm, const uint64_t *rs1,
                                     ptrdiff_t rs2, size_t vl);

Vector Strided Store Intrinsics

void __riscv_vsse16_v_f16mf4(_Float16 *rs1, ptrdiff_t rs2, vfloat16mf4_t vs3,
                             size_t vl);
void __riscv_vsse16_v_f16mf2(_Float16 *rs1, ptrdiff_t rs2, vfloat16mf2_t vs3,
                             size_t vl);
void __riscv_vsse16_v_f16m1(_Float16 *rs1, ptrdiff_t rs2, vfloat16m1_t vs3,
                            size_t vl);
void __riscv_vsse16_v_f16m2(_Float16 *rs1, ptrdiff_t rs2, vfloat16m2_t vs3,
                            size_t vl);
void __riscv_vsse16_v_f16m4(_Float16 *rs1, ptrdiff_t rs2, vfloat16m4_t vs3,
                            size_t vl);
void __riscv_vsse16_v_f16m8(_Float16 *rs1, ptrdiff_t rs2, vfloat16m8_t vs3,
                            size_t vl);
void __riscv_vsse32_v_f32mf2(float *rs1, ptrdiff_t rs2, vfloat32mf2_t vs3,
                             size_t vl);
void __riscv_vsse32_v_f32m1(float *rs1, ptrdiff_t rs2, vfloat32m1_t vs3,
                            size_t vl);
void __riscv_vsse32_v_f32m2(float *rs1, ptrdiff_t rs2, vfloat32m2_t vs3,
                            size_t vl);
void __riscv_vsse32_v_f32m4(float *rs1, ptrdiff_t rs2, vfloat32m4_t vs3,
                            size_t vl);
void __riscv_vsse32_v_f32m8(float *rs1, ptrdiff_t rs2, vfloat32m8_t vs3,
                            size_t vl);
void __riscv_vsse64_v_f64m1(double *rs1, ptrdiff_t rs2, vfloat64m1_t vs3,
                            size_t vl);
void __riscv_vsse64_v_f64m2(double *rs1, ptrdiff_t rs2, vfloat64m2_t vs3,
                            size_t vl);
void __riscv_vsse64_v_f64m4(double *rs1, ptrdiff_t rs2, vfloat64m4_t vs3,
                            size_t vl);
void __riscv_vsse64_v_f64m8(double *rs1, ptrdiff_t rs2, vfloat64m8_t vs3,
                            size_t vl);
void __riscv_vsse8_v_i8mf8(int8_t *rs1, ptrdiff_t rs2, vint8mf8_t vs3,
                           size_t vl);
void __riscv_vsse8_v_i8mf4(int8_t *rs1, ptrdiff_t rs2, vint8mf4_t vs3,
                           size_t vl);
void __riscv_vsse8_v_i8mf2(int8_t *rs1, ptrdiff_t rs2, vint8mf2_t vs3,
                           size_t vl);
void __riscv_vsse8_v_i8m1(int8_t *rs1, ptrdiff_t rs2, vint8m1_t vs3, size_t vl);
void __riscv_vsse8_v_i8m2(int8_t *rs1, ptrdiff_t rs2, vint8m2_t vs3, size_t vl);
void __riscv_vsse8_v_i8m4(int8_t *rs1, ptrdiff_t rs2, vint8m4_t vs3, size_t vl);
void __riscv_vsse8_v_i8m8(int8_t *rs1, ptrdiff_t rs2, vint8m8_t vs3, size_t vl);
void __riscv_vsse16_v_i16mf4(int16_t *rs1, ptrdiff_t rs2, vint16mf4_t vs3,
                             size_t vl);
void __riscv_vsse16_v_i16mf2(int16_t *rs1, ptrdiff_t rs2, vint16mf2_t vs3,
                             size_t vl);
void __riscv_vsse16_v_i16m1(int16_t *rs1, ptrdiff_t rs2, vint16m1_t vs3,
                            size_t vl);
void __riscv_vsse16_v_i16m2(int16_t *rs1, ptrdiff_t rs2, vint16m2_t vs3,
                            size_t vl);
void __riscv_vsse16_v_i16m4(int16_t *rs1, ptrdiff_t rs2, vint16m4_t vs3,
                            size_t vl);
void __riscv_vsse16_v_i16m8(int16_t *rs1, ptrdiff_t rs2, vint16m8_t vs3,
                            size_t vl);
void __riscv_vsse32_v_i32mf2(int32_t *rs1, ptrdiff_t rs2, vint32mf2_t vs3,
                             size_t vl);
void __riscv_vsse32_v_i32m1(int32_t *rs1, ptrdiff_t rs2, vint32m1_t vs3,
                            size_t vl);
void __riscv_vsse32_v_i32m2(int32_t *rs1, ptrdiff_t rs2, vint32m2_t vs3,
                            size_t vl);
void __riscv_vsse32_v_i32m4(int32_t *rs1, ptrdiff_t rs2, vint32m4_t vs3,
                            size_t vl);
void __riscv_vsse32_v_i32m8(int32_t *rs1, ptrdiff_t rs2, vint32m8_t vs3,
                            size_t vl);
void __riscv_vsse64_v_i64m1(int64_t *rs1, ptrdiff_t rs2, vint64m1_t vs3,
                            size_t vl);
void __riscv_vsse64_v_i64m2(int64_t *rs1, ptrdiff_t rs2, vint64m2_t vs3,
                            size_t vl);
void __riscv_vsse64_v_i64m4(int64_t *rs1, ptrdiff_t rs2, vint64m4_t vs3,
                            size_t vl);
void __riscv_vsse64_v_i64m8(int64_t *rs1, ptrdiff_t rs2, vint64m8_t vs3,
                            size_t vl);
void __riscv_vsse8_v_u8mf8(uint8_t *rs1, ptrdiff_t rs2, vuint8mf8_t vs3,
                           size_t vl);
void __riscv_vsse8_v_u8mf4(uint8_t *rs1, ptrdiff_t rs2, vuint8mf4_t vs3,
                           size_t vl);
void __riscv_vsse8_v_u8mf2(uint8_t *rs1, ptrdiff_t rs2, vuint8mf2_t vs3,
                           size_t vl);
void __riscv_vsse8_v_u8m1(uint8_t *rs1, ptrdiff_t rs2, vuint8m1_t vs3,
                          size_t vl);
void __riscv_vsse8_v_u8m2(uint8_t *rs1, ptrdiff_t rs2, vuint8m2_t vs3,
                          size_t vl);
void __riscv_vsse8_v_u8m4(uint8_t *rs1, ptrdiff_t rs2, vuint8m4_t vs3,
                          size_t vl);
void __riscv_vsse8_v_u8m8(uint8_t *rs1, ptrdiff_t rs2, vuint8m8_t vs3,
                          size_t vl);
void __riscv_vsse16_v_u16mf4(uint16_t *rs1, ptrdiff_t rs2, vuint16mf4_t vs3,
                             size_t vl);
void __riscv_vsse16_v_u16mf2(uint16_t *rs1, ptrdiff_t rs2, vuint16mf2_t vs3,
                             size_t vl);
void __riscv_vsse16_v_u16m1(uint16_t *rs1, ptrdiff_t rs2, vuint16m1_t vs3,
                            size_t vl);
void __riscv_vsse16_v_u16m2(uint16_t *rs1, ptrdiff_t rs2, vuint16m2_t vs3,
                            size_t vl);
void __riscv_vsse16_v_u16m4(uint16_t *rs1, ptrdiff_t rs2, vuint16m4_t vs3,
                            size_t vl);
void __riscv_vsse16_v_u16m8(uint16_t *rs1, ptrdiff_t rs2, vuint16m8_t vs3,
                            size_t vl);
void __riscv_vsse32_v_u32mf2(uint32_t *rs1, ptrdiff_t rs2, vuint32mf2_t vs3,
                             size_t vl);
void __riscv_vsse32_v_u32m1(uint32_t *rs1, ptrdiff_t rs2, vuint32m1_t vs3,
                            size_t vl);
void __riscv_vsse32_v_u32m2(uint32_t *rs1, ptrdiff_t rs2, vuint32m2_t vs3,
                            size_t vl);
void __riscv_vsse32_v_u32m4(uint32_t *rs1, ptrdiff_t rs2, vuint32m4_t vs3,
                            size_t vl);
void __riscv_vsse32_v_u32m8(uint32_t *rs1, ptrdiff_t rs2, vuint32m8_t vs3,
                            size_t vl);
void __riscv_vsse64_v_u64m1(uint64_t *rs1, ptrdiff_t rs2, vuint64m1_t vs3,
                            size_t vl);
void __riscv_vsse64_v_u64m2(uint64_t *rs1, ptrdiff_t rs2, vuint64m2_t vs3,
                            size_t vl);
void __riscv_vsse64_v_u64m4(uint64_t *rs1, ptrdiff_t rs2, vuint64m4_t vs3,
                            size_t vl);
void __riscv_vsse64_v_u64m8(uint64_t *rs1, ptrdiff_t rs2, vuint64m8_t vs3,
                            size_t vl);
// masked functions
void __riscv_vsse16_v_f16mf4_m(vbool64_t vm, _Float16 *rs1, ptrdiff_t rs2,
                               vfloat16mf4_t vs3, size_t vl);
void __riscv_vsse16_v_f16mf2_m(vbool32_t vm, _Float16 *rs1, ptrdiff_t rs2,
                               vfloat16mf2_t vs3, size_t vl);
void __riscv_vsse16_v_f16m1_m(vbool16_t vm, _Float16 *rs1, ptrdiff_t rs2,
                              vfloat16m1_t vs3, size_t vl);
void __riscv_vsse16_v_f16m2_m(vbool8_t vm, _Float16 *rs1, ptrdiff_t rs2,
                              vfloat16m2_t vs3, size_t vl);
void __riscv_vsse16_v_f16m4_m(vbool4_t vm, _Float16 *rs1, ptrdiff_t rs2,
                              vfloat16m4_t vs3, size_t vl);
void __riscv_vsse16_v_f16m8_m(vbool2_t vm, _Float16 *rs1, ptrdiff_t rs2,
                              vfloat16m8_t vs3, size_t vl);
void __riscv_vsse32_v_f32mf2_m(vbool64_t vm, float *rs1, ptrdiff_t rs2,
                               vfloat32mf2_t vs3, size_t vl);
void __riscv_vsse32_v_f32m1_m(vbool32_t vm, float *rs1, ptrdiff_t rs2,
                              vfloat32m1_t vs3, size_t vl);
void __riscv_vsse32_v_f32m2_m(vbool16_t vm, float *rs1, ptrdiff_t rs2,
                              vfloat32m2_t vs3, size_t vl);
void __riscv_vsse32_v_f32m4_m(vbool8_t vm, float *rs1, ptrdiff_t rs2,
                              vfloat32m4_t vs3, size_t vl);
void __riscv_vsse32_v_f32m8_m(vbool4_t vm, float *rs1, ptrdiff_t rs2,
                              vfloat32m8_t vs3, size_t vl);
void __riscv_vsse64_v_f64m1_m(vbool64_t vm, double *rs1, ptrdiff_t rs2,
                              vfloat64m1_t vs3, size_t vl);
void __riscv_vsse64_v_f64m2_m(vbool32_t vm, double *rs1, ptrdiff_t rs2,
                              vfloat64m2_t vs3, size_t vl);
void __riscv_vsse64_v_f64m4_m(vbool16_t vm, double *rs1, ptrdiff_t rs2,
                              vfloat64m4_t vs3, size_t vl);
void __riscv_vsse64_v_f64m8_m(vbool8_t vm, double *rs1, ptrdiff_t rs2,
                              vfloat64m8_t vs3, size_t vl);
void __riscv_vsse8_v_i8mf8_m(vbool64_t vm, int8_t *rs1, ptrdiff_t rs2,
                             vint8mf8_t vs3, size_t vl);
void __riscv_vsse8_v_i8mf4_m(vbool32_t vm, int8_t *rs1, ptrdiff_t rs2,
                             vint8mf4_t vs3, size_t vl);
void __riscv_vsse8_v_i8mf2_m(vbool16_t vm, int8_t *rs1, ptrdiff_t rs2,
                             vint8mf2_t vs3, size_t vl);
void __riscv_vsse8_v_i8m1_m(vbool8_t vm, int8_t *rs1, ptrdiff_t rs2,
                            vint8m1_t vs3, size_t vl);
void __riscv_vsse8_v_i8m2_m(vbool4_t vm, int8_t *rs1, ptrdiff_t rs2,
                            vint8m2_t vs3, size_t vl);
void __riscv_vsse8_v_i8m4_m(vbool2_t vm, int8_t *rs1, ptrdiff_t rs2,
                            vint8m4_t vs3, size_t vl);
void __riscv_vsse8_v_i8m8_m(vbool1_t vm, int8_t *rs1, ptrdiff_t rs2,
                            vint8m8_t vs3, size_t vl);
void __riscv_vsse16_v_i16mf4_m(vbool64_t vm, int16_t *rs1, ptrdiff_t rs2,
                               vint16mf4_t vs3, size_t vl);
void __riscv_vsse16_v_i16mf2_m(vbool32_t vm, int16_t *rs1, ptrdiff_t rs2,
                               vint16mf2_t vs3, size_t vl);
void __riscv_vsse16_v_i16m1_m(vbool16_t vm, int16_t *rs1, ptrdiff_t rs2,
                              vint16m1_t vs3, size_t vl);
void __riscv_vsse16_v_i16m2_m(vbool8_t vm, int16_t *rs1, ptrdiff_t rs2,
                              vint16m2_t vs3, size_t vl);
void __riscv_vsse16_v_i16m4_m(vbool4_t vm, int16_t *rs1, ptrdiff_t rs2,
                              vint16m4_t vs3, size_t vl);
void __riscv_vsse16_v_i16m8_m(vbool2_t vm, int16_t *rs1, ptrdiff_t rs2,
                              vint16m8_t vs3, size_t vl);
void __riscv_vsse32_v_i32mf2_m(vbool64_t vm, int32_t *rs1, ptrdiff_t rs2,
                               vint32mf2_t vs3, size_t vl);
void __riscv_vsse32_v_i32m1_m(vbool32_t vm, int32_t *rs1, ptrdiff_t rs2,
                              vint32m1_t vs3, size_t vl);
void __riscv_vsse32_v_i32m2_m(vbool16_t vm, int32_t *rs1, ptrdiff_t rs2,
                              vint32m2_t vs3, size_t vl);
void __riscv_vsse32_v_i32m4_m(vbool8_t vm, int32_t *rs1, ptrdiff_t rs2,
                              vint32m4_t vs3, size_t vl);
void __riscv_vsse32_v_i32m8_m(vbool4_t vm, int32_t *rs1, ptrdiff_t rs2,
                              vint32m8_t vs3, size_t vl);
void __riscv_vsse64_v_i64m1_m(vbool64_t vm, int64_t *rs1, ptrdiff_t rs2,
                              vint64m1_t vs3, size_t vl);
void __riscv_vsse64_v_i64m2_m(vbool32_t vm, int64_t *rs1, ptrdiff_t rs2,
                              vint64m2_t vs3, size_t vl);
void __riscv_vsse64_v_i64m4_m(vbool16_t vm, int64_t *rs1, ptrdiff_t rs2,
                              vint64m4_t vs3, size_t vl);
void __riscv_vsse64_v_i64m8_m(vbool8_t vm, int64_t *rs1, ptrdiff_t rs2,
                              vint64m8_t vs3, size_t vl);
void __riscv_vsse8_v_u8mf8_m(vbool64_t vm, uint8_t *rs1, ptrdiff_t rs2,
                             vuint8mf8_t vs3, size_t vl);
void __riscv_vsse8_v_u8mf4_m(vbool32_t vm, uint8_t *rs1, ptrdiff_t rs2,
                             vuint8mf4_t vs3, size_t vl);
void __riscv_vsse8_v_u8mf2_m(vbool16_t vm, uint8_t *rs1, ptrdiff_t rs2,
                             vuint8mf2_t vs3, size_t vl);
void __riscv_vsse8_v_u8m1_m(vbool8_t vm, uint8_t *rs1, ptrdiff_t rs2,
                            vuint8m1_t vs3, size_t vl);
void __riscv_vsse8_v_u8m2_m(vbool4_t vm, uint8_t *rs1, ptrdiff_t rs2,
                            vuint8m2_t vs3, size_t vl);
void __riscv_vsse8_v_u8m4_m(vbool2_t vm, uint8_t *rs1, ptrdiff_t rs2,
                            vuint8m4_t vs3, size_t vl);
void __riscv_vsse8_v_u8m8_m(vbool1_t vm, uint8_t *rs1, ptrdiff_t rs2,
                            vuint8m8_t vs3, size_t vl);
void __riscv_vsse16_v_u16mf4_m(vbool64_t vm, uint16_t *rs1, ptrdiff_t rs2,
                               vuint16mf4_t vs3, size_t vl);
void __riscv_vsse16_v_u16mf2_m(vbool32_t vm, uint16_t *rs1, ptrdiff_t rs2,
                               vuint16mf2_t vs3, size_t vl);
void __riscv_vsse16_v_u16m1_m(vbool16_t vm, uint16_t *rs1, ptrdiff_t rs2,
                              vuint16m1_t vs3, size_t vl);
void __riscv_vsse16_v_u16m2_m(vbool8_t vm, uint16_t *rs1, ptrdiff_t rs2,
                              vuint16m2_t vs3, size_t vl);
void __riscv_vsse16_v_u16m4_m(vbool4_t vm, uint16_t *rs1, ptrdiff_t rs2,
                              vuint16m4_t vs3, size_t vl);
void __riscv_vsse16_v_u16m8_m(vbool2_t vm, uint16_t *rs1, ptrdiff_t rs2,
                              vuint16m8_t vs3, size_t vl);
void __riscv_vsse32_v_u32mf2_m(vbool64_t vm, uint32_t *rs1, ptrdiff_t rs2,
                               vuint32mf2_t vs3, size_t vl);
void __riscv_vsse32_v_u32m1_m(vbool32_t vm, uint32_t *rs1, ptrdiff_t rs2,
                              vuint32m1_t vs3, size_t vl);
void __riscv_vsse32_v_u32m2_m(vbool16_t vm, uint32_t *rs1, ptrdiff_t rs2,
                              vuint32m2_t vs3, size_t vl);
void __riscv_vsse32_v_u32m4_m(vbool8_t vm, uint32_t *rs1, ptrdiff_t rs2,
                              vuint32m4_t vs3, size_t vl);
void __riscv_vsse32_v_u32m8_m(vbool4_t vm, uint32_t *rs1, ptrdiff_t rs2,
                              vuint32m8_t vs3, size_t vl);
void __riscv_vsse64_v_u64m1_m(vbool64_t vm, uint64_t *rs1, ptrdiff_t rs2,
                              vuint64m1_t vs3, size_t vl);
void __riscv_vsse64_v_u64m2_m(vbool32_t vm, uint64_t *rs1, ptrdiff_t rs2,
                              vuint64m2_t vs3, size_t vl);
void __riscv_vsse64_v_u64m4_m(vbool16_t vm, uint64_t *rs1, ptrdiff_t rs2,
                              vuint64m4_t vs3, size_t vl);
void __riscv_vsse64_v_u64m8_m(vbool8_t vm, uint64_t *rs1, ptrdiff_t rs2,
                              vuint64m8_t vs3, size_t vl);

Vector Indexed Load Intrinsics

vfloat16mf4_t __riscv_vloxei8_v_f16mf4(const _Float16 *rs1, vuint8mf8_t rs2,
                                       size_t vl);
vfloat16mf2_t __riscv_vloxei8_v_f16mf2(const _Float16 *rs1, vuint8mf4_t rs2,
                                       size_t vl);
vfloat16m1_t __riscv_vloxei8_v_f16m1(const _Float16 *rs1, vuint8mf2_t rs2,
                                     size_t vl);
vfloat16m2_t __riscv_vloxei8_v_f16m2(const _Float16 *rs1, vuint8m1_t rs2,
                                     size_t vl);
vfloat16m4_t __riscv_vloxei8_v_f16m4(const _Float16 *rs1, vuint8m2_t rs2,
                                     size_t vl);
vfloat16m8_t __riscv_vloxei8_v_f16m8(const _Float16 *rs1, vuint8m4_t rs2,
                                     size_t vl);
vfloat16mf4_t __riscv_vloxei16_v_f16mf4(const _Float16 *rs1, vuint16mf4_t rs2,
                                        size_t vl);
vfloat16mf2_t __riscv_vloxei16_v_f16mf2(const _Float16 *rs1, vuint16mf2_t rs2,
                                        size_t vl);
vfloat16m1_t __riscv_vloxei16_v_f16m1(const _Float16 *rs1, vuint16m1_t rs2,
                                      size_t vl);
vfloat16m2_t __riscv_vloxei16_v_f16m2(const _Float16 *rs1, vuint16m2_t rs2,
                                      size_t vl);
vfloat16m4_t __riscv_vloxei16_v_f16m4(const _Float16 *rs1, vuint16m4_t rs2,
                                      size_t vl);
vfloat16m8_t __riscv_vloxei16_v_f16m8(const _Float16 *rs1, vuint16m8_t rs2,
                                      size_t vl);
vfloat16mf4_t __riscv_vloxei32_v_f16mf4(const _Float16 *rs1, vuint32mf2_t rs2,
                                        size_t vl);
vfloat16mf2_t __riscv_vloxei32_v_f16mf2(const _Float16 *rs1, vuint32m1_t rs2,
                                        size_t vl);
vfloat16m1_t __riscv_vloxei32_v_f16m1(const _Float16 *rs1, vuint32m2_t rs2,
                                      size_t vl);
vfloat16m2_t __riscv_vloxei32_v_f16m2(const _Float16 *rs1, vuint32m4_t rs2,
                                      size_t vl);
vfloat16m4_t __riscv_vloxei32_v_f16m4(const _Float16 *rs1, vuint32m8_t rs2,
                                      size_t vl);
vfloat16mf4_t __riscv_vloxei64_v_f16mf4(const _Float16 *rs1, vuint64m1_t rs2,
                                        size_t vl);
vfloat16mf2_t __riscv_vloxei64_v_f16mf2(const _Float16 *rs1, vuint64m2_t rs2,
                                        size_t vl);
vfloat16m1_t __riscv_vloxei64_v_f16m1(const _Float16 *rs1, vuint64m4_t rs2,
                                      size_t vl);
vfloat16m2_t __riscv_vloxei64_v_f16m2(const _Float16 *rs1, vuint64m8_t rs2,
                                      size_t vl);
vfloat32mf2_t __riscv_vloxei8_v_f32mf2(const float *rs1, vuint8mf8_t rs2,
                                       size_t vl);
vfloat32m1_t __riscv_vloxei8_v_f32m1(const float *rs1, vuint8mf4_t rs2,
                                     size_t vl);
vfloat32m2_t __riscv_vloxei8_v_f32m2(const float *rs1, vuint8mf2_t rs2,
                                     size_t vl);
vfloat32m4_t __riscv_vloxei8_v_f32m4(const float *rs1, vuint8m1_t rs2,
                                     size_t vl);
vfloat32m8_t __riscv_vloxei8_v_f32m8(const float *rs1, vuint8m2_t rs2,
                                     size_t vl);
vfloat32mf2_t __riscv_vloxei16_v_f32mf2(const float *rs1, vuint16mf4_t rs2,
                                        size_t vl);
vfloat32m1_t __riscv_vloxei16_v_f32m1(const float *rs1, vuint16mf2_t rs2,
                                      size_t vl);
vfloat32m2_t __riscv_vloxei16_v_f32m2(const float *rs1, vuint16m1_t rs2,
                                      size_t vl);
vfloat32m4_t __riscv_vloxei16_v_f32m4(const float *rs1, vuint16m2_t rs2,
                                      size_t vl);
vfloat32m8_t __riscv_vloxei16_v_f32m8(const float *rs1, vuint16m4_t rs2,
                                      size_t vl);
vfloat32mf2_t __riscv_vloxei32_v_f32mf2(const float *rs1, vuint32mf2_t rs2,
                                        size_t vl);
vfloat32m1_t __riscv_vloxei32_v_f32m1(const float *rs1, vuint32m1_t rs2,
                                      size_t vl);
vfloat32m2_t __riscv_vloxei32_v_f32m2(const float *rs1, vuint32m2_t rs2,
                                      size_t vl);
vfloat32m4_t __riscv_vloxei32_v_f32m4(const float *rs1, vuint32m4_t rs2,
                                      size_t vl);
vfloat32m8_t __riscv_vloxei32_v_f32m8(const float *rs1, vuint32m8_t rs2,
                                      size_t vl);
vfloat32mf2_t __riscv_vloxei64_v_f32mf2(const float *rs1, vuint64m1_t rs2,
                                        size_t vl);
vfloat32m1_t __riscv_vloxei64_v_f32m1(const float *rs1, vuint64m2_t rs2,
                                      size_t vl);
vfloat32m2_t __riscv_vloxei64_v_f32m2(const float *rs1, vuint64m4_t rs2,
                                      size_t vl);
vfloat32m4_t __riscv_vloxei64_v_f32m4(const float *rs1, vuint64m8_t rs2,
                                      size_t vl);
vfloat64m1_t __riscv_vloxei8_v_f64m1(const double *rs1, vuint8mf8_t rs2,
                                     size_t vl);
vfloat64m2_t __riscv_vloxei8_v_f64m2(const double *rs1, vuint8mf4_t rs2,
                                     size_t vl);
vfloat64m4_t __riscv_vloxei8_v_f64m4(const double *rs1, vuint8mf2_t rs2,
                                     size_t vl);
vfloat64m8_t __riscv_vloxei8_v_f64m8(const double *rs1, vuint8m1_t rs2,
                                     size_t vl);
vfloat64m1_t __riscv_vloxei16_v_f64m1(const double *rs1, vuint16mf4_t rs2,
                                      size_t vl);
vfloat64m2_t __riscv_vloxei16_v_f64m2(const double *rs1, vuint16mf2_t rs2,
                                      size_t vl);
vfloat64m4_t __riscv_vloxei16_v_f64m4(const double *rs1, vuint16m1_t rs2,
                                      size_t vl);
vfloat64m8_t __riscv_vloxei16_v_f64m8(const double *rs1, vuint16m2_t rs2,
                                      size_t vl);
vfloat64m1_t __riscv_vloxei32_v_f64m1(const double *rs1, vuint32mf2_t rs2,
                                      size_t vl);
vfloat64m2_t __riscv_vloxei32_v_f64m2(const double *rs1, vuint32m1_t rs2,
                                      size_t vl);
vfloat64m4_t __riscv_vloxei32_v_f64m4(const double *rs1, vuint32m2_t rs2,
                                      size_t vl);
vfloat64m8_t __riscv_vloxei32_v_f64m8(const double *rs1, vuint32m4_t rs2,
                                      size_t vl);
vfloat64m1_t __riscv_vloxei64_v_f64m1(const double *rs1, vuint64m1_t rs2,
                                      size_t vl);
vfloat64m2_t __riscv_vloxei64_v_f64m2(const double *rs1, vuint64m2_t rs2,
                                      size_t vl);
vfloat64m4_t __riscv_vloxei64_v_f64m4(const double *rs1, vuint64m4_t rs2,
                                      size_t vl);
vfloat64m8_t __riscv_vloxei64_v_f64m8(const double *rs1, vuint64m8_t rs2,
                                      size_t vl);
vfloat16mf4_t __riscv_vluxei8_v_f16mf4(const _Float16 *rs1, vuint8mf8_t rs2,
                                       size_t vl);
vfloat16mf2_t __riscv_vluxei8_v_f16mf2(const _Float16 *rs1, vuint8mf4_t rs2,
                                       size_t vl);
vfloat16m1_t __riscv_vluxei8_v_f16m1(const _Float16 *rs1, vuint8mf2_t rs2,
                                     size_t vl);
vfloat16m2_t __riscv_vluxei8_v_f16m2(const _Float16 *rs1, vuint8m1_t rs2,
                                     size_t vl);
vfloat16m4_t __riscv_vluxei8_v_f16m4(const _Float16 *rs1, vuint8m2_t rs2,
                                     size_t vl);
vfloat16m8_t __riscv_vluxei8_v_f16m8(const _Float16 *rs1, vuint8m4_t rs2,
                                     size_t vl);
vfloat16mf4_t __riscv_vluxei16_v_f16mf4(const _Float16 *rs1, vuint16mf4_t rs2,
                                        size_t vl);
vfloat16mf2_t __riscv_vluxei16_v_f16mf2(const _Float16 *rs1, vuint16mf2_t rs2,
                                        size_t vl);
vfloat16m1_t __riscv_vluxei16_v_f16m1(const _Float16 *rs1, vuint16m1_t rs2,
                                      size_t vl);
vfloat16m2_t __riscv_vluxei16_v_f16m2(const _Float16 *rs1, vuint16m2_t rs2,
                                      size_t vl);
vfloat16m4_t __riscv_vluxei16_v_f16m4(const _Float16 *rs1, vuint16m4_t rs2,
                                      size_t vl);
vfloat16m8_t __riscv_vluxei16_v_f16m8(const _Float16 *rs1, vuint16m8_t rs2,
                                      size_t vl);
vfloat16mf4_t __riscv_vluxei32_v_f16mf4(const _Float16 *rs1, vuint32mf2_t rs2,
                                        size_t vl);
vfloat16mf2_t __riscv_vluxei32_v_f16mf2(const _Float16 *rs1, vuint32m1_t rs2,
                                        size_t vl);
vfloat16m1_t __riscv_vluxei32_v_f16m1(const _Float16 *rs1, vuint32m2_t rs2,
                                      size_t vl);
vfloat16m2_t __riscv_vluxei32_v_f16m2(const _Float16 *rs1, vuint32m4_t rs2,
                                      size_t vl);
vfloat16m4_t __riscv_vluxei32_v_f16m4(const _Float16 *rs1, vuint32m8_t rs2,
                                      size_t vl);
vfloat16mf4_t __riscv_vluxei64_v_f16mf4(const _Float16 *rs1, vuint64m1_t rs2,
                                        size_t vl);
vfloat16mf2_t __riscv_vluxei64_v_f16mf2(const _Float16 *rs1, vuint64m2_t rs2,
                                        size_t vl);
vfloat16m1_t __riscv_vluxei64_v_f16m1(const _Float16 *rs1, vuint64m4_t rs2,
                                      size_t vl);
vfloat16m2_t __riscv_vluxei64_v_f16m2(const _Float16 *rs1, vuint64m8_t rs2,
                                      size_t vl);
vfloat32mf2_t __riscv_vluxei8_v_f32mf2(const float *rs1, vuint8mf8_t rs2,
                                       size_t vl);
vfloat32m1_t __riscv_vluxei8_v_f32m1(const float *rs1, vuint8mf4_t rs2,
                                     size_t vl);
vfloat32m2_t __riscv_vluxei8_v_f32m2(const float *rs1, vuint8mf2_t rs2,
                                     size_t vl);
vfloat32m4_t __riscv_vluxei8_v_f32m4(const float *rs1, vuint8m1_t rs2,
                                     size_t vl);
vfloat32m8_t __riscv_vluxei8_v_f32m8(const float *rs1, vuint8m2_t rs2,
                                     size_t vl);
vfloat32mf2_t __riscv_vluxei16_v_f32mf2(const float *rs1, vuint16mf4_t rs2,
                                        size_t vl);
vfloat32m1_t __riscv_vluxei16_v_f32m1(const float *rs1, vuint16mf2_t rs2,
                                      size_t vl);
vfloat32m2_t __riscv_vluxei16_v_f32m2(const float *rs1, vuint16m1_t rs2,
                                      size_t vl);
vfloat32m4_t __riscv_vluxei16_v_f32m4(const float *rs1, vuint16m2_t rs2,
                                      size_t vl);
vfloat32m8_t __riscv_vluxei16_v_f32m8(const float *rs1, vuint16m4_t rs2,
                                      size_t vl);
vfloat32mf2_t __riscv_vluxei32_v_f32mf2(const float *rs1, vuint32mf2_t rs2,
                                        size_t vl);
vfloat32m1_t __riscv_vluxei32_v_f32m1(const float *rs1, vuint32m1_t rs2,
                                      size_t vl);
vfloat32m2_t __riscv_vluxei32_v_f32m2(const float *rs1, vuint32m2_t rs2,
                                      size_t vl);
vfloat32m4_t __riscv_vluxei32_v_f32m4(const float *rs1, vuint32m4_t rs2,
                                      size_t vl);
vfloat32m8_t __riscv_vluxei32_v_f32m8(const float *rs1, vuint32m8_t rs2,
                                      size_t vl);
vfloat32mf2_t __riscv_vluxei64_v_f32mf2(const float *rs1, vuint64m1_t rs2,
                                        size_t vl);
vfloat32m1_t __riscv_vluxei64_v_f32m1(const float *rs1, vuint64m2_t rs2,
                                      size_t vl);
vfloat32m2_t __riscv_vluxei64_v_f32m2(const float *rs1, vuint64m4_t rs2,
                                      size_t vl);
vfloat32m4_t __riscv_vluxei64_v_f32m4(const float *rs1, vuint64m8_t rs2,
                                      size_t vl);
vfloat64m1_t __riscv_vluxei8_v_f64m1(const double *rs1, vuint8mf8_t rs2,
                                     size_t vl);
vfloat64m2_t __riscv_vluxei8_v_f64m2(const double *rs1, vuint8mf4_t rs2,
                                     size_t vl);
vfloat64m4_t __riscv_vluxei8_v_f64m4(const double *rs1, vuint8mf2_t rs2,
                                     size_t vl);
vfloat64m8_t __riscv_vluxei8_v_f64m8(const double *rs1, vuint8m1_t rs2,
                                     size_t vl);
vfloat64m1_t __riscv_vluxei16_v_f64m1(const double *rs1, vuint16mf4_t rs2,
                                      size_t vl);
vfloat64m2_t __riscv_vluxei16_v_f64m2(const double *rs1, vuint16mf2_t rs2,
                                      size_t vl);
vfloat64m4_t __riscv_vluxei16_v_f64m4(const double *rs1, vuint16m1_t rs2,
                                      size_t vl);
vfloat64m8_t __riscv_vluxei16_v_f64m8(const double *rs1, vuint16m2_t rs2,
                                      size_t vl);
vfloat64m1_t __riscv_vluxei32_v_f64m1(const double *rs1, vuint32mf2_t rs2,
                                      size_t vl);
vfloat64m2_t __riscv_vluxei32_v_f64m2(const double *rs1, vuint32m1_t rs2,
                                      size_t vl);
vfloat64m4_t __riscv_vluxei32_v_f64m4(const double *rs1, vuint32m2_t rs2,
                                      size_t vl);
vfloat64m8_t __riscv_vluxei32_v_f64m8(const double *rs1, vuint32m4_t rs2,
                                      size_t vl);
vfloat64m1_t __riscv_vluxei64_v_f64m1(const double *rs1, vuint64m1_t rs2,
                                      size_t vl);
vfloat64m2_t __riscv_vluxei64_v_f64m2(const double *rs1, vuint64m2_t rs2,
                                      size_t vl);
vfloat64m4_t __riscv_vluxei64_v_f64m4(const double *rs1, vuint64m4_t rs2,
                                      size_t vl);
vfloat64m8_t __riscv_vluxei64_v_f64m8(const double *rs1, vuint64m8_t rs2,
                                      size_t vl);
vint8mf8_t __riscv_vloxei8_v_i8mf8(const int8_t *rs1, vuint8mf8_t rs2,
                                   size_t vl);
vint8mf4_t __riscv_vloxei8_v_i8mf4(const int8_t *rs1, vuint8mf4_t rs2,
                                   size_t vl);
vint8mf2_t __riscv_vloxei8_v_i8mf2(const int8_t *rs1, vuint8mf2_t rs2,
                                   size_t vl);
vint8m1_t __riscv_vloxei8_v_i8m1(const int8_t *rs1, vuint8m1_t rs2, size_t vl);
vint8m2_t __riscv_vloxei8_v_i8m2(const int8_t *rs1, vuint8m2_t rs2, size_t vl);
vint8m4_t __riscv_vloxei8_v_i8m4(const int8_t *rs1, vuint8m4_t rs2, size_t vl);
vint8m8_t __riscv_vloxei8_v_i8m8(const int8_t *rs1, vuint8m8_t rs2, size_t vl);
vint8mf8_t __riscv_vloxei16_v_i8mf8(const int8_t *rs1, vuint16mf4_t rs2,
                                    size_t vl);
vint8mf4_t __riscv_vloxei16_v_i8mf4(const int8_t *rs1, vuint16mf2_t rs2,
                                    size_t vl);
vint8mf2_t __riscv_vloxei16_v_i8mf2(const int8_t *rs1, vuint16m1_t rs2,
                                    size_t vl);
vint8m1_t __riscv_vloxei16_v_i8m1(const int8_t *rs1, vuint16m2_t rs2,
                                  size_t vl);
vint8m2_t __riscv_vloxei16_v_i8m2(const int8_t *rs1, vuint16m4_t rs2,
                                  size_t vl);
vint8m4_t __riscv_vloxei16_v_i8m4(const int8_t *rs1, vuint16m8_t rs2,
                                  size_t vl);
vint8mf8_t __riscv_vloxei32_v_i8mf8(const int8_t *rs1, vuint32mf2_t rs2,
                                    size_t vl);
vint8mf4_t __riscv_vloxei32_v_i8mf4(const int8_t *rs1, vuint32m1_t rs2,
                                    size_t vl);
vint8mf2_t __riscv_vloxei32_v_i8mf2(const int8_t *rs1, vuint32m2_t rs2,
                                    size_t vl);
vint8m1_t __riscv_vloxei32_v_i8m1(const int8_t *rs1, vuint32m4_t rs2,
                                  size_t vl);
vint8m2_t __riscv_vloxei32_v_i8m2(const int8_t *rs1, vuint32m8_t rs2,
                                  size_t vl);
vint8mf8_t __riscv_vloxei64_v_i8mf8(const int8_t *rs1, vuint64m1_t rs2,
                                    size_t vl);
vint8mf4_t __riscv_vloxei64_v_i8mf4(const int8_t *rs1, vuint64m2_t rs2,
                                    size_t vl);
vint8mf2_t __riscv_vloxei64_v_i8mf2(const int8_t *rs1, vuint64m4_t rs2,
                                    size_t vl);
vint8m1_t __riscv_vloxei64_v_i8m1(const int8_t *rs1, vuint64m8_t rs2,
                                  size_t vl);
vint16mf4_t __riscv_vloxei8_v_i16mf4(const int16_t *rs1, vuint8mf8_t rs2,
                                     size_t vl);
vint16mf2_t __riscv_vloxei8_v_i16mf2(const int16_t *rs1, vuint8mf4_t rs2,
                                     size_t vl);
vint16m1_t __riscv_vloxei8_v_i16m1(const int16_t *rs1, vuint8mf2_t rs2,
                                   size_t vl);
vint16m2_t __riscv_vloxei8_v_i16m2(const int16_t *rs1, vuint8m1_t rs2,
                                   size_t vl);
vint16m4_t __riscv_vloxei8_v_i16m4(const int16_t *rs1, vuint8m2_t rs2,
                                   size_t vl);
vint16m8_t __riscv_vloxei8_v_i16m8(const int16_t *rs1, vuint8m4_t rs2,
                                   size_t vl);
vint16mf4_t __riscv_vloxei16_v_i16mf4(const int16_t *rs1, vuint16mf4_t rs2,
                                      size_t vl);
vint16mf2_t __riscv_vloxei16_v_i16mf2(const int16_t *rs1, vuint16mf2_t rs2,
                                      size_t vl);
vint16m1_t __riscv_vloxei16_v_i16m1(const int16_t *rs1, vuint16m1_t rs2,
                                    size_t vl);
vint16m2_t __riscv_vloxei16_v_i16m2(const int16_t *rs1, vuint16m2_t rs2,
                                    size_t vl);
vint16m4_t __riscv_vloxei16_v_i16m4(const int16_t *rs1, vuint16m4_t rs2,
                                    size_t vl);
vint16m8_t __riscv_vloxei16_v_i16m8(const int16_t *rs1, vuint16m8_t rs2,
                                    size_t vl);
vint16mf4_t __riscv_vloxei32_v_i16mf4(const int16_t *rs1, vuint32mf2_t rs2,
                                      size_t vl);
vint16mf2_t __riscv_vloxei32_v_i16mf2(const int16_t *rs1, vuint32m1_t rs2,
                                      size_t vl);
vint16m1_t __riscv_vloxei32_v_i16m1(const int16_t *rs1, vuint32m2_t rs2,
                                    size_t vl);
vint16m2_t __riscv_vloxei32_v_i16m2(const int16_t *rs1, vuint32m4_t rs2,
                                    size_t vl);
vint16m4_t __riscv_vloxei32_v_i16m4(const int16_t *rs1, vuint32m8_t rs2,
                                    size_t vl);
vint16mf4_t __riscv_vloxei64_v_i16mf4(const int16_t *rs1, vuint64m1_t rs2,
                                      size_t vl);
vint16mf2_t __riscv_vloxei64_v_i16mf2(const int16_t *rs1, vuint64m2_t rs2,
                                      size_t vl);
vint16m1_t __riscv_vloxei64_v_i16m1(const int16_t *rs1, vuint64m4_t rs2,
                                    size_t vl);
vint16m2_t __riscv_vloxei64_v_i16m2(const int16_t *rs1, vuint64m8_t rs2,
                                    size_t vl);
vint32mf2_t __riscv_vloxei8_v_i32mf2(const int32_t *rs1, vuint8mf8_t rs2,
                                     size_t vl);
vint32m1_t __riscv_vloxei8_v_i32m1(const int32_t *rs1, vuint8mf4_t rs2,
                                   size_t vl);
vint32m2_t __riscv_vloxei8_v_i32m2(const int32_t *rs1, vuint8mf2_t rs2,
                                   size_t vl);
vint32m4_t __riscv_vloxei8_v_i32m4(const int32_t *rs1, vuint8m1_t rs2,
                                   size_t vl);
vint32m8_t __riscv_vloxei8_v_i32m8(const int32_t *rs1, vuint8m2_t rs2,
                                   size_t vl);
vint32mf2_t __riscv_vloxei16_v_i32mf2(const int32_t *rs1, vuint16mf4_t rs2,
                                      size_t vl);
vint32m1_t __riscv_vloxei16_v_i32m1(const int32_t *rs1, vuint16mf2_t rs2,
                                    size_t vl);
vint32m2_t __riscv_vloxei16_v_i32m2(const int32_t *rs1, vuint16m1_t rs2,
                                    size_t vl);
vint32m4_t __riscv_vloxei16_v_i32m4(const int32_t *rs1, vuint16m2_t rs2,
                                    size_t vl);
vint32m8_t __riscv_vloxei16_v_i32m8(const int32_t *rs1, vuint16m4_t rs2,
                                    size_t vl);
vint32mf2_t __riscv_vloxei32_v_i32mf2(const int32_t *rs1, vuint32mf2_t rs2,
                                      size_t vl);
vint32m1_t __riscv_vloxei32_v_i32m1(const int32_t *rs1, vuint32m1_t rs2,
                                    size_t vl);
vint32m2_t __riscv_vloxei32_v_i32m2(const int32_t *rs1, vuint32m2_t rs2,
                                    size_t vl);
vint32m4_t __riscv_vloxei32_v_i32m4(const int32_t *rs1, vuint32m4_t rs2,
                                    size_t vl);
vint32m8_t __riscv_vloxei32_v_i32m8(const int32_t *rs1, vuint32m8_t rs2,
                                    size_t vl);
vint32mf2_t __riscv_vloxei64_v_i32mf2(const int32_t *rs1, vuint64m1_t rs2,
                                      size_t vl);
vint32m1_t __riscv_vloxei64_v_i32m1(const int32_t *rs1, vuint64m2_t rs2,
                                    size_t vl);
vint32m2_t __riscv_vloxei64_v_i32m2(const int32_t *rs1, vuint64m4_t rs2,
                                    size_t vl);
vint32m4_t __riscv_vloxei64_v_i32m4(const int32_t *rs1, vuint64m8_t rs2,
                                    size_t vl);
vint64m1_t __riscv_vloxei8_v_i64m1(const int64_t *rs1, vuint8mf8_t rs2,
                                   size_t vl);
vint64m2_t __riscv_vloxei8_v_i64m2(const int64_t *rs1, vuint8mf4_t rs2,
                                   size_t vl);
vint64m4_t __riscv_vloxei8_v_i64m4(const int64_t *rs1, vuint8mf2_t rs2,
                                   size_t vl);
vint64m8_t __riscv_vloxei8_v_i64m8(const int64_t *rs1, vuint8m1_t rs2,
                                   size_t vl);
vint64m1_t __riscv_vloxei16_v_i64m1(const int64_t *rs1, vuint16mf4_t rs2,
                                    size_t vl);
vint64m2_t __riscv_vloxei16_v_i64m2(const int64_t *rs1, vuint16mf2_t rs2,
                                    size_t vl);
vint64m4_t __riscv_vloxei16_v_i64m4(const int64_t *rs1, vuint16m1_t rs2,
                                    size_t vl);
vint64m8_t __riscv_vloxei16_v_i64m8(const int64_t *rs1, vuint16m2_t rs2,
                                    size_t vl);
vint64m1_t __riscv_vloxei32_v_i64m1(const int64_t *rs1, vuint32mf2_t rs2,
                                    size_t vl);
vint64m2_t __riscv_vloxei32_v_i64m2(const int64_t *rs1, vuint32m1_t rs2,
                                    size_t vl);
vint64m4_t __riscv_vloxei32_v_i64m4(const int64_t *rs1, vuint32m2_t rs2,
                                    size_t vl);
vint64m8_t __riscv_vloxei32_v_i64m8(const int64_t *rs1, vuint32m4_t rs2,
                                    size_t vl);
vint64m1_t __riscv_vloxei64_v_i64m1(const int64_t *rs1, vuint64m1_t rs2,
                                    size_t vl);
vint64m2_t __riscv_vloxei64_v_i64m2(const int64_t *rs1, vuint64m2_t rs2,
                                    size_t vl);
vint64m4_t __riscv_vloxei64_v_i64m4(const int64_t *rs1, vuint64m4_t rs2,
                                    size_t vl);
vint64m8_t __riscv_vloxei64_v_i64m8(const int64_t *rs1, vuint64m8_t rs2,
                                    size_t vl);
vint8mf8_t __riscv_vluxei8_v_i8mf8(const int8_t *rs1, vuint8mf8_t rs2,
                                   size_t vl);
vint8mf4_t __riscv_vluxei8_v_i8mf4(const int8_t *rs1, vuint8mf4_t rs2,
                                   size_t vl);
vint8mf2_t __riscv_vluxei8_v_i8mf2(const int8_t *rs1, vuint8mf2_t rs2,
                                   size_t vl);
vint8m1_t __riscv_vluxei8_v_i8m1(const int8_t *rs1, vuint8m1_t rs2, size_t vl);
vint8m2_t __riscv_vluxei8_v_i8m2(const int8_t *rs1, vuint8m2_t rs2, size_t vl);
vint8m4_t __riscv_vluxei8_v_i8m4(const int8_t *rs1, vuint8m4_t rs2, size_t vl);
vint8m8_t __riscv_vluxei8_v_i8m8(const int8_t *rs1, vuint8m8_t rs2, size_t vl);
vint8mf8_t __riscv_vluxei16_v_i8mf8(const int8_t *rs1, vuint16mf4_t rs2,
                                    size_t vl);
vint8mf4_t __riscv_vluxei16_v_i8mf4(const int8_t *rs1, vuint16mf2_t rs2,
                                    size_t vl);
vint8mf2_t __riscv_vluxei16_v_i8mf2(const int8_t *rs1, vuint16m1_t rs2,
                                    size_t vl);
vint8m1_t __riscv_vluxei16_v_i8m1(const int8_t *rs1, vuint16m2_t rs2,
                                  size_t vl);
vint8m2_t __riscv_vluxei16_v_i8m2(const int8_t *rs1, vuint16m4_t rs2,
                                  size_t vl);
vint8m4_t __riscv_vluxei16_v_i8m4(const int8_t *rs1, vuint16m8_t rs2,
                                  size_t vl);
vint8mf8_t __riscv_vluxei32_v_i8mf8(const int8_t *rs1, vuint32mf2_t rs2,
                                    size_t vl);
vint8mf4_t __riscv_vluxei32_v_i8mf4(const int8_t *rs1, vuint32m1_t rs2,
                                    size_t vl);
vint8mf2_t __riscv_vluxei32_v_i8mf2(const int8_t *rs1, vuint32m2_t rs2,
                                    size_t vl);
vint8m1_t __riscv_vluxei32_v_i8m1(const int8_t *rs1, vuint32m4_t rs2,
                                  size_t vl);
vint8m2_t __riscv_vluxei32_v_i8m2(const int8_t *rs1, vuint32m8_t rs2,
                                  size_t vl);
vint8mf8_t __riscv_vluxei64_v_i8mf8(const int8_t *rs1, vuint64m1_t rs2,
                                    size_t vl);
vint8mf4_t __riscv_vluxei64_v_i8mf4(const int8_t *rs1, vuint64m2_t rs2,
                                    size_t vl);
vint8mf2_t __riscv_vluxei64_v_i8mf2(const int8_t *rs1, vuint64m4_t rs2,
                                    size_t vl);
vint8m1_t __riscv_vluxei64_v_i8m1(const int8_t *rs1, vuint64m8_t rs2,
                                  size_t vl);
vint16mf4_t __riscv_vluxei8_v_i16mf4(const int16_t *rs1, vuint8mf8_t rs2,
                                     size_t vl);
vint16mf2_t __riscv_vluxei8_v_i16mf2(const int16_t *rs1, vuint8mf4_t rs2,
                                     size_t vl);
vint16m1_t __riscv_vluxei8_v_i16m1(const int16_t *rs1, vuint8mf2_t rs2,
                                   size_t vl);
vint16m2_t __riscv_vluxei8_v_i16m2(const int16_t *rs1, vuint8m1_t rs2,
                                   size_t vl);
vint16m4_t __riscv_vluxei8_v_i16m4(const int16_t *rs1, vuint8m2_t rs2,
                                   size_t vl);
vint16m8_t __riscv_vluxei8_v_i16m8(const int16_t *rs1, vuint8m4_t rs2,
                                   size_t vl);
vint16mf4_t __riscv_vluxei16_v_i16mf4(const int16_t *rs1, vuint16mf4_t rs2,
                                      size_t vl);
vint16mf2_t __riscv_vluxei16_v_i16mf2(const int16_t *rs1, vuint16mf2_t rs2,
                                      size_t vl);
vint16m1_t __riscv_vluxei16_v_i16m1(const int16_t *rs1, vuint16m1_t rs2,
                                    size_t vl);
vint16m2_t __riscv_vluxei16_v_i16m2(const int16_t *rs1, vuint16m2_t rs2,
                                    size_t vl);
vint16m4_t __riscv_vluxei16_v_i16m4(const int16_t *rs1, vuint16m4_t rs2,
                                    size_t vl);
vint16m8_t __riscv_vluxei16_v_i16m8(const int16_t *rs1, vuint16m8_t rs2,
                                    size_t vl);
vint16mf4_t __riscv_vluxei32_v_i16mf4(const int16_t *rs1, vuint32mf2_t rs2,
                                      size_t vl);
vint16mf2_t __riscv_vluxei32_v_i16mf2(const int16_t *rs1, vuint32m1_t rs2,
                                      size_t vl);
vint16m1_t __riscv_vluxei32_v_i16m1(const int16_t *rs1, vuint32m2_t rs2,
                                    size_t vl);
vint16m2_t __riscv_vluxei32_v_i16m2(const int16_t *rs1, vuint32m4_t rs2,
                                    size_t vl);
vint16m4_t __riscv_vluxei32_v_i16m4(const int16_t *rs1, vuint32m8_t rs2,
                                    size_t vl);
vint16mf4_t __riscv_vluxei64_v_i16mf4(const int16_t *rs1, vuint64m1_t rs2,
                                      size_t vl);
vint16mf2_t __riscv_vluxei64_v_i16mf2(const int16_t *rs1, vuint64m2_t rs2,
                                      size_t vl);
vint16m1_t __riscv_vluxei64_v_i16m1(const int16_t *rs1, vuint64m4_t rs2,
                                    size_t vl);
vint16m2_t __riscv_vluxei64_v_i16m2(const int16_t *rs1, vuint64m8_t rs2,
                                    size_t vl);
vint32mf2_t __riscv_vluxei8_v_i32mf2(const int32_t *rs1, vuint8mf8_t rs2,
                                     size_t vl);
vint32m1_t __riscv_vluxei8_v_i32m1(const int32_t *rs1, vuint8mf4_t rs2,
                                   size_t vl);
vint32m2_t __riscv_vluxei8_v_i32m2(const int32_t *rs1, vuint8mf2_t rs2,
                                   size_t vl);
vint32m4_t __riscv_vluxei8_v_i32m4(const int32_t *rs1, vuint8m1_t rs2,
                                   size_t vl);
vint32m8_t __riscv_vluxei8_v_i32m8(const int32_t *rs1, vuint8m2_t rs2,
                                   size_t vl);
vint32mf2_t __riscv_vluxei16_v_i32mf2(const int32_t *rs1, vuint16mf4_t rs2,
                                      size_t vl);
vint32m1_t __riscv_vluxei16_v_i32m1(const int32_t *rs1, vuint16mf2_t rs2,
                                    size_t vl);
vint32m2_t __riscv_vluxei16_v_i32m2(const int32_t *rs1, vuint16m1_t rs2,
                                    size_t vl);
vint32m4_t __riscv_vluxei16_v_i32m4(const int32_t *rs1, vuint16m2_t rs2,
                                    size_t vl);
vint32m8_t __riscv_vluxei16_v_i32m8(const int32_t *rs1, vuint16m4_t rs2,
                                    size_t vl);
vint32mf2_t __riscv_vluxei32_v_i32mf2(const int32_t *rs1, vuint32mf2_t rs2,
                                      size_t vl);
vint32m1_t __riscv_vluxei32_v_i32m1(const int32_t *rs1, vuint32m1_t rs2,
                                    size_t vl);
vint32m2_t __riscv_vluxei32_v_i32m2(const int32_t *rs1, vuint32m2_t rs2,
                                    size_t vl);
vint32m4_t __riscv_vluxei32_v_i32m4(const int32_t *rs1, vuint32m4_t rs2,
                                    size_t vl);
vint32m8_t __riscv_vluxei32_v_i32m8(const int32_t *rs1, vuint32m8_t rs2,
                                    size_t vl);
vint32mf2_t __riscv_vluxei64_v_i32mf2(const int32_t *rs1, vuint64m1_t rs2,
                                      size_t vl);
vint32m1_t __riscv_vluxei64_v_i32m1(const int32_t *rs1, vuint64m2_t rs2,
                                    size_t vl);
vint32m2_t __riscv_vluxei64_v_i32m2(const int32_t *rs1, vuint64m4_t rs2,
                                    size_t vl);
vint32m4_t __riscv_vluxei64_v_i32m4(const int32_t *rs1, vuint64m8_t rs2,
                                    size_t vl);
vint64m1_t __riscv_vluxei8_v_i64m1(const int64_t *rs1, vuint8mf8_t rs2,
                                   size_t vl);
vint64m2_t __riscv_vluxei8_v_i64m2(const int64_t *rs1, vuint8mf4_t rs2,
                                   size_t vl);
vint64m4_t __riscv_vluxei8_v_i64m4(const int64_t *rs1, vuint8mf2_t rs2,
                                   size_t vl);
vint64m8_t __riscv_vluxei8_v_i64m8(const int64_t *rs1, vuint8m1_t rs2,
                                   size_t vl);
vint64m1_t __riscv_vluxei16_v_i64m1(const int64_t *rs1, vuint16mf4_t rs2,
                                    size_t vl);
vint64m2_t __riscv_vluxei16_v_i64m2(const int64_t *rs1, vuint16mf2_t rs2,
                                    size_t vl);
vint64m4_t __riscv_vluxei16_v_i64m4(const int64_t *rs1, vuint16m1_t rs2,
                                    size_t vl);
vint64m8_t __riscv_vluxei16_v_i64m8(const int64_t *rs1, vuint16m2_t rs2,
                                    size_t vl);
vint64m1_t __riscv_vluxei32_v_i64m1(const int64_t *rs1, vuint32mf2_t rs2,
                                    size_t vl);
vint64m2_t __riscv_vluxei32_v_i64m2(const int64_t *rs1, vuint32m1_t rs2,
                                    size_t vl);
vint64m4_t __riscv_vluxei32_v_i64m4(const int64_t *rs1, vuint32m2_t rs2,
                                    size_t vl);
vint64m8_t __riscv_vluxei32_v_i64m8(const int64_t *rs1, vuint32m4_t rs2,
                                    size_t vl);
vint64m1_t __riscv_vluxei64_v_i64m1(const int64_t *rs1, vuint64m1_t rs2,
                                    size_t vl);
vint64m2_t __riscv_vluxei64_v_i64m2(const int64_t *rs1, vuint64m2_t rs2,
                                    size_t vl);
vint64m4_t __riscv_vluxei64_v_i64m4(const int64_t *rs1, vuint64m4_t rs2,
                                    size_t vl);
vint64m8_t __riscv_vluxei64_v_i64m8(const int64_t *rs1, vuint64m8_t rs2,
                                    size_t vl);
vuint8mf8_t __riscv_vloxei8_v_u8mf8(const uint8_t *rs1, vuint8mf8_t rs2,
                                    size_t vl);
vuint8mf4_t __riscv_vloxei8_v_u8mf4(const uint8_t *rs1, vuint8mf4_t rs2,
                                    size_t vl);
vuint8mf2_t __riscv_vloxei8_v_u8mf2(const uint8_t *rs1, vuint8mf2_t rs2,
                                    size_t vl);
vuint8m1_t __riscv_vloxei8_v_u8m1(const uint8_t *rs1, vuint8m1_t rs2,
                                  size_t vl);
vuint8m2_t __riscv_vloxei8_v_u8m2(const uint8_t *rs1, vuint8m2_t rs2,
                                  size_t vl);
vuint8m4_t __riscv_vloxei8_v_u8m4(const uint8_t *rs1, vuint8m4_t rs2,
                                  size_t vl);
vuint8m8_t __riscv_vloxei8_v_u8m8(const uint8_t *rs1, vuint8m8_t rs2,
                                  size_t vl);
vuint8mf8_t __riscv_vloxei16_v_u8mf8(const uint8_t *rs1, vuint16mf4_t rs2,
                                     size_t vl);
vuint8mf4_t __riscv_vloxei16_v_u8mf4(const uint8_t *rs1, vuint16mf2_t rs2,
                                     size_t vl);
vuint8mf2_t __riscv_vloxei16_v_u8mf2(const uint8_t *rs1, vuint16m1_t rs2,
                                     size_t vl);
vuint8m1_t __riscv_vloxei16_v_u8m1(const uint8_t *rs1, vuint16m2_t rs2,
                                   size_t vl);
vuint8m2_t __riscv_vloxei16_v_u8m2(const uint8_t *rs1, vuint16m4_t rs2,
                                   size_t vl);
vuint8m4_t __riscv_vloxei16_v_u8m4(const uint8_t *rs1, vuint16m8_t rs2,
                                   size_t vl);
vuint8mf8_t __riscv_vloxei32_v_u8mf8(const uint8_t *rs1, vuint32mf2_t rs2,
                                     size_t vl);
vuint8mf4_t __riscv_vloxei32_v_u8mf4(const uint8_t *rs1, vuint32m1_t rs2,
                                     size_t vl);
vuint8mf2_t __riscv_vloxei32_v_u8mf2(const uint8_t *rs1, vuint32m2_t rs2,
                                     size_t vl);
vuint8m1_t __riscv_vloxei32_v_u8m1(const uint8_t *rs1, vuint32m4_t rs2,
                                   size_t vl);
vuint8m2_t __riscv_vloxei32_v_u8m2(const uint8_t *rs1, vuint32m8_t rs2,
                                   size_t vl);
vuint8mf8_t __riscv_vloxei64_v_u8mf8(const uint8_t *rs1, vuint64m1_t rs2,
                                     size_t vl);
vuint8mf4_t __riscv_vloxei64_v_u8mf4(const uint8_t *rs1, vuint64m2_t rs2,
                                     size_t vl);
vuint8mf2_t __riscv_vloxei64_v_u8mf2(const uint8_t *rs1, vuint64m4_t rs2,
                                     size_t vl);
vuint8m1_t __riscv_vloxei64_v_u8m1(const uint8_t *rs1, vuint64m8_t rs2,
                                   size_t vl);
vuint16mf4_t __riscv_vloxei8_v_u16mf4(const uint16_t *rs1, vuint8mf8_t rs2,
                                      size_t vl);
vuint16mf2_t __riscv_vloxei8_v_u16mf2(const uint16_t *rs1, vuint8mf4_t rs2,
                                      size_t vl);
vuint16m1_t __riscv_vloxei8_v_u16m1(const uint16_t *rs1, vuint8mf2_t rs2,
                                    size_t vl);
vuint16m2_t __riscv_vloxei8_v_u16m2(const uint16_t *rs1, vuint8m1_t rs2,
                                    size_t vl);
vuint16m4_t __riscv_vloxei8_v_u16m4(const uint16_t *rs1, vuint8m2_t rs2,
                                    size_t vl);
vuint16m8_t __riscv_vloxei8_v_u16m8(const uint16_t *rs1, vuint8m4_t rs2,
                                    size_t vl);
vuint16mf4_t __riscv_vloxei16_v_u16mf4(const uint16_t *rs1, vuint16mf4_t rs2,
                                       size_t vl);
vuint16mf2_t __riscv_vloxei16_v_u16mf2(const uint16_t *rs1, vuint16mf2_t rs2,
                                       size_t vl);
vuint16m1_t __riscv_vloxei16_v_u16m1(const uint16_t *rs1, vuint16m1_t rs2,
                                     size_t vl);
vuint16m2_t __riscv_vloxei16_v_u16m2(const uint16_t *rs1, vuint16m2_t rs2,
                                     size_t vl);
vuint16m4_t __riscv_vloxei16_v_u16m4(const uint16_t *rs1, vuint16m4_t rs2,
                                     size_t vl);
vuint16m8_t __riscv_vloxei16_v_u16m8(const uint16_t *rs1, vuint16m8_t rs2,
                                     size_t vl);
vuint16mf4_t __riscv_vloxei32_v_u16mf4(const uint16_t *rs1, vuint32mf2_t rs2,
                                       size_t vl);
vuint16mf2_t __riscv_vloxei32_v_u16mf2(const uint16_t *rs1, vuint32m1_t rs2,
                                       size_t vl);
vuint16m1_t __riscv_vloxei32_v_u16m1(const uint16_t *rs1, vuint32m2_t rs2,
                                     size_t vl);
vuint16m2_t __riscv_vloxei32_v_u16m2(const uint16_t *rs1, vuint32m4_t rs2,
                                     size_t vl);
vuint16m4_t __riscv_vloxei32_v_u16m4(const uint16_t *rs1, vuint32m8_t rs2,
                                     size_t vl);
vuint16mf4_t __riscv_vloxei64_v_u16mf4(const uint16_t *rs1, vuint64m1_t rs2,
                                       size_t vl);
vuint16mf2_t __riscv_vloxei64_v_u16mf2(const uint16_t *rs1, vuint64m2_t rs2,
                                       size_t vl);
vuint16m1_t __riscv_vloxei64_v_u16m1(const uint16_t *rs1, vuint64m4_t rs2,
                                     size_t vl);
vuint16m2_t __riscv_vloxei64_v_u16m2(const uint16_t *rs1, vuint64m8_t rs2,
                                     size_t vl);
vuint32mf2_t __riscv_vloxei8_v_u32mf2(const uint32_t *rs1, vuint8mf8_t rs2,
                                      size_t vl);
vuint32m1_t __riscv_vloxei8_v_u32m1(const uint32_t *rs1, vuint8mf4_t rs2,
                                    size_t vl);
vuint32m2_t __riscv_vloxei8_v_u32m2(const uint32_t *rs1, vuint8mf2_t rs2,
                                    size_t vl);
vuint32m4_t __riscv_vloxei8_v_u32m4(const uint32_t *rs1, vuint8m1_t rs2,
                                    size_t vl);
vuint32m8_t __riscv_vloxei8_v_u32m8(const uint32_t *rs1, vuint8m2_t rs2,
                                    size_t vl);
vuint32mf2_t __riscv_vloxei16_v_u32mf2(const uint32_t *rs1, vuint16mf4_t rs2,
                                       size_t vl);
vuint32m1_t __riscv_vloxei16_v_u32m1(const uint32_t *rs1, vuint16mf2_t rs2,
                                     size_t vl);
vuint32m2_t __riscv_vloxei16_v_u32m2(const uint32_t *rs1, vuint16m1_t rs2,
                                     size_t vl);
vuint32m4_t __riscv_vloxei16_v_u32m4(const uint32_t *rs1, vuint16m2_t rs2,
                                     size_t vl);
vuint32m8_t __riscv_vloxei16_v_u32m8(const uint32_t *rs1, vuint16m4_t rs2,
                                     size_t vl);
vuint32mf2_t __riscv_vloxei32_v_u32mf2(const uint32_t *rs1, vuint32mf2_t rs2,
                                       size_t vl);
vuint32m1_t __riscv_vloxei32_v_u32m1(const uint32_t *rs1, vuint32m1_t rs2,
                                     size_t vl);
vuint32m2_t __riscv_vloxei32_v_u32m2(const uint32_t *rs1, vuint32m2_t rs2,
                                     size_t vl);
vuint32m4_t __riscv_vloxei32_v_u32m4(const uint32_t *rs1, vuint32m4_t rs2,
                                     size_t vl);
vuint32m8_t __riscv_vloxei32_v_u32m8(const uint32_t *rs1, vuint32m8_t rs2,
                                     size_t vl);
vuint32mf2_t __riscv_vloxei64_v_u32mf2(const uint32_t *rs1, vuint64m1_t rs2,
                                       size_t vl);
vuint32m1_t __riscv_vloxei64_v_u32m1(const uint32_t *rs1, vuint64m2_t rs2,
                                     size_t vl);
vuint32m2_t __riscv_vloxei64_v_u32m2(const uint32_t *rs1, vuint64m4_t rs2,
                                     size_t vl);
vuint32m4_t __riscv_vloxei64_v_u32m4(const uint32_t *rs1, vuint64m8_t rs2,
                                     size_t vl);
vuint64m1_t __riscv_vloxei8_v_u64m1(const uint64_t *rs1, vuint8mf8_t rs2,
                                    size_t vl);
vuint64m2_t __riscv_vloxei8_v_u64m2(const uint64_t *rs1, vuint8mf4_t rs2,
                                    size_t vl);
vuint64m4_t __riscv_vloxei8_v_u64m4(const uint64_t *rs1, vuint8mf2_t rs2,
                                    size_t vl);
vuint64m8_t __riscv_vloxei8_v_u64m8(const uint64_t *rs1, vuint8m1_t rs2,
                                    size_t vl);
vuint64m1_t __riscv_vloxei16_v_u64m1(const uint64_t *rs1, vuint16mf4_t rs2,
                                     size_t vl);
vuint64m2_t __riscv_vloxei16_v_u64m2(const uint64_t *rs1, vuint16mf2_t rs2,
                                     size_t vl);
vuint64m4_t __riscv_vloxei16_v_u64m4(const uint64_t *rs1, vuint16m1_t rs2,
                                     size_t vl);
vuint64m8_t __riscv_vloxei16_v_u64m8(const uint64_t *rs1, vuint16m2_t rs2,
                                     size_t vl);
vuint64m1_t __riscv_vloxei32_v_u64m1(const uint64_t *rs1, vuint32mf2_t rs2,
                                     size_t vl);
vuint64m2_t __riscv_vloxei32_v_u64m2(const uint64_t *rs1, vuint32m1_t rs2,
                                     size_t vl);
vuint64m4_t __riscv_vloxei32_v_u64m4(const uint64_t *rs1, vuint32m2_t rs2,
                                     size_t vl);
vuint64m8_t __riscv_vloxei32_v_u64m8(const uint64_t *rs1, vuint32m4_t rs2,
                                     size_t vl);
vuint64m1_t __riscv_vloxei64_v_u64m1(const uint64_t *rs1, vuint64m1_t rs2,
                                     size_t vl);
vuint64m2_t __riscv_vloxei64_v_u64m2(const uint64_t *rs1, vuint64m2_t rs2,
                                     size_t vl);
vuint64m4_t __riscv_vloxei64_v_u64m4(const uint64_t *rs1, vuint64m4_t rs2,
                                     size_t vl);
vuint64m8_t __riscv_vloxei64_v_u64m8(const uint64_t *rs1, vuint64m8_t rs2,
                                     size_t vl);
vuint8mf8_t __riscv_vluxei8_v_u8mf8(const uint8_t *rs1, vuint8mf8_t rs2,
                                    size_t vl);
vuint8mf4_t __riscv_vluxei8_v_u8mf4(const uint8_t *rs1, vuint8mf4_t rs2,
                                    size_t vl);
vuint8mf2_t __riscv_vluxei8_v_u8mf2(const uint8_t *rs1, vuint8mf2_t rs2,
                                    size_t vl);
vuint8m1_t __riscv_vluxei8_v_u8m1(const uint8_t *rs1, vuint8m1_t rs2,
                                  size_t vl);
vuint8m2_t __riscv_vluxei8_v_u8m2(const uint8_t *rs1, vuint8m2_t rs2,
                                  size_t vl);
vuint8m4_t __riscv_vluxei8_v_u8m4(const uint8_t *rs1, vuint8m4_t rs2,
                                  size_t vl);
vuint8m8_t __riscv_vluxei8_v_u8m8(const uint8_t *rs1, vuint8m8_t rs2,
                                  size_t vl);
vuint8mf8_t __riscv_vluxei16_v_u8mf8(const uint8_t *rs1, vuint16mf4_t rs2,
                                     size_t vl);
vuint8mf4_t __riscv_vluxei16_v_u8mf4(const uint8_t *rs1, vuint16mf2_t rs2,
                                     size_t vl);
vuint8mf2_t __riscv_vluxei16_v_u8mf2(const uint8_t *rs1, vuint16m1_t rs2,
                                     size_t vl);
vuint8m1_t __riscv_vluxei16_v_u8m1(const uint8_t *rs1, vuint16m2_t rs2,
                                   size_t vl);
vuint8m2_t __riscv_vluxei16_v_u8m2(const uint8_t *rs1, vuint16m4_t rs2,
                                   size_t vl);
vuint8m4_t __riscv_vluxei16_v_u8m4(const uint8_t *rs1, vuint16m8_t rs2,
                                   size_t vl);
vuint8mf8_t __riscv_vluxei32_v_u8mf8(const uint8_t *rs1, vuint32mf2_t rs2,
                                     size_t vl);
vuint8mf4_t __riscv_vluxei32_v_u8mf4(const uint8_t *rs1, vuint32m1_t rs2,
                                     size_t vl);
vuint8mf2_t __riscv_vluxei32_v_u8mf2(const uint8_t *rs1, vuint32m2_t rs2,
                                     size_t vl);
vuint8m1_t __riscv_vluxei32_v_u8m1(const uint8_t *rs1, vuint32m4_t rs2,
                                   size_t vl);
vuint8m2_t __riscv_vluxei32_v_u8m2(const uint8_t *rs1, vuint32m8_t rs2,
                                   size_t vl);
vuint8mf8_t __riscv_vluxei64_v_u8mf8(const uint8_t *rs1, vuint64m1_t rs2,
                                     size_t vl);
vuint8mf4_t __riscv_vluxei64_v_u8mf4(const uint8_t *rs1, vuint64m2_t rs2,
                                     size_t vl);
vuint8mf2_t __riscv_vluxei64_v_u8mf2(const uint8_t *rs1, vuint64m4_t rs2,
                                     size_t vl);
vuint8m1_t __riscv_vluxei64_v_u8m1(const uint8_t *rs1, vuint64m8_t rs2,
                                   size_t vl);
vuint16mf4_t __riscv_vluxei8_v_u16mf4(const uint16_t *rs1, vuint8mf8_t rs2,
                                      size_t vl);
vuint16mf2_t __riscv_vluxei8_v_u16mf2(const uint16_t *rs1, vuint8mf4_t rs2,
                                      size_t vl);
vuint16m1_t __riscv_vluxei8_v_u16m1(const uint16_t *rs1, vuint8mf2_t rs2,
                                    size_t vl);
vuint16m2_t __riscv_vluxei8_v_u16m2(const uint16_t *rs1, vuint8m1_t rs2,
                                    size_t vl);
vuint16m4_t __riscv_vluxei8_v_u16m4(const uint16_t *rs1, vuint8m2_t rs2,
                                    size_t vl);
vuint16m8_t __riscv_vluxei8_v_u16m8(const uint16_t *rs1, vuint8m4_t rs2,
                                    size_t vl);
vuint16mf4_t __riscv_vluxei16_v_u16mf4(const uint16_t *rs1, vuint16mf4_t rs2,
                                       size_t vl);
vuint16mf2_t __riscv_vluxei16_v_u16mf2(const uint16_t *rs1, vuint16mf2_t rs2,
                                       size_t vl);
vuint16m1_t __riscv_vluxei16_v_u16m1(const uint16_t *rs1, vuint16m1_t rs2,
                                     size_t vl);
vuint16m2_t __riscv_vluxei16_v_u16m2(const uint16_t *rs1, vuint16m2_t rs2,
                                     size_t vl);
vuint16m4_t __riscv_vluxei16_v_u16m4(const uint16_t *rs1, vuint16m4_t rs2,
                                     size_t vl);
vuint16m8_t __riscv_vluxei16_v_u16m8(const uint16_t *rs1, vuint16m8_t rs2,
                                     size_t vl);
vuint16mf4_t __riscv_vluxei32_v_u16mf4(const uint16_t *rs1, vuint32mf2_t rs2,
                                       size_t vl);
vuint16mf2_t __riscv_vluxei32_v_u16mf2(const uint16_t *rs1, vuint32m1_t rs2,
                                       size_t vl);
vuint16m1_t __riscv_vluxei32_v_u16m1(const uint16_t *rs1, vuint32m2_t rs2,
                                     size_t vl);
vuint16m2_t __riscv_vluxei32_v_u16m2(const uint16_t *rs1, vuint32m4_t rs2,
                                     size_t vl);
vuint16m4_t __riscv_vluxei32_v_u16m4(const uint16_t *rs1, vuint32m8_t rs2,
                                     size_t vl);
vuint16mf4_t __riscv_vluxei64_v_u16mf4(const uint16_t *rs1, vuint64m1_t rs2,
                                       size_t vl);
vuint16mf2_t __riscv_vluxei64_v_u16mf2(const uint16_t *rs1, vuint64m2_t rs2,
                                       size_t vl);
vuint16m1_t __riscv_vluxei64_v_u16m1(const uint16_t *rs1, vuint64m4_t rs2,
                                     size_t vl);
vuint16m2_t __riscv_vluxei64_v_u16m2(const uint16_t *rs1, vuint64m8_t rs2,
                                     size_t vl);
vuint32mf2_t __riscv_vluxei8_v_u32mf2(const uint32_t *rs1, vuint8mf8_t rs2,
                                      size_t vl);
vuint32m1_t __riscv_vluxei8_v_u32m1(const uint32_t *rs1, vuint8mf4_t rs2,
                                    size_t vl);
vuint32m2_t __riscv_vluxei8_v_u32m2(const uint32_t *rs1, vuint8mf2_t rs2,
                                    size_t vl);
vuint32m4_t __riscv_vluxei8_v_u32m4(const uint32_t *rs1, vuint8m1_t rs2,
                                    size_t vl);
vuint32m8_t __riscv_vluxei8_v_u32m8(const uint32_t *rs1, vuint8m2_t rs2,
                                    size_t vl);
vuint32mf2_t __riscv_vluxei16_v_u32mf2(const uint32_t *rs1, vuint16mf4_t rs2,
                                       size_t vl);
vuint32m1_t __riscv_vluxei16_v_u32m1(const uint32_t *rs1, vuint16mf2_t rs2,
                                     size_t vl);
vuint32m2_t __riscv_vluxei16_v_u32m2(const uint32_t *rs1, vuint16m1_t rs2,
                                     size_t vl);
vuint32m4_t __riscv_vluxei16_v_u32m4(const uint32_t *rs1, vuint16m2_t rs2,
                                     size_t vl);
vuint32m8_t __riscv_vluxei16_v_u32m8(const uint32_t *rs1, vuint16m4_t rs2,
                                     size_t vl);
vuint32mf2_t __riscv_vluxei32_v_u32mf2(const uint32_t *rs1, vuint32mf2_t rs2,
                                       size_t vl);
vuint32m1_t __riscv_vluxei32_v_u32m1(const uint32_t *rs1, vuint32m1_t rs2,
                                     size_t vl);
vuint32m2_t __riscv_vluxei32_v_u32m2(const uint32_t *rs1, vuint32m2_t rs2,
                                     size_t vl);
vuint32m4_t __riscv_vluxei32_v_u32m4(const uint32_t *rs1, vuint32m4_t rs2,
                                     size_t vl);
vuint32m8_t __riscv_vluxei32_v_u32m8(const uint32_t *rs1, vuint32m8_t rs2,
                                     size_t vl);
vuint32mf2_t __riscv_vluxei64_v_u32mf2(const uint32_t *rs1, vuint64m1_t rs2,
                                       size_t vl);
vuint32m1_t __riscv_vluxei64_v_u32m1(const uint32_t *rs1, vuint64m2_t rs2,
                                     size_t vl);
vuint32m2_t __riscv_vluxei64_v_u32m2(const uint32_t *rs1, vuint64m4_t rs2,
                                     size_t vl);
vuint32m4_t __riscv_vluxei64_v_u32m4(const uint32_t *rs1, vuint64m8_t rs2,
                                     size_t vl);
vuint64m1_t __riscv_vluxei8_v_u64m1(const uint64_t *rs1, vuint8mf8_t rs2,
                                    size_t vl);
vuint64m2_t __riscv_vluxei8_v_u64m2(const uint64_t *rs1, vuint8mf4_t rs2,
                                    size_t vl);
vuint64m4_t __riscv_vluxei8_v_u64m4(const uint64_t *rs1, vuint8mf2_t rs2,
                                    size_t vl);
vuint64m8_t __riscv_vluxei8_v_u64m8(const uint64_t *rs1, vuint8m1_t rs2,
                                    size_t vl);
vuint64m1_t __riscv_vluxei16_v_u64m1(const uint64_t *rs1, vuint16mf4_t rs2,
                                     size_t vl);
vuint64m2_t __riscv_vluxei16_v_u64m2(const uint64_t *rs1, vuint16mf2_t rs2,
                                     size_t vl);
vuint64m4_t __riscv_vluxei16_v_u64m4(const uint64_t *rs1, vuint16m1_t rs2,
                                     size_t vl);
vuint64m8_t __riscv_vluxei16_v_u64m8(const uint64_t *rs1, vuint16m2_t rs2,
                                     size_t vl);
vuint64m1_t __riscv_vluxei32_v_u64m1(const uint64_t *rs1, vuint32mf2_t rs2,
                                     size_t vl);
vuint64m2_t __riscv_vluxei32_v_u64m2(const uint64_t *rs1, vuint32m1_t rs2,
                                     size_t vl);
vuint64m4_t __riscv_vluxei32_v_u64m4(const uint64_t *rs1, vuint32m2_t rs2,
                                     size_t vl);
vuint64m8_t __riscv_vluxei32_v_u64m8(const uint64_t *rs1, vuint32m4_t rs2,
                                     size_t vl);
vuint64m1_t __riscv_vluxei64_v_u64m1(const uint64_t *rs1, vuint64m1_t rs2,
                                     size_t vl);
vuint64m2_t __riscv_vluxei64_v_u64m2(const uint64_t *rs1, vuint64m2_t rs2,
                                     size_t vl);
vuint64m4_t __riscv_vluxei64_v_u64m4(const uint64_t *rs1, vuint64m4_t rs2,
                                     size_t vl);
vuint64m8_t __riscv_vluxei64_v_u64m8(const uint64_t *rs1, vuint64m8_t rs2,
                                     size_t vl);
// masked functions
vfloat16mf4_t __riscv_vloxei8_v_f16mf4_m(vbool64_t vm, const _Float16 *rs1,
                                         vuint8mf8_t rs2, size_t vl);
vfloat16mf2_t __riscv_vloxei8_v_f16mf2_m(vbool32_t vm, const _Float16 *rs1,
                                         vuint8mf4_t rs2, size_t vl);
vfloat16m1_t __riscv_vloxei8_v_f16m1_m(vbool16_t vm, const _Float16 *rs1,
                                       vuint8mf2_t rs2, size_t vl);
vfloat16m2_t __riscv_vloxei8_v_f16m2_m(vbool8_t vm, const _Float16 *rs1,
                                       vuint8m1_t rs2, size_t vl);
vfloat16m4_t __riscv_vloxei8_v_f16m4_m(vbool4_t vm, const _Float16 *rs1,
                                       vuint8m2_t rs2, size_t vl);
vfloat16m8_t __riscv_vloxei8_v_f16m8_m(vbool2_t vm, const _Float16 *rs1,
                                       vuint8m4_t rs2, size_t vl);
vfloat16mf4_t __riscv_vloxei16_v_f16mf4_m(vbool64_t vm, const _Float16 *rs1,
                                          vuint16mf4_t rs2, size_t vl);
vfloat16mf2_t __riscv_vloxei16_v_f16mf2_m(vbool32_t vm, const _Float16 *rs1,
                                          vuint16mf2_t rs2, size_t vl);
vfloat16m1_t __riscv_vloxei16_v_f16m1_m(vbool16_t vm, const _Float16 *rs1,
                                        vuint16m1_t rs2, size_t vl);
vfloat16m2_t __riscv_vloxei16_v_f16m2_m(vbool8_t vm, const _Float16 *rs1,
                                        vuint16m2_t rs2, size_t vl);
vfloat16m4_t __riscv_vloxei16_v_f16m4_m(vbool4_t vm, const _Float16 *rs1,
                                        vuint16m4_t rs2, size_t vl);
vfloat16m8_t __riscv_vloxei16_v_f16m8_m(vbool2_t vm, const _Float16 *rs1,
                                        vuint16m8_t rs2, size_t vl);
vfloat16mf4_t __riscv_vloxei32_v_f16mf4_m(vbool64_t vm, const _Float16 *rs1,
                                          vuint32mf2_t rs2, size_t vl);
vfloat16mf2_t __riscv_vloxei32_v_f16mf2_m(vbool32_t vm, const _Float16 *rs1,
                                          vuint32m1_t rs2, size_t vl);
vfloat16m1_t __riscv_vloxei32_v_f16m1_m(vbool16_t vm, const _Float16 *rs1,
                                        vuint32m2_t rs2, size_t vl);
vfloat16m2_t __riscv_vloxei32_v_f16m2_m(vbool8_t vm, const _Float16 *rs1,
                                        vuint32m4_t rs2, size_t vl);
vfloat16m4_t __riscv_vloxei32_v_f16m4_m(vbool4_t vm, const _Float16 *rs1,
                                        vuint32m8_t rs2, size_t vl);
vfloat16mf4_t __riscv_vloxei64_v_f16mf4_m(vbool64_t vm, const _Float16 *rs1,
                                          vuint64m1_t rs2, size_t vl);
vfloat16mf2_t __riscv_vloxei64_v_f16mf2_m(vbool32_t vm, const _Float16 *rs1,
                                          vuint64m2_t rs2, size_t vl);
vfloat16m1_t __riscv_vloxei64_v_f16m1_m(vbool16_t vm, const _Float16 *rs1,
                                        vuint64m4_t rs2, size_t vl);
vfloat16m2_t __riscv_vloxei64_v_f16m2_m(vbool8_t vm, const _Float16 *rs1,
                                        vuint64m8_t rs2, size_t vl);
vfloat32mf2_t __riscv_vloxei8_v_f32mf2_m(vbool64_t vm, const float *rs1,
                                         vuint8mf8_t rs2, size_t vl);
vfloat32m1_t __riscv_vloxei8_v_f32m1_m(vbool32_t vm, const float *rs1,
                                       vuint8mf4_t rs2, size_t vl);
vfloat32m2_t __riscv_vloxei8_v_f32m2_m(vbool16_t vm, const float *rs1,
                                       vuint8mf2_t rs2, size_t vl);
vfloat32m4_t __riscv_vloxei8_v_f32m4_m(vbool8_t vm, const float *rs1,
                                       vuint8m1_t rs2, size_t vl);
vfloat32m8_t __riscv_vloxei8_v_f32m8_m(vbool4_t vm, const float *rs1,
                                       vuint8m2_t rs2, size_t vl);
vfloat32mf2_t __riscv_vloxei16_v_f32mf2_m(vbool64_t vm, const float *rs1,
                                          vuint16mf4_t rs2, size_t vl);
vfloat32m1_t __riscv_vloxei16_v_f32m1_m(vbool32_t vm, const float *rs1,
                                        vuint16mf2_t rs2, size_t vl);
vfloat32m2_t __riscv_vloxei16_v_f32m2_m(vbool16_t vm, const float *rs1,
                                        vuint16m1_t rs2, size_t vl);
vfloat32m4_t __riscv_vloxei16_v_f32m4_m(vbool8_t vm, const float *rs1,
                                        vuint16m2_t rs2, size_t vl);
vfloat32m8_t __riscv_vloxei16_v_f32m8_m(vbool4_t vm, const float *rs1,
                                        vuint16m4_t rs2, size_t vl);
vfloat32mf2_t __riscv_vloxei32_v_f32mf2_m(vbool64_t vm, const float *rs1,
                                          vuint32mf2_t rs2, size_t vl);
vfloat32m1_t __riscv_vloxei32_v_f32m1_m(vbool32_t vm, const float *rs1,
                                        vuint32m1_t rs2, size_t vl);
vfloat32m2_t __riscv_vloxei32_v_f32m2_m(vbool16_t vm, const float *rs1,
                                        vuint32m2_t rs2, size_t vl);
vfloat32m4_t __riscv_vloxei32_v_f32m4_m(vbool8_t vm, const float *rs1,
                                        vuint32m4_t rs2, size_t vl);
vfloat32m8_t __riscv_vloxei32_v_f32m8_m(vbool4_t vm, const float *rs1,
                                        vuint32m8_t rs2, size_t vl);
vfloat32mf2_t __riscv_vloxei64_v_f32mf2_m(vbool64_t vm, const float *rs1,
                                          vuint64m1_t rs2, size_t vl);
vfloat32m1_t __riscv_vloxei64_v_f32m1_m(vbool32_t vm, const float *rs1,
                                        vuint64m2_t rs2, size_t vl);
vfloat32m2_t __riscv_vloxei64_v_f32m2_m(vbool16_t vm, const float *rs1,
                                        vuint64m4_t rs2, size_t vl);
vfloat32m4_t __riscv_vloxei64_v_f32m4_m(vbool8_t vm, const float *rs1,
                                        vuint64m8_t rs2, size_t vl);
vfloat64m1_t __riscv_vloxei8_v_f64m1_m(vbool64_t vm, const double *rs1,
                                       vuint8mf8_t rs2, size_t vl);
vfloat64m2_t __riscv_vloxei8_v_f64m2_m(vbool32_t vm, const double *rs1,
                                       vuint8mf4_t rs2, size_t vl);
vfloat64m4_t __riscv_vloxei8_v_f64m4_m(vbool16_t vm, const double *rs1,
                                       vuint8mf2_t rs2, size_t vl);
vfloat64m8_t __riscv_vloxei8_v_f64m8_m(vbool8_t vm, const double *rs1,
                                       vuint8m1_t rs2, size_t vl);
vfloat64m1_t __riscv_vloxei16_v_f64m1_m(vbool64_t vm, const double *rs1,
                                        vuint16mf4_t rs2, size_t vl);
vfloat64m2_t __riscv_vloxei16_v_f64m2_m(vbool32_t vm, const double *rs1,
                                        vuint16mf2_t rs2, size_t vl);
vfloat64m4_t __riscv_vloxei16_v_f64m4_m(vbool16_t vm, const double *rs1,
                                        vuint16m1_t rs2, size_t vl);
vfloat64m8_t __riscv_vloxei16_v_f64m8_m(vbool8_t vm, const double *rs1,
                                        vuint16m2_t rs2, size_t vl);
vfloat64m1_t __riscv_vloxei32_v_f64m1_m(vbool64_t vm, const double *rs1,
                                        vuint32mf2_t rs2, size_t vl);
vfloat64m2_t __riscv_vloxei32_v_f64m2_m(vbool32_t vm, const double *rs1,
                                        vuint32m1_t rs2, size_t vl);
vfloat64m4_t __riscv_vloxei32_v_f64m4_m(vbool16_t vm, const double *rs1,
                                        vuint32m2_t rs2, size_t vl);
vfloat64m8_t __riscv_vloxei32_v_f64m8_m(vbool8_t vm, const double *rs1,
                                        vuint32m4_t rs2, size_t vl);
vfloat64m1_t __riscv_vloxei64_v_f64m1_m(vbool64_t vm, const double *rs1,
                                        vuint64m1_t rs2, size_t vl);
vfloat64m2_t __riscv_vloxei64_v_f64m2_m(vbool32_t vm, const double *rs1,
                                        vuint64m2_t rs2, size_t vl);
vfloat64m4_t __riscv_vloxei64_v_f64m4_m(vbool16_t vm, const double *rs1,
                                        vuint64m4_t rs2, size_t vl);
vfloat64m8_t __riscv_vloxei64_v_f64m8_m(vbool8_t vm, const double *rs1,
                                        vuint64m8_t rs2, size_t vl);
vfloat16mf4_t __riscv_vluxei8_v_f16mf4_m(vbool64_t vm, const _Float16 *rs1,
                                         vuint8mf8_t rs2, size_t vl);
vfloat16mf2_t __riscv_vluxei8_v_f16mf2_m(vbool32_t vm, const _Float16 *rs1,
                                         vuint8mf4_t rs2, size_t vl);
vfloat16m1_t __riscv_vluxei8_v_f16m1_m(vbool16_t vm, const _Float16 *rs1,
                                       vuint8mf2_t rs2, size_t vl);
vfloat16m2_t __riscv_vluxei8_v_f16m2_m(vbool8_t vm, const _Float16 *rs1,
                                       vuint8m1_t rs2, size_t vl);
vfloat16m4_t __riscv_vluxei8_v_f16m4_m(vbool4_t vm, const _Float16 *rs1,
                                       vuint8m2_t rs2, size_t vl);
vfloat16m8_t __riscv_vluxei8_v_f16m8_m(vbool2_t vm, const _Float16 *rs1,
                                       vuint8m4_t rs2, size_t vl);
vfloat16mf4_t __riscv_vluxei16_v_f16mf4_m(vbool64_t vm, const _Float16 *rs1,
                                          vuint16mf4_t rs2, size_t vl);
vfloat16mf2_t __riscv_vluxei16_v_f16mf2_m(vbool32_t vm, const _Float16 *rs1,
                                          vuint16mf2_t rs2, size_t vl);
vfloat16m1_t __riscv_vluxei16_v_f16m1_m(vbool16_t vm, const _Float16 *rs1,
                                        vuint16m1_t rs2, size_t vl);
vfloat16m2_t __riscv_vluxei16_v_f16m2_m(vbool8_t vm, const _Float16 *rs1,
                                        vuint16m2_t rs2, size_t vl);
vfloat16m4_t __riscv_vluxei16_v_f16m4_m(vbool4_t vm, const _Float16 *rs1,
                                        vuint16m4_t rs2, size_t vl);
vfloat16m8_t __riscv_vluxei16_v_f16m8_m(vbool2_t vm, const _Float16 *rs1,
                                        vuint16m8_t rs2, size_t vl);
vfloat16mf4_t __riscv_vluxei32_v_f16mf4_m(vbool64_t vm, const _Float16 *rs1,
                                          vuint32mf2_t rs2, size_t vl);
vfloat16mf2_t __riscv_vluxei32_v_f16mf2_m(vbool32_t vm, const _Float16 *rs1,
                                          vuint32m1_t rs2, size_t vl);
vfloat16m1_t __riscv_vluxei32_v_f16m1_m(vbool16_t vm, const _Float16 *rs1,
                                        vuint32m2_t rs2, size_t vl);
vfloat16m2_t __riscv_vluxei32_v_f16m2_m(vbool8_t vm, const _Float16 *rs1,
                                        vuint32m4_t rs2, size_t vl);
vfloat16m4_t __riscv_vluxei32_v_f16m4_m(vbool4_t vm, const _Float16 *rs1,
                                        vuint32m8_t rs2, size_t vl);
vfloat16mf4_t __riscv_vluxei64_v_f16mf4_m(vbool64_t vm, const _Float16 *rs1,
                                          vuint64m1_t rs2, size_t vl);
vfloat16mf2_t __riscv_vluxei64_v_f16mf2_m(vbool32_t vm, const _Float16 *rs1,
                                          vuint64m2_t rs2, size_t vl);
vfloat16m1_t __riscv_vluxei64_v_f16m1_m(vbool16_t vm, const _Float16 *rs1,
                                        vuint64m4_t rs2, size_t vl);
vfloat16m2_t __riscv_vluxei64_v_f16m2_m(vbool8_t vm, const _Float16 *rs1,
                                        vuint64m8_t rs2, size_t vl);
vfloat32mf2_t __riscv_vluxei8_v_f32mf2_m(vbool64_t vm, const float *rs1,
                                         vuint8mf8_t rs2, size_t vl);
vfloat32m1_t __riscv_vluxei8_v_f32m1_m(vbool32_t vm, const float *rs1,
                                       vuint8mf4_t rs2, size_t vl);
vfloat32m2_t __riscv_vluxei8_v_f32m2_m(vbool16_t vm, const float *rs1,
                                       vuint8mf2_t rs2, size_t vl);
vfloat32m4_t __riscv_vluxei8_v_f32m4_m(vbool8_t vm, const float *rs1,
                                       vuint8m1_t rs2, size_t vl);
vfloat32m8_t __riscv_vluxei8_v_f32m8_m(vbool4_t vm, const float *rs1,
                                       vuint8m2_t rs2, size_t vl);
vfloat32mf2_t __riscv_vluxei16_v_f32mf2_m(vbool64_t vm, const float *rs1,
                                          vuint16mf4_t rs2, size_t vl);
vfloat32m1_t __riscv_vluxei16_v_f32m1_m(vbool32_t vm, const float *rs1,
                                        vuint16mf2_t rs2, size_t vl);
vfloat32m2_t __riscv_vluxei16_v_f32m2_m(vbool16_t vm, const float *rs1,
                                        vuint16m1_t rs2, size_t vl);
vfloat32m4_t __riscv_vluxei16_v_f32m4_m(vbool8_t vm, const float *rs1,
                                        vuint16m2_t rs2, size_t vl);
vfloat32m8_t __riscv_vluxei16_v_f32m8_m(vbool4_t vm, const float *rs1,
                                        vuint16m4_t rs2, size_t vl);
vfloat32mf2_t __riscv_vluxei32_v_f32mf2_m(vbool64_t vm, const float *rs1,
                                          vuint32mf2_t rs2, size_t vl);
vfloat32m1_t __riscv_vluxei32_v_f32m1_m(vbool32_t vm, const float *rs1,
                                        vuint32m1_t rs2, size_t vl);
vfloat32m2_t __riscv_vluxei32_v_f32m2_m(vbool16_t vm, const float *rs1,
                                        vuint32m2_t rs2, size_t vl);
vfloat32m4_t __riscv_vluxei32_v_f32m4_m(vbool8_t vm, const float *rs1,
                                        vuint32m4_t rs2, size_t vl);
vfloat32m8_t __riscv_vluxei32_v_f32m8_m(vbool4_t vm, const float *rs1,
                                        vuint32m8_t rs2, size_t vl);
vfloat32mf2_t __riscv_vluxei64_v_f32mf2_m(vbool64_t vm, const float *rs1,
                                          vuint64m1_t rs2, size_t vl);
vfloat32m1_t __riscv_vluxei64_v_f32m1_m(vbool32_t vm, const float *rs1,
                                        vuint64m2_t rs2, size_t vl);
vfloat32m2_t __riscv_vluxei64_v_f32m2_m(vbool16_t vm, const float *rs1,
                                        vuint64m4_t rs2, size_t vl);
vfloat32m4_t __riscv_vluxei64_v_f32m4_m(vbool8_t vm, const float *rs1,
                                        vuint64m8_t rs2, size_t vl);
vfloat64m1_t __riscv_vluxei8_v_f64m1_m(vbool64_t vm, const double *rs1,
                                       vuint8mf8_t rs2, size_t vl);
vfloat64m2_t __riscv_vluxei8_v_f64m2_m(vbool32_t vm, const double *rs1,
                                       vuint8mf4_t rs2, size_t vl);
vfloat64m4_t __riscv_vluxei8_v_f64m4_m(vbool16_t vm, const double *rs1,
                                       vuint8mf2_t rs2, size_t vl);
vfloat64m8_t __riscv_vluxei8_v_f64m8_m(vbool8_t vm, const double *rs1,
                                       vuint8m1_t rs2, size_t vl);
vfloat64m1_t __riscv_vluxei16_v_f64m1_m(vbool64_t vm, const double *rs1,
                                        vuint16mf4_t rs2, size_t vl);
vfloat64m2_t __riscv_vluxei16_v_f64m2_m(vbool32_t vm, const double *rs1,
                                        vuint16mf2_t rs2, size_t vl);
vfloat64m4_t __riscv_vluxei16_v_f64m4_m(vbool16_t vm, const double *rs1,
                                        vuint16m1_t rs2, size_t vl);
vfloat64m8_t __riscv_vluxei16_v_f64m8_m(vbool8_t vm, const double *rs1,
                                        vuint16m2_t rs2, size_t vl);
vfloat64m1_t __riscv_vluxei32_v_f64m1_m(vbool64_t vm, const double *rs1,
                                        vuint32mf2_t rs2, size_t vl);
vfloat64m2_t __riscv_vluxei32_v_f64m2_m(vbool32_t vm, const double *rs1,
                                        vuint32m1_t rs2, size_t vl);
vfloat64m4_t __riscv_vluxei32_v_f64m4_m(vbool16_t vm, const double *rs1,
                                        vuint32m2_t rs2, size_t vl);
vfloat64m8_t __riscv_vluxei32_v_f64m8_m(vbool8_t vm, const double *rs1,
                                        vuint32m4_t rs2, size_t vl);
vfloat64m1_t __riscv_vluxei64_v_f64m1_m(vbool64_t vm, const double *rs1,
                                        vuint64m1_t rs2, size_t vl);
vfloat64m2_t __riscv_vluxei64_v_f64m2_m(vbool32_t vm, const double *rs1,
                                        vuint64m2_t rs2, size_t vl);
vfloat64m4_t __riscv_vluxei64_v_f64m4_m(vbool16_t vm, const double *rs1,
                                        vuint64m4_t rs2, size_t vl);
vfloat64m8_t __riscv_vluxei64_v_f64m8_m(vbool8_t vm, const double *rs1,
                                        vuint64m8_t rs2, size_t vl);
vint8mf8_t __riscv_vloxei8_v_i8mf8_m(vbool64_t vm, const int8_t *rs1,
                                     vuint8mf8_t rs2, size_t vl);
vint8mf4_t __riscv_vloxei8_v_i8mf4_m(vbool32_t vm, const int8_t *rs1,
                                     vuint8mf4_t rs2, size_t vl);
vint8mf2_t __riscv_vloxei8_v_i8mf2_m(vbool16_t vm, const int8_t *rs1,
                                     vuint8mf2_t rs2, size_t vl);
vint8m1_t __riscv_vloxei8_v_i8m1_m(vbool8_t vm, const int8_t *rs1,
                                   vuint8m1_t rs2, size_t vl);
vint8m2_t __riscv_vloxei8_v_i8m2_m(vbool4_t vm, const int8_t *rs1,
                                   vuint8m2_t rs2, size_t vl);
vint8m4_t __riscv_vloxei8_v_i8m4_m(vbool2_t vm, const int8_t *rs1,
                                   vuint8m4_t rs2, size_t vl);
vint8m8_t __riscv_vloxei8_v_i8m8_m(vbool1_t vm, const int8_t *rs1,
                                   vuint8m8_t rs2, size_t vl);
vint8mf8_t __riscv_vloxei16_v_i8mf8_m(vbool64_t vm, const int8_t *rs1,
                                      vuint16mf4_t rs2, size_t vl);
vint8mf4_t __riscv_vloxei16_v_i8mf4_m(vbool32_t vm, const int8_t *rs1,
                                      vuint16mf2_t rs2, size_t vl);
vint8mf2_t __riscv_vloxei16_v_i8mf2_m(vbool16_t vm, const int8_t *rs1,
                                      vuint16m1_t rs2, size_t vl);
vint8m1_t __riscv_vloxei16_v_i8m1_m(vbool8_t vm, const int8_t *rs1,
                                    vuint16m2_t rs2, size_t vl);
vint8m2_t __riscv_vloxei16_v_i8m2_m(vbool4_t vm, const int8_t *rs1,
                                    vuint16m4_t rs2, size_t vl);
vint8m4_t __riscv_vloxei16_v_i8m4_m(vbool2_t vm, const int8_t *rs1,
                                    vuint16m8_t rs2, size_t vl);
vint8mf8_t __riscv_vloxei32_v_i8mf8_m(vbool64_t vm, const int8_t *rs1,
                                      vuint32mf2_t rs2, size_t vl);
vint8mf4_t __riscv_vloxei32_v_i8mf4_m(vbool32_t vm, const int8_t *rs1,
                                      vuint32m1_t rs2, size_t vl);
vint8mf2_t __riscv_vloxei32_v_i8mf2_m(vbool16_t vm, const int8_t *rs1,
                                      vuint32m2_t rs2, size_t vl);
vint8m1_t __riscv_vloxei32_v_i8m1_m(vbool8_t vm, const int8_t *rs1,
                                    vuint32m4_t rs2, size_t vl);
vint8m2_t __riscv_vloxei32_v_i8m2_m(vbool4_t vm, const int8_t *rs1,
                                    vuint32m8_t rs2, size_t vl);
vint8mf8_t __riscv_vloxei64_v_i8mf8_m(vbool64_t vm, const int8_t *rs1,
                                      vuint64m1_t rs2, size_t vl);
vint8mf4_t __riscv_vloxei64_v_i8mf4_m(vbool32_t vm, const int8_t *rs1,
                                      vuint64m2_t rs2, size_t vl);
vint8mf2_t __riscv_vloxei64_v_i8mf2_m(vbool16_t vm, const int8_t *rs1,
                                      vuint64m4_t rs2, size_t vl);
vint8m1_t __riscv_vloxei64_v_i8m1_m(vbool8_t vm, const int8_t *rs1,
                                    vuint64m8_t rs2, size_t vl);
vint16mf4_t __riscv_vloxei8_v_i16mf4_m(vbool64_t vm, const int16_t *rs1,
                                       vuint8mf8_t rs2, size_t vl);
vint16mf2_t __riscv_vloxei8_v_i16mf2_m(vbool32_t vm, const int16_t *rs1,
                                       vuint8mf4_t rs2, size_t vl);
vint16m1_t __riscv_vloxei8_v_i16m1_m(vbool16_t vm, const int16_t *rs1,
                                     vuint8mf2_t rs2, size_t vl);
vint16m2_t __riscv_vloxei8_v_i16m2_m(vbool8_t vm, const int16_t *rs1,
                                     vuint8m1_t rs2, size_t vl);
vint16m4_t __riscv_vloxei8_v_i16m4_m(vbool4_t vm, const int16_t *rs1,
                                     vuint8m2_t rs2, size_t vl);
vint16m8_t __riscv_vloxei8_v_i16m8_m(vbool2_t vm, const int16_t *rs1,
                                     vuint8m4_t rs2, size_t vl);
vint16mf4_t __riscv_vloxei16_v_i16mf4_m(vbool64_t vm, const int16_t *rs1,
                                        vuint16mf4_t rs2, size_t vl);
vint16mf2_t __riscv_vloxei16_v_i16mf2_m(vbool32_t vm, const int16_t *rs1,
                                        vuint16mf2_t rs2, size_t vl);
vint16m1_t __riscv_vloxei16_v_i16m1_m(vbool16_t vm, const int16_t *rs1,
                                      vuint16m1_t rs2, size_t vl);
vint16m2_t __riscv_vloxei16_v_i16m2_m(vbool8_t vm, const int16_t *rs1,
                                      vuint16m2_t rs2, size_t vl);
vint16m4_t __riscv_vloxei16_v_i16m4_m(vbool4_t vm, const int16_t *rs1,
                                      vuint16m4_t rs2, size_t vl);
vint16m8_t __riscv_vloxei16_v_i16m8_m(vbool2_t vm, const int16_t *rs1,
                                      vuint16m8_t rs2, size_t vl);
vint16mf4_t __riscv_vloxei32_v_i16mf4_m(vbool64_t vm, const int16_t *rs1,
                                        vuint32mf2_t rs2, size_t vl);
vint16mf2_t __riscv_vloxei32_v_i16mf2_m(vbool32_t vm, const int16_t *rs1,
                                        vuint32m1_t rs2, size_t vl);
vint16m1_t __riscv_vloxei32_v_i16m1_m(vbool16_t vm, const int16_t *rs1,
                                      vuint32m2_t rs2, size_t vl);
vint16m2_t __riscv_vloxei32_v_i16m2_m(vbool8_t vm, const int16_t *rs1,
                                      vuint32m4_t rs2, size_t vl);
vint16m4_t __riscv_vloxei32_v_i16m4_m(vbool4_t vm, const int16_t *rs1,
                                      vuint32m8_t rs2, size_t vl);
vint16mf4_t __riscv_vloxei64_v_i16mf4_m(vbool64_t vm, const int16_t *rs1,
                                        vuint64m1_t rs2, size_t vl);
vint16mf2_t __riscv_vloxei64_v_i16mf2_m(vbool32_t vm, const int16_t *rs1,
                                        vuint64m2_t rs2, size_t vl);
vint16m1_t __riscv_vloxei64_v_i16m1_m(vbool16_t vm, const int16_t *rs1,
                                      vuint64m4_t rs2, size_t vl);
vint16m2_t __riscv_vloxei64_v_i16m2_m(vbool8_t vm, const int16_t *rs1,
                                      vuint64m8_t rs2, size_t vl);
vint32mf2_t __riscv_vloxei8_v_i32mf2_m(vbool64_t vm, const int32_t *rs1,
                                       vuint8mf8_t rs2, size_t vl);
vint32m1_t __riscv_vloxei8_v_i32m1_m(vbool32_t vm, const int32_t *rs1,
                                     vuint8mf4_t rs2, size_t vl);
vint32m2_t __riscv_vloxei8_v_i32m2_m(vbool16_t vm, const int32_t *rs1,
                                     vuint8mf2_t rs2, size_t vl);
vint32m4_t __riscv_vloxei8_v_i32m4_m(vbool8_t vm, const int32_t *rs1,
                                     vuint8m1_t rs2, size_t vl);
vint32m8_t __riscv_vloxei8_v_i32m8_m(vbool4_t vm, const int32_t *rs1,
                                     vuint8m2_t rs2, size_t vl);
vint32mf2_t __riscv_vloxei16_v_i32mf2_m(vbool64_t vm, const int32_t *rs1,
                                        vuint16mf4_t rs2, size_t vl);
vint32m1_t __riscv_vloxei16_v_i32m1_m(vbool32_t vm, const int32_t *rs1,
                                      vuint16mf2_t rs2, size_t vl);
vint32m2_t __riscv_vloxei16_v_i32m2_m(vbool16_t vm, const int32_t *rs1,
                                      vuint16m1_t rs2, size_t vl);
vint32m4_t __riscv_vloxei16_v_i32m4_m(vbool8_t vm, const int32_t *rs1,
                                      vuint16m2_t rs2, size_t vl);
vint32m8_t __riscv_vloxei16_v_i32m8_m(vbool4_t vm, const int32_t *rs1,
                                      vuint16m4_t rs2, size_t vl);
vint32mf2_t __riscv_vloxei32_v_i32mf2_m(vbool64_t vm, const int32_t *rs1,
                                        vuint32mf2_t rs2, size_t vl);
vint32m1_t __riscv_vloxei32_v_i32m1_m(vbool32_t vm, const int32_t *rs1,
                                      vuint32m1_t rs2, size_t vl);
vint32m2_t __riscv_vloxei32_v_i32m2_m(vbool16_t vm, const int32_t *rs1,
                                      vuint32m2_t rs2, size_t vl);
vint32m4_t __riscv_vloxei32_v_i32m4_m(vbool8_t vm, const int32_t *rs1,
                                      vuint32m4_t rs2, size_t vl);
vint32m8_t __riscv_vloxei32_v_i32m8_m(vbool4_t vm, const int32_t *rs1,
                                      vuint32m8_t rs2, size_t vl);
vint32mf2_t __riscv_vloxei64_v_i32mf2_m(vbool64_t vm, const int32_t *rs1,
                                        vuint64m1_t rs2, size_t vl);
vint32m1_t __riscv_vloxei64_v_i32m1_m(vbool32_t vm, const int32_t *rs1,
                                      vuint64m2_t rs2, size_t vl);
vint32m2_t __riscv_vloxei64_v_i32m2_m(vbool16_t vm, const int32_t *rs1,
                                      vuint64m4_t rs2, size_t vl);
vint32m4_t __riscv_vloxei64_v_i32m4_m(vbool8_t vm, const int32_t *rs1,
                                      vuint64m8_t rs2, size_t vl);
vint64m1_t __riscv_vloxei8_v_i64m1_m(vbool64_t vm, const int64_t *rs1,
                                     vuint8mf8_t rs2, size_t vl);
vint64m2_t __riscv_vloxei8_v_i64m2_m(vbool32_t vm, const int64_t *rs1,
                                     vuint8mf4_t rs2, size_t vl);
vint64m4_t __riscv_vloxei8_v_i64m4_m(vbool16_t vm, const int64_t *rs1,
                                     vuint8mf2_t rs2, size_t vl);
vint64m8_t __riscv_vloxei8_v_i64m8_m(vbool8_t vm, const int64_t *rs1,
                                     vuint8m1_t rs2, size_t vl);
vint64m1_t __riscv_vloxei16_v_i64m1_m(vbool64_t vm, const int64_t *rs1,
                                      vuint16mf4_t rs2, size_t vl);
vint64m2_t __riscv_vloxei16_v_i64m2_m(vbool32_t vm, const int64_t *rs1,
                                      vuint16mf2_t rs2, size_t vl);
vint64m4_t __riscv_vloxei16_v_i64m4_m(vbool16_t vm, const int64_t *rs1,
                                      vuint16m1_t rs2, size_t vl);
vint64m8_t __riscv_vloxei16_v_i64m8_m(vbool8_t vm, const int64_t *rs1,
                                      vuint16m2_t rs2, size_t vl);
vint64m1_t __riscv_vloxei32_v_i64m1_m(vbool64_t vm, const int64_t *rs1,
                                      vuint32mf2_t rs2, size_t vl);
vint64m2_t __riscv_vloxei32_v_i64m2_m(vbool32_t vm, const int64_t *rs1,
                                      vuint32m1_t rs2, size_t vl);
vint64m4_t __riscv_vloxei32_v_i64m4_m(vbool16_t vm, const int64_t *rs1,
                                      vuint32m2_t rs2, size_t vl);
vint64m8_t __riscv_vloxei32_v_i64m8_m(vbool8_t vm, const int64_t *rs1,
                                      vuint32m4_t rs2, size_t vl);
vint64m1_t __riscv_vloxei64_v_i64m1_m(vbool64_t vm, const int64_t *rs1,
                                      vuint64m1_t rs2, size_t vl);
vint64m2_t __riscv_vloxei64_v_i64m2_m(vbool32_t vm, const int64_t *rs1,
                                      vuint64m2_t rs2, size_t vl);
vint64m4_t __riscv_vloxei64_v_i64m4_m(vbool16_t vm, const int64_t *rs1,
                                      vuint64m4_t rs2, size_t vl);
vint64m8_t __riscv_vloxei64_v_i64m8_m(vbool8_t vm, const int64_t *rs1,
                                      vuint64m8_t rs2, size_t vl);
vint8mf8_t __riscv_vluxei8_v_i8mf8_m(vbool64_t vm, const int8_t *rs1,
                                     vuint8mf8_t rs2, size_t vl);
vint8mf4_t __riscv_vluxei8_v_i8mf4_m(vbool32_t vm, const int8_t *rs1,
                                     vuint8mf4_t rs2, size_t vl);
vint8mf2_t __riscv_vluxei8_v_i8mf2_m(vbool16_t vm, const int8_t *rs1,
                                     vuint8mf2_t rs2, size_t vl);
vint8m1_t __riscv_vluxei8_v_i8m1_m(vbool8_t vm, const int8_t *rs1,
                                   vuint8m1_t rs2, size_t vl);
vint8m2_t __riscv_vluxei8_v_i8m2_m(vbool4_t vm, const int8_t *rs1,
                                   vuint8m2_t rs2, size_t vl);
vint8m4_t __riscv_vluxei8_v_i8m4_m(vbool2_t vm, const int8_t *rs1,
                                   vuint8m4_t rs2, size_t vl);
vint8m8_t __riscv_vluxei8_v_i8m8_m(vbool1_t vm, const int8_t *rs1,
                                   vuint8m8_t rs2, size_t vl);
vint8mf8_t __riscv_vluxei16_v_i8mf8_m(vbool64_t vm, const int8_t *rs1,
                                      vuint16mf4_t rs2, size_t vl);
vint8mf4_t __riscv_vluxei16_v_i8mf4_m(vbool32_t vm, const int8_t *rs1,
                                      vuint16mf2_t rs2, size_t vl);
vint8mf2_t __riscv_vluxei16_v_i8mf2_m(vbool16_t vm, const int8_t *rs1,
                                      vuint16m1_t rs2, size_t vl);
vint8m1_t __riscv_vluxei16_v_i8m1_m(vbool8_t vm, const int8_t *rs1,
                                    vuint16m2_t rs2, size_t vl);
vint8m2_t __riscv_vluxei16_v_i8m2_m(vbool4_t vm, const int8_t *rs1,
                                    vuint16m4_t rs2, size_t vl);
vint8m4_t __riscv_vluxei16_v_i8m4_m(vbool2_t vm, const int8_t *rs1,
                                    vuint16m8_t rs2, size_t vl);
vint8mf8_t __riscv_vluxei32_v_i8mf8_m(vbool64_t vm, const int8_t *rs1,
                                      vuint32mf2_t rs2, size_t vl);
vint8mf4_t __riscv_vluxei32_v_i8mf4_m(vbool32_t vm, const int8_t *rs1,
                                      vuint32m1_t rs2, size_t vl);
vint8mf2_t __riscv_vluxei32_v_i8mf2_m(vbool16_t vm, const int8_t *rs1,
                                      vuint32m2_t rs2, size_t vl);
vint8m1_t __riscv_vluxei32_v_i8m1_m(vbool8_t vm, const int8_t *rs1,
                                    vuint32m4_t rs2, size_t vl);
vint8m2_t __riscv_vluxei32_v_i8m2_m(vbool4_t vm, const int8_t *rs1,
                                    vuint32m8_t rs2, size_t vl);
vint8mf8_t __riscv_vluxei64_v_i8mf8_m(vbool64_t vm, const int8_t *rs1,
                                      vuint64m1_t rs2, size_t vl);
vint8mf4_t __riscv_vluxei64_v_i8mf4_m(vbool32_t vm, const int8_t *rs1,
                                      vuint64m2_t rs2, size_t vl);
vint8mf2_t __riscv_vluxei64_v_i8mf2_m(vbool16_t vm, const int8_t *rs1,
                                      vuint64m4_t rs2, size_t vl);
vint8m1_t __riscv_vluxei64_v_i8m1_m(vbool8_t vm, const int8_t *rs1,
                                    vuint64m8_t rs2, size_t vl);
vint16mf4_t __riscv_vluxei8_v_i16mf4_m(vbool64_t vm, const int16_t *rs1,
                                       vuint8mf8_t rs2, size_t vl);
vint16mf2_t __riscv_vluxei8_v_i16mf2_m(vbool32_t vm, const int16_t *rs1,
                                       vuint8mf4_t rs2, size_t vl);
vint16m1_t __riscv_vluxei8_v_i16m1_m(vbool16_t vm, const int16_t *rs1,
                                     vuint8mf2_t rs2, size_t vl);
vint16m2_t __riscv_vluxei8_v_i16m2_m(vbool8_t vm, const int16_t *rs1,
                                     vuint8m1_t rs2, size_t vl);
vint16m4_t __riscv_vluxei8_v_i16m4_m(vbool4_t vm, const int16_t *rs1,
                                     vuint8m2_t rs2, size_t vl);
vint16m8_t __riscv_vluxei8_v_i16m8_m(vbool2_t vm, const int16_t *rs1,
                                     vuint8m4_t rs2, size_t vl);
vint16mf4_t __riscv_vluxei16_v_i16mf4_m(vbool64_t vm, const int16_t *rs1,
                                        vuint16mf4_t rs2, size_t vl);
vint16mf2_t __riscv_vluxei16_v_i16mf2_m(vbool32_t vm, const int16_t *rs1,
                                        vuint16mf2_t rs2, size_t vl);
vint16m1_t __riscv_vluxei16_v_i16m1_m(vbool16_t vm, const int16_t *rs1,
                                      vuint16m1_t rs2, size_t vl);
vint16m2_t __riscv_vluxei16_v_i16m2_m(vbool8_t vm, const int16_t *rs1,
                                      vuint16m2_t rs2, size_t vl);
vint16m4_t __riscv_vluxei16_v_i16m4_m(vbool4_t vm, const int16_t *rs1,
                                      vuint16m4_t rs2, size_t vl);
vint16m8_t __riscv_vluxei16_v_i16m8_m(vbool2_t vm, const int16_t *rs1,
                                      vuint16m8_t rs2, size_t vl);
vint16mf4_t __riscv_vluxei32_v_i16mf4_m(vbool64_t vm, const int16_t *rs1,
                                        vuint32mf2_t rs2, size_t vl);
vint16mf2_t __riscv_vluxei32_v_i16mf2_m(vbool32_t vm, const int16_t *rs1,
                                        vuint32m1_t rs2, size_t vl);
vint16m1_t __riscv_vluxei32_v_i16m1_m(vbool16_t vm, const int16_t *rs1,
                                      vuint32m2_t rs2, size_t vl);
vint16m2_t __riscv_vluxei32_v_i16m2_m(vbool8_t vm, const int16_t *rs1,
                                      vuint32m4_t rs2, size_t vl);
vint16m4_t __riscv_vluxei32_v_i16m4_m(vbool4_t vm, const int16_t *rs1,
                                      vuint32m8_t rs2, size_t vl);
vint16mf4_t __riscv_vluxei64_v_i16mf4_m(vbool64_t vm, const int16_t *rs1,
                                        vuint64m1_t rs2, size_t vl);
vint16mf2_t __riscv_vluxei64_v_i16mf2_m(vbool32_t vm, const int16_t *rs1,
                                        vuint64m2_t rs2, size_t vl);
vint16m1_t __riscv_vluxei64_v_i16m1_m(vbool16_t vm, const int16_t *rs1,
                                      vuint64m4_t rs2, size_t vl);
vint16m2_t __riscv_vluxei64_v_i16m2_m(vbool8_t vm, const int16_t *rs1,
                                      vuint64m8_t rs2, size_t vl);
vint32mf2_t __riscv_vluxei8_v_i32mf2_m(vbool64_t vm, const int32_t *rs1,
                                       vuint8mf8_t rs2, size_t vl);
vint32m1_t __riscv_vluxei8_v_i32m1_m(vbool32_t vm, const int32_t *rs1,
                                     vuint8mf4_t rs2, size_t vl);
vint32m2_t __riscv_vluxei8_v_i32m2_m(vbool16_t vm, const int32_t *rs1,
                                     vuint8mf2_t rs2, size_t vl);
vint32m4_t __riscv_vluxei8_v_i32m4_m(vbool8_t vm, const int32_t *rs1,
                                     vuint8m1_t rs2, size_t vl);
vint32m8_t __riscv_vluxei8_v_i32m8_m(vbool4_t vm, const int32_t *rs1,
                                     vuint8m2_t rs2, size_t vl);
vint32mf2_t __riscv_vluxei16_v_i32mf2_m(vbool64_t vm, const int32_t *rs1,
                                        vuint16mf4_t rs2, size_t vl);
vint32m1_t __riscv_vluxei16_v_i32m1_m(vbool32_t vm, const int32_t *rs1,
                                      vuint16mf2_t rs2, size_t vl);
vint32m2_t __riscv_vluxei16_v_i32m2_m(vbool16_t vm, const int32_t *rs1,
                                      vuint16m1_t rs2, size_t vl);
vint32m4_t __riscv_vluxei16_v_i32m4_m(vbool8_t vm, const int32_t *rs1,
                                      vuint16m2_t rs2, size_t vl);
vint32m8_t __riscv_vluxei16_v_i32m8_m(vbool4_t vm, const int32_t *rs1,
                                      vuint16m4_t rs2, size_t vl);
vint32mf2_t __riscv_vluxei32_v_i32mf2_m(vbool64_t vm, const int32_t *rs1,
                                        vuint32mf2_t rs2, size_t vl);
vint32m1_t __riscv_vluxei32_v_i32m1_m(vbool32_t vm, const int32_t *rs1,
                                      vuint32m1_t rs2, size_t vl);
vint32m2_t __riscv_vluxei32_v_i32m2_m(vbool16_t vm, const int32_t *rs1,
                                      vuint32m2_t rs2, size_t vl);
vint32m4_t __riscv_vluxei32_v_i32m4_m(vbool8_t vm, const int32_t *rs1,
                                      vuint32m4_t rs2, size_t vl);
vint32m8_t __riscv_vluxei32_v_i32m8_m(vbool4_t vm, const int32_t *rs1,
                                      vuint32m8_t rs2, size_t vl);
vint32mf2_t __riscv_vluxei64_v_i32mf2_m(vbool64_t vm, const int32_t *rs1,
                                        vuint64m1_t rs2, size_t vl);
vint32m1_t __riscv_vluxei64_v_i32m1_m(vbool32_t vm, const int32_t *rs1,
                                      vuint64m2_t rs2, size_t vl);
vint32m2_t __riscv_vluxei64_v_i32m2_m(vbool16_t vm, const int32_t *rs1,
                                      vuint64m4_t rs2, size_t vl);
vint32m4_t __riscv_vluxei64_v_i32m4_m(vbool8_t vm, const int32_t *rs1,
                                      vuint64m8_t rs2, size_t vl);
vint64m1_t __riscv_vluxei8_v_i64m1_m(vbool64_t vm, const int64_t *rs1,
                                     vuint8mf8_t rs2, size_t vl);
vint64m2_t __riscv_vluxei8_v_i64m2_m(vbool32_t vm, const int64_t *rs1,
                                     vuint8mf4_t rs2, size_t vl);
vint64m4_t __riscv_vluxei8_v_i64m4_m(vbool16_t vm, const int64_t *rs1,
                                     vuint8mf2_t rs2, size_t vl);
vint64m8_t __riscv_vluxei8_v_i64m8_m(vbool8_t vm, const int64_t *rs1,
                                     vuint8m1_t rs2, size_t vl);
vint64m1_t __riscv_vluxei16_v_i64m1_m(vbool64_t vm, const int64_t *rs1,
                                      vuint16mf4_t rs2, size_t vl);
vint64m2_t __riscv_vluxei16_v_i64m2_m(vbool32_t vm, const int64_t *rs1,
                                      vuint16mf2_t rs2, size_t vl);
vint64m4_t __riscv_vluxei16_v_i64m4_m(vbool16_t vm, const int64_t *rs1,
                                      vuint16m1_t rs2, size_t vl);
vint64m8_t __riscv_vluxei16_v_i64m8_m(vbool8_t vm, const int64_t *rs1,
                                      vuint16m2_t rs2, size_t vl);
vint64m1_t __riscv_vluxei32_v_i64m1_m(vbool64_t vm, const int64_t *rs1,
                                      vuint32mf2_t rs2, size_t vl);
vint64m2_t __riscv_vluxei32_v_i64m2_m(vbool32_t vm, const int64_t *rs1,
                                      vuint32m1_t rs2, size_t vl);
vint64m4_t __riscv_vluxei32_v_i64m4_m(vbool16_t vm, const int64_t *rs1,
                                      vuint32m2_t rs2, size_t vl);
vint64m8_t __riscv_vluxei32_v_i64m8_m(vbool8_t vm, const int64_t *rs1,
                                      vuint32m4_t rs2, size_t vl);
vint64m1_t __riscv_vluxei64_v_i64m1_m(vbool64_t vm, const int64_t *rs1,
                                      vuint64m1_t rs2, size_t vl);
vint64m2_t __riscv_vluxei64_v_i64m2_m(vbool32_t vm, const int64_t *rs1,
                                      vuint64m2_t rs2, size_t vl);
vint64m4_t __riscv_vluxei64_v_i64m4_m(vbool16_t vm, const int64_t *rs1,
                                      vuint64m4_t rs2, size_t vl);
vint64m8_t __riscv_vluxei64_v_i64m8_m(vbool8_t vm, const int64_t *rs1,
                                      vuint64m8_t rs2, size_t vl);
vuint8mf8_t __riscv_vloxei8_v_u8mf8_m(vbool64_t vm, const uint8_t *rs1,
                                      vuint8mf8_t rs2, size_t vl);
vuint8mf4_t __riscv_vloxei8_v_u8mf4_m(vbool32_t vm, const uint8_t *rs1,
                                      vuint8mf4_t rs2, size_t vl);
vuint8mf2_t __riscv_vloxei8_v_u8mf2_m(vbool16_t vm, const uint8_t *rs1,
                                      vuint8mf2_t rs2, size_t vl);
vuint8m1_t __riscv_vloxei8_v_u8m1_m(vbool8_t vm, const uint8_t *rs1,
                                    vuint8m1_t rs2, size_t vl);
vuint8m2_t __riscv_vloxei8_v_u8m2_m(vbool4_t vm, const uint8_t *rs1,
                                    vuint8m2_t rs2, size_t vl);
vuint8m4_t __riscv_vloxei8_v_u8m4_m(vbool2_t vm, const uint8_t *rs1,
                                    vuint8m4_t rs2, size_t vl);
vuint8m8_t __riscv_vloxei8_v_u8m8_m(vbool1_t vm, const uint8_t *rs1,
                                    vuint8m8_t rs2, size_t vl);
vuint8mf8_t __riscv_vloxei16_v_u8mf8_m(vbool64_t vm, const uint8_t *rs1,
                                       vuint16mf4_t rs2, size_t vl);
vuint8mf4_t __riscv_vloxei16_v_u8mf4_m(vbool32_t vm, const uint8_t *rs1,
                                       vuint16mf2_t rs2, size_t vl);
vuint8mf2_t __riscv_vloxei16_v_u8mf2_m(vbool16_t vm, const uint8_t *rs1,
                                       vuint16m1_t rs2, size_t vl);
vuint8m1_t __riscv_vloxei16_v_u8m1_m(vbool8_t vm, const uint8_t *rs1,
                                     vuint16m2_t rs2, size_t vl);
vuint8m2_t __riscv_vloxei16_v_u8m2_m(vbool4_t vm, const uint8_t *rs1,
                                     vuint16m4_t rs2, size_t vl);
vuint8m4_t __riscv_vloxei16_v_u8m4_m(vbool2_t vm, const uint8_t *rs1,
                                     vuint16m8_t rs2, size_t vl);
vuint8mf8_t __riscv_vloxei32_v_u8mf8_m(vbool64_t vm, const uint8_t *rs1,
                                       vuint32mf2_t rs2, size_t vl);
vuint8mf4_t __riscv_vloxei32_v_u8mf4_m(vbool32_t vm, const uint8_t *rs1,
                                       vuint32m1_t rs2, size_t vl);
vuint8mf2_t __riscv_vloxei32_v_u8mf2_m(vbool16_t vm, const uint8_t *rs1,
                                       vuint32m2_t rs2, size_t vl);
vuint8m1_t __riscv_vloxei32_v_u8m1_m(vbool8_t vm, const uint8_t *rs1,
                                     vuint32m4_t rs2, size_t vl);
vuint8m2_t __riscv_vloxei32_v_u8m2_m(vbool4_t vm, const uint8_t *rs1,
                                     vuint32m8_t rs2, size_t vl);
vuint8mf8_t __riscv_vloxei64_v_u8mf8_m(vbool64_t vm, const uint8_t *rs1,
                                       vuint64m1_t rs2, size_t vl);
vuint8mf4_t __riscv_vloxei64_v_u8mf4_m(vbool32_t vm, const uint8_t *rs1,
                                       vuint64m2_t rs2, size_t vl);
vuint8mf2_t __riscv_vloxei64_v_u8mf2_m(vbool16_t vm, const uint8_t *rs1,
                                       vuint64m4_t rs2, size_t vl);
vuint8m1_t __riscv_vloxei64_v_u8m1_m(vbool8_t vm, const uint8_t *rs1,
                                     vuint64m8_t rs2, size_t vl);
vuint16mf4_t __riscv_vloxei8_v_u16mf4_m(vbool64_t vm, const uint16_t *rs1,
                                        vuint8mf8_t rs2, size_t vl);
vuint16mf2_t __riscv_vloxei8_v_u16mf2_m(vbool32_t vm, const uint16_t *rs1,
                                        vuint8mf4_t rs2, size_t vl);
vuint16m1_t __riscv_vloxei8_v_u16m1_m(vbool16_t vm, const uint16_t *rs1,
                                      vuint8mf2_t rs2, size_t vl);
vuint16m2_t __riscv_vloxei8_v_u16m2_m(vbool8_t vm, const uint16_t *rs1,
                                      vuint8m1_t rs2, size_t vl);
vuint16m4_t __riscv_vloxei8_v_u16m4_m(vbool4_t vm, const uint16_t *rs1,
                                      vuint8m2_t rs2, size_t vl);
vuint16m8_t __riscv_vloxei8_v_u16m8_m(vbool2_t vm, const uint16_t *rs1,
                                      vuint8m4_t rs2, size_t vl);
vuint16mf4_t __riscv_vloxei16_v_u16mf4_m(vbool64_t vm, const uint16_t *rs1,
                                         vuint16mf4_t rs2, size_t vl);
vuint16mf2_t __riscv_vloxei16_v_u16mf2_m(vbool32_t vm, const uint16_t *rs1,
                                         vuint16mf2_t rs2, size_t vl);
vuint16m1_t __riscv_vloxei16_v_u16m1_m(vbool16_t vm, const uint16_t *rs1,
                                       vuint16m1_t rs2, size_t vl);
vuint16m2_t __riscv_vloxei16_v_u16m2_m(vbool8_t vm, const uint16_t *rs1,
                                       vuint16m2_t rs2, size_t vl);
vuint16m4_t __riscv_vloxei16_v_u16m4_m(vbool4_t vm, const uint16_t *rs1,
                                       vuint16m4_t rs2, size_t vl);
vuint16m8_t __riscv_vloxei16_v_u16m8_m(vbool2_t vm, const uint16_t *rs1,
                                       vuint16m8_t rs2, size_t vl);
vuint16mf4_t __riscv_vloxei32_v_u16mf4_m(vbool64_t vm, const uint16_t *rs1,
                                         vuint32mf2_t rs2, size_t vl);
vuint16mf2_t __riscv_vloxei32_v_u16mf2_m(vbool32_t vm, const uint16_t *rs1,
                                         vuint32m1_t rs2, size_t vl);
vuint16m1_t __riscv_vloxei32_v_u16m1_m(vbool16_t vm, const uint16_t *rs1,
                                       vuint32m2_t rs2, size_t vl);
vuint16m2_t __riscv_vloxei32_v_u16m2_m(vbool8_t vm, const uint16_t *rs1,
                                       vuint32m4_t rs2, size_t vl);
vuint16m4_t __riscv_vloxei32_v_u16m4_m(vbool4_t vm, const uint16_t *rs1,
                                       vuint32m8_t rs2, size_t vl);
vuint16mf4_t __riscv_vloxei64_v_u16mf4_m(vbool64_t vm, const uint16_t *rs1,
                                         vuint64m1_t rs2, size_t vl);
vuint16mf2_t __riscv_vloxei64_v_u16mf2_m(vbool32_t vm, const uint16_t *rs1,
                                         vuint64m2_t rs2, size_t vl);
vuint16m1_t __riscv_vloxei64_v_u16m1_m(vbool16_t vm, const uint16_t *rs1,
                                       vuint64m4_t rs2, size_t vl);
vuint16m2_t __riscv_vloxei64_v_u16m2_m(vbool8_t vm, const uint16_t *rs1,
                                       vuint64m8_t rs2, size_t vl);
vuint32mf2_t __riscv_vloxei8_v_u32mf2_m(vbool64_t vm, const uint32_t *rs1,
                                        vuint8mf8_t rs2, size_t vl);
vuint32m1_t __riscv_vloxei8_v_u32m1_m(vbool32_t vm, const uint32_t *rs1,
                                      vuint8mf4_t rs2, size_t vl);
vuint32m2_t __riscv_vloxei8_v_u32m2_m(vbool16_t vm, const uint32_t *rs1,
                                      vuint8mf2_t rs2, size_t vl);
vuint32m4_t __riscv_vloxei8_v_u32m4_m(vbool8_t vm, const uint32_t *rs1,
                                      vuint8m1_t rs2, size_t vl);
vuint32m8_t __riscv_vloxei8_v_u32m8_m(vbool4_t vm, const uint32_t *rs1,
                                      vuint8m2_t rs2, size_t vl);
vuint32mf2_t __riscv_vloxei16_v_u32mf2_m(vbool64_t vm, const uint32_t *rs1,
                                         vuint16mf4_t rs2, size_t vl);
vuint32m1_t __riscv_vloxei16_v_u32m1_m(vbool32_t vm, const uint32_t *rs1,
                                       vuint16mf2_t rs2, size_t vl);
vuint32m2_t __riscv_vloxei16_v_u32m2_m(vbool16_t vm, const uint32_t *rs1,
                                       vuint16m1_t rs2, size_t vl);
vuint32m4_t __riscv_vloxei16_v_u32m4_m(vbool8_t vm, const uint32_t *rs1,
                                       vuint16m2_t rs2, size_t vl);
vuint32m8_t __riscv_vloxei16_v_u32m8_m(vbool4_t vm, const uint32_t *rs1,
                                       vuint16m4_t rs2, size_t vl);
vuint32mf2_t __riscv_vloxei32_v_u32mf2_m(vbool64_t vm, const uint32_t *rs1,
                                         vuint32mf2_t rs2, size_t vl);
vuint32m1_t __riscv_vloxei32_v_u32m1_m(vbool32_t vm, const uint32_t *rs1,
                                       vuint32m1_t rs2, size_t vl);
vuint32m2_t __riscv_vloxei32_v_u32m2_m(vbool16_t vm, const uint32_t *rs1,
                                       vuint32m2_t rs2, size_t vl);
vuint32m4_t __riscv_vloxei32_v_u32m4_m(vbool8_t vm, const uint32_t *rs1,
                                       vuint32m4_t rs2, size_t vl);
vuint32m8_t __riscv_vloxei32_v_u32m8_m(vbool4_t vm, const uint32_t *rs1,
                                       vuint32m8_t rs2, size_t vl);
vuint32mf2_t __riscv_vloxei64_v_u32mf2_m(vbool64_t vm, const uint32_t *rs1,
                                         vuint64m1_t rs2, size_t vl);
vuint32m1_t __riscv_vloxei64_v_u32m1_m(vbool32_t vm, const uint32_t *rs1,
                                       vuint64m2_t rs2, size_t vl);
vuint32m2_t __riscv_vloxei64_v_u32m2_m(vbool16_t vm, const uint32_t *rs1,
                                       vuint64m4_t rs2, size_t vl);
vuint32m4_t __riscv_vloxei64_v_u32m4_m(vbool8_t vm, const uint32_t *rs1,
                                       vuint64m8_t rs2, size_t vl);
vuint64m1_t __riscv_vloxei8_v_u64m1_m(vbool64_t vm, const uint64_t *rs1,
                                      vuint8mf8_t rs2, size_t vl);
vuint64m2_t __riscv_vloxei8_v_u64m2_m(vbool32_t vm, const uint64_t *rs1,
                                      vuint8mf4_t rs2, size_t vl);
vuint64m4_t __riscv_vloxei8_v_u64m4_m(vbool16_t vm, const uint64_t *rs1,
                                      vuint8mf2_t rs2, size_t vl);
vuint64m8_t __riscv_vloxei8_v_u64m8_m(vbool8_t vm, const uint64_t *rs1,
                                      vuint8m1_t rs2, size_t vl);
vuint64m1_t __riscv_vloxei16_v_u64m1_m(vbool64_t vm, const uint64_t *rs1,
                                       vuint16mf4_t rs2, size_t vl);
vuint64m2_t __riscv_vloxei16_v_u64m2_m(vbool32_t vm, const uint64_t *rs1,
                                       vuint16mf2_t rs2, size_t vl);
vuint64m4_t __riscv_vloxei16_v_u64m4_m(vbool16_t vm, const uint64_t *rs1,
                                       vuint16m1_t rs2, size_t vl);
vuint64m8_t __riscv_vloxei16_v_u64m8_m(vbool8_t vm, const uint64_t *rs1,
                                       vuint16m2_t rs2, size_t vl);
vuint64m1_t __riscv_vloxei32_v_u64m1_m(vbool64_t vm, const uint64_t *rs1,
                                       vuint32mf2_t rs2, size_t vl);
vuint64m2_t __riscv_vloxei32_v_u64m2_m(vbool32_t vm, const uint64_t *rs1,
                                       vuint32m1_t rs2, size_t vl);
vuint64m4_t __riscv_vloxei32_v_u64m4_m(vbool16_t vm, const uint64_t *rs1,
                                       vuint32m2_t rs2, size_t vl);
vuint64m8_t __riscv_vloxei32_v_u64m8_m(vbool8_t vm, const uint64_t *rs1,
                                       vuint32m4_t rs2, size_t vl);
vuint64m1_t __riscv_vloxei64_v_u64m1_m(vbool64_t vm, const uint64_t *rs1,
                                       vuint64m1_t rs2, size_t vl);
vuint64m2_t __riscv_vloxei64_v_u64m2_m(vbool32_t vm, const uint64_t *rs1,
                                       vuint64m2_t rs2, size_t vl);
vuint64m4_t __riscv_vloxei64_v_u64m4_m(vbool16_t vm, const uint64_t *rs1,
                                       vuint64m4_t rs2, size_t vl);
vuint64m8_t __riscv_vloxei64_v_u64m8_m(vbool8_t vm, const uint64_t *rs1,
                                       vuint64m8_t rs2, size_t vl);
vuint8mf8_t __riscv_vluxei8_v_u8mf8_m(vbool64_t vm, const uint8_t *rs1,
                                      vuint8mf8_t rs2, size_t vl);
vuint8mf4_t __riscv_vluxei8_v_u8mf4_m(vbool32_t vm, const uint8_t *rs1,
                                      vuint8mf4_t rs2, size_t vl);
vuint8mf2_t __riscv_vluxei8_v_u8mf2_m(vbool16_t vm, const uint8_t *rs1,
                                      vuint8mf2_t rs2, size_t vl);
vuint8m1_t __riscv_vluxei8_v_u8m1_m(vbool8_t vm, const uint8_t *rs1,
                                    vuint8m1_t rs2, size_t vl);
vuint8m2_t __riscv_vluxei8_v_u8m2_m(vbool4_t vm, const uint8_t *rs1,
                                    vuint8m2_t rs2, size_t vl);
vuint8m4_t __riscv_vluxei8_v_u8m4_m(vbool2_t vm, const uint8_t *rs1,
                                    vuint8m4_t rs2, size_t vl);
vuint8m8_t __riscv_vluxei8_v_u8m8_m(vbool1_t vm, const uint8_t *rs1,
                                    vuint8m8_t rs2, size_t vl);
vuint8mf8_t __riscv_vluxei16_v_u8mf8_m(vbool64_t vm, const uint8_t *rs1,
                                       vuint16mf4_t rs2, size_t vl);
vuint8mf4_t __riscv_vluxei16_v_u8mf4_m(vbool32_t vm, const uint8_t *rs1,
                                       vuint16mf2_t rs2, size_t vl);
vuint8mf2_t __riscv_vluxei16_v_u8mf2_m(vbool16_t vm, const uint8_t *rs1,
                                       vuint16m1_t rs2, size_t vl);
vuint8m1_t __riscv_vluxei16_v_u8m1_m(vbool8_t vm, const uint8_t *rs1,
                                     vuint16m2_t rs2, size_t vl);
vuint8m2_t __riscv_vluxei16_v_u8m2_m(vbool4_t vm, const uint8_t *rs1,
                                     vuint16m4_t rs2, size_t vl);
vuint8m4_t __riscv_vluxei16_v_u8m4_m(vbool2_t vm, const uint8_t *rs1,
                                     vuint16m8_t rs2, size_t vl);
vuint8mf8_t __riscv_vluxei32_v_u8mf8_m(vbool64_t vm, const uint8_t *rs1,
                                       vuint32mf2_t rs2, size_t vl);
vuint8mf4_t __riscv_vluxei32_v_u8mf4_m(vbool32_t vm, const uint8_t *rs1,
                                       vuint32m1_t rs2, size_t vl);
vuint8mf2_t __riscv_vluxei32_v_u8mf2_m(vbool16_t vm, const uint8_t *rs1,
                                       vuint32m2_t rs2, size_t vl);
vuint8m1_t __riscv_vluxei32_v_u8m1_m(vbool8_t vm, const uint8_t *rs1,
                                     vuint32m4_t rs2, size_t vl);
vuint8m2_t __riscv_vluxei32_v_u8m2_m(vbool4_t vm, const uint8_t *rs1,
                                     vuint32m8_t rs2, size_t vl);
vuint8mf8_t __riscv_vluxei64_v_u8mf8_m(vbool64_t vm, const uint8_t *rs1,
                                       vuint64m1_t rs2, size_t vl);
vuint8mf4_t __riscv_vluxei64_v_u8mf4_m(vbool32_t vm, const uint8_t *rs1,
                                       vuint64m2_t rs2, size_t vl);
vuint8mf2_t __riscv_vluxei64_v_u8mf2_m(vbool16_t vm, const uint8_t *rs1,
                                       vuint64m4_t rs2, size_t vl);
vuint8m1_t __riscv_vluxei64_v_u8m1_m(vbool8_t vm, const uint8_t *rs1,
                                     vuint64m8_t rs2, size_t vl);
vuint16mf4_t __riscv_vluxei8_v_u16mf4_m(vbool64_t vm, const uint16_t *rs1,
                                        vuint8mf8_t rs2, size_t vl);
vuint16mf2_t __riscv_vluxei8_v_u16mf2_m(vbool32_t vm, const uint16_t *rs1,
                                        vuint8mf4_t rs2, size_t vl);
vuint16m1_t __riscv_vluxei8_v_u16m1_m(vbool16_t vm, const uint16_t *rs1,
                                      vuint8mf2_t rs2, size_t vl);
vuint16m2_t __riscv_vluxei8_v_u16m2_m(vbool8_t vm, const uint16_t *rs1,
                                      vuint8m1_t rs2, size_t vl);
vuint16m4_t __riscv_vluxei8_v_u16m4_m(vbool4_t vm, const uint16_t *rs1,
                                      vuint8m2_t rs2, size_t vl);
vuint16m8_t __riscv_vluxei8_v_u16m8_m(vbool2_t vm, const uint16_t *rs1,
                                      vuint8m4_t rs2, size_t vl);
vuint16mf4_t __riscv_vluxei16_v_u16mf4_m(vbool64_t vm, const uint16_t *rs1,
                                         vuint16mf4_t rs2, size_t vl);
vuint16mf2_t __riscv_vluxei16_v_u16mf2_m(vbool32_t vm, const uint16_t *rs1,
                                         vuint16mf2_t rs2, size_t vl);
vuint16m1_t __riscv_vluxei16_v_u16m1_m(vbool16_t vm, const uint16_t *rs1,
                                       vuint16m1_t rs2, size_t vl);
vuint16m2_t __riscv_vluxei16_v_u16m2_m(vbool8_t vm, const uint16_t *rs1,
                                       vuint16m2_t rs2, size_t vl);
vuint16m4_t __riscv_vluxei16_v_u16m4_m(vbool4_t vm, const uint16_t *rs1,
                                       vuint16m4_t rs2, size_t vl);
vuint16m8_t __riscv_vluxei16_v_u16m8_m(vbool2_t vm, const uint16_t *rs1,
                                       vuint16m8_t rs2, size_t vl);
vuint16mf4_t __riscv_vluxei32_v_u16mf4_m(vbool64_t vm, const uint16_t *rs1,
                                         vuint32mf2_t rs2, size_t vl);
vuint16mf2_t __riscv_vluxei32_v_u16mf2_m(vbool32_t vm, const uint16_t *rs1,
                                         vuint32m1_t rs2, size_t vl);
vuint16m1_t __riscv_vluxei32_v_u16m1_m(vbool16_t vm, const uint16_t *rs1,
                                       vuint32m2_t rs2, size_t vl);
vuint16m2_t __riscv_vluxei32_v_u16m2_m(vbool8_t vm, const uint16_t *rs1,
                                       vuint32m4_t rs2, size_t vl);
vuint16m4_t __riscv_vluxei32_v_u16m4_m(vbool4_t vm, const uint16_t *rs1,
                                       vuint32m8_t rs2, size_t vl);
vuint16mf4_t __riscv_vluxei64_v_u16mf4_m(vbool64_t vm, const uint16_t *rs1,
                                         vuint64m1_t rs2, size_t vl);
vuint16mf2_t __riscv_vluxei64_v_u16mf2_m(vbool32_t vm, const uint16_t *rs1,
                                         vuint64m2_t rs2, size_t vl);
vuint16m1_t __riscv_vluxei64_v_u16m1_m(vbool16_t vm, const uint16_t *rs1,
                                       vuint64m4_t rs2, size_t vl);
vuint16m2_t __riscv_vluxei64_v_u16m2_m(vbool8_t vm, const uint16_t *rs1,
                                       vuint64m8_t rs2, size_t vl);
vuint32mf2_t __riscv_vluxei8_v_u32mf2_m(vbool64_t vm, const uint32_t *rs1,
                                        vuint8mf8_t rs2, size_t vl);
vuint32m1_t __riscv_vluxei8_v_u32m1_m(vbool32_t vm, const uint32_t *rs1,
                                      vuint8mf4_t rs2, size_t vl);
vuint32m2_t __riscv_vluxei8_v_u32m2_m(vbool16_t vm, const uint32_t *rs1,
                                      vuint8mf2_t rs2, size_t vl);
vuint32m4_t __riscv_vluxei8_v_u32m4_m(vbool8_t vm, const uint32_t *rs1,
                                      vuint8m1_t rs2, size_t vl);
vuint32m8_t __riscv_vluxei8_v_u32m8_m(vbool4_t vm, const uint32_t *rs1,
                                      vuint8m2_t rs2, size_t vl);
vuint32mf2_t __riscv_vluxei16_v_u32mf2_m(vbool64_t vm, const uint32_t *rs1,
                                         vuint16mf4_t rs2, size_t vl);
vuint32m1_t __riscv_vluxei16_v_u32m1_m(vbool32_t vm, const uint32_t *rs1,
                                       vuint16mf2_t rs2, size_t vl);
vuint32m2_t __riscv_vluxei16_v_u32m2_m(vbool16_t vm, const uint32_t *rs1,
                                       vuint16m1_t rs2, size_t vl);
vuint32m4_t __riscv_vluxei16_v_u32m4_m(vbool8_t vm, const uint32_t *rs1,
                                       vuint16m2_t rs2, size_t vl);
vuint32m8_t __riscv_vluxei16_v_u32m8_m(vbool4_t vm, const uint32_t *rs1,
                                       vuint16m4_t rs2, size_t vl);
vuint32mf2_t __riscv_vluxei32_v_u32mf2_m(vbool64_t vm, const uint32_t *rs1,
                                         vuint32mf2_t rs2, size_t vl);
vuint32m1_t __riscv_vluxei32_v_u32m1_m(vbool32_t vm, const uint32_t *rs1,
                                       vuint32m1_t rs2, size_t vl);
vuint32m2_t __riscv_vluxei32_v_u32m2_m(vbool16_t vm, const uint32_t *rs1,
                                       vuint32m2_t rs2, size_t vl);
vuint32m4_t __riscv_vluxei32_v_u32m4_m(vbool8_t vm, const uint32_t *rs1,
                                       vuint32m4_t rs2, size_t vl);
vuint32m8_t __riscv_vluxei32_v_u32m8_m(vbool4_t vm, const uint32_t *rs1,
                                       vuint32m8_t rs2, size_t vl);
vuint32mf2_t __riscv_vluxei64_v_u32mf2_m(vbool64_t vm, const uint32_t *rs1,
                                         vuint64m1_t rs2, size_t vl);
vuint32m1_t __riscv_vluxei64_v_u32m1_m(vbool32_t vm, const uint32_t *rs1,
                                       vuint64m2_t rs2, size_t vl);
vuint32m2_t __riscv_vluxei64_v_u32m2_m(vbool16_t vm, const uint32_t *rs1,
                                       vuint64m4_t rs2, size_t vl);
vuint32m4_t __riscv_vluxei64_v_u32m4_m(vbool8_t vm, const uint32_t *rs1,
                                       vuint64m8_t rs2, size_t vl);
vuint64m1_t __riscv_vluxei8_v_u64m1_m(vbool64_t vm, const uint64_t *rs1,
                                      vuint8mf8_t rs2, size_t vl);
vuint64m2_t __riscv_vluxei8_v_u64m2_m(vbool32_t vm, const uint64_t *rs1,
                                      vuint8mf4_t rs2, size_t vl);
vuint64m4_t __riscv_vluxei8_v_u64m4_m(vbool16_t vm, const uint64_t *rs1,
                                      vuint8mf2_t rs2, size_t vl);
vuint64m8_t __riscv_vluxei8_v_u64m8_m(vbool8_t vm, const uint64_t *rs1,
                                      vuint8m1_t rs2, size_t vl);
vuint64m1_t __riscv_vluxei16_v_u64m1_m(vbool64_t vm, const uint64_t *rs1,
                                       vuint16mf4_t rs2, size_t vl);
vuint64m2_t __riscv_vluxei16_v_u64m2_m(vbool32_t vm, const uint64_t *rs1,
                                       vuint16mf2_t rs2, size_t vl);
vuint64m4_t __riscv_vluxei16_v_u64m4_m(vbool16_t vm, const uint64_t *rs1,
                                       vuint16m1_t rs2, size_t vl);
vuint64m8_t __riscv_vluxei16_v_u64m8_m(vbool8_t vm, const uint64_t *rs1,
                                       vuint16m2_t rs2, size_t vl);
vuint64m1_t __riscv_vluxei32_v_u64m1_m(vbool64_t vm, const uint64_t *rs1,
                                       vuint32mf2_t rs2, size_t vl);
vuint64m2_t __riscv_vluxei32_v_u64m2_m(vbool32_t vm, const uint64_t *rs1,
                                       vuint32m1_t rs2, size_t vl);
vuint64m4_t __riscv_vluxei32_v_u64m4_m(vbool16_t vm, const uint64_t *rs1,
                                       vuint32m2_t rs2, size_t vl);
vuint64m8_t __riscv_vluxei32_v_u64m8_m(vbool8_t vm, const uint64_t *rs1,
                                       vuint32m4_t rs2, size_t vl);
vuint64m1_t __riscv_vluxei64_v_u64m1_m(vbool64_t vm, const uint64_t *rs1,
                                       vuint64m1_t rs2, size_t vl);
vuint64m2_t __riscv_vluxei64_v_u64m2_m(vbool32_t vm, const uint64_t *rs1,
                                       vuint64m2_t rs2, size_t vl);
vuint64m4_t __riscv_vluxei64_v_u64m4_m(vbool16_t vm, const uint64_t *rs1,
                                       vuint64m4_t rs2, size_t vl);
vuint64m8_t __riscv_vluxei64_v_u64m8_m(vbool8_t vm, const uint64_t *rs1,
                                       vuint64m8_t rs2, size_t vl);

Vector Indexed Store Intrinsics

void __riscv_vsoxei8_v_f16mf4(_Float16 *rs1, vuint8mf8_t rs2, vfloat16mf4_t vs3,
                              size_t vl);
void __riscv_vsoxei8_v_f16mf2(_Float16 *rs1, vuint8mf4_t rs2, vfloat16mf2_t vs3,
                              size_t vl);
void __riscv_vsoxei8_v_f16m1(_Float16 *rs1, vuint8mf2_t rs2, vfloat16m1_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_f16m2(_Float16 *rs1, vuint8m1_t rs2, vfloat16m2_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_f16m4(_Float16 *rs1, vuint8m2_t rs2, vfloat16m4_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_f16m8(_Float16 *rs1, vuint8m4_t rs2, vfloat16m8_t vs3,
                             size_t vl);
void __riscv_vsoxei16_v_f16mf4(_Float16 *rs1, vuint16mf4_t rs2,
                               vfloat16mf4_t vs3, size_t vl);
void __riscv_vsoxei16_v_f16mf2(_Float16 *rs1, vuint16mf2_t rs2,
                               vfloat16mf2_t vs3, size_t vl);
void __riscv_vsoxei16_v_f16m1(_Float16 *rs1, vuint16m1_t rs2, vfloat16m1_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_f16m2(_Float16 *rs1, vuint16m2_t rs2, vfloat16m2_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_f16m4(_Float16 *rs1, vuint16m4_t rs2, vfloat16m4_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_f16m8(_Float16 *rs1, vuint16m8_t rs2, vfloat16m8_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_f16mf4(_Float16 *rs1, vuint32mf2_t rs2,
                               vfloat16mf4_t vs3, size_t vl);
void __riscv_vsoxei32_v_f16mf2(_Float16 *rs1, vuint32m1_t rs2,
                               vfloat16mf2_t vs3, size_t vl);
void __riscv_vsoxei32_v_f16m1(_Float16 *rs1, vuint32m2_t rs2, vfloat16m1_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_f16m2(_Float16 *rs1, vuint32m4_t rs2, vfloat16m2_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_f16m4(_Float16 *rs1, vuint32m8_t rs2, vfloat16m4_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_f16mf4(_Float16 *rs1, vuint64m1_t rs2,
                               vfloat16mf4_t vs3, size_t vl);
void __riscv_vsoxei64_v_f16mf2(_Float16 *rs1, vuint64m2_t rs2,
                               vfloat16mf2_t vs3, size_t vl);
void __riscv_vsoxei64_v_f16m1(_Float16 *rs1, vuint64m4_t rs2, vfloat16m1_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_f16m2(_Float16 *rs1, vuint64m8_t rs2, vfloat16m2_t vs3,
                              size_t vl);
void __riscv_vsoxei8_v_f32mf2(float *rs1, vuint8mf8_t rs2, vfloat32mf2_t vs3,
                              size_t vl);
void __riscv_vsoxei8_v_f32m1(float *rs1, vuint8mf4_t rs2, vfloat32m1_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_f32m2(float *rs1, vuint8mf2_t rs2, vfloat32m2_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_f32m4(float *rs1, vuint8m1_t rs2, vfloat32m4_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_f32m8(float *rs1, vuint8m2_t rs2, vfloat32m8_t vs3,
                             size_t vl);
void __riscv_vsoxei16_v_f32mf2(float *rs1, vuint16mf4_t rs2, vfloat32mf2_t vs3,
                               size_t vl);
void __riscv_vsoxei16_v_f32m1(float *rs1, vuint16mf2_t rs2, vfloat32m1_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_f32m2(float *rs1, vuint16m1_t rs2, vfloat32m2_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_f32m4(float *rs1, vuint16m2_t rs2, vfloat32m4_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_f32m8(float *rs1, vuint16m4_t rs2, vfloat32m8_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_f32mf2(float *rs1, vuint32mf2_t rs2, vfloat32mf2_t vs3,
                               size_t vl);
void __riscv_vsoxei32_v_f32m1(float *rs1, vuint32m1_t rs2, vfloat32m1_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_f32m2(float *rs1, vuint32m2_t rs2, vfloat32m2_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_f32m4(float *rs1, vuint32m4_t rs2, vfloat32m4_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_f32m8(float *rs1, vuint32m8_t rs2, vfloat32m8_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_f32mf2(float *rs1, vuint64m1_t rs2, vfloat32mf2_t vs3,
                               size_t vl);
void __riscv_vsoxei64_v_f32m1(float *rs1, vuint64m2_t rs2, vfloat32m1_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_f32m2(float *rs1, vuint64m4_t rs2, vfloat32m2_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_f32m4(float *rs1, vuint64m8_t rs2, vfloat32m4_t vs3,
                              size_t vl);
void __riscv_vsoxei8_v_f64m1(double *rs1, vuint8mf8_t rs2, vfloat64m1_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_f64m2(double *rs1, vuint8mf4_t rs2, vfloat64m2_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_f64m4(double *rs1, vuint8mf2_t rs2, vfloat64m4_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_f64m8(double *rs1, vuint8m1_t rs2, vfloat64m8_t vs3,
                             size_t vl);
void __riscv_vsoxei16_v_f64m1(double *rs1, vuint16mf4_t rs2, vfloat64m1_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_f64m2(double *rs1, vuint16mf2_t rs2, vfloat64m2_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_f64m4(double *rs1, vuint16m1_t rs2, vfloat64m4_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_f64m8(double *rs1, vuint16m2_t rs2, vfloat64m8_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_f64m1(double *rs1, vuint32mf2_t rs2, vfloat64m1_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_f64m2(double *rs1, vuint32m1_t rs2, vfloat64m2_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_f64m4(double *rs1, vuint32m2_t rs2, vfloat64m4_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_f64m8(double *rs1, vuint32m4_t rs2, vfloat64m8_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_f64m1(double *rs1, vuint64m1_t rs2, vfloat64m1_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_f64m2(double *rs1, vuint64m2_t rs2, vfloat64m2_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_f64m4(double *rs1, vuint64m4_t rs2, vfloat64m4_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_f64m8(double *rs1, vuint64m8_t rs2, vfloat64m8_t vs3,
                              size_t vl);
void __riscv_vsuxei8_v_f16mf4(_Float16 *rs1, vuint8mf8_t rs2, vfloat16mf4_t vs3,
                              size_t vl);
void __riscv_vsuxei8_v_f16mf2(_Float16 *rs1, vuint8mf4_t rs2, vfloat16mf2_t vs3,
                              size_t vl);
void __riscv_vsuxei8_v_f16m1(_Float16 *rs1, vuint8mf2_t rs2, vfloat16m1_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_f16m2(_Float16 *rs1, vuint8m1_t rs2, vfloat16m2_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_f16m4(_Float16 *rs1, vuint8m2_t rs2, vfloat16m4_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_f16m8(_Float16 *rs1, vuint8m4_t rs2, vfloat16m8_t vs3,
                             size_t vl);
void __riscv_vsuxei16_v_f16mf4(_Float16 *rs1, vuint16mf4_t rs2,
                               vfloat16mf4_t vs3, size_t vl);
void __riscv_vsuxei16_v_f16mf2(_Float16 *rs1, vuint16mf2_t rs2,
                               vfloat16mf2_t vs3, size_t vl);
void __riscv_vsuxei16_v_f16m1(_Float16 *rs1, vuint16m1_t rs2, vfloat16m1_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_f16m2(_Float16 *rs1, vuint16m2_t rs2, vfloat16m2_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_f16m4(_Float16 *rs1, vuint16m4_t rs2, vfloat16m4_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_f16m8(_Float16 *rs1, vuint16m8_t rs2, vfloat16m8_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_f16mf4(_Float16 *rs1, vuint32mf2_t rs2,
                               vfloat16mf4_t vs3, size_t vl);
void __riscv_vsuxei32_v_f16mf2(_Float16 *rs1, vuint32m1_t rs2,
                               vfloat16mf2_t vs3, size_t vl);
void __riscv_vsuxei32_v_f16m1(_Float16 *rs1, vuint32m2_t rs2, vfloat16m1_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_f16m2(_Float16 *rs1, vuint32m4_t rs2, vfloat16m2_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_f16m4(_Float16 *rs1, vuint32m8_t rs2, vfloat16m4_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_f16mf4(_Float16 *rs1, vuint64m1_t rs2,
                               vfloat16mf4_t vs3, size_t vl);
void __riscv_vsuxei64_v_f16mf2(_Float16 *rs1, vuint64m2_t rs2,
                               vfloat16mf2_t vs3, size_t vl);
void __riscv_vsuxei64_v_f16m1(_Float16 *rs1, vuint64m4_t rs2, vfloat16m1_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_f16m2(_Float16 *rs1, vuint64m8_t rs2, vfloat16m2_t vs3,
                              size_t vl);
void __riscv_vsuxei8_v_f32mf2(float *rs1, vuint8mf8_t rs2, vfloat32mf2_t vs3,
                              size_t vl);
void __riscv_vsuxei8_v_f32m1(float *rs1, vuint8mf4_t rs2, vfloat32m1_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_f32m2(float *rs1, vuint8mf2_t rs2, vfloat32m2_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_f32m4(float *rs1, vuint8m1_t rs2, vfloat32m4_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_f32m8(float *rs1, vuint8m2_t rs2, vfloat32m8_t vs3,
                             size_t vl);
void __riscv_vsuxei16_v_f32mf2(float *rs1, vuint16mf4_t rs2, vfloat32mf2_t vs3,
                               size_t vl);
void __riscv_vsuxei16_v_f32m1(float *rs1, vuint16mf2_t rs2, vfloat32m1_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_f32m2(float *rs1, vuint16m1_t rs2, vfloat32m2_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_f32m4(float *rs1, vuint16m2_t rs2, vfloat32m4_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_f32m8(float *rs1, vuint16m4_t rs2, vfloat32m8_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_f32mf2(float *rs1, vuint32mf2_t rs2, vfloat32mf2_t vs3,
                               size_t vl);
void __riscv_vsuxei32_v_f32m1(float *rs1, vuint32m1_t rs2, vfloat32m1_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_f32m2(float *rs1, vuint32m2_t rs2, vfloat32m2_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_f32m4(float *rs1, vuint32m4_t rs2, vfloat32m4_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_f32m8(float *rs1, vuint32m8_t rs2, vfloat32m8_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_f32mf2(float *rs1, vuint64m1_t rs2, vfloat32mf2_t vs3,
                               size_t vl);
void __riscv_vsuxei64_v_f32m1(float *rs1, vuint64m2_t rs2, vfloat32m1_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_f32m2(float *rs1, vuint64m4_t rs2, vfloat32m2_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_f32m4(float *rs1, vuint64m8_t rs2, vfloat32m4_t vs3,
                              size_t vl);
void __riscv_vsuxei8_v_f64m1(double *rs1, vuint8mf8_t rs2, vfloat64m1_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_f64m2(double *rs1, vuint8mf4_t rs2, vfloat64m2_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_f64m4(double *rs1, vuint8mf2_t rs2, vfloat64m4_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_f64m8(double *rs1, vuint8m1_t rs2, vfloat64m8_t vs3,
                             size_t vl);
void __riscv_vsuxei16_v_f64m1(double *rs1, vuint16mf4_t rs2, vfloat64m1_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_f64m2(double *rs1, vuint16mf2_t rs2, vfloat64m2_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_f64m4(double *rs1, vuint16m1_t rs2, vfloat64m4_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_f64m8(double *rs1, vuint16m2_t rs2, vfloat64m8_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_f64m1(double *rs1, vuint32mf2_t rs2, vfloat64m1_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_f64m2(double *rs1, vuint32m1_t rs2, vfloat64m2_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_f64m4(double *rs1, vuint32m2_t rs2, vfloat64m4_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_f64m8(double *rs1, vuint32m4_t rs2, vfloat64m8_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_f64m1(double *rs1, vuint64m1_t rs2, vfloat64m1_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_f64m2(double *rs1, vuint64m2_t rs2, vfloat64m2_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_f64m4(double *rs1, vuint64m4_t rs2, vfloat64m4_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_f64m8(double *rs1, vuint64m8_t rs2, vfloat64m8_t vs3,
                              size_t vl);
void __riscv_vsoxei8_v_i8mf8(int8_t *rs1, vuint8mf8_t rs2, vint8mf8_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_i8mf4(int8_t *rs1, vuint8mf4_t rs2, vint8mf4_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_i8mf2(int8_t *rs1, vuint8mf2_t rs2, vint8mf2_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_i8m1(int8_t *rs1, vuint8m1_t rs2, vint8m1_t vs3,
                            size_t vl);
void __riscv_vsoxei8_v_i8m2(int8_t *rs1, vuint8m2_t rs2, vint8m2_t vs3,
                            size_t vl);
void __riscv_vsoxei8_v_i8m4(int8_t *rs1, vuint8m4_t rs2, vint8m4_t vs3,
                            size_t vl);
void __riscv_vsoxei8_v_i8m8(int8_t *rs1, vuint8m8_t rs2, vint8m8_t vs3,
                            size_t vl);
void __riscv_vsoxei16_v_i8mf8(int8_t *rs1, vuint16mf4_t rs2, vint8mf8_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_i8mf4(int8_t *rs1, vuint16mf2_t rs2, vint8mf4_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_i8mf2(int8_t *rs1, vuint16m1_t rs2, vint8mf2_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_i8m1(int8_t *rs1, vuint16m2_t rs2, vint8m1_t vs3,
                             size_t vl);
void __riscv_vsoxei16_v_i8m2(int8_t *rs1, vuint16m4_t rs2, vint8m2_t vs3,
                             size_t vl);
void __riscv_vsoxei16_v_i8m4(int8_t *rs1, vuint16m8_t rs2, vint8m4_t vs3,
                             size_t vl);
void __riscv_vsoxei32_v_i8mf8(int8_t *rs1, vuint32mf2_t rs2, vint8mf8_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_i8mf4(int8_t *rs1, vuint32m1_t rs2, vint8mf4_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_i8mf2(int8_t *rs1, vuint32m2_t rs2, vint8mf2_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_i8m1(int8_t *rs1, vuint32m4_t rs2, vint8m1_t vs3,
                             size_t vl);
void __riscv_vsoxei32_v_i8m2(int8_t *rs1, vuint32m8_t rs2, vint8m2_t vs3,
                             size_t vl);
void __riscv_vsoxei64_v_i8mf8(int8_t *rs1, vuint64m1_t rs2, vint8mf8_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_i8mf4(int8_t *rs1, vuint64m2_t rs2, vint8mf4_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_i8mf2(int8_t *rs1, vuint64m4_t rs2, vint8mf2_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_i8m1(int8_t *rs1, vuint64m8_t rs2, vint8m1_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_i16mf4(int16_t *rs1, vuint8mf8_t rs2, vint16mf4_t vs3,
                              size_t vl);
void __riscv_vsoxei8_v_i16mf2(int16_t *rs1, vuint8mf4_t rs2, vint16mf2_t vs3,
                              size_t vl);
void __riscv_vsoxei8_v_i16m1(int16_t *rs1, vuint8mf2_t rs2, vint16m1_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_i16m2(int16_t *rs1, vuint8m1_t rs2, vint16m2_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_i16m4(int16_t *rs1, vuint8m2_t rs2, vint16m4_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_i16m8(int16_t *rs1, vuint8m4_t rs2, vint16m8_t vs3,
                             size_t vl);
void __riscv_vsoxei16_v_i16mf4(int16_t *rs1, vuint16mf4_t rs2, vint16mf4_t vs3,
                               size_t vl);
void __riscv_vsoxei16_v_i16mf2(int16_t *rs1, vuint16mf2_t rs2, vint16mf2_t vs3,
                               size_t vl);
void __riscv_vsoxei16_v_i16m1(int16_t *rs1, vuint16m1_t rs2, vint16m1_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_i16m2(int16_t *rs1, vuint16m2_t rs2, vint16m2_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_i16m4(int16_t *rs1, vuint16m4_t rs2, vint16m4_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_i16m8(int16_t *rs1, vuint16m8_t rs2, vint16m8_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_i16mf4(int16_t *rs1, vuint32mf2_t rs2, vint16mf4_t vs3,
                               size_t vl);
void __riscv_vsoxei32_v_i16mf2(int16_t *rs1, vuint32m1_t rs2, vint16mf2_t vs3,
                               size_t vl);
void __riscv_vsoxei32_v_i16m1(int16_t *rs1, vuint32m2_t rs2, vint16m1_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_i16m2(int16_t *rs1, vuint32m4_t rs2, vint16m2_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_i16m4(int16_t *rs1, vuint32m8_t rs2, vint16m4_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_i16mf4(int16_t *rs1, vuint64m1_t rs2, vint16mf4_t vs3,
                               size_t vl);
void __riscv_vsoxei64_v_i16mf2(int16_t *rs1, vuint64m2_t rs2, vint16mf2_t vs3,
                               size_t vl);
void __riscv_vsoxei64_v_i16m1(int16_t *rs1, vuint64m4_t rs2, vint16m1_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_i16m2(int16_t *rs1, vuint64m8_t rs2, vint16m2_t vs3,
                              size_t vl);
void __riscv_vsoxei8_v_i32mf2(int32_t *rs1, vuint8mf8_t rs2, vint32mf2_t vs3,
                              size_t vl);
void __riscv_vsoxei8_v_i32m1(int32_t *rs1, vuint8mf4_t rs2, vint32m1_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_i32m2(int32_t *rs1, vuint8mf2_t rs2, vint32m2_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_i32m4(int32_t *rs1, vuint8m1_t rs2, vint32m4_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_i32m8(int32_t *rs1, vuint8m2_t rs2, vint32m8_t vs3,
                             size_t vl);
void __riscv_vsoxei16_v_i32mf2(int32_t *rs1, vuint16mf4_t rs2, vint32mf2_t vs3,
                               size_t vl);
void __riscv_vsoxei16_v_i32m1(int32_t *rs1, vuint16mf2_t rs2, vint32m1_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_i32m2(int32_t *rs1, vuint16m1_t rs2, vint32m2_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_i32m4(int32_t *rs1, vuint16m2_t rs2, vint32m4_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_i32m8(int32_t *rs1, vuint16m4_t rs2, vint32m8_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_i32mf2(int32_t *rs1, vuint32mf2_t rs2, vint32mf2_t vs3,
                               size_t vl);
void __riscv_vsoxei32_v_i32m1(int32_t *rs1, vuint32m1_t rs2, vint32m1_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_i32m2(int32_t *rs1, vuint32m2_t rs2, vint32m2_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_i32m4(int32_t *rs1, vuint32m4_t rs2, vint32m4_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_i32m8(int32_t *rs1, vuint32m8_t rs2, vint32m8_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_i32mf2(int32_t *rs1, vuint64m1_t rs2, vint32mf2_t vs3,
                               size_t vl);
void __riscv_vsoxei64_v_i32m1(int32_t *rs1, vuint64m2_t rs2, vint32m1_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_i32m2(int32_t *rs1, vuint64m4_t rs2, vint32m2_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_i32m4(int32_t *rs1, vuint64m8_t rs2, vint32m4_t vs3,
                              size_t vl);
void __riscv_vsoxei8_v_i64m1(int64_t *rs1, vuint8mf8_t rs2, vint64m1_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_i64m2(int64_t *rs1, vuint8mf4_t rs2, vint64m2_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_i64m4(int64_t *rs1, vuint8mf2_t rs2, vint64m4_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_i64m8(int64_t *rs1, vuint8m1_t rs2, vint64m8_t vs3,
                             size_t vl);
void __riscv_vsoxei16_v_i64m1(int64_t *rs1, vuint16mf4_t rs2, vint64m1_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_i64m2(int64_t *rs1, vuint16mf2_t rs2, vint64m2_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_i64m4(int64_t *rs1, vuint16m1_t rs2, vint64m4_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_i64m8(int64_t *rs1, vuint16m2_t rs2, vint64m8_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_i64m1(int64_t *rs1, vuint32mf2_t rs2, vint64m1_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_i64m2(int64_t *rs1, vuint32m1_t rs2, vint64m2_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_i64m4(int64_t *rs1, vuint32m2_t rs2, vint64m4_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_i64m8(int64_t *rs1, vuint32m4_t rs2, vint64m8_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_i64m1(int64_t *rs1, vuint64m1_t rs2, vint64m1_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_i64m2(int64_t *rs1, vuint64m2_t rs2, vint64m2_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_i64m4(int64_t *rs1, vuint64m4_t rs2, vint64m4_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_i64m8(int64_t *rs1, vuint64m8_t rs2, vint64m8_t vs3,
                              size_t vl);
void __riscv_vsuxei8_v_i8mf8(int8_t *rs1, vuint8mf8_t rs2, vint8mf8_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_i8mf4(int8_t *rs1, vuint8mf4_t rs2, vint8mf4_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_i8mf2(int8_t *rs1, vuint8mf2_t rs2, vint8mf2_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_i8m1(int8_t *rs1, vuint8m1_t rs2, vint8m1_t vs3,
                            size_t vl);
void __riscv_vsuxei8_v_i8m2(int8_t *rs1, vuint8m2_t rs2, vint8m2_t vs3,
                            size_t vl);
void __riscv_vsuxei8_v_i8m4(int8_t *rs1, vuint8m4_t rs2, vint8m4_t vs3,
                            size_t vl);
void __riscv_vsuxei8_v_i8m8(int8_t *rs1, vuint8m8_t rs2, vint8m8_t vs3,
                            size_t vl);
void __riscv_vsuxei16_v_i8mf8(int8_t *rs1, vuint16mf4_t rs2, vint8mf8_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_i8mf4(int8_t *rs1, vuint16mf2_t rs2, vint8mf4_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_i8mf2(int8_t *rs1, vuint16m1_t rs2, vint8mf2_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_i8m1(int8_t *rs1, vuint16m2_t rs2, vint8m1_t vs3,
                             size_t vl);
void __riscv_vsuxei16_v_i8m2(int8_t *rs1, vuint16m4_t rs2, vint8m2_t vs3,
                             size_t vl);
void __riscv_vsuxei16_v_i8m4(int8_t *rs1, vuint16m8_t rs2, vint8m4_t vs3,
                             size_t vl);
void __riscv_vsuxei32_v_i8mf8(int8_t *rs1, vuint32mf2_t rs2, vint8mf8_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_i8mf4(int8_t *rs1, vuint32m1_t rs2, vint8mf4_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_i8mf2(int8_t *rs1, vuint32m2_t rs2, vint8mf2_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_i8m1(int8_t *rs1, vuint32m4_t rs2, vint8m1_t vs3,
                             size_t vl);
void __riscv_vsuxei32_v_i8m2(int8_t *rs1, vuint32m8_t rs2, vint8m2_t vs3,
                             size_t vl);
void __riscv_vsuxei64_v_i8mf8(int8_t *rs1, vuint64m1_t rs2, vint8mf8_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_i8mf4(int8_t *rs1, vuint64m2_t rs2, vint8mf4_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_i8mf2(int8_t *rs1, vuint64m4_t rs2, vint8mf2_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_i8m1(int8_t *rs1, vuint64m8_t rs2, vint8m1_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_i16mf4(int16_t *rs1, vuint8mf8_t rs2, vint16mf4_t vs3,
                              size_t vl);
void __riscv_vsuxei8_v_i16mf2(int16_t *rs1, vuint8mf4_t rs2, vint16mf2_t vs3,
                              size_t vl);
void __riscv_vsuxei8_v_i16m1(int16_t *rs1, vuint8mf2_t rs2, vint16m1_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_i16m2(int16_t *rs1, vuint8m1_t rs2, vint16m2_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_i16m4(int16_t *rs1, vuint8m2_t rs2, vint16m4_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_i16m8(int16_t *rs1, vuint8m4_t rs2, vint16m8_t vs3,
                             size_t vl);
void __riscv_vsuxei16_v_i16mf4(int16_t *rs1, vuint16mf4_t rs2, vint16mf4_t vs3,
                               size_t vl);
void __riscv_vsuxei16_v_i16mf2(int16_t *rs1, vuint16mf2_t rs2, vint16mf2_t vs3,
                               size_t vl);
void __riscv_vsuxei16_v_i16m1(int16_t *rs1, vuint16m1_t rs2, vint16m1_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_i16m2(int16_t *rs1, vuint16m2_t rs2, vint16m2_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_i16m4(int16_t *rs1, vuint16m4_t rs2, vint16m4_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_i16m8(int16_t *rs1, vuint16m8_t rs2, vint16m8_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_i16mf4(int16_t *rs1, vuint32mf2_t rs2, vint16mf4_t vs3,
                               size_t vl);
void __riscv_vsuxei32_v_i16mf2(int16_t *rs1, vuint32m1_t rs2, vint16mf2_t vs3,
                               size_t vl);
void __riscv_vsuxei32_v_i16m1(int16_t *rs1, vuint32m2_t rs2, vint16m1_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_i16m2(int16_t *rs1, vuint32m4_t rs2, vint16m2_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_i16m4(int16_t *rs1, vuint32m8_t rs2, vint16m4_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_i16mf4(int16_t *rs1, vuint64m1_t rs2, vint16mf4_t vs3,
                               size_t vl);
void __riscv_vsuxei64_v_i16mf2(int16_t *rs1, vuint64m2_t rs2, vint16mf2_t vs3,
                               size_t vl);
void __riscv_vsuxei64_v_i16m1(int16_t *rs1, vuint64m4_t rs2, vint16m1_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_i16m2(int16_t *rs1, vuint64m8_t rs2, vint16m2_t vs3,
                              size_t vl);
void __riscv_vsuxei8_v_i32mf2(int32_t *rs1, vuint8mf8_t rs2, vint32mf2_t vs3,
                              size_t vl);
void __riscv_vsuxei8_v_i32m1(int32_t *rs1, vuint8mf4_t rs2, vint32m1_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_i32m2(int32_t *rs1, vuint8mf2_t rs2, vint32m2_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_i32m4(int32_t *rs1, vuint8m1_t rs2, vint32m4_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_i32m8(int32_t *rs1, vuint8m2_t rs2, vint32m8_t vs3,
                             size_t vl);
void __riscv_vsuxei16_v_i32mf2(int32_t *rs1, vuint16mf4_t rs2, vint32mf2_t vs3,
                               size_t vl);
void __riscv_vsuxei16_v_i32m1(int32_t *rs1, vuint16mf2_t rs2, vint32m1_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_i32m2(int32_t *rs1, vuint16m1_t rs2, vint32m2_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_i32m4(int32_t *rs1, vuint16m2_t rs2, vint32m4_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_i32m8(int32_t *rs1, vuint16m4_t rs2, vint32m8_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_i32mf2(int32_t *rs1, vuint32mf2_t rs2, vint32mf2_t vs3,
                               size_t vl);
void __riscv_vsuxei32_v_i32m1(int32_t *rs1, vuint32m1_t rs2, vint32m1_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_i32m2(int32_t *rs1, vuint32m2_t rs2, vint32m2_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_i32m4(int32_t *rs1, vuint32m4_t rs2, vint32m4_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_i32m8(int32_t *rs1, vuint32m8_t rs2, vint32m8_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_i32mf2(int32_t *rs1, vuint64m1_t rs2, vint32mf2_t vs3,
                               size_t vl);
void __riscv_vsuxei64_v_i32m1(int32_t *rs1, vuint64m2_t rs2, vint32m1_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_i32m2(int32_t *rs1, vuint64m4_t rs2, vint32m2_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_i32m4(int32_t *rs1, vuint64m8_t rs2, vint32m4_t vs3,
                              size_t vl);
void __riscv_vsuxei8_v_i64m1(int64_t *rs1, vuint8mf8_t rs2, vint64m1_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_i64m2(int64_t *rs1, vuint8mf4_t rs2, vint64m2_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_i64m4(int64_t *rs1, vuint8mf2_t rs2, vint64m4_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_i64m8(int64_t *rs1, vuint8m1_t rs2, vint64m8_t vs3,
                             size_t vl);
void __riscv_vsuxei16_v_i64m1(int64_t *rs1, vuint16mf4_t rs2, vint64m1_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_i64m2(int64_t *rs1, vuint16mf2_t rs2, vint64m2_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_i64m4(int64_t *rs1, vuint16m1_t rs2, vint64m4_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_i64m8(int64_t *rs1, vuint16m2_t rs2, vint64m8_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_i64m1(int64_t *rs1, vuint32mf2_t rs2, vint64m1_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_i64m2(int64_t *rs1, vuint32m1_t rs2, vint64m2_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_i64m4(int64_t *rs1, vuint32m2_t rs2, vint64m4_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_i64m8(int64_t *rs1, vuint32m4_t rs2, vint64m8_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_i64m1(int64_t *rs1, vuint64m1_t rs2, vint64m1_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_i64m2(int64_t *rs1, vuint64m2_t rs2, vint64m2_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_i64m4(int64_t *rs1, vuint64m4_t rs2, vint64m4_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_i64m8(int64_t *rs1, vuint64m8_t rs2, vint64m8_t vs3,
                              size_t vl);
void __riscv_vsoxei8_v_u8mf8(uint8_t *rs1, vuint8mf8_t rs2, vuint8mf8_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_u8mf4(uint8_t *rs1, vuint8mf4_t rs2, vuint8mf4_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_u8mf2(uint8_t *rs1, vuint8mf2_t rs2, vuint8mf2_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_u8m1(uint8_t *rs1, vuint8m1_t rs2, vuint8m1_t vs3,
                            size_t vl);
void __riscv_vsoxei8_v_u8m2(uint8_t *rs1, vuint8m2_t rs2, vuint8m2_t vs3,
                            size_t vl);
void __riscv_vsoxei8_v_u8m4(uint8_t *rs1, vuint8m4_t rs2, vuint8m4_t vs3,
                            size_t vl);
void __riscv_vsoxei8_v_u8m8(uint8_t *rs1, vuint8m8_t rs2, vuint8m8_t vs3,
                            size_t vl);
void __riscv_vsoxei16_v_u8mf8(uint8_t *rs1, vuint16mf4_t rs2, vuint8mf8_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_u8mf4(uint8_t *rs1, vuint16mf2_t rs2, vuint8mf4_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_u8mf2(uint8_t *rs1, vuint16m1_t rs2, vuint8mf2_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_u8m1(uint8_t *rs1, vuint16m2_t rs2, vuint8m1_t vs3,
                             size_t vl);
void __riscv_vsoxei16_v_u8m2(uint8_t *rs1, vuint16m4_t rs2, vuint8m2_t vs3,
                             size_t vl);
void __riscv_vsoxei16_v_u8m4(uint8_t *rs1, vuint16m8_t rs2, vuint8m4_t vs3,
                             size_t vl);
void __riscv_vsoxei32_v_u8mf8(uint8_t *rs1, vuint32mf2_t rs2, vuint8mf8_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_u8mf4(uint8_t *rs1, vuint32m1_t rs2, vuint8mf4_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_u8mf2(uint8_t *rs1, vuint32m2_t rs2, vuint8mf2_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_u8m1(uint8_t *rs1, vuint32m4_t rs2, vuint8m1_t vs3,
                             size_t vl);
void __riscv_vsoxei32_v_u8m2(uint8_t *rs1, vuint32m8_t rs2, vuint8m2_t vs3,
                             size_t vl);
void __riscv_vsoxei64_v_u8mf8(uint8_t *rs1, vuint64m1_t rs2, vuint8mf8_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_u8mf4(uint8_t *rs1, vuint64m2_t rs2, vuint8mf4_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_u8mf2(uint8_t *rs1, vuint64m4_t rs2, vuint8mf2_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_u8m1(uint8_t *rs1, vuint64m8_t rs2, vuint8m1_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_u16mf4(uint16_t *rs1, vuint8mf8_t rs2, vuint16mf4_t vs3,
                              size_t vl);
void __riscv_vsoxei8_v_u16mf2(uint16_t *rs1, vuint8mf4_t rs2, vuint16mf2_t vs3,
                              size_t vl);
void __riscv_vsoxei8_v_u16m1(uint16_t *rs1, vuint8mf2_t rs2, vuint16m1_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_u16m2(uint16_t *rs1, vuint8m1_t rs2, vuint16m2_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_u16m4(uint16_t *rs1, vuint8m2_t rs2, vuint16m4_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_u16m8(uint16_t *rs1, vuint8m4_t rs2, vuint16m8_t vs3,
                             size_t vl);
void __riscv_vsoxei16_v_u16mf4(uint16_t *rs1, vuint16mf4_t rs2,
                               vuint16mf4_t vs3, size_t vl);
void __riscv_vsoxei16_v_u16mf2(uint16_t *rs1, vuint16mf2_t rs2,
                               vuint16mf2_t vs3, size_t vl);
void __riscv_vsoxei16_v_u16m1(uint16_t *rs1, vuint16m1_t rs2, vuint16m1_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_u16m2(uint16_t *rs1, vuint16m2_t rs2, vuint16m2_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_u16m4(uint16_t *rs1, vuint16m4_t rs2, vuint16m4_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_u16m8(uint16_t *rs1, vuint16m8_t rs2, vuint16m8_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_u16mf4(uint16_t *rs1, vuint32mf2_t rs2,
                               vuint16mf4_t vs3, size_t vl);
void __riscv_vsoxei32_v_u16mf2(uint16_t *rs1, vuint32m1_t rs2, vuint16mf2_t vs3,
                               size_t vl);
void __riscv_vsoxei32_v_u16m1(uint16_t *rs1, vuint32m2_t rs2, vuint16m1_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_u16m2(uint16_t *rs1, vuint32m4_t rs2, vuint16m2_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_u16m4(uint16_t *rs1, vuint32m8_t rs2, vuint16m4_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_u16mf4(uint16_t *rs1, vuint64m1_t rs2, vuint16mf4_t vs3,
                               size_t vl);
void __riscv_vsoxei64_v_u16mf2(uint16_t *rs1, vuint64m2_t rs2, vuint16mf2_t vs3,
                               size_t vl);
void __riscv_vsoxei64_v_u16m1(uint16_t *rs1, vuint64m4_t rs2, vuint16m1_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_u16m2(uint16_t *rs1, vuint64m8_t rs2, vuint16m2_t vs3,
                              size_t vl);
void __riscv_vsoxei8_v_u32mf2(uint32_t *rs1, vuint8mf8_t rs2, vuint32mf2_t vs3,
                              size_t vl);
void __riscv_vsoxei8_v_u32m1(uint32_t *rs1, vuint8mf4_t rs2, vuint32m1_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_u32m2(uint32_t *rs1, vuint8mf2_t rs2, vuint32m2_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_u32m4(uint32_t *rs1, vuint8m1_t rs2, vuint32m4_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_u32m8(uint32_t *rs1, vuint8m2_t rs2, vuint32m8_t vs3,
                             size_t vl);
void __riscv_vsoxei16_v_u32mf2(uint32_t *rs1, vuint16mf4_t rs2,
                               vuint32mf2_t vs3, size_t vl);
void __riscv_vsoxei16_v_u32m1(uint32_t *rs1, vuint16mf2_t rs2, vuint32m1_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_u32m2(uint32_t *rs1, vuint16m1_t rs2, vuint32m2_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_u32m4(uint32_t *rs1, vuint16m2_t rs2, vuint32m4_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_u32m8(uint32_t *rs1, vuint16m4_t rs2, vuint32m8_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_u32mf2(uint32_t *rs1, vuint32mf2_t rs2,
                               vuint32mf2_t vs3, size_t vl);
void __riscv_vsoxei32_v_u32m1(uint32_t *rs1, vuint32m1_t rs2, vuint32m1_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_u32m2(uint32_t *rs1, vuint32m2_t rs2, vuint32m2_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_u32m4(uint32_t *rs1, vuint32m4_t rs2, vuint32m4_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_u32m8(uint32_t *rs1, vuint32m8_t rs2, vuint32m8_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_u32mf2(uint32_t *rs1, vuint64m1_t rs2, vuint32mf2_t vs3,
                               size_t vl);
void __riscv_vsoxei64_v_u32m1(uint32_t *rs1, vuint64m2_t rs2, vuint32m1_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_u32m2(uint32_t *rs1, vuint64m4_t rs2, vuint32m2_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_u32m4(uint32_t *rs1, vuint64m8_t rs2, vuint32m4_t vs3,
                              size_t vl);
void __riscv_vsoxei8_v_u64m1(uint64_t *rs1, vuint8mf8_t rs2, vuint64m1_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_u64m2(uint64_t *rs1, vuint8mf4_t rs2, vuint64m2_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_u64m4(uint64_t *rs1, vuint8mf2_t rs2, vuint64m4_t vs3,
                             size_t vl);
void __riscv_vsoxei8_v_u64m8(uint64_t *rs1, vuint8m1_t rs2, vuint64m8_t vs3,
                             size_t vl);
void __riscv_vsoxei16_v_u64m1(uint64_t *rs1, vuint16mf4_t rs2, vuint64m1_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_u64m2(uint64_t *rs1, vuint16mf2_t rs2, vuint64m2_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_u64m4(uint64_t *rs1, vuint16m1_t rs2, vuint64m4_t vs3,
                              size_t vl);
void __riscv_vsoxei16_v_u64m8(uint64_t *rs1, vuint16m2_t rs2, vuint64m8_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_u64m1(uint64_t *rs1, vuint32mf2_t rs2, vuint64m1_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_u64m2(uint64_t *rs1, vuint32m1_t rs2, vuint64m2_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_u64m4(uint64_t *rs1, vuint32m2_t rs2, vuint64m4_t vs3,
                              size_t vl);
void __riscv_vsoxei32_v_u64m8(uint64_t *rs1, vuint32m4_t rs2, vuint64m8_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_u64m1(uint64_t *rs1, vuint64m1_t rs2, vuint64m1_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_u64m2(uint64_t *rs1, vuint64m2_t rs2, vuint64m2_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_u64m4(uint64_t *rs1, vuint64m4_t rs2, vuint64m4_t vs3,
                              size_t vl);
void __riscv_vsoxei64_v_u64m8(uint64_t *rs1, vuint64m8_t rs2, vuint64m8_t vs3,
                              size_t vl);
void __riscv_vsuxei8_v_u8mf8(uint8_t *rs1, vuint8mf8_t rs2, vuint8mf8_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_u8mf4(uint8_t *rs1, vuint8mf4_t rs2, vuint8mf4_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_u8mf2(uint8_t *rs1, vuint8mf2_t rs2, vuint8mf2_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_u8m1(uint8_t *rs1, vuint8m1_t rs2, vuint8m1_t vs3,
                            size_t vl);
void __riscv_vsuxei8_v_u8m2(uint8_t *rs1, vuint8m2_t rs2, vuint8m2_t vs3,
                            size_t vl);
void __riscv_vsuxei8_v_u8m4(uint8_t *rs1, vuint8m4_t rs2, vuint8m4_t vs3,
                            size_t vl);
void __riscv_vsuxei8_v_u8m8(uint8_t *rs1, vuint8m8_t rs2, vuint8m8_t vs3,
                            size_t vl);
void __riscv_vsuxei16_v_u8mf8(uint8_t *rs1, vuint16mf4_t rs2, vuint8mf8_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_u8mf4(uint8_t *rs1, vuint16mf2_t rs2, vuint8mf4_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_u8mf2(uint8_t *rs1, vuint16m1_t rs2, vuint8mf2_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_u8m1(uint8_t *rs1, vuint16m2_t rs2, vuint8m1_t vs3,
                             size_t vl);
void __riscv_vsuxei16_v_u8m2(uint8_t *rs1, vuint16m4_t rs2, vuint8m2_t vs3,
                             size_t vl);
void __riscv_vsuxei16_v_u8m4(uint8_t *rs1, vuint16m8_t rs2, vuint8m4_t vs3,
                             size_t vl);
void __riscv_vsuxei32_v_u8mf8(uint8_t *rs1, vuint32mf2_t rs2, vuint8mf8_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_u8mf4(uint8_t *rs1, vuint32m1_t rs2, vuint8mf4_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_u8mf2(uint8_t *rs1, vuint32m2_t rs2, vuint8mf2_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_u8m1(uint8_t *rs1, vuint32m4_t rs2, vuint8m1_t vs3,
                             size_t vl);
void __riscv_vsuxei32_v_u8m2(uint8_t *rs1, vuint32m8_t rs2, vuint8m2_t vs3,
                             size_t vl);
void __riscv_vsuxei64_v_u8mf8(uint8_t *rs1, vuint64m1_t rs2, vuint8mf8_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_u8mf4(uint8_t *rs1, vuint64m2_t rs2, vuint8mf4_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_u8mf2(uint8_t *rs1, vuint64m4_t rs2, vuint8mf2_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_u8m1(uint8_t *rs1, vuint64m8_t rs2, vuint8m1_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_u16mf4(uint16_t *rs1, vuint8mf8_t rs2, vuint16mf4_t vs3,
                              size_t vl);
void __riscv_vsuxei8_v_u16mf2(uint16_t *rs1, vuint8mf4_t rs2, vuint16mf2_t vs3,
                              size_t vl);
void __riscv_vsuxei8_v_u16m1(uint16_t *rs1, vuint8mf2_t rs2, vuint16m1_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_u16m2(uint16_t *rs1, vuint8m1_t rs2, vuint16m2_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_u16m4(uint16_t *rs1, vuint8m2_t rs2, vuint16m4_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_u16m8(uint16_t *rs1, vuint8m4_t rs2, vuint16m8_t vs3,
                             size_t vl);
void __riscv_vsuxei16_v_u16mf4(uint16_t *rs1, vuint16mf4_t rs2,
                               vuint16mf4_t vs3, size_t vl);
void __riscv_vsuxei16_v_u16mf2(uint16_t *rs1, vuint16mf2_t rs2,
                               vuint16mf2_t vs3, size_t vl);
void __riscv_vsuxei16_v_u16m1(uint16_t *rs1, vuint16m1_t rs2, vuint16m1_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_u16m2(uint16_t *rs1, vuint16m2_t rs2, vuint16m2_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_u16m4(uint16_t *rs1, vuint16m4_t rs2, vuint16m4_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_u16m8(uint16_t *rs1, vuint16m8_t rs2, vuint16m8_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_u16mf4(uint16_t *rs1, vuint32mf2_t rs2,
                               vuint16mf4_t vs3, size_t vl);
void __riscv_vsuxei32_v_u16mf2(uint16_t *rs1, vuint32m1_t rs2, vuint16mf2_t vs3,
                               size_t vl);
void __riscv_vsuxei32_v_u16m1(uint16_t *rs1, vuint32m2_t rs2, vuint16m1_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_u16m2(uint16_t *rs1, vuint32m4_t rs2, vuint16m2_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_u16m4(uint16_t *rs1, vuint32m8_t rs2, vuint16m4_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_u16mf4(uint16_t *rs1, vuint64m1_t rs2, vuint16mf4_t vs3,
                               size_t vl);
void __riscv_vsuxei64_v_u16mf2(uint16_t *rs1, vuint64m2_t rs2, vuint16mf2_t vs3,
                               size_t vl);
void __riscv_vsuxei64_v_u16m1(uint16_t *rs1, vuint64m4_t rs2, vuint16m1_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_u16m2(uint16_t *rs1, vuint64m8_t rs2, vuint16m2_t vs3,
                              size_t vl);
void __riscv_vsuxei8_v_u32mf2(uint32_t *rs1, vuint8mf8_t rs2, vuint32mf2_t vs3,
                              size_t vl);
void __riscv_vsuxei8_v_u32m1(uint32_t *rs1, vuint8mf4_t rs2, vuint32m1_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_u32m2(uint32_t *rs1, vuint8mf2_t rs2, vuint32m2_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_u32m4(uint32_t *rs1, vuint8m1_t rs2, vuint32m4_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_u32m8(uint32_t *rs1, vuint8m2_t rs2, vuint32m8_t vs3,
                             size_t vl);
void __riscv_vsuxei16_v_u32mf2(uint32_t *rs1, vuint16mf4_t rs2,
                               vuint32mf2_t vs3, size_t vl);
void __riscv_vsuxei16_v_u32m1(uint32_t *rs1, vuint16mf2_t rs2, vuint32m1_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_u32m2(uint32_t *rs1, vuint16m1_t rs2, vuint32m2_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_u32m4(uint32_t *rs1, vuint16m2_t rs2, vuint32m4_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_u32m8(uint32_t *rs1, vuint16m4_t rs2, vuint32m8_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_u32mf2(uint32_t *rs1, vuint32mf2_t rs2,
                               vuint32mf2_t vs3, size_t vl);
void __riscv_vsuxei32_v_u32m1(uint32_t *rs1, vuint32m1_t rs2, vuint32m1_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_u32m2(uint32_t *rs1, vuint32m2_t rs2, vuint32m2_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_u32m4(uint32_t *rs1, vuint32m4_t rs2, vuint32m4_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_u32m8(uint32_t *rs1, vuint32m8_t rs2, vuint32m8_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_u32mf2(uint32_t *rs1, vuint64m1_t rs2, vuint32mf2_t vs3,
                               size_t vl);
void __riscv_vsuxei64_v_u32m1(uint32_t *rs1, vuint64m2_t rs2, vuint32m1_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_u32m2(uint32_t *rs1, vuint64m4_t rs2, vuint32m2_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_u32m4(uint32_t *rs1, vuint64m8_t rs2, vuint32m4_t vs3,
                              size_t vl);
void __riscv_vsuxei8_v_u64m1(uint64_t *rs1, vuint8mf8_t rs2, vuint64m1_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_u64m2(uint64_t *rs1, vuint8mf4_t rs2, vuint64m2_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_u64m4(uint64_t *rs1, vuint8mf2_t rs2, vuint64m4_t vs3,
                             size_t vl);
void __riscv_vsuxei8_v_u64m8(uint64_t *rs1, vuint8m1_t rs2, vuint64m8_t vs3,
                             size_t vl);
void __riscv_vsuxei16_v_u64m1(uint64_t *rs1, vuint16mf4_t rs2, vuint64m1_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_u64m2(uint64_t *rs1, vuint16mf2_t rs2, vuint64m2_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_u64m4(uint64_t *rs1, vuint16m1_t rs2, vuint64m4_t vs3,
                              size_t vl);
void __riscv_vsuxei16_v_u64m8(uint64_t *rs1, vuint16m2_t rs2, vuint64m8_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_u64m1(uint64_t *rs1, vuint32mf2_t rs2, vuint64m1_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_u64m2(uint64_t *rs1, vuint32m1_t rs2, vuint64m2_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_u64m4(uint64_t *rs1, vuint32m2_t rs2, vuint64m4_t vs3,
                              size_t vl);
void __riscv_vsuxei32_v_u64m8(uint64_t *rs1, vuint32m4_t rs2, vuint64m8_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_u64m1(uint64_t *rs1, vuint64m1_t rs2, vuint64m1_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_u64m2(uint64_t *rs1, vuint64m2_t rs2, vuint64m2_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_u64m4(uint64_t *rs1, vuint64m4_t rs2, vuint64m4_t vs3,
                              size_t vl);
void __riscv_vsuxei64_v_u64m8(uint64_t *rs1, vuint64m8_t rs2, vuint64m8_t vs3,
                              size_t vl);
// masked functions
void __riscv_vsoxei8_v_f16mf4_m(vbool64_t vm, _Float16 *rs1, vuint8mf8_t rs2,
                                vfloat16mf4_t vs3, size_t vl);
void __riscv_vsoxei8_v_f16mf2_m(vbool32_t vm, _Float16 *rs1, vuint8mf4_t rs2,
                                vfloat16mf2_t vs3, size_t vl);
void __riscv_vsoxei8_v_f16m1_m(vbool16_t vm, _Float16 *rs1, vuint8mf2_t rs2,
                               vfloat16m1_t vs3, size_t vl);
void __riscv_vsoxei8_v_f16m2_m(vbool8_t vm, _Float16 *rs1, vuint8m1_t rs2,
                               vfloat16m2_t vs3, size_t vl);
void __riscv_vsoxei8_v_f16m4_m(vbool4_t vm, _Float16 *rs1, vuint8m2_t rs2,
                               vfloat16m4_t vs3, size_t vl);
void __riscv_vsoxei8_v_f16m8_m(vbool2_t vm, _Float16 *rs1, vuint8m4_t rs2,
                               vfloat16m8_t vs3, size_t vl);
void __riscv_vsoxei16_v_f16mf4_m(vbool64_t vm, _Float16 *rs1, vuint16mf4_t rs2,
                                 vfloat16mf4_t vs3, size_t vl);
void __riscv_vsoxei16_v_f16mf2_m(vbool32_t vm, _Float16 *rs1, vuint16mf2_t rs2,
                                 vfloat16mf2_t vs3, size_t vl);
void __riscv_vsoxei16_v_f16m1_m(vbool16_t vm, _Float16 *rs1, vuint16m1_t rs2,
                                vfloat16m1_t vs3, size_t vl);
void __riscv_vsoxei16_v_f16m2_m(vbool8_t vm, _Float16 *rs1, vuint16m2_t rs2,
                                vfloat16m2_t vs3, size_t vl);
void __riscv_vsoxei16_v_f16m4_m(vbool4_t vm, _Float16 *rs1, vuint16m4_t rs2,
                                vfloat16m4_t vs3, size_t vl);
void __riscv_vsoxei16_v_f16m8_m(vbool2_t vm, _Float16 *rs1, vuint16m8_t rs2,
                                vfloat16m8_t vs3, size_t vl);
void __riscv_vsoxei32_v_f16mf4_m(vbool64_t vm, _Float16 *rs1, vuint32mf2_t rs2,
                                 vfloat16mf4_t vs3, size_t vl);
void __riscv_vsoxei32_v_f16mf2_m(vbool32_t vm, _Float16 *rs1, vuint32m1_t rs2,
                                 vfloat16mf2_t vs3, size_t vl);
void __riscv_vsoxei32_v_f16m1_m(vbool16_t vm, _Float16 *rs1, vuint32m2_t rs2,
                                vfloat16m1_t vs3, size_t vl);
void __riscv_vsoxei32_v_f16m2_m(vbool8_t vm, _Float16 *rs1, vuint32m4_t rs2,
                                vfloat16m2_t vs3, size_t vl);
void __riscv_vsoxei32_v_f16m4_m(vbool4_t vm, _Float16 *rs1, vuint32m8_t rs2,
                                vfloat16m4_t vs3, size_t vl);
void __riscv_vsoxei64_v_f16mf4_m(vbool64_t vm, _Float16 *rs1, vuint64m1_t rs2,
                                 vfloat16mf4_t vs3, size_t vl);
void __riscv_vsoxei64_v_f16mf2_m(vbool32_t vm, _Float16 *rs1, vuint64m2_t rs2,
                                 vfloat16mf2_t vs3, size_t vl);
void __riscv_vsoxei64_v_f16m1_m(vbool16_t vm, _Float16 *rs1, vuint64m4_t rs2,
                                vfloat16m1_t vs3, size_t vl);
void __riscv_vsoxei64_v_f16m2_m(vbool8_t vm, _Float16 *rs1, vuint64m8_t rs2,
                                vfloat16m2_t vs3, size_t vl);
void __riscv_vsoxei8_v_f32mf2_m(vbool64_t vm, float *rs1, vuint8mf8_t rs2,
                                vfloat32mf2_t vs3, size_t vl);
void __riscv_vsoxei8_v_f32m1_m(vbool32_t vm, float *rs1, vuint8mf4_t rs2,
                               vfloat32m1_t vs3, size_t vl);
void __riscv_vsoxei8_v_f32m2_m(vbool16_t vm, float *rs1, vuint8mf2_t rs2,
                               vfloat32m2_t vs3, size_t vl);
void __riscv_vsoxei8_v_f32m4_m(vbool8_t vm, float *rs1, vuint8m1_t rs2,
                               vfloat32m4_t vs3, size_t vl);
void __riscv_vsoxei8_v_f32m8_m(vbool4_t vm, float *rs1, vuint8m2_t rs2,
                               vfloat32m8_t vs3, size_t vl);
void __riscv_vsoxei16_v_f32mf2_m(vbool64_t vm, float *rs1, vuint16mf4_t rs2,
                                 vfloat32mf2_t vs3, size_t vl);
void __riscv_vsoxei16_v_f32m1_m(vbool32_t vm, float *rs1, vuint16mf2_t rs2,
                                vfloat32m1_t vs3, size_t vl);
void __riscv_vsoxei16_v_f32m2_m(vbool16_t vm, float *rs1, vuint16m1_t rs2,
                                vfloat32m2_t vs3, size_t vl);
void __riscv_vsoxei16_v_f32m4_m(vbool8_t vm, float *rs1, vuint16m2_t rs2,
                                vfloat32m4_t vs3, size_t vl);
void __riscv_vsoxei16_v_f32m8_m(vbool4_t vm, float *rs1, vuint16m4_t rs2,
                                vfloat32m8_t vs3, size_t vl);
void __riscv_vsoxei32_v_f32mf2_m(vbool64_t vm, float *rs1, vuint32mf2_t rs2,
                                 vfloat32mf2_t vs3, size_t vl);
void __riscv_vsoxei32_v_f32m1_m(vbool32_t vm, float *rs1, vuint32m1_t rs2,
                                vfloat32m1_t vs3, size_t vl);
void __riscv_vsoxei32_v_f32m2_m(vbool16_t vm, float *rs1, vuint32m2_t rs2,
                                vfloat32m2_t vs3, size_t vl);
void __riscv_vsoxei32_v_f32m4_m(vbool8_t vm, float *rs1, vuint32m4_t rs2,
                                vfloat32m4_t vs3, size_t vl);
void __riscv_vsoxei32_v_f32m8_m(vbool4_t vm, float *rs1, vuint32m8_t rs2,
                                vfloat32m8_t vs3, size_t vl);
void __riscv_vsoxei64_v_f32mf2_m(vbool64_t vm, float *rs1, vuint64m1_t rs2,
                                 vfloat32mf2_t vs3, size_t vl);
void __riscv_vsoxei64_v_f32m1_m(vbool32_t vm, float *rs1, vuint64m2_t rs2,
                                vfloat32m1_t vs3, size_t vl);
void __riscv_vsoxei64_v_f32m2_m(vbool16_t vm, float *rs1, vuint64m4_t rs2,
                                vfloat32m2_t vs3, size_t vl);
void __riscv_vsoxei64_v_f32m4_m(vbool8_t vm, float *rs1, vuint64m8_t rs2,
                                vfloat32m4_t vs3, size_t vl);
void __riscv_vsoxei8_v_f64m1_m(vbool64_t vm, double *rs1, vuint8mf8_t rs2,
                               vfloat64m1_t vs3, size_t vl);
void __riscv_vsoxei8_v_f64m2_m(vbool32_t vm, double *rs1, vuint8mf4_t rs2,
                               vfloat64m2_t vs3, size_t vl);
void __riscv_vsoxei8_v_f64m4_m(vbool16_t vm, double *rs1, vuint8mf2_t rs2,
                               vfloat64m4_t vs3, size_t vl);
void __riscv_vsoxei8_v_f64m8_m(vbool8_t vm, double *rs1, vuint8m1_t rs2,
                               vfloat64m8_t vs3, size_t vl);
void __riscv_vsoxei16_v_f64m1_m(vbool64_t vm, double *rs1, vuint16mf4_t rs2,
                                vfloat64m1_t vs3, size_t vl);
void __riscv_vsoxei16_v_f64m2_m(vbool32_t vm, double *rs1, vuint16mf2_t rs2,
                                vfloat64m2_t vs3, size_t vl);
void __riscv_vsoxei16_v_f64m4_m(vbool16_t vm, double *rs1, vuint16m1_t rs2,
                                vfloat64m4_t vs3, size_t vl);
void __riscv_vsoxei16_v_f64m8_m(vbool8_t vm, double *rs1, vuint16m2_t rs2,
                                vfloat64m8_t vs3, size_t vl);
void __riscv_vsoxei32_v_f64m1_m(vbool64_t vm, double *rs1, vuint32mf2_t rs2,
                                vfloat64m1_t vs3, size_t vl);
void __riscv_vsoxei32_v_f64m2_m(vbool32_t vm, double *rs1, vuint32m1_t rs2,
                                vfloat64m2_t vs3, size_t vl);
void __riscv_vsoxei32_v_f64m4_m(vbool16_t vm, double *rs1, vuint32m2_t rs2,
                                vfloat64m4_t vs3, size_t vl);
void __riscv_vsoxei32_v_f64m8_m(vbool8_t vm, double *rs1, vuint32m4_t rs2,
                                vfloat64m8_t vs3, size_t vl);
void __riscv_vsoxei64_v_f64m1_m(vbool64_t vm, double *rs1, vuint64m1_t rs2,
                                vfloat64m1_t vs3, size_t vl);
void __riscv_vsoxei64_v_f64m2_m(vbool32_t vm, double *rs1, vuint64m2_t rs2,
                                vfloat64m2_t vs3, size_t vl);
void __riscv_vsoxei64_v_f64m4_m(vbool16_t vm, double *rs1, vuint64m4_t rs2,
                                vfloat64m4_t vs3, size_t vl);
void __riscv_vsoxei64_v_f64m8_m(vbool8_t vm, double *rs1, vuint64m8_t rs2,
                                vfloat64m8_t vs3, size_t vl);
void __riscv_vsuxei8_v_f16mf4_m(vbool64_t vm, _Float16 *rs1, vuint8mf8_t rs2,
                                vfloat16mf4_t vs3, size_t vl);
void __riscv_vsuxei8_v_f16mf2_m(vbool32_t vm, _Float16 *rs1, vuint8mf4_t rs2,
                                vfloat16mf2_t vs3, size_t vl);
void __riscv_vsuxei8_v_f16m1_m(vbool16_t vm, _Float16 *rs1, vuint8mf2_t rs2,
                               vfloat16m1_t vs3, size_t vl);
void __riscv_vsuxei8_v_f16m2_m(vbool8_t vm, _Float16 *rs1, vuint8m1_t rs2,
                               vfloat16m2_t vs3, size_t vl);
void __riscv_vsuxei8_v_f16m4_m(vbool4_t vm, _Float16 *rs1, vuint8m2_t rs2,
                               vfloat16m4_t vs3, size_t vl);
void __riscv_vsuxei8_v_f16m8_m(vbool2_t vm, _Float16 *rs1, vuint8m4_t rs2,
                               vfloat16m8_t vs3, size_t vl);
void __riscv_vsuxei16_v_f16mf4_m(vbool64_t vm, _Float16 *rs1, vuint16mf4_t rs2,
                                 vfloat16mf4_t vs3, size_t vl);
void __riscv_vsuxei16_v_f16mf2_m(vbool32_t vm, _Float16 *rs1, vuint16mf2_t rs2,
                                 vfloat16mf2_t vs3, size_t vl);
void __riscv_vsuxei16_v_f16m1_m(vbool16_t vm, _Float16 *rs1, vuint16m1_t rs2,
                                vfloat16m1_t vs3, size_t vl);
void __riscv_vsuxei16_v_f16m2_m(vbool8_t vm, _Float16 *rs1, vuint16m2_t rs2,
                                vfloat16m2_t vs3, size_t vl);
void __riscv_vsuxei16_v_f16m4_m(vbool4_t vm, _Float16 *rs1, vuint16m4_t rs2,
                                vfloat16m4_t vs3, size_t vl);
void __riscv_vsuxei16_v_f16m8_m(vbool2_t vm, _Float16 *rs1, vuint16m8_t rs2,
                                vfloat16m8_t vs3, size_t vl);
void __riscv_vsuxei32_v_f16mf4_m(vbool64_t vm, _Float16 *rs1, vuint32mf2_t rs2,
                                 vfloat16mf4_t vs3, size_t vl);
void __riscv_vsuxei32_v_f16mf2_m(vbool32_t vm, _Float16 *rs1, vuint32m1_t rs2,
                                 vfloat16mf2_t vs3, size_t vl);
void __riscv_vsuxei32_v_f16m1_m(vbool16_t vm, _Float16 *rs1, vuint32m2_t rs2,
                                vfloat16m1_t vs3, size_t vl);
void __riscv_vsuxei32_v_f16m2_m(vbool8_t vm, _Float16 *rs1, vuint32m4_t rs2,
                                vfloat16m2_t vs3, size_t vl);
void __riscv_vsuxei32_v_f16m4_m(vbool4_t vm, _Float16 *rs1, vuint32m8_t rs2,
                                vfloat16m4_t vs3, size_t vl);
void __riscv_vsuxei64_v_f16mf4_m(vbool64_t vm, _Float16 *rs1, vuint64m1_t rs2,
                                 vfloat16mf4_t vs3, size_t vl);
void __riscv_vsuxei64_v_f16mf2_m(vbool32_t vm, _Float16 *rs1, vuint64m2_t rs2,
                                 vfloat16mf2_t vs3, size_t vl);
void __riscv_vsuxei64_v_f16m1_m(vbool16_t vm, _Float16 *rs1, vuint64m4_t rs2,
                                vfloat16m1_t vs3, size_t vl);
void __riscv_vsuxei64_v_f16m2_m(vbool8_t vm, _Float16 *rs1, vuint64m8_t rs2,
                                vfloat16m2_t vs3, size_t vl);
void __riscv_vsuxei8_v_f32mf2_m(vbool64_t vm, float *rs1, vuint8mf8_t rs2,
                                vfloat32mf2_t vs3, size_t vl);
void __riscv_vsuxei8_v_f32m1_m(vbool32_t vm, float *rs1, vuint8mf4_t rs2,
                               vfloat32m1_t vs3, size_t vl);
void __riscv_vsuxei8_v_f32m2_m(vbool16_t vm, float *rs1, vuint8mf2_t rs2,
                               vfloat32m2_t vs3, size_t vl);
void __riscv_vsuxei8_v_f32m4_m(vbool8_t vm, float *rs1, vuint8m1_t rs2,
                               vfloat32m4_t vs3, size_t vl);
void __riscv_vsuxei8_v_f32m8_m(vbool4_t vm, float *rs1, vuint8m2_t rs2,
                               vfloat32m8_t vs3, size_t vl);
void __riscv_vsuxei16_v_f32mf2_m(vbool64_t vm, float *rs1, vuint16mf4_t rs2,
                                 vfloat32mf2_t vs3, size_t vl);
void __riscv_vsuxei16_v_f32m1_m(vbool32_t vm, float *rs1, vuint16mf2_t rs2,
                                vfloat32m1_t vs3, size_t vl);
void __riscv_vsuxei16_v_f32m2_m(vbool16_t vm, float *rs1, vuint16m1_t rs2,
                                vfloat32m2_t vs3, size_t vl);
void __riscv_vsuxei16_v_f32m4_m(vbool8_t vm, float *rs1, vuint16m2_t rs2,
                                vfloat32m4_t vs3, size_t vl);
void __riscv_vsuxei16_v_f32m8_m(vbool4_t vm, float *rs1, vuint16m4_t rs2,
                                vfloat32m8_t vs3, size_t vl);
void __riscv_vsuxei32_v_f32mf2_m(vbool64_t vm, float *rs1, vuint32mf2_t rs2,
                                 vfloat32mf2_t vs3, size_t vl);
void __riscv_vsuxei32_v_f32m1_m(vbool32_t vm, float *rs1, vuint32m1_t rs2,
                                vfloat32m1_t vs3, size_t vl);
void __riscv_vsuxei32_v_f32m2_m(vbool16_t vm, float *rs1, vuint32m2_t rs2,
                                vfloat32m2_t vs3, size_t vl);
void __riscv_vsuxei32_v_f32m4_m(vbool8_t vm, float *rs1, vuint32m4_t rs2,
                                vfloat32m4_t vs3, size_t vl);
void __riscv_vsuxei32_v_f32m8_m(vbool4_t vm, float *rs1, vuint32m8_t rs2,
                                vfloat32m8_t vs3, size_t vl);
void __riscv_vsuxei64_v_f32mf2_m(vbool64_t vm, float *rs1, vuint64m1_t rs2,
                                 vfloat32mf2_t vs3, size_t vl);
void __riscv_vsuxei64_v_f32m1_m(vbool32_t vm, float *rs1, vuint64m2_t rs2,
                                vfloat32m1_t vs3, size_t vl);
void __riscv_vsuxei64_v_f32m2_m(vbool16_t vm, float *rs1, vuint64m4_t rs2,
                                vfloat32m2_t vs3, size_t vl);
void __riscv_vsuxei64_v_f32m4_m(vbool8_t vm, float *rs1, vuint64m8_t rs2,
                                vfloat32m4_t vs3, size_t vl);
void __riscv_vsuxei8_v_f64m1_m(vbool64_t vm, double *rs1, vuint8mf8_t rs2,
                               vfloat64m1_t vs3, size_t vl);
void __riscv_vsuxei8_v_f64m2_m(vbool32_t vm, double *rs1, vuint8mf4_t rs2,
                               vfloat64m2_t vs3, size_t vl);
void __riscv_vsuxei8_v_f64m4_m(vbool16_t vm, double *rs1, vuint8mf2_t rs2,
                               vfloat64m4_t vs3, size_t vl);
void __riscv_vsuxei8_v_f64m8_m(vbool8_t vm, double *rs1, vuint8m1_t rs2,
                               vfloat64m8_t vs3, size_t vl);
void __riscv_vsuxei16_v_f64m1_m(vbool64_t vm, double *rs1, vuint16mf4_t rs2,
                                vfloat64m1_t vs3, size_t vl);
void __riscv_vsuxei16_v_f64m2_m(vbool32_t vm, double *rs1, vuint16mf2_t rs2,
                                vfloat64m2_t vs3, size_t vl);
void __riscv_vsuxei16_v_f64m4_m(vbool16_t vm, double *rs1, vuint16m1_t rs2,
                                vfloat64m4_t vs3, size_t vl);
void __riscv_vsuxei16_v_f64m8_m(vbool8_t vm, double *rs1, vuint16m2_t rs2,
                                vfloat64m8_t vs3, size_t vl);
void __riscv_vsuxei32_v_f64m1_m(vbool64_t vm, double *rs1, vuint32mf2_t rs2,
                                vfloat64m1_t vs3, size_t vl);
void __riscv_vsuxei32_v_f64m2_m(vbool32_t vm, double *rs1, vuint32m1_t rs2,
                                vfloat64m2_t vs3, size_t vl);
void __riscv_vsuxei32_v_f64m4_m(vbool16_t vm, double *rs1, vuint32m2_t rs2,
                                vfloat64m4_t vs3, size_t vl);
void __riscv_vsuxei32_v_f64m8_m(vbool8_t vm, double *rs1, vuint32m4_t rs2,
                                vfloat64m8_t vs3, size_t vl);
void __riscv_vsuxei64_v_f64m1_m(vbool64_t vm, double *rs1, vuint64m1_t rs2,
                                vfloat64m1_t vs3, size_t vl);
void __riscv_vsuxei64_v_f64m2_m(vbool32_t vm, double *rs1, vuint64m2_t rs2,
                                vfloat64m2_t vs3, size_t vl);
void __riscv_vsuxei64_v_f64m4_m(vbool16_t vm, double *rs1, vuint64m4_t rs2,
                                vfloat64m4_t vs3, size_t vl);
void __riscv_vsuxei64_v_f64m8_m(vbool8_t vm, double *rs1, vuint64m8_t rs2,
                                vfloat64m8_t vs3, size_t vl);
void __riscv_vsoxei8_v_i8mf8_m(vbool64_t vm, int8_t *rs1, vuint8mf8_t rs2,
                               vint8mf8_t vs3, size_t vl);
void __riscv_vsoxei8_v_i8mf4_m(vbool32_t vm, int8_t *rs1, vuint8mf4_t rs2,
                               vint8mf4_t vs3, size_t vl);
void __riscv_vsoxei8_v_i8mf2_m(vbool16_t vm, int8_t *rs1, vuint8mf2_t rs2,
                               vint8mf2_t vs3, size_t vl);
void __riscv_vsoxei8_v_i8m1_m(vbool8_t vm, int8_t *rs1, vuint8m1_t rs2,
                              vint8m1_t vs3, size_t vl);
void __riscv_vsoxei8_v_i8m2_m(vbool4_t vm, int8_t *rs1, vuint8m2_t rs2,
                              vint8m2_t vs3, size_t vl);
void __riscv_vsoxei8_v_i8m4_m(vbool2_t vm, int8_t *rs1, vuint8m4_t rs2,
                              vint8m4_t vs3, size_t vl);
void __riscv_vsoxei8_v_i8m8_m(vbool1_t vm, int8_t *rs1, vuint8m8_t rs2,
                              vint8m8_t vs3, size_t vl);
void __riscv_vsoxei16_v_i8mf8_m(vbool64_t vm, int8_t *rs1, vuint16mf4_t rs2,
                                vint8mf8_t vs3, size_t vl);
void __riscv_vsoxei16_v_i8mf4_m(vbool32_t vm, int8_t *rs1, vuint16mf2_t rs2,
                                vint8mf4_t vs3, size_t vl);
void __riscv_vsoxei16_v_i8mf2_m(vbool16_t vm, int8_t *rs1, vuint16m1_t rs2,
                                vint8mf2_t vs3, size_t vl);
void __riscv_vsoxei16_v_i8m1_m(vbool8_t vm, int8_t *rs1, vuint16m2_t rs2,
                               vint8m1_t vs3, size_t vl);
void __riscv_vsoxei16_v_i8m2_m(vbool4_t vm, int8_t *rs1, vuint16m4_t rs2,
                               vint8m2_t vs3, size_t vl);
void __riscv_vsoxei16_v_i8m4_m(vbool2_t vm, int8_t *rs1, vuint16m8_t rs2,
                               vint8m4_t vs3, size_t vl);
void __riscv_vsoxei32_v_i8mf8_m(vbool64_t vm, int8_t *rs1, vuint32mf2_t rs2,
                                vint8mf8_t vs3, size_t vl);
void __riscv_vsoxei32_v_i8mf4_m(vbool32_t vm, int8_t *rs1, vuint32m1_t rs2,
                                vint8mf4_t vs3, size_t vl);
void __riscv_vsoxei32_v_i8mf2_m(vbool16_t vm, int8_t *rs1, vuint32m2_t rs2,
                                vint8mf2_t vs3, size_t vl);
void __riscv_vsoxei32_v_i8m1_m(vbool8_t vm, int8_t *rs1, vuint32m4_t rs2,
                               vint8m1_t vs3, size_t vl);
void __riscv_vsoxei32_v_i8m2_m(vbool4_t vm, int8_t *rs1, vuint32m8_t rs2,
                               vint8m2_t vs3, size_t vl);
void __riscv_vsoxei64_v_i8mf8_m(vbool64_t vm, int8_t *rs1, vuint64m1_t rs2,
                                vint8mf8_t vs3, size_t vl);
void __riscv_vsoxei64_v_i8mf4_m(vbool32_t vm, int8_t *rs1, vuint64m2_t rs2,
                                vint8mf4_t vs3, size_t vl);
void __riscv_vsoxei64_v_i8mf2_m(vbool16_t vm, int8_t *rs1, vuint64m4_t rs2,
                                vint8mf2_t vs3, size_t vl);
void __riscv_vsoxei64_v_i8m1_m(vbool8_t vm, int8_t *rs1, vuint64m8_t rs2,
                               vint8m1_t vs3, size_t vl);
void __riscv_vsoxei8_v_i16mf4_m(vbool64_t vm, int16_t *rs1, vuint8mf8_t rs2,
                                vint16mf4_t vs3, size_t vl);
void __riscv_vsoxei8_v_i16mf2_m(vbool32_t vm, int16_t *rs1, vuint8mf4_t rs2,
                                vint16mf2_t vs3, size_t vl);
void __riscv_vsoxei8_v_i16m1_m(vbool16_t vm, int16_t *rs1, vuint8mf2_t rs2,
                               vint16m1_t vs3, size_t vl);
void __riscv_vsoxei8_v_i16m2_m(vbool8_t vm, int16_t *rs1, vuint8m1_t rs2,
                               vint16m2_t vs3, size_t vl);
void __riscv_vsoxei8_v_i16m4_m(vbool4_t vm, int16_t *rs1, vuint8m2_t rs2,
                               vint16m4_t vs3, size_t vl);
void __riscv_vsoxei8_v_i16m8_m(vbool2_t vm, int16_t *rs1, vuint8m4_t rs2,
                               vint16m8_t vs3, size_t vl);
void __riscv_vsoxei16_v_i16mf4_m(vbool64_t vm, int16_t *rs1, vuint16mf4_t rs2,
                                 vint16mf4_t vs3, size_t vl);
void __riscv_vsoxei16_v_i16mf2_m(vbool32_t vm, int16_t *rs1, vuint16mf2_t rs2,
                                 vint16mf2_t vs3, size_t vl);
void __riscv_vsoxei16_v_i16m1_m(vbool16_t vm, int16_t *rs1, vuint16m1_t rs2,
                                vint16m1_t vs3, size_t vl);
void __riscv_vsoxei16_v_i16m2_m(vbool8_t vm, int16_t *rs1, vuint16m2_t rs2,
                                vint16m2_t vs3, size_t vl);
void __riscv_vsoxei16_v_i16m4_m(vbool4_t vm, int16_t *rs1, vuint16m4_t rs2,
                                vint16m4_t vs3, size_t vl);
void __riscv_vsoxei16_v_i16m8_m(vbool2_t vm, int16_t *rs1, vuint16m8_t rs2,
                                vint16m8_t vs3, size_t vl);
void __riscv_vsoxei32_v_i16mf4_m(vbool64_t vm, int16_t *rs1, vuint32mf2_t rs2,
                                 vint16mf4_t vs3, size_t vl);
void __riscv_vsoxei32_v_i16mf2_m(vbool32_t vm, int16_t *rs1, vuint32m1_t rs2,
                                 vint16mf2_t vs3, size_t vl);
void __riscv_vsoxei32_v_i16m1_m(vbool16_t vm, int16_t *rs1, vuint32m2_t rs2,
                                vint16m1_t vs3, size_t vl);
void __riscv_vsoxei32_v_i16m2_m(vbool8_t vm, int16_t *rs1, vuint32m4_t rs2,
                                vint16m2_t vs3, size_t vl);
void __riscv_vsoxei32_v_i16m4_m(vbool4_t vm, int16_t *rs1, vuint32m8_t rs2,
                                vint16m4_t vs3, size_t vl);
void __riscv_vsoxei64_v_i16mf4_m(vbool64_t vm, int16_t *rs1, vuint64m1_t rs2,
                                 vint16mf4_t vs3, size_t vl);
void __riscv_vsoxei64_v_i16mf2_m(vbool32_t vm, int16_t *rs1, vuint64m2_t rs2,
                                 vint16mf2_t vs3, size_t vl);
void __riscv_vsoxei64_v_i16m1_m(vbool16_t vm, int16_t *rs1, vuint64m4_t rs2,
                                vint16m1_t vs3, size_t vl);
void __riscv_vsoxei64_v_i16m2_m(vbool8_t vm, int16_t *rs1, vuint64m8_t rs2,
                                vint16m2_t vs3, size_t vl);
void __riscv_vsoxei8_v_i32mf2_m(vbool64_t vm, int32_t *rs1, vuint8mf8_t rs2,
                                vint32mf2_t vs3, size_t vl);
void __riscv_vsoxei8_v_i32m1_m(vbool32_t vm, int32_t *rs1, vuint8mf4_t rs2,
                               vint32m1_t vs3, size_t vl);
void __riscv_vsoxei8_v_i32m2_m(vbool16_t vm, int32_t *rs1, vuint8mf2_t rs2,
                               vint32m2_t vs3, size_t vl);
void __riscv_vsoxei8_v_i32m4_m(vbool8_t vm, int32_t *rs1, vuint8m1_t rs2,
                               vint32m4_t vs3, size_t vl);
void __riscv_vsoxei8_v_i32m8_m(vbool4_t vm, int32_t *rs1, vuint8m2_t rs2,
                               vint32m8_t vs3, size_t vl);
void __riscv_vsoxei16_v_i32mf2_m(vbool64_t vm, int32_t *rs1, vuint16mf4_t rs2,
                                 vint32mf2_t vs3, size_t vl);
void __riscv_vsoxei16_v_i32m1_m(vbool32_t vm, int32_t *rs1, vuint16mf2_t rs2,
                                vint32m1_t vs3, size_t vl);
void __riscv_vsoxei16_v_i32m2_m(vbool16_t vm, int32_t *rs1, vuint16m1_t rs2,
                                vint32m2_t vs3, size_t vl);
void __riscv_vsoxei16_v_i32m4_m(vbool8_t vm, int32_t *rs1, vuint16m2_t rs2,
                                vint32m4_t vs3, size_t vl);
void __riscv_vsoxei16_v_i32m8_m(vbool4_t vm, int32_t *rs1, vuint16m4_t rs2,
                                vint32m8_t vs3, size_t vl);
void __riscv_vsoxei32_v_i32mf2_m(vbool64_t vm, int32_t *rs1, vuint32mf2_t rs2,
                                 vint32mf2_t vs3, size_t vl);
void __riscv_vsoxei32_v_i32m1_m(vbool32_t vm, int32_t *rs1, vuint32m1_t rs2,
                                vint32m1_t vs3, size_t vl);
void __riscv_vsoxei32_v_i32m2_m(vbool16_t vm, int32_t *rs1, vuint32m2_t rs2,
                                vint32m2_t vs3, size_t vl);
void __riscv_vsoxei32_v_i32m4_m(vbool8_t vm, int32_t *rs1, vuint32m4_t rs2,
                                vint32m4_t vs3, size_t vl);
void __riscv_vsoxei32_v_i32m8_m(vbool4_t vm, int32_t *rs1, vuint32m8_t rs2,
                                vint32m8_t vs3, size_t vl);
void __riscv_vsoxei64_v_i32mf2_m(vbool64_t vm, int32_t *rs1, vuint64m1_t rs2,
                                 vint32mf2_t vs3, size_t vl);
void __riscv_vsoxei64_v_i32m1_m(vbool32_t vm, int32_t *rs1, vuint64m2_t rs2,
                                vint32m1_t vs3, size_t vl);
void __riscv_vsoxei64_v_i32m2_m(vbool16_t vm, int32_t *rs1, vuint64m4_t rs2,
                                vint32m2_t vs3, size_t vl);
void __riscv_vsoxei64_v_i32m4_m(vbool8_t vm, int32_t *rs1, vuint64m8_t rs2,
                                vint32m4_t vs3, size_t vl);
void __riscv_vsoxei8_v_i64m1_m(vbool64_t vm, int64_t *rs1, vuint8mf8_t rs2,
                               vint64m1_t vs3, size_t vl);
void __riscv_vsoxei8_v_i64m2_m(vbool32_t vm, int64_t *rs1, vuint8mf4_t rs2,
                               vint64m2_t vs3, size_t vl);
void __riscv_vsoxei8_v_i64m4_m(vbool16_t vm, int64_t *rs1, vuint8mf2_t rs2,
                               vint64m4_t vs3, size_t vl);
void __riscv_vsoxei8_v_i64m8_m(vbool8_t vm, int64_t *rs1, vuint8m1_t rs2,
                               vint64m8_t vs3, size_t vl);
void __riscv_vsoxei16_v_i64m1_m(vbool64_t vm, int64_t *rs1, vuint16mf4_t rs2,
                                vint64m1_t vs3, size_t vl);
void __riscv_vsoxei16_v_i64m2_m(vbool32_t vm, int64_t *rs1, vuint16mf2_t rs2,
                                vint64m2_t vs3, size_t vl);
void __riscv_vsoxei16_v_i64m4_m(vbool16_t vm, int64_t *rs1, vuint16m1_t rs2,
                                vint64m4_t vs3, size_t vl);
void __riscv_vsoxei16_v_i64m8_m(vbool8_t vm, int64_t *rs1, vuint16m2_t rs2,
                                vint64m8_t vs3, size_t vl);
void __riscv_vsoxei32_v_i64m1_m(vbool64_t vm, int64_t *rs1, vuint32mf2_t rs2,
                                vint64m1_t vs3, size_t vl);
void __riscv_vsoxei32_v_i64m2_m(vbool32_t vm, int64_t *rs1, vuint32m1_t rs2,
                                vint64m2_t vs3, size_t vl);
void __riscv_vsoxei32_v_i64m4_m(vbool16_t vm, int64_t *rs1, vuint32m2_t rs2,
                                vint64m4_t vs3, size_t vl);
void __riscv_vsoxei32_v_i64m8_m(vbool8_t vm, int64_t *rs1, vuint32m4_t rs2,
                                vint64m8_t vs3, size_t vl);
void __riscv_vsoxei64_v_i64m1_m(vbool64_t vm, int64_t *rs1, vuint64m1_t rs2,
                                vint64m1_t vs3, size_t vl);
void __riscv_vsoxei64_v_i64m2_m(vbool32_t vm, int64_t *rs1, vuint64m2_t rs2,
                                vint64m2_t vs3, size_t vl);
void __riscv_vsoxei64_v_i64m4_m(vbool16_t vm, int64_t *rs1, vuint64m4_t rs2,
                                vint64m4_t vs3, size_t vl);
void __riscv_vsoxei64_v_i64m8_m(vbool8_t vm, int64_t *rs1, vuint64m8_t rs2,
                                vint64m8_t vs3, size_t vl);
void __riscv_vsuxei8_v_i8mf8_m(vbool64_t vm, int8_t *rs1, vuint8mf8_t rs2,
                               vint8mf8_t vs3, size_t vl);
void __riscv_vsuxei8_v_i8mf4_m(vbool32_t vm, int8_t *rs1, vuint8mf4_t rs2,
                               vint8mf4_t vs3, size_t vl);
void __riscv_vsuxei8_v_i8mf2_m(vbool16_t vm, int8_t *rs1, vuint8mf2_t rs2,
                               vint8mf2_t vs3, size_t vl);
void __riscv_vsuxei8_v_i8m1_m(vbool8_t vm, int8_t *rs1, vuint8m1_t rs2,
                              vint8m1_t vs3, size_t vl);
void __riscv_vsuxei8_v_i8m2_m(vbool4_t vm, int8_t *rs1, vuint8m2_t rs2,
                              vint8m2_t vs3, size_t vl);
void __riscv_vsuxei8_v_i8m4_m(vbool2_t vm, int8_t *rs1, vuint8m4_t rs2,
                              vint8m4_t vs3, size_t vl);
void __riscv_vsuxei8_v_i8m8_m(vbool1_t vm, int8_t *rs1, vuint8m8_t rs2,
                              vint8m8_t vs3, size_t vl);
void __riscv_vsuxei16_v_i8mf8_m(vbool64_t vm, int8_t *rs1, vuint16mf4_t rs2,
                                vint8mf8_t vs3, size_t vl);
void __riscv_vsuxei16_v_i8mf4_m(vbool32_t vm, int8_t *rs1, vuint16mf2_t rs2,
                                vint8mf4_t vs3, size_t vl);
void __riscv_vsuxei16_v_i8mf2_m(vbool16_t vm, int8_t *rs1, vuint16m1_t rs2,
                                vint8mf2_t vs3, size_t vl);
void __riscv_vsuxei16_v_i8m1_m(vbool8_t vm, int8_t *rs1, vuint16m2_t rs2,
                               vint8m1_t vs3, size_t vl);
void __riscv_vsuxei16_v_i8m2_m(vbool4_t vm, int8_t *rs1, vuint16m4_t rs2,
                               vint8m2_t vs3, size_t vl);
void __riscv_vsuxei16_v_i8m4_m(vbool2_t vm, int8_t *rs1, vuint16m8_t rs2,
                               vint8m4_t vs3, size_t vl);
void __riscv_vsuxei32_v_i8mf8_m(vbool64_t vm, int8_t *rs1, vuint32mf2_t rs2,
                                vint8mf8_t vs3, size_t vl);
void __riscv_vsuxei32_v_i8mf4_m(vbool32_t vm, int8_t *rs1, vuint32m1_t rs2,
                                vint8mf4_t vs3, size_t vl);
void __riscv_vsuxei32_v_i8mf2_m(vbool16_t vm, int8_t *rs1, vuint32m2_t rs2,
                                vint8mf2_t vs3, size_t vl);
void __riscv_vsuxei32_v_i8m1_m(vbool8_t vm, int8_t *rs1, vuint32m4_t rs2,
                               vint8m1_t vs3, size_t vl);
void __riscv_vsuxei32_v_i8m2_m(vbool4_t vm, int8_t *rs1, vuint32m8_t rs2,
                               vint8m2_t vs3, size_t vl);
void __riscv_vsuxei64_v_i8mf8_m(vbool64_t vm, int8_t *rs1, vuint64m1_t rs2,
                                vint8mf8_t vs3, size_t vl);
void __riscv_vsuxei64_v_i8mf4_m(vbool32_t vm, int8_t *rs1, vuint64m2_t rs2,
                                vint8mf4_t vs3, size_t vl);
void __riscv_vsuxei64_v_i8mf2_m(vbool16_t vm, int8_t *rs1, vuint64m4_t rs2,
                                vint8mf2_t vs3, size_t vl);
void __riscv_vsuxei64_v_i8m1_m(vbool8_t vm, int8_t *rs1, vuint64m8_t rs2,
                               vint8m1_t vs3, size_t vl);
void __riscv_vsuxei8_v_i16mf4_m(vbool64_t vm, int16_t *rs1, vuint8mf8_t rs2,
                                vint16mf4_t vs3, size_t vl);
void __riscv_vsuxei8_v_i16mf2_m(vbool32_t vm, int16_t *rs1, vuint8mf4_t rs2,
                                vint16mf2_t vs3, size_t vl);
void __riscv_vsuxei8_v_i16m1_m(vbool16_t vm, int16_t *rs1, vuint8mf2_t rs2,
                               vint16m1_t vs3, size_t vl);
void __riscv_vsuxei8_v_i16m2_m(vbool8_t vm, int16_t *rs1, vuint8m1_t rs2,
                               vint16m2_t vs3, size_t vl);
void __riscv_vsuxei8_v_i16m4_m(vbool4_t vm, int16_t *rs1, vuint8m2_t rs2,
                               vint16m4_t vs3, size_t vl);
void __riscv_vsuxei8_v_i16m8_m(vbool2_t vm, int16_t *rs1, vuint8m4_t rs2,
                               vint16m8_t vs3, size_t vl);
void __riscv_vsuxei16_v_i16mf4_m(vbool64_t vm, int16_t *rs1, vuint16mf4_t rs2,
                                 vint16mf4_t vs3, size_t vl);
void __riscv_vsuxei16_v_i16mf2_m(vbool32_t vm, int16_t *rs1, vuint16mf2_t rs2,
                                 vint16mf2_t vs3, size_t vl);
void __riscv_vsuxei16_v_i16m1_m(vbool16_t vm, int16_t *rs1, vuint16m1_t rs2,
                                vint16m1_t vs3, size_t vl);
void __riscv_vsuxei16_v_i16m2_m(vbool8_t vm, int16_t *rs1, vuint16m2_t rs2,
                                vint16m2_t vs3, size_t vl);
void __riscv_vsuxei16_v_i16m4_m(vbool4_t vm, int16_t *rs1, vuint16m4_t rs2,
                                vint16m4_t vs3, size_t vl);
void __riscv_vsuxei16_v_i16m8_m(vbool2_t vm, int16_t *rs1, vuint16m8_t rs2,
                                vint16m8_t vs3, size_t vl);
void __riscv_vsuxei32_v_i16mf4_m(vbool64_t vm, int16_t *rs1, vuint32mf2_t rs2,
                                 vint16mf4_t vs3, size_t vl);
void __riscv_vsuxei32_v_i16mf2_m(vbool32_t vm, int16_t *rs1, vuint32m1_t rs2,
                                 vint16mf2_t vs3, size_t vl);
void __riscv_vsuxei32_v_i16m1_m(vbool16_t vm, int16_t *rs1, vuint32m2_t rs2,
                                vint16m1_t vs3, size_t vl);
void __riscv_vsuxei32_v_i16m2_m(vbool8_t vm, int16_t *rs1, vuint32m4_t rs2,
                                vint16m2_t vs3, size_t vl);
void __riscv_vsuxei32_v_i16m4_m(vbool4_t vm, int16_t *rs1, vuint32m8_t rs2,
                                vint16m4_t vs3, size_t vl);
void __riscv_vsuxei64_v_i16mf4_m(vbool64_t vm, int16_t *rs1, vuint64m1_t rs2,
                                 vint16mf4_t vs3, size_t vl);
void __riscv_vsuxei64_v_i16mf2_m(vbool32_t vm, int16_t *rs1, vuint64m2_t rs2,
                                 vint16mf2_t vs3, size_t vl);
void __riscv_vsuxei64_v_i16m1_m(vbool16_t vm, int16_t *rs1, vuint64m4_t rs2,
                                vint16m1_t vs3, size_t vl);
void __riscv_vsuxei64_v_i16m2_m(vbool8_t vm, int16_t *rs1, vuint64m8_t rs2,
                                vint16m2_t vs3, size_t vl);
void __riscv_vsuxei8_v_i32mf2_m(vbool64_t vm, int32_t *rs1, vuint8mf8_t rs2,
                                vint32mf2_t vs3, size_t vl);
void __riscv_vsuxei8_v_i32m1_m(vbool32_t vm, int32_t *rs1, vuint8mf4_t rs2,
                               vint32m1_t vs3, size_t vl);
void __riscv_vsuxei8_v_i32m2_m(vbool16_t vm, int32_t *rs1, vuint8mf2_t rs2,
                               vint32m2_t vs3, size_t vl);
void __riscv_vsuxei8_v_i32m4_m(vbool8_t vm, int32_t *rs1, vuint8m1_t rs2,
                               vint32m4_t vs3, size_t vl);
void __riscv_vsuxei8_v_i32m8_m(vbool4_t vm, int32_t *rs1, vuint8m2_t rs2,
                               vint32m8_t vs3, size_t vl);
void __riscv_vsuxei16_v_i32mf2_m(vbool64_t vm, int32_t *rs1, vuint16mf4_t rs2,
                                 vint32mf2_t vs3, size_t vl);
void __riscv_vsuxei16_v_i32m1_m(vbool32_t vm, int32_t *rs1, vuint16mf2_t rs2,
                                vint32m1_t vs3, size_t vl);
void __riscv_vsuxei16_v_i32m2_m(vbool16_t vm, int32_t *rs1, vuint16m1_t rs2,
                                vint32m2_t vs3, size_t vl);
void __riscv_vsuxei16_v_i32m4_m(vbool8_t vm, int32_t *rs1, vuint16m2_t rs2,
                                vint32m4_t vs3, size_t vl);
void __riscv_vsuxei16_v_i32m8_m(vbool4_t vm, int32_t *rs1, vuint16m4_t rs2,
                                vint32m8_t vs3, size_t vl);
void __riscv_vsuxei32_v_i32mf2_m(vbool64_t vm, int32_t *rs1, vuint32mf2_t rs2,
                                 vint32mf2_t vs3, size_t vl);
void __riscv_vsuxei32_v_i32m1_m(vbool32_t vm, int32_t *rs1, vuint32m1_t rs2,
                                vint32m1_t vs3, size_t vl);
void __riscv_vsuxei32_v_i32m2_m(vbool16_t vm, int32_t *rs1, vuint32m2_t rs2,
                                vint32m2_t vs3, size_t vl);
void __riscv_vsuxei32_v_i32m4_m(vbool8_t vm, int32_t *rs1, vuint32m4_t rs2,
                                vint32m4_t vs3, size_t vl);
void __riscv_vsuxei32_v_i32m8_m(vbool4_t vm, int32_t *rs1, vuint32m8_t rs2,
                                vint32m8_t vs3, size_t vl);
void __riscv_vsuxei64_v_i32mf2_m(vbool64_t vm, int32_t *rs1, vuint64m1_t rs2,
                                 vint32mf2_t vs3, size_t vl);
void __riscv_vsuxei64_v_i32m1_m(vbool32_t vm, int32_t *rs1, vuint64m2_t rs2,
                                vint32m1_t vs3, size_t vl);
void __riscv_vsuxei64_v_i32m2_m(vbool16_t vm, int32_t *rs1, vuint64m4_t rs2,
                                vint32m2_t vs3, size_t vl);
void __riscv_vsuxei64_v_i32m4_m(vbool8_t vm, int32_t *rs1, vuint64m8_t rs2,
                                vint32m4_t vs3, size_t vl);
void __riscv_vsuxei8_v_i64m1_m(vbool64_t vm, int64_t *rs1, vuint8mf8_t rs2,
                               vint64m1_t vs3, size_t vl);
void __riscv_vsuxei8_v_i64m2_m(vbool32_t vm, int64_t *rs1, vuint8mf4_t rs2,
                               vint64m2_t vs3, size_t vl);
void __riscv_vsuxei8_v_i64m4_m(vbool16_t vm, int64_t *rs1, vuint8mf2_t rs2,
                               vint64m4_t vs3, size_t vl);
void __riscv_vsuxei8_v_i64m8_m(vbool8_t vm, int64_t *rs1, vuint8m1_t rs2,
                               vint64m8_t vs3, size_t vl);
void __riscv_vsuxei16_v_i64m1_m(vbool64_t vm, int64_t *rs1, vuint16mf4_t rs2,
                                vint64m1_t vs3, size_t vl);
void __riscv_vsuxei16_v_i64m2_m(vbool32_t vm, int64_t *rs1, vuint16mf2_t rs2,
                                vint64m2_t vs3, size_t vl);
void __riscv_vsuxei16_v_i64m4_m(vbool16_t vm, int64_t *rs1, vuint16m1_t rs2,
                                vint64m4_t vs3, size_t vl);
void __riscv_vsuxei16_v_i64m8_m(vbool8_t vm, int64_t *rs1, vuint16m2_t rs2,
                                vint64m8_t vs3, size_t vl);
void __riscv_vsuxei32_v_i64m1_m(vbool64_t vm, int64_t *rs1, vuint32mf2_t rs2,
                                vint64m1_t vs3, size_t vl);
void __riscv_vsuxei32_v_i64m2_m(vbool32_t vm, int64_t *rs1, vuint32m1_t rs2,
                                vint64m2_t vs3, size_t vl);
void __riscv_vsuxei32_v_i64m4_m(vbool16_t vm, int64_t *rs1, vuint32m2_t rs2,
                                vint64m4_t vs3, size_t vl);
void __riscv_vsuxei32_v_i64m8_m(vbool8_t vm, int64_t *rs1, vuint32m4_t rs2,
                                vint64m8_t vs3, size_t vl);
void __riscv_vsuxei64_v_i64m1_m(vbool64_t vm, int64_t *rs1, vuint64m1_t rs2,
                                vint64m1_t vs3, size_t vl);
void __riscv_vsuxei64_v_i64m2_m(vbool32_t vm, int64_t *rs1, vuint64m2_t rs2,
                                vint64m2_t vs3, size_t vl);
void __riscv_vsuxei64_v_i64m4_m(vbool16_t vm, int64_t *rs1, vuint64m4_t rs2,
                                vint64m4_t vs3, size_t vl);
void __riscv_vsuxei64_v_i64m8_m(vbool8_t vm, int64_t *rs1, vuint64m8_t rs2,
                                vint64m8_t vs3, size_t vl);
void __riscv_vsoxei8_v_u8mf8_m(vbool64_t vm, uint8_t *rs1, vuint8mf8_t rs2,
                               vuint8mf8_t vs3, size_t vl);
void __riscv_vsoxei8_v_u8mf4_m(vbool32_t vm, uint8_t *rs1, vuint8mf4_t rs2,
                               vuint8mf4_t vs3, size_t vl);
void __riscv_vsoxei8_v_u8mf2_m(vbool16_t vm, uint8_t *rs1, vuint8mf2_t rs2,
                               vuint8mf2_t vs3, size_t vl);
void __riscv_vsoxei8_v_u8m1_m(vbool8_t vm, uint8_t *rs1, vuint8m1_t rs2,
                              vuint8m1_t vs3, size_t vl);
void __riscv_vsoxei8_v_u8m2_m(vbool4_t vm, uint8_t *rs1, vuint8m2_t rs2,
                              vuint8m2_t vs3, size_t vl);
void __riscv_vsoxei8_v_u8m4_m(vbool2_t vm, uint8_t *rs1, vuint8m4_t rs2,
                              vuint8m4_t vs3, size_t vl);
void __riscv_vsoxei8_v_u8m8_m(vbool1_t vm, uint8_t *rs1, vuint8m8_t rs2,
                              vuint8m8_t vs3, size_t vl);
void __riscv_vsoxei16_v_u8mf8_m(vbool64_t vm, uint8_t *rs1, vuint16mf4_t rs2,
                                vuint8mf8_t vs3, size_t vl);
void __riscv_vsoxei16_v_u8mf4_m(vbool32_t vm, uint8_t *rs1, vuint16mf2_t rs2,
                                vuint8mf4_t vs3, size_t vl);
void __riscv_vsoxei16_v_u8mf2_m(vbool16_t vm, uint8_t *rs1, vuint16m1_t rs2,
                                vuint8mf2_t vs3, size_t vl);
void __riscv_vsoxei16_v_u8m1_m(vbool8_t vm, uint8_t *rs1, vuint16m2_t rs2,
                               vuint8m1_t vs3, size_t vl);
void __riscv_vsoxei16_v_u8m2_m(vbool4_t vm, uint8_t *rs1, vuint16m4_t rs2,
                               vuint8m2_t vs3, size_t vl);
void __riscv_vsoxei16_v_u8m4_m(vbool2_t vm, uint8_t *rs1, vuint16m8_t rs2,
                               vuint8m4_t vs3, size_t vl);
void __riscv_vsoxei32_v_u8mf8_m(vbool64_t vm, uint8_t *rs1, vuint32mf2_t rs2,
                                vuint8mf8_t vs3, size_t vl);
void __riscv_vsoxei32_v_u8mf4_m(vbool32_t vm, uint8_t *rs1, vuint32m1_t rs2,
                                vuint8mf4_t vs3, size_t vl);
void __riscv_vsoxei32_v_u8mf2_m(vbool16_t vm, uint8_t *rs1, vuint32m2_t rs2,
                                vuint8mf2_t vs3, size_t vl);
void __riscv_vsoxei32_v_u8m1_m(vbool8_t vm, uint8_t *rs1, vuint32m4_t rs2,
                               vuint8m1_t vs3, size_t vl);
void __riscv_vsoxei32_v_u8m2_m(vbool4_t vm, uint8_t *rs1, vuint32m8_t rs2,
                               vuint8m2_t vs3, size_t vl);
void __riscv_vsoxei64_v_u8mf8_m(vbool64_t vm, uint8_t *rs1, vuint64m1_t rs2,
                                vuint8mf8_t vs3, size_t vl);
void __riscv_vsoxei64_v_u8mf4_m(vbool32_t vm, uint8_t *rs1, vuint64m2_t rs2,
                                vuint8mf4_t vs3, size_t vl);
void __riscv_vsoxei64_v_u8mf2_m(vbool16_t vm, uint8_t *rs1, vuint64m4_t rs2,
                                vuint8mf2_t vs3, size_t vl);
void __riscv_vsoxei64_v_u8m1_m(vbool8_t vm, uint8_t *rs1, vuint64m8_t rs2,
                               vuint8m1_t vs3, size_t vl);
void __riscv_vsoxei8_v_u16mf4_m(vbool64_t vm, uint16_t *rs1, vuint8mf8_t rs2,
                                vuint16mf4_t vs3, size_t vl);
void __riscv_vsoxei8_v_u16mf2_m(vbool32_t vm, uint16_t *rs1, vuint8mf4_t rs2,
                                vuint16mf2_t vs3, size_t vl);
void __riscv_vsoxei8_v_u16m1_m(vbool16_t vm, uint16_t *rs1, vuint8mf2_t rs2,
                               vuint16m1_t vs3, size_t vl);
void __riscv_vsoxei8_v_u16m2_m(vbool8_t vm, uint16_t *rs1, vuint8m1_t rs2,
                               vuint16m2_t vs3, size_t vl);
void __riscv_vsoxei8_v_u16m4_m(vbool4_t vm, uint16_t *rs1, vuint8m2_t rs2,
                               vuint16m4_t vs3, size_t vl);
void __riscv_vsoxei8_v_u16m8_m(vbool2_t vm, uint16_t *rs1, vuint8m4_t rs2,
                               vuint16m8_t vs3, size_t vl);
void __riscv_vsoxei16_v_u16mf4_m(vbool64_t vm, uint16_t *rs1, vuint16mf4_t rs2,
                                 vuint16mf4_t vs3, size_t vl);
void __riscv_vsoxei16_v_u16mf2_m(vbool32_t vm, uint16_t *rs1, vuint16mf2_t rs2,
                                 vuint16mf2_t vs3, size_t vl);
void __riscv_vsoxei16_v_u16m1_m(vbool16_t vm, uint16_t *rs1, vuint16m1_t rs2,
                                vuint16m1_t vs3, size_t vl);
void __riscv_vsoxei16_v_u16m2_m(vbool8_t vm, uint16_t *rs1, vuint16m2_t rs2,
                                vuint16m2_t vs3, size_t vl);
void __riscv_vsoxei16_v_u16m4_m(vbool4_t vm, uint16_t *rs1, vuint16m4_t rs2,
                                vuint16m4_t vs3, size_t vl);
void __riscv_vsoxei16_v_u16m8_m(vbool2_t vm, uint16_t *rs1, vuint16m8_t rs2,
                                vuint16m8_t vs3, size_t vl);
void __riscv_vsoxei32_v_u16mf4_m(vbool64_t vm, uint16_t *rs1, vuint32mf2_t rs2,
                                 vuint16mf4_t vs3, size_t vl);
void __riscv_vsoxei32_v_u16mf2_m(vbool32_t vm, uint16_t *rs1, vuint32m1_t rs2,
                                 vuint16mf2_t vs3, size_t vl);
void __riscv_vsoxei32_v_u16m1_m(vbool16_t vm, uint16_t *rs1, vuint32m2_t rs2,
                                vuint16m1_t vs3, size_t vl);
void __riscv_vsoxei32_v_u16m2_m(vbool8_t vm, uint16_t *rs1, vuint32m4_t rs2,
                                vuint16m2_t vs3, size_t vl);
void __riscv_vsoxei32_v_u16m4_m(vbool4_t vm, uint16_t *rs1, vuint32m8_t rs2,
                                vuint16m4_t vs3, size_t vl);
void __riscv_vsoxei64_v_u16mf4_m(vbool64_t vm, uint16_t *rs1, vuint64m1_t rs2,
                                 vuint16mf4_t vs3, size_t vl);
void __riscv_vsoxei64_v_u16mf2_m(vbool32_t vm, uint16_t *rs1, vuint64m2_t rs2,
                                 vuint16mf2_t vs3, size_t vl);
void __riscv_vsoxei64_v_u16m1_m(vbool16_t vm, uint16_t *rs1, vuint64m4_t rs2,
                                vuint16m1_t vs3, size_t vl);
void __riscv_vsoxei64_v_u16m2_m(vbool8_t vm, uint16_t *rs1, vuint64m8_t rs2,
                                vuint16m2_t vs3, size_t vl);
void __riscv_vsoxei8_v_u32mf2_m(vbool64_t vm, uint32_t *rs1, vuint8mf8_t rs2,
                                vuint32mf2_t vs3, size_t vl);
void __riscv_vsoxei8_v_u32m1_m(vbool32_t vm, uint32_t *rs1, vuint8mf4_t rs2,
                               vuint32m1_t vs3, size_t vl);
void __riscv_vsoxei8_v_u32m2_m(vbool16_t vm, uint32_t *rs1, vuint8mf2_t rs2,
                               vuint32m2_t vs3, size_t vl);
void __riscv_vsoxei8_v_u32m4_m(vbool8_t vm, uint32_t *rs1, vuint8m1_t rs2,
                               vuint32m4_t vs3, size_t vl);
void __riscv_vsoxei8_v_u32m8_m(vbool4_t vm, uint32_t *rs1, vuint8m2_t rs2,
                               vuint32m8_t vs3, size_t vl);
void __riscv_vsoxei16_v_u32mf2_m(vbool64_t vm, uint32_t *rs1, vuint16mf4_t rs2,
                                 vuint32mf2_t vs3, size_t vl);
void __riscv_vsoxei16_v_u32m1_m(vbool32_t vm, uint32_t *rs1, vuint16mf2_t rs2,
                                vuint32m1_t vs3, size_t vl);
void __riscv_vsoxei16_v_u32m2_m(vbool16_t vm, uint32_t *rs1, vuint16m1_t rs2,
                                vuint32m2_t vs3, size_t vl);
void __riscv_vsoxei16_v_u32m4_m(vbool8_t vm, uint32_t *rs1, vuint16m2_t rs2,
                                vuint32m4_t vs3, size_t vl);
void __riscv_vsoxei16_v_u32m8_m(vbool4_t vm, uint32_t *rs1, vuint16m4_t rs2,
                                vuint32m8_t vs3, size_t vl);
void __riscv_vsoxei32_v_u32mf2_m(vbool64_t vm, uint32_t *rs1, vuint32mf2_t rs2,
                                 vuint32mf2_t vs3, size_t vl);
void __riscv_vsoxei32_v_u32m1_m(vbool32_t vm, uint32_t *rs1, vuint32m1_t rs2,
                                vuint32m1_t vs3, size_t vl);
void __riscv_vsoxei32_v_u32m2_m(vbool16_t vm, uint32_t *rs1, vuint32m2_t rs2,
                                vuint32m2_t vs3, size_t vl);
void __riscv_vsoxei32_v_u32m4_m(vbool8_t vm, uint32_t *rs1, vuint32m4_t rs2,
                                vuint32m4_t vs3, size_t vl);
void __riscv_vsoxei32_v_u32m8_m(vbool4_t vm, uint32_t *rs1, vuint32m8_t rs2,
                                vuint32m8_t vs3, size_t vl);
void __riscv_vsoxei64_v_u32mf2_m(vbool64_t vm, uint32_t *rs1, vuint64m1_t rs2,
                                 vuint32mf2_t vs3, size_t vl);
void __riscv_vsoxei64_v_u32m1_m(vbool32_t vm, uint32_t *rs1, vuint64m2_t rs2,
                                vuint32m1_t vs3, size_t vl);
void __riscv_vsoxei64_v_u32m2_m(vbool16_t vm, uint32_t *rs1, vuint64m4_t rs2,
                                vuint32m2_t vs3, size_t vl);
void __riscv_vsoxei64_v_u32m4_m(vbool8_t vm, uint32_t *rs1, vuint64m8_t rs2,
                                vuint32m4_t vs3, size_t vl);
void __riscv_vsoxei8_v_u64m1_m(vbool64_t vm, uint64_t *rs1, vuint8mf8_t rs2,
                               vuint64m1_t vs3, size_t vl);
void __riscv_vsoxei8_v_u64m2_m(vbool32_t vm, uint64_t *rs1, vuint8mf4_t rs2,
                               vuint64m2_t vs3, size_t vl);
void __riscv_vsoxei8_v_u64m4_m(vbool16_t vm, uint64_t *rs1, vuint8mf2_t rs2,
                               vuint64m4_t vs3, size_t vl);
void __riscv_vsoxei8_v_u64m8_m(vbool8_t vm, uint64_t *rs1, vuint8m1_t rs2,
                               vuint64m8_t vs3, size_t vl);
void __riscv_vsoxei16_v_u64m1_m(vbool64_t vm, uint64_t *rs1, vuint16mf4_t rs2,
                                vuint64m1_t vs3, size_t vl);
void __riscv_vsoxei16_v_u64m2_m(vbool32_t vm, uint64_t *rs1, vuint16mf2_t rs2,
                                vuint64m2_t vs3, size_t vl);
void __riscv_vsoxei16_v_u64m4_m(vbool16_t vm, uint64_t *rs1, vuint16m1_t rs2,
                                vuint64m4_t vs3, size_t vl);
void __riscv_vsoxei16_v_u64m8_m(vbool8_t vm, uint64_t *rs1, vuint16m2_t rs2,
                                vuint64m8_t vs3, size_t vl);
void __riscv_vsoxei32_v_u64m1_m(vbool64_t vm, uint64_t *rs1, vuint32mf2_t rs2,
                                vuint64m1_t vs3, size_t vl);
void __riscv_vsoxei32_v_u64m2_m(vbool32_t vm, uint64_t *rs1, vuint32m1_t rs2,
                                vuint64m2_t vs3, size_t vl);
void __riscv_vsoxei32_v_u64m4_m(vbool16_t vm, uint64_t *rs1, vuint32m2_t rs2,
                                vuint64m4_t vs3, size_t vl);
void __riscv_vsoxei32_v_u64m8_m(vbool8_t vm, uint64_t *rs1, vuint32m4_t rs2,
                                vuint64m8_t vs3, size_t vl);
void __riscv_vsoxei64_v_u64m1_m(vbool64_t vm, uint64_t *rs1, vuint64m1_t rs2,
                                vuint64m1_t vs3, size_t vl);
void __riscv_vsoxei64_v_u64m2_m(vbool32_t vm, uint64_t *rs1, vuint64m2_t rs2,
                                vuint64m2_t vs3, size_t vl);
void __riscv_vsoxei64_v_u64m4_m(vbool16_t vm, uint64_t *rs1, vuint64m4_t rs2,
                                vuint64m4_t vs3, size_t vl);
void __riscv_vsoxei64_v_u64m8_m(vbool8_t vm, uint64_t *rs1, vuint64m8_t rs2,
                                vuint64m8_t vs3, size_t vl);
void __riscv_vsuxei8_v_u8mf8_m(vbool64_t vm, uint8_t *rs1, vuint8mf8_t rs2,
                               vuint8mf8_t vs3, size_t vl);
void __riscv_vsuxei8_v_u8mf4_m(vbool32_t vm, uint8_t *rs1, vuint8mf4_t rs2,
                               vuint8mf4_t vs3, size_t vl);
void __riscv_vsuxei8_v_u8mf2_m(vbool16_t vm, uint8_t *rs1, vuint8mf2_t rs2,
                               vuint8mf2_t vs3, size_t vl);
void __riscv_vsuxei8_v_u8m1_m(vbool8_t vm, uint8_t *rs1, vuint8m1_t rs2,
                              vuint8m1_t vs3, size_t vl);
void __riscv_vsuxei8_v_u8m2_m(vbool4_t vm, uint8_t *rs1, vuint8m2_t rs2,
                              vuint8m2_t vs3, size_t vl);
void __riscv_vsuxei8_v_u8m4_m(vbool2_t vm, uint8_t *rs1, vuint8m4_t rs2,
                              vuint8m4_t vs3, size_t vl);
void __riscv_vsuxei8_v_u8m8_m(vbool1_t vm, uint8_t *rs1, vuint8m8_t rs2,
                              vuint8m8_t vs3, size_t vl);
void __riscv_vsuxei16_v_u8mf8_m(vbool64_t vm, uint8_t *rs1, vuint16mf4_t rs2,
                                vuint8mf8_t vs3, size_t vl);
void __riscv_vsuxei16_v_u8mf4_m(vbool32_t vm, uint8_t *rs1, vuint16mf2_t rs2,
                                vuint8mf4_t vs3, size_t vl);
void __riscv_vsuxei16_v_u8mf2_m(vbool16_t vm, uint8_t *rs1, vuint16m1_t rs2,
                                vuint8mf2_t vs3, size_t vl);
void __riscv_vsuxei16_v_u8m1_m(vbool8_t vm, uint8_t *rs1, vuint16m2_t rs2,
                               vuint8m1_t vs3, size_t vl);
void __riscv_vsuxei16_v_u8m2_m(vbool4_t vm, uint8_t *rs1, vuint16m4_t rs2,
                               vuint8m2_t vs3, size_t vl);
void __riscv_vsuxei16_v_u8m4_m(vbool2_t vm, uint8_t *rs1, vuint16m8_t rs2,
                               vuint8m4_t vs3, size_t vl);
void __riscv_vsuxei32_v_u8mf8_m(vbool64_t vm, uint8_t *rs1, vuint32mf2_t rs2,
                                vuint8mf8_t vs3, size_t vl);
void __riscv_vsuxei32_v_u8mf4_m(vbool32_t vm, uint8_t *rs1, vuint32m1_t rs2,
                                vuint8mf4_t vs3, size_t vl);
void __riscv_vsuxei32_v_u8mf2_m(vbool16_t vm, uint8_t *rs1, vuint32m2_t rs2,
                                vuint8mf2_t vs3, size_t vl);
void __riscv_vsuxei32_v_u8m1_m(vbool8_t vm, uint8_t *rs1, vuint32m4_t rs2,
                               vuint8m1_t vs3, size_t vl);
void __riscv_vsuxei32_v_u8m2_m(vbool4_t vm, uint8_t *rs1, vuint32m8_t rs2,
                               vuint8m2_t vs3, size_t vl);
void __riscv_vsuxei64_v_u8mf8_m(vbool64_t vm, uint8_t *rs1, vuint64m1_t rs2,
                                vuint8mf8_t vs3, size_t vl);
void __riscv_vsuxei64_v_u8mf4_m(vbool32_t vm, uint8_t *rs1, vuint64m2_t rs2,
                                vuint8mf4_t vs3, size_t vl);
void __riscv_vsuxei64_v_u8mf2_m(vbool16_t vm, uint8_t *rs1, vuint64m4_t rs2,
                                vuint8mf2_t vs3, size_t vl);
void __riscv_vsuxei64_v_u8m1_m(vbool8_t vm, uint8_t *rs1, vuint64m8_t rs2,
                               vuint8m1_t vs3, size_t vl);
void __riscv_vsuxei8_v_u16mf4_m(vbool64_t vm, uint16_t *rs1, vuint8mf8_t rs2,
                                vuint16mf4_t vs3, size_t vl);
void __riscv_vsuxei8_v_u16mf2_m(vbool32_t vm, uint16_t *rs1, vuint8mf4_t rs2,
                                vuint16mf2_t vs3, size_t vl);
void __riscv_vsuxei8_v_u16m1_m(vbool16_t vm, uint16_t *rs1, vuint8mf2_t rs2,
                               vuint16m1_t vs3, size_t vl);
void __riscv_vsuxei8_v_u16m2_m(vbool8_t vm, uint16_t *rs1, vuint8m1_t rs2,
                               vuint16m2_t vs3, size_t vl);
void __riscv_vsuxei8_v_u16m4_m(vbool4_t vm, uint16_t *rs1, vuint8m2_t rs2,
                               vuint16m4_t vs3, size_t vl);
void __riscv_vsuxei8_v_u16m8_m(vbool2_t vm, uint16_t *rs1, vuint8m4_t rs2,
                               vuint16m8_t vs3, size_t vl);
void __riscv_vsuxei16_v_u16mf4_m(vbool64_t vm, uint16_t *rs1, vuint16mf4_t rs2,
                                 vuint16mf4_t vs3, size_t vl);
void __riscv_vsuxei16_v_u16mf2_m(vbool32_t vm, uint16_t *rs1, vuint16mf2_t rs2,
                                 vuint16mf2_t vs3, size_t vl);
void __riscv_vsuxei16_v_u16m1_m(vbool16_t vm, uint16_t *rs1, vuint16m1_t rs2,
                                vuint16m1_t vs3, size_t vl);
void __riscv_vsuxei16_v_u16m2_m(vbool8_t vm, uint16_t *rs1, vuint16m2_t rs2,
                                vuint16m2_t vs3, size_t vl);
void __riscv_vsuxei16_v_u16m4_m(vbool4_t vm, uint16_t *rs1, vuint16m4_t rs2,
                                vuint16m4_t vs3, size_t vl);
void __riscv_vsuxei16_v_u16m8_m(vbool2_t vm, uint16_t *rs1, vuint16m8_t rs2,
                                vuint16m8_t vs3, size_t vl);
void __riscv_vsuxei32_v_u16mf4_m(vbool64_t vm, uint16_t *rs1, vuint32mf2_t rs2,
                                 vuint16mf4_t vs3, size_t vl);
void __riscv_vsuxei32_v_u16mf2_m(vbool32_t vm, uint16_t *rs1, vuint32m1_t rs2,
                                 vuint16mf2_t vs3, size_t vl);
void __riscv_vsuxei32_v_u16m1_m(vbool16_t vm, uint16_t *rs1, vuint32m2_t rs2,
                                vuint16m1_t vs3, size_t vl);
void __riscv_vsuxei32_v_u16m2_m(vbool8_t vm, uint16_t *rs1, vuint32m4_t rs2,
                                vuint16m2_t vs3, size_t vl);
void __riscv_vsuxei32_v_u16m4_m(vbool4_t vm, uint16_t *rs1, vuint32m8_t rs2,
                                vuint16m4_t vs3, size_t vl);
void __riscv_vsuxei64_v_u16mf4_m(vbool64_t vm, uint16_t *rs1, vuint64m1_t rs2,
                                 vuint16mf4_t vs3, size_t vl);
void __riscv_vsuxei64_v_u16mf2_m(vbool32_t vm, uint16_t *rs1, vuint64m2_t rs2,
                                 vuint16mf2_t vs3, size_t vl);
void __riscv_vsuxei64_v_u16m1_m(vbool16_t vm, uint16_t *rs1, vuint64m4_t rs2,
                                vuint16m1_t vs3, size_t vl);
void __riscv_vsuxei64_v_u16m2_m(vbool8_t vm, uint16_t *rs1, vuint64m8_t rs2,
                                vuint16m2_t vs3, size_t vl);
void __riscv_vsuxei8_v_u32mf2_m(vbool64_t vm, uint32_t *rs1, vuint8mf8_t rs2,
                                vuint32mf2_t vs3, size_t vl);
void __riscv_vsuxei8_v_u32m1_m(vbool32_t vm, uint32_t *rs1, vuint8mf4_t rs2,
                               vuint32m1_t vs3, size_t vl);
void __riscv_vsuxei8_v_u32m2_m(vbool16_t vm, uint32_t *rs1, vuint8mf2_t rs2,
                               vuint32m2_t vs3, size_t vl);
void __riscv_vsuxei8_v_u32m4_m(vbool8_t vm, uint32_t *rs1, vuint8m1_t rs2,
                               vuint32m4_t vs3, size_t vl);
void __riscv_vsuxei8_v_u32m8_m(vbool4_t vm, uint32_t *rs1, vuint8m2_t rs2,
                               vuint32m8_t vs3, size_t vl);
void __riscv_vsuxei16_v_u32mf2_m(vbool64_t vm, uint32_t *rs1, vuint16mf4_t rs2,
                                 vuint32mf2_t vs3, size_t vl);
void __riscv_vsuxei16_v_u32m1_m(vbool32_t vm, uint32_t *rs1, vuint16mf2_t rs2,
                                vuint32m1_t vs3, size_t vl);
void __riscv_vsuxei16_v_u32m2_m(vbool16_t vm, uint32_t *rs1, vuint16m1_t rs2,
                                vuint32m2_t vs3, size_t vl);
void __riscv_vsuxei16_v_u32m4_m(vbool8_t vm, uint32_t *rs1, vuint16m2_t rs2,
                                vuint32m4_t vs3, size_t vl);
void __riscv_vsuxei16_v_u32m8_m(vbool4_t vm, uint32_t *rs1, vuint16m4_t rs2,
                                vuint32m8_t vs3, size_t vl);
void __riscv_vsuxei32_v_u32mf2_m(vbool64_t vm, uint32_t *rs1, vuint32mf2_t rs2,
                                 vuint32mf2_t vs3, size_t vl);
void __riscv_vsuxei32_v_u32m1_m(vbool32_t vm, uint32_t *rs1, vuint32m1_t rs2,
                                vuint32m1_t vs3, size_t vl);
void __riscv_vsuxei32_v_u32m2_m(vbool16_t vm, uint32_t *rs1, vuint32m2_t rs2,
                                vuint32m2_t vs3, size_t vl);
void __riscv_vsuxei32_v_u32m4_m(vbool8_t vm, uint32_t *rs1, vuint32m4_t rs2,
                                vuint32m4_t vs3, size_t vl);
void __riscv_vsuxei32_v_u32m8_m(vbool4_t vm, uint32_t *rs1, vuint32m8_t rs2,
                                vuint32m8_t vs3, size_t vl);
void __riscv_vsuxei64_v_u32mf2_m(vbool64_t vm, uint32_t *rs1, vuint64m1_t rs2,
                                 vuint32mf2_t vs3, size_t vl);
void __riscv_vsuxei64_v_u32m1_m(vbool32_t vm, uint32_t *rs1, vuint64m2_t rs2,
                                vuint32m1_t vs3, size_t vl);
void __riscv_vsuxei64_v_u32m2_m(vbool16_t vm, uint32_t *rs1, vuint64m4_t rs2,
                                vuint32m2_t vs3, size_t vl);
void __riscv_vsuxei64_v_u32m4_m(vbool8_t vm, uint32_t *rs1, vuint64m8_t rs2,
                                vuint32m4_t vs3, size_t vl);
void __riscv_vsuxei8_v_u64m1_m(vbool64_t vm, uint64_t *rs1, vuint8mf8_t rs2,
                               vuint64m1_t vs3, size_t vl);
void __riscv_vsuxei8_v_u64m2_m(vbool32_t vm, uint64_t *rs1, vuint8mf4_t rs2,
                               vuint64m2_t vs3, size_t vl);
void __riscv_vsuxei8_v_u64m4_m(vbool16_t vm, uint64_t *rs1, vuint8mf2_t rs2,
                               vuint64m4_t vs3, size_t vl);
void __riscv_vsuxei8_v_u64m8_m(vbool8_t vm, uint64_t *rs1, vuint8m1_t rs2,
                               vuint64m8_t vs3, size_t vl);
void __riscv_vsuxei16_v_u64m1_m(vbool64_t vm, uint64_t *rs1, vuint16mf4_t rs2,
                                vuint64m1_t vs3, size_t vl);
void __riscv_vsuxei16_v_u64m2_m(vbool32_t vm, uint64_t *rs1, vuint16mf2_t rs2,
                                vuint64m2_t vs3, size_t vl);
void __riscv_vsuxei16_v_u64m4_m(vbool16_t vm, uint64_t *rs1, vuint16m1_t rs2,
                                vuint64m4_t vs3, size_t vl);
void __riscv_vsuxei16_v_u64m8_m(vbool8_t vm, uint64_t *rs1, vuint16m2_t rs2,
                                vuint64m8_t vs3, size_t vl);
void __riscv_vsuxei32_v_u64m1_m(vbool64_t vm, uint64_t *rs1, vuint32mf2_t rs2,
                                vuint64m1_t vs3, size_t vl);
void __riscv_vsuxei32_v_u64m2_m(vbool32_t vm, uint64_t *rs1, vuint32m1_t rs2,
                                vuint64m2_t vs3, size_t vl);
void __riscv_vsuxei32_v_u64m4_m(vbool16_t vm, uint64_t *rs1, vuint32m2_t rs2,
                                vuint64m4_t vs3, size_t vl);
void __riscv_vsuxei32_v_u64m8_m(vbool8_t vm, uint64_t *rs1, vuint32m4_t rs2,
                                vuint64m8_t vs3, size_t vl);
void __riscv_vsuxei64_v_u64m1_m(vbool64_t vm, uint64_t *rs1, vuint64m1_t rs2,
                                vuint64m1_t vs3, size_t vl);
void __riscv_vsuxei64_v_u64m2_m(vbool32_t vm, uint64_t *rs1, vuint64m2_t rs2,
                                vuint64m2_t vs3, size_t vl);
void __riscv_vsuxei64_v_u64m4_m(vbool16_t vm, uint64_t *rs1, vuint64m4_t rs2,
                                vuint64m4_t vs3, size_t vl);
void __riscv_vsuxei64_v_u64m8_m(vbool8_t vm, uint64_t *rs1, vuint64m8_t rs2,
                                vuint64m8_t vs3, size_t vl);

Unit-stride Fault-Only-First Loads Intrinsics

vfloat16mf4_t __riscv_vle16ff_v_f16mf4(const _Float16 *rs1, size_t *new_vl,
                                       size_t vl);
vfloat16mf2_t __riscv_vle16ff_v_f16mf2(const _Float16 *rs1, size_t *new_vl,
                                       size_t vl);
vfloat16m1_t __riscv_vle16ff_v_f16m1(const _Float16 *rs1, size_t *new_vl,
                                     size_t vl);
vfloat16m2_t __riscv_vle16ff_v_f16m2(const _Float16 *rs1, size_t *new_vl,
                                     size_t vl);
vfloat16m4_t __riscv_vle16ff_v_f16m4(const _Float16 *rs1, size_t *new_vl,
                                     size_t vl);
vfloat16m8_t __riscv_vle16ff_v_f16m8(const _Float16 *rs1, size_t *new_vl,
                                     size_t vl);
vfloat32mf2_t __riscv_vle32ff_v_f32mf2(const float *rs1, size_t *new_vl,
                                       size_t vl);
vfloat32m1_t __riscv_vle32ff_v_f32m1(const float *rs1, size_t *new_vl,
                                     size_t vl);
vfloat32m2_t __riscv_vle32ff_v_f32m2(const float *rs1, size_t *new_vl,
                                     size_t vl);
vfloat32m4_t __riscv_vle32ff_v_f32m4(const float *rs1, size_t *new_vl,
                                     size_t vl);
vfloat32m8_t __riscv_vle32ff_v_f32m8(const float *rs1, size_t *new_vl,
                                     size_t vl);
vfloat64m1_t __riscv_vle64ff_v_f64m1(const double *rs1, size_t *new_vl,
                                     size_t vl);
vfloat64m2_t __riscv_vle64ff_v_f64m2(const double *rs1, size_t *new_vl,
                                     size_t vl);
vfloat64m4_t __riscv_vle64ff_v_f64m4(const double *rs1, size_t *new_vl,
                                     size_t vl);
vfloat64m8_t __riscv_vle64ff_v_f64m8(const double *rs1, size_t *new_vl,
                                     size_t vl);
vint8mf8_t __riscv_vle8ff_v_i8mf8(const int8_t *rs1, size_t *new_vl, size_t vl);
vint8mf4_t __riscv_vle8ff_v_i8mf4(const int8_t *rs1, size_t *new_vl, size_t vl);
vint8mf2_t __riscv_vle8ff_v_i8mf2(const int8_t *rs1, size_t *new_vl, size_t vl);
vint8m1_t __riscv_vle8ff_v_i8m1(const int8_t *rs1, size_t *new_vl, size_t vl);
vint8m2_t __riscv_vle8ff_v_i8m2(const int8_t *rs1, size_t *new_vl, size_t vl);
vint8m4_t __riscv_vle8ff_v_i8m4(const int8_t *rs1, size_t *new_vl, size_t vl);
vint8m8_t __riscv_vle8ff_v_i8m8(const int8_t *rs1, size_t *new_vl, size_t vl);
vint16mf4_t __riscv_vle16ff_v_i16mf4(const int16_t *rs1, size_t *new_vl,
                                     size_t vl);
vint16mf2_t __riscv_vle16ff_v_i16mf2(const int16_t *rs1, size_t *new_vl,
                                     size_t vl);
vint16m1_t __riscv_vle16ff_v_i16m1(const int16_t *rs1, size_t *new_vl,
                                   size_t vl);
vint16m2_t __riscv_vle16ff_v_i16m2(const int16_t *rs1, size_t *new_vl,
                                   size_t vl);
vint16m4_t __riscv_vle16ff_v_i16m4(const int16_t *rs1, size_t *new_vl,
                                   size_t vl);
vint16m8_t __riscv_vle16ff_v_i16m8(const int16_t *rs1, size_t *new_vl,
                                   size_t vl);
vint32mf2_t __riscv_vle32ff_v_i32mf2(const int32_t *rs1, size_t *new_vl,
                                     size_t vl);
vint32m1_t __riscv_vle32ff_v_i32m1(const int32_t *rs1, size_t *new_vl,
                                   size_t vl);
vint32m2_t __riscv_vle32ff_v_i32m2(const int32_t *rs1, size_t *new_vl,
                                   size_t vl);
vint32m4_t __riscv_vle32ff_v_i32m4(const int32_t *rs1, size_t *new_vl,
                                   size_t vl);
vint32m8_t __riscv_vle32ff_v_i32m8(const int32_t *rs1, size_t *new_vl,
                                   size_t vl);
vint64m1_t __riscv_vle64ff_v_i64m1(const int64_t *rs1, size_t *new_vl,
                                   size_t vl);
vint64m2_t __riscv_vle64ff_v_i64m2(const int64_t *rs1, size_t *new_vl,
                                   size_t vl);
vint64m4_t __riscv_vle64ff_v_i64m4(const int64_t *rs1, size_t *new_vl,
                                   size_t vl);
vint64m8_t __riscv_vle64ff_v_i64m8(const int64_t *rs1, size_t *new_vl,
                                   size_t vl);
vuint8mf8_t __riscv_vle8ff_v_u8mf8(const uint8_t *rs1, size_t *new_vl,
                                   size_t vl);
vuint8mf4_t __riscv_vle8ff_v_u8mf4(const uint8_t *rs1, size_t *new_vl,
                                   size_t vl);
vuint8mf2_t __riscv_vle8ff_v_u8mf2(const uint8_t *rs1, size_t *new_vl,
                                   size_t vl);
vuint8m1_t __riscv_vle8ff_v_u8m1(const uint8_t *rs1, size_t *new_vl, size_t vl);
vuint8m2_t __riscv_vle8ff_v_u8m2(const uint8_t *rs1, size_t *new_vl, size_t vl);
vuint8m4_t __riscv_vle8ff_v_u8m4(const uint8_t *rs1, size_t *new_vl, size_t vl);
vuint8m8_t __riscv_vle8ff_v_u8m8(const uint8_t *rs1, size_t *new_vl, size_t vl);
vuint16mf4_t __riscv_vle16ff_v_u16mf4(const uint16_t *rs1, size_t *new_vl,
                                      size_t vl);
vuint16mf2_t __riscv_vle16ff_v_u16mf2(const uint16_t *rs1, size_t *new_vl,
                                      size_t vl);
vuint16m1_t __riscv_vle16ff_v_u16m1(const uint16_t *rs1, size_t *new_vl,
                                    size_t vl);
vuint16m2_t __riscv_vle16ff_v_u16m2(const uint16_t *rs1, size_t *new_vl,
                                    size_t vl);
vuint16m4_t __riscv_vle16ff_v_u16m4(const uint16_t *rs1, size_t *new_vl,
                                    size_t vl);
vuint16m8_t __riscv_vle16ff_v_u16m8(const uint16_t *rs1, size_t *new_vl,
                                    size_t vl);
vuint32mf2_t __riscv_vle32ff_v_u32mf2(const uint32_t *rs1, size_t *new_vl,
                                      size_t vl);
vuint32m1_t __riscv_vle32ff_v_u32m1(const uint32_t *rs1, size_t *new_vl,
                                    size_t vl);
vuint32m2_t __riscv_vle32ff_v_u32m2(const uint32_t *rs1, size_t *new_vl,
                                    size_t vl);
vuint32m4_t __riscv_vle32ff_v_u32m4(const uint32_t *rs1, size_t *new_vl,
                                    size_t vl);
vuint32m8_t __riscv_vle32ff_v_u32m8(const uint32_t *rs1, size_t *new_vl,
                                    size_t vl);
vuint64m1_t __riscv_vle64ff_v_u64m1(const uint64_t *rs1, size_t *new_vl,
                                    size_t vl);
vuint64m2_t __riscv_vle64ff_v_u64m2(const uint64_t *rs1, size_t *new_vl,
                                    size_t vl);
vuint64m4_t __riscv_vle64ff_v_u64m4(const uint64_t *rs1, size_t *new_vl,
                                    size_t vl);
vuint64m8_t __riscv_vle64ff_v_u64m8(const uint64_t *rs1, size_t *new_vl,
                                    size_t vl);
// masked functions
vfloat16mf4_t __riscv_vle16ff_v_f16mf4_m(vbool64_t vm, const _Float16 *rs1,
                                         size_t *new_vl, size_t vl);
vfloat16mf2_t __riscv_vle16ff_v_f16mf2_m(vbool32_t vm, const _Float16 *rs1,
                                         size_t *new_vl, size_t vl);
vfloat16m1_t __riscv_vle16ff_v_f16m1_m(vbool16_t vm, const _Float16 *rs1,
                                       size_t *new_vl, size_t vl);
vfloat16m2_t __riscv_vle16ff_v_f16m2_m(vbool8_t vm, const _Float16 *rs1,
                                       size_t *new_vl, size_t vl);
vfloat16m4_t __riscv_vle16ff_v_f16m4_m(vbool4_t vm, const _Float16 *rs1,
                                       size_t *new_vl, size_t vl);
vfloat16m8_t __riscv_vle16ff_v_f16m8_m(vbool2_t vm, const _Float16 *rs1,
                                       size_t *new_vl, size_t vl);
vfloat32mf2_t __riscv_vle32ff_v_f32mf2_m(vbool64_t vm, const float *rs1,
                                         size_t *new_vl, size_t vl);
vfloat32m1_t __riscv_vle32ff_v_f32m1_m(vbool32_t vm, const float *rs1,
                                       size_t *new_vl, size_t vl);
vfloat32m2_t __riscv_vle32ff_v_f32m2_m(vbool16_t vm, const float *rs1,
                                       size_t *new_vl, size_t vl);
vfloat32m4_t __riscv_vle32ff_v_f32m4_m(vbool8_t vm, const float *rs1,
                                       size_t *new_vl, size_t vl);
vfloat32m8_t __riscv_vle32ff_v_f32m8_m(vbool4_t vm, const float *rs1,
                                       size_t *new_vl, size_t vl);
vfloat64m1_t __riscv_vle64ff_v_f64m1_m(vbool64_t vm, const double *rs1,
                                       size_t *new_vl, size_t vl);
vfloat64m2_t __riscv_vle64ff_v_f64m2_m(vbool32_t vm, const double *rs1,
                                       size_t *new_vl, size_t vl);
vfloat64m4_t __riscv_vle64ff_v_f64m4_m(vbool16_t vm, const double *rs1,
                                       size_t *new_vl, size_t vl);
vfloat64m8_t __riscv_vle64ff_v_f64m8_m(vbool8_t vm, const double *rs1,
                                       size_t *new_vl, size_t vl);
vint8mf8_t __riscv_vle8ff_v_i8mf8_m(vbool64_t vm, const int8_t *rs1,
                                    size_t *new_vl, size_t vl);
vint8mf4_t __riscv_vle8ff_v_i8mf4_m(vbool32_t vm, const int8_t *rs1,
                                    size_t *new_vl, size_t vl);
vint8mf2_t __riscv_vle8ff_v_i8mf2_m(vbool16_t vm, const int8_t *rs1,
                                    size_t *new_vl, size_t vl);
vint8m1_t __riscv_vle8ff_v_i8m1_m(vbool8_t vm, const int8_t *rs1,
                                  size_t *new_vl, size_t vl);
vint8m2_t __riscv_vle8ff_v_i8m2_m(vbool4_t vm, const int8_t *rs1,
                                  size_t *new_vl, size_t vl);
vint8m4_t __riscv_vle8ff_v_i8m4_m(vbool2_t vm, const int8_t *rs1,
                                  size_t *new_vl, size_t vl);
vint8m8_t __riscv_vle8ff_v_i8m8_m(vbool1_t vm, const int8_t *rs1,
                                  size_t *new_vl, size_t vl);
vint16mf4_t __riscv_vle16ff_v_i16mf4_m(vbool64_t vm, const int16_t *rs1,
                                       size_t *new_vl, size_t vl);
vint16mf2_t __riscv_vle16ff_v_i16mf2_m(vbool32_t vm, const int16_t *rs1,
                                       size_t *new_vl, size_t vl);
vint16m1_t __riscv_vle16ff_v_i16m1_m(vbool16_t vm, const int16_t *rs1,
                                     size_t *new_vl, size_t vl);
vint16m2_t __riscv_vle16ff_v_i16m2_m(vbool8_t vm, const int16_t *rs1,
                                     size_t *new_vl, size_t vl);
vint16m4_t __riscv_vle16ff_v_i16m4_m(vbool4_t vm, const int16_t *rs1,
                                     size_t *new_vl, size_t vl);
vint16m8_t __riscv_vle16ff_v_i16m8_m(vbool2_t vm, const int16_t *rs1,
                                     size_t *new_vl, size_t vl);
vint32mf2_t __riscv_vle32ff_v_i32mf2_m(vbool64_t vm, const int32_t *rs1,
                                       size_t *new_vl, size_t vl);
vint32m1_t __riscv_vle32ff_v_i32m1_m(vbool32_t vm, const int32_t *rs1,
                                     size_t *new_vl, size_t vl);
vint32m2_t __riscv_vle32ff_v_i32m2_m(vbool16_t vm, const int32_t *rs1,
                                     size_t *new_vl, size_t vl);
vint32m4_t __riscv_vle32ff_v_i32m4_m(vbool8_t vm, const int32_t *rs1,
                                     size_t *new_vl, size_t vl);
vint32m8_t __riscv_vle32ff_v_i32m8_m(vbool4_t vm, const int32_t *rs1,
                                     size_t *new_vl, size_t vl);
vint64m1_t __riscv_vle64ff_v_i64m1_m(vbool64_t vm, const int64_t *rs1,
                                     size_t *new_vl, size_t vl);
vint64m2_t __riscv_vle64ff_v_i64m2_m(vbool32_t vm, const int64_t *rs1,
                                     size_t *new_vl, size_t vl);
vint64m4_t __riscv_vle64ff_v_i64m4_m(vbool16_t vm, const int64_t *rs1,
                                     size_t *new_vl, size_t vl);
vint64m8_t __riscv_vle64ff_v_i64m8_m(vbool8_t vm, const int64_t *rs1,
                                     size_t *new_vl, size_t vl);
vuint8mf8_t __riscv_vle8ff_v_u8mf8_m(vbool64_t vm, const uint8_t *rs1,
                                     size_t *new_vl, size_t vl);
vuint8mf4_t __riscv_vle8ff_v_u8mf4_m(vbool32_t vm, const uint8_t *rs1,
                                     size_t *new_vl, size_t vl);
vuint8mf2_t __riscv_vle8ff_v_u8mf2_m(vbool16_t vm, const uint8_t *rs1,
                                     size_t *new_vl, size_t vl);
vuint8m1_t __riscv_vle8ff_v_u8m1_m(vbool8_t vm, const uint8_t *rs1,
                                   size_t *new_vl, size_t vl);
vuint8m2_t __riscv_vle8ff_v_u8m2_m(vbool4_t vm, const uint8_t *rs1,
                                   size_t *new_vl, size_t vl);
vuint8m4_t __riscv_vle8ff_v_u8m4_m(vbool2_t vm, const uint8_t *rs1,
                                   size_t *new_vl, size_t vl);
vuint8m8_t __riscv_vle8ff_v_u8m8_m(vbool1_t vm, const uint8_t *rs1,
                                   size_t *new_vl, size_t vl);
vuint16mf4_t __riscv_vle16ff_v_u16mf4_m(vbool64_t vm, const uint16_t *rs1,
                                        size_t *new_vl, size_t vl);
vuint16mf2_t __riscv_vle16ff_v_u16mf2_m(vbool32_t vm, const uint16_t *rs1,
                                        size_t *new_vl, size_t vl);
vuint16m1_t __riscv_vle16ff_v_u16m1_m(vbool16_t vm, const uint16_t *rs1,
                                      size_t *new_vl, size_t vl);
vuint16m2_t __riscv_vle16ff_v_u16m2_m(vbool8_t vm, const uint16_t *rs1,
                                      size_t *new_vl, size_t vl);
vuint16m4_t __riscv_vle16ff_v_u16m4_m(vbool4_t vm, const uint16_t *rs1,
                                      size_t *new_vl, size_t vl);
vuint16m8_t __riscv_vle16ff_v_u16m8_m(vbool2_t vm, const uint16_t *rs1,
                                      size_t *new_vl, size_t vl);
vuint32mf2_t __riscv_vle32ff_v_u32mf2_m(vbool64_t vm, const uint32_t *rs1,
                                        size_t *new_vl, size_t vl);
vuint32m1_t __riscv_vle32ff_v_u32m1_m(vbool32_t vm, const uint32_t *rs1,
                                      size_t *new_vl, size_t vl);
vuint32m2_t __riscv_vle32ff_v_u32m2_m(vbool16_t vm, const uint32_t *rs1,
                                      size_t *new_vl, size_t vl);
vuint32m4_t __riscv_vle32ff_v_u32m4_m(vbool8_t vm, const uint32_t *rs1,
                                      size_t *new_vl, size_t vl);
vuint32m8_t __riscv_vle32ff_v_u32m8_m(vbool4_t vm, const uint32_t *rs1,
                                      size_t *new_vl, size_t vl);
vuint64m1_t __riscv_vle64ff_v_u64m1_m(vbool64_t vm, const uint64_t *rs1,
                                      size_t *new_vl, size_t vl);
vuint64m2_t __riscv_vle64ff_v_u64m2_m(vbool32_t vm, const uint64_t *rs1,
                                      size_t *new_vl, size_t vl);
vuint64m4_t __riscv_vle64ff_v_u64m4_m(vbool16_t vm, const uint64_t *rs1,
                                      size_t *new_vl, size_t vl);
vuint64m8_t __riscv_vle64ff_v_u64m8_m(vbool8_t vm, const uint64_t *rs1,
                                      size_t *new_vl, size_t vl);