Skip to content

Latest commit

 

History

History
1944 lines (1935 loc) · 132 KB

05_vector_reduction_operations.adoc

File metadata and controls

1944 lines (1935 loc) · 132 KB

Vector Reduction Operations

Vector Single-Width Integer Reduction Intrinsics

vint8m1_t __riscv_vredsum_vs_i8mf8_i8m1(vint8mf8_t vs2, vint8m1_t vs1,
                                        size_t vl);
vint8m1_t __riscv_vredsum_vs_i8mf4_i8m1(vint8mf4_t vs2, vint8m1_t vs1,
                                        size_t vl);
vint8m1_t __riscv_vredsum_vs_i8mf2_i8m1(vint8mf2_t vs2, vint8m1_t vs1,
                                        size_t vl);
vint8m1_t __riscv_vredsum_vs_i8m1_i8m1(vint8m1_t vs2, vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredsum_vs_i8m2_i8m1(vint8m2_t vs2, vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredsum_vs_i8m4_i8m1(vint8m4_t vs2, vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredsum_vs_i8m8_i8m1(vint8m8_t vs2, vint8m1_t vs1, size_t vl);
vint16m1_t __riscv_vredsum_vs_i16mf4_i16m1(vint16mf4_t vs2, vint16m1_t vs1,
                                           size_t vl);
vint16m1_t __riscv_vredsum_vs_i16mf2_i16m1(vint16mf2_t vs2, vint16m1_t vs1,
                                           size_t vl);
vint16m1_t __riscv_vredsum_vs_i16m1_i16m1(vint16m1_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint16m1_t __riscv_vredsum_vs_i16m2_i16m1(vint16m2_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint16m1_t __riscv_vredsum_vs_i16m4_i16m1(vint16m4_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint16m1_t __riscv_vredsum_vs_i16m8_i16m1(vint16m8_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint32m1_t __riscv_vredsum_vs_i32mf2_i32m1(vint32mf2_t vs2, vint32m1_t vs1,
                                           size_t vl);
vint32m1_t __riscv_vredsum_vs_i32m1_i32m1(vint32m1_t vs2, vint32m1_t vs1,
                                          size_t vl);
vint32m1_t __riscv_vredsum_vs_i32m2_i32m1(vint32m2_t vs2, vint32m1_t vs1,
                                          size_t vl);
vint32m1_t __riscv_vredsum_vs_i32m4_i32m1(vint32m4_t vs2, vint32m1_t vs1,
                                          size_t vl);
vint32m1_t __riscv_vredsum_vs_i32m8_i32m1(vint32m8_t vs2, vint32m1_t vs1,
                                          size_t vl);
vint64m1_t __riscv_vredsum_vs_i64m1_i64m1(vint64m1_t vs2, vint64m1_t vs1,
                                          size_t vl);
vint64m1_t __riscv_vredsum_vs_i64m2_i64m1(vint64m2_t vs2, vint64m1_t vs1,
                                          size_t vl);
vint64m1_t __riscv_vredsum_vs_i64m4_i64m1(vint64m4_t vs2, vint64m1_t vs1,
                                          size_t vl);
vint64m1_t __riscv_vredsum_vs_i64m8_i64m1(vint64m8_t vs2, vint64m1_t vs1,
                                          size_t vl);
vint8m1_t __riscv_vredmax_vs_i8mf8_i8m1(vint8mf8_t vs2, vint8m1_t vs1,
                                        size_t vl);
vint8m1_t __riscv_vredmax_vs_i8mf4_i8m1(vint8mf4_t vs2, vint8m1_t vs1,
                                        size_t vl);
vint8m1_t __riscv_vredmax_vs_i8mf2_i8m1(vint8mf2_t vs2, vint8m1_t vs1,
                                        size_t vl);
vint8m1_t __riscv_vredmax_vs_i8m1_i8m1(vint8m1_t vs2, vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmax_vs_i8m2_i8m1(vint8m2_t vs2, vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmax_vs_i8m4_i8m1(vint8m4_t vs2, vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmax_vs_i8m8_i8m1(vint8m8_t vs2, vint8m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmax_vs_i16mf4_i16m1(vint16mf4_t vs2, vint16m1_t vs1,
                                           size_t vl);
vint16m1_t __riscv_vredmax_vs_i16mf2_i16m1(vint16mf2_t vs2, vint16m1_t vs1,
                                           size_t vl);
vint16m1_t __riscv_vredmax_vs_i16m1_i16m1(vint16m1_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint16m1_t __riscv_vredmax_vs_i16m2_i16m1(vint16m2_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint16m1_t __riscv_vredmax_vs_i16m4_i16m1(vint16m4_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint16m1_t __riscv_vredmax_vs_i16m8_i16m1(vint16m8_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint32m1_t __riscv_vredmax_vs_i32mf2_i32m1(vint32mf2_t vs2, vint32m1_t vs1,
                                           size_t vl);
vint32m1_t __riscv_vredmax_vs_i32m1_i32m1(vint32m1_t vs2, vint32m1_t vs1,
                                          size_t vl);
vint32m1_t __riscv_vredmax_vs_i32m2_i32m1(vint32m2_t vs2, vint32m1_t vs1,
                                          size_t vl);
vint32m1_t __riscv_vredmax_vs_i32m4_i32m1(vint32m4_t vs2, vint32m1_t vs1,
                                          size_t vl);
vint32m1_t __riscv_vredmax_vs_i32m8_i32m1(vint32m8_t vs2, vint32m1_t vs1,
                                          size_t vl);
vint64m1_t __riscv_vredmax_vs_i64m1_i64m1(vint64m1_t vs2, vint64m1_t vs1,
                                          size_t vl);
vint64m1_t __riscv_vredmax_vs_i64m2_i64m1(vint64m2_t vs2, vint64m1_t vs1,
                                          size_t vl);
vint64m1_t __riscv_vredmax_vs_i64m4_i64m1(vint64m4_t vs2, vint64m1_t vs1,
                                          size_t vl);
vint64m1_t __riscv_vredmax_vs_i64m8_i64m1(vint64m8_t vs2, vint64m1_t vs1,
                                          size_t vl);
vint8m1_t __riscv_vredmin_vs_i8mf8_i8m1(vint8mf8_t vs2, vint8m1_t vs1,
                                        size_t vl);
vint8m1_t __riscv_vredmin_vs_i8mf4_i8m1(vint8mf4_t vs2, vint8m1_t vs1,
                                        size_t vl);
vint8m1_t __riscv_vredmin_vs_i8mf2_i8m1(vint8mf2_t vs2, vint8m1_t vs1,
                                        size_t vl);
vint8m1_t __riscv_vredmin_vs_i8m1_i8m1(vint8m1_t vs2, vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmin_vs_i8m2_i8m1(vint8m2_t vs2, vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmin_vs_i8m4_i8m1(vint8m4_t vs2, vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmin_vs_i8m8_i8m1(vint8m8_t vs2, vint8m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmin_vs_i16mf4_i16m1(vint16mf4_t vs2, vint16m1_t vs1,
                                           size_t vl);
vint16m1_t __riscv_vredmin_vs_i16mf2_i16m1(vint16mf2_t vs2, vint16m1_t vs1,
                                           size_t vl);
vint16m1_t __riscv_vredmin_vs_i16m1_i16m1(vint16m1_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint16m1_t __riscv_vredmin_vs_i16m2_i16m1(vint16m2_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint16m1_t __riscv_vredmin_vs_i16m4_i16m1(vint16m4_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint16m1_t __riscv_vredmin_vs_i16m8_i16m1(vint16m8_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint32m1_t __riscv_vredmin_vs_i32mf2_i32m1(vint32mf2_t vs2, vint32m1_t vs1,
                                           size_t vl);
vint32m1_t __riscv_vredmin_vs_i32m1_i32m1(vint32m1_t vs2, vint32m1_t vs1,
                                          size_t vl);
vint32m1_t __riscv_vredmin_vs_i32m2_i32m1(vint32m2_t vs2, vint32m1_t vs1,
                                          size_t vl);
vint32m1_t __riscv_vredmin_vs_i32m4_i32m1(vint32m4_t vs2, vint32m1_t vs1,
                                          size_t vl);
vint32m1_t __riscv_vredmin_vs_i32m8_i32m1(vint32m8_t vs2, vint32m1_t vs1,
                                          size_t vl);
vint64m1_t __riscv_vredmin_vs_i64m1_i64m1(vint64m1_t vs2, vint64m1_t vs1,
                                          size_t vl);
vint64m1_t __riscv_vredmin_vs_i64m2_i64m1(vint64m2_t vs2, vint64m1_t vs1,
                                          size_t vl);
vint64m1_t __riscv_vredmin_vs_i64m4_i64m1(vint64m4_t vs2, vint64m1_t vs1,
                                          size_t vl);
vint64m1_t __riscv_vredmin_vs_i64m8_i64m1(vint64m8_t vs2, vint64m1_t vs1,
                                          size_t vl);
vint8m1_t __riscv_vredand_vs_i8mf8_i8m1(vint8mf8_t vs2, vint8m1_t vs1,
                                        size_t vl);
vint8m1_t __riscv_vredand_vs_i8mf4_i8m1(vint8mf4_t vs2, vint8m1_t vs1,
                                        size_t vl);
vint8m1_t __riscv_vredand_vs_i8mf2_i8m1(vint8mf2_t vs2, vint8m1_t vs1,
                                        size_t vl);
vint8m1_t __riscv_vredand_vs_i8m1_i8m1(vint8m1_t vs2, vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredand_vs_i8m2_i8m1(vint8m2_t vs2, vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredand_vs_i8m4_i8m1(vint8m4_t vs2, vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredand_vs_i8m8_i8m1(vint8m8_t vs2, vint8m1_t vs1, size_t vl);
vint16m1_t __riscv_vredand_vs_i16mf4_i16m1(vint16mf4_t vs2, vint16m1_t vs1,
                                           size_t vl);
vint16m1_t __riscv_vredand_vs_i16mf2_i16m1(vint16mf2_t vs2, vint16m1_t vs1,
                                           size_t vl);
vint16m1_t __riscv_vredand_vs_i16m1_i16m1(vint16m1_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint16m1_t __riscv_vredand_vs_i16m2_i16m1(vint16m2_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint16m1_t __riscv_vredand_vs_i16m4_i16m1(vint16m4_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint16m1_t __riscv_vredand_vs_i16m8_i16m1(vint16m8_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint32m1_t __riscv_vredand_vs_i32mf2_i32m1(vint32mf2_t vs2, vint32m1_t vs1,
                                           size_t vl);
vint32m1_t __riscv_vredand_vs_i32m1_i32m1(vint32m1_t vs2, vint32m1_t vs1,
                                          size_t vl);
vint32m1_t __riscv_vredand_vs_i32m2_i32m1(vint32m2_t vs2, vint32m1_t vs1,
                                          size_t vl);
vint32m1_t __riscv_vredand_vs_i32m4_i32m1(vint32m4_t vs2, vint32m1_t vs1,
                                          size_t vl);
vint32m1_t __riscv_vredand_vs_i32m8_i32m1(vint32m8_t vs2, vint32m1_t vs1,
                                          size_t vl);
vint64m1_t __riscv_vredand_vs_i64m1_i64m1(vint64m1_t vs2, vint64m1_t vs1,
                                          size_t vl);
vint64m1_t __riscv_vredand_vs_i64m2_i64m1(vint64m2_t vs2, vint64m1_t vs1,
                                          size_t vl);
vint64m1_t __riscv_vredand_vs_i64m4_i64m1(vint64m4_t vs2, vint64m1_t vs1,
                                          size_t vl);
vint64m1_t __riscv_vredand_vs_i64m8_i64m1(vint64m8_t vs2, vint64m1_t vs1,
                                          size_t vl);
vint8m1_t __riscv_vredor_vs_i8mf8_i8m1(vint8mf8_t vs2, vint8m1_t vs1,
                                       size_t vl);
vint8m1_t __riscv_vredor_vs_i8mf4_i8m1(vint8mf4_t vs2, vint8m1_t vs1,
                                       size_t vl);
vint8m1_t __riscv_vredor_vs_i8mf2_i8m1(vint8mf2_t vs2, vint8m1_t vs1,
                                       size_t vl);
vint8m1_t __riscv_vredor_vs_i8m1_i8m1(vint8m1_t vs2, vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredor_vs_i8m2_i8m1(vint8m2_t vs2, vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredor_vs_i8m4_i8m1(vint8m4_t vs2, vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredor_vs_i8m8_i8m1(vint8m8_t vs2, vint8m1_t vs1, size_t vl);
vint16m1_t __riscv_vredor_vs_i16mf4_i16m1(vint16mf4_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint16m1_t __riscv_vredor_vs_i16mf2_i16m1(vint16mf2_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint16m1_t __riscv_vredor_vs_i16m1_i16m1(vint16m1_t vs2, vint16m1_t vs1,
                                         size_t vl);
vint16m1_t __riscv_vredor_vs_i16m2_i16m1(vint16m2_t vs2, vint16m1_t vs1,
                                         size_t vl);
vint16m1_t __riscv_vredor_vs_i16m4_i16m1(vint16m4_t vs2, vint16m1_t vs1,
                                         size_t vl);
vint16m1_t __riscv_vredor_vs_i16m8_i16m1(vint16m8_t vs2, vint16m1_t vs1,
                                         size_t vl);
vint32m1_t __riscv_vredor_vs_i32mf2_i32m1(vint32mf2_t vs2, vint32m1_t vs1,
                                          size_t vl);
vint32m1_t __riscv_vredor_vs_i32m1_i32m1(vint32m1_t vs2, vint32m1_t vs1,
                                         size_t vl);
vint32m1_t __riscv_vredor_vs_i32m2_i32m1(vint32m2_t vs2, vint32m1_t vs1,
                                         size_t vl);
vint32m1_t __riscv_vredor_vs_i32m4_i32m1(vint32m4_t vs2, vint32m1_t vs1,
                                         size_t vl);
vint32m1_t __riscv_vredor_vs_i32m8_i32m1(vint32m8_t vs2, vint32m1_t vs1,
                                         size_t vl);
vint64m1_t __riscv_vredor_vs_i64m1_i64m1(vint64m1_t vs2, vint64m1_t vs1,
                                         size_t vl);
vint64m1_t __riscv_vredor_vs_i64m2_i64m1(vint64m2_t vs2, vint64m1_t vs1,
                                         size_t vl);
vint64m1_t __riscv_vredor_vs_i64m4_i64m1(vint64m4_t vs2, vint64m1_t vs1,
                                         size_t vl);
vint64m1_t __riscv_vredor_vs_i64m8_i64m1(vint64m8_t vs2, vint64m1_t vs1,
                                         size_t vl);
vint8m1_t __riscv_vredxor_vs_i8mf8_i8m1(vint8mf8_t vs2, vint8m1_t vs1,
                                        size_t vl);
vint8m1_t __riscv_vredxor_vs_i8mf4_i8m1(vint8mf4_t vs2, vint8m1_t vs1,
                                        size_t vl);
vint8m1_t __riscv_vredxor_vs_i8mf2_i8m1(vint8mf2_t vs2, vint8m1_t vs1,
                                        size_t vl);
vint8m1_t __riscv_vredxor_vs_i8m1_i8m1(vint8m1_t vs2, vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredxor_vs_i8m2_i8m1(vint8m2_t vs2, vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredxor_vs_i8m4_i8m1(vint8m4_t vs2, vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredxor_vs_i8m8_i8m1(vint8m8_t vs2, vint8m1_t vs1, size_t vl);
vint16m1_t __riscv_vredxor_vs_i16mf4_i16m1(vint16mf4_t vs2, vint16m1_t vs1,
                                           size_t vl);
vint16m1_t __riscv_vredxor_vs_i16mf2_i16m1(vint16mf2_t vs2, vint16m1_t vs1,
                                           size_t vl);
vint16m1_t __riscv_vredxor_vs_i16m1_i16m1(vint16m1_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint16m1_t __riscv_vredxor_vs_i16m2_i16m1(vint16m2_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint16m1_t __riscv_vredxor_vs_i16m4_i16m1(vint16m4_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint16m1_t __riscv_vredxor_vs_i16m8_i16m1(vint16m8_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint32m1_t __riscv_vredxor_vs_i32mf2_i32m1(vint32mf2_t vs2, vint32m1_t vs1,
                                           size_t vl);
vint32m1_t __riscv_vredxor_vs_i32m1_i32m1(vint32m1_t vs2, vint32m1_t vs1,
                                          size_t vl);
vint32m1_t __riscv_vredxor_vs_i32m2_i32m1(vint32m2_t vs2, vint32m1_t vs1,
                                          size_t vl);
vint32m1_t __riscv_vredxor_vs_i32m4_i32m1(vint32m4_t vs2, vint32m1_t vs1,
                                          size_t vl);
vint32m1_t __riscv_vredxor_vs_i32m8_i32m1(vint32m8_t vs2, vint32m1_t vs1,
                                          size_t vl);
vint64m1_t __riscv_vredxor_vs_i64m1_i64m1(vint64m1_t vs2, vint64m1_t vs1,
                                          size_t vl);
vint64m1_t __riscv_vredxor_vs_i64m2_i64m1(vint64m2_t vs2, vint64m1_t vs1,
                                          size_t vl);
vint64m1_t __riscv_vredxor_vs_i64m4_i64m1(vint64m4_t vs2, vint64m1_t vs1,
                                          size_t vl);
vint64m1_t __riscv_vredxor_vs_i64m8_i64m1(vint64m8_t vs2, vint64m1_t vs1,
                                          size_t vl);
vuint8m1_t __riscv_vredsum_vs_u8mf8_u8m1(vuint8mf8_t vs2, vuint8m1_t vs1,
                                         size_t vl);
vuint8m1_t __riscv_vredsum_vs_u8mf4_u8m1(vuint8mf4_t vs2, vuint8m1_t vs1,
                                         size_t vl);
vuint8m1_t __riscv_vredsum_vs_u8mf2_u8m1(vuint8mf2_t vs2, vuint8m1_t vs1,
                                         size_t vl);
vuint8m1_t __riscv_vredsum_vs_u8m1_u8m1(vuint8m1_t vs2, vuint8m1_t vs1,
                                        size_t vl);
vuint8m1_t __riscv_vredsum_vs_u8m2_u8m1(vuint8m2_t vs2, vuint8m1_t vs1,
                                        size_t vl);
vuint8m1_t __riscv_vredsum_vs_u8m4_u8m1(vuint8m4_t vs2, vuint8m1_t vs1,
                                        size_t vl);
vuint8m1_t __riscv_vredsum_vs_u8m8_u8m1(vuint8m8_t vs2, vuint8m1_t vs1,
                                        size_t vl);
vuint16m1_t __riscv_vredsum_vs_u16mf4_u16m1(vuint16mf4_t vs2, vuint16m1_t vs1,
                                            size_t vl);
vuint16m1_t __riscv_vredsum_vs_u16mf2_u16m1(vuint16mf2_t vs2, vuint16m1_t vs1,
                                            size_t vl);
vuint16m1_t __riscv_vredsum_vs_u16m1_u16m1(vuint16m1_t vs2, vuint16m1_t vs1,
                                           size_t vl);
vuint16m1_t __riscv_vredsum_vs_u16m2_u16m1(vuint16m2_t vs2, vuint16m1_t vs1,
                                           size_t vl);
vuint16m1_t __riscv_vredsum_vs_u16m4_u16m1(vuint16m4_t vs2, vuint16m1_t vs1,
                                           size_t vl);
vuint16m1_t __riscv_vredsum_vs_u16m8_u16m1(vuint16m8_t vs2, vuint16m1_t vs1,
                                           size_t vl);
vuint32m1_t __riscv_vredsum_vs_u32mf2_u32m1(vuint32mf2_t vs2, vuint32m1_t vs1,
                                            size_t vl);
vuint32m1_t __riscv_vredsum_vs_u32m1_u32m1(vuint32m1_t vs2, vuint32m1_t vs1,
                                           size_t vl);
vuint32m1_t __riscv_vredsum_vs_u32m2_u32m1(vuint32m2_t vs2, vuint32m1_t vs1,
                                           size_t vl);
vuint32m1_t __riscv_vredsum_vs_u32m4_u32m1(vuint32m4_t vs2, vuint32m1_t vs1,
                                           size_t vl);
vuint32m1_t __riscv_vredsum_vs_u32m8_u32m1(vuint32m8_t vs2, vuint32m1_t vs1,
                                           size_t vl);
vuint64m1_t __riscv_vredsum_vs_u64m1_u64m1(vuint64m1_t vs2, vuint64m1_t vs1,
                                           size_t vl);
vuint64m1_t __riscv_vredsum_vs_u64m2_u64m1(vuint64m2_t vs2, vuint64m1_t vs1,
                                           size_t vl);
vuint64m1_t __riscv_vredsum_vs_u64m4_u64m1(vuint64m4_t vs2, vuint64m1_t vs1,
                                           size_t vl);
vuint64m1_t __riscv_vredsum_vs_u64m8_u64m1(vuint64m8_t vs2, vuint64m1_t vs1,
                                           size_t vl);
vuint8m1_t __riscv_vredmaxu_vs_u8mf8_u8m1(vuint8mf8_t vs2, vuint8m1_t vs1,
                                          size_t vl);
vuint8m1_t __riscv_vredmaxu_vs_u8mf4_u8m1(vuint8mf4_t vs2, vuint8m1_t vs1,
                                          size_t vl);
vuint8m1_t __riscv_vredmaxu_vs_u8mf2_u8m1(vuint8mf2_t vs2, vuint8m1_t vs1,
                                          size_t vl);
vuint8m1_t __riscv_vredmaxu_vs_u8m1_u8m1(vuint8m1_t vs2, vuint8m1_t vs1,
                                         size_t vl);
vuint8m1_t __riscv_vredmaxu_vs_u8m2_u8m1(vuint8m2_t vs2, vuint8m1_t vs1,
                                         size_t vl);
vuint8m1_t __riscv_vredmaxu_vs_u8m4_u8m1(vuint8m4_t vs2, vuint8m1_t vs1,
                                         size_t vl);
vuint8m1_t __riscv_vredmaxu_vs_u8m8_u8m1(vuint8m8_t vs2, vuint8m1_t vs1,
                                         size_t vl);
vuint16m1_t __riscv_vredmaxu_vs_u16mf4_u16m1(vuint16mf4_t vs2, vuint16m1_t vs1,
                                             size_t vl);
vuint16m1_t __riscv_vredmaxu_vs_u16mf2_u16m1(vuint16mf2_t vs2, vuint16m1_t vs1,
                                             size_t vl);
vuint16m1_t __riscv_vredmaxu_vs_u16m1_u16m1(vuint16m1_t vs2, vuint16m1_t vs1,
                                            size_t vl);
vuint16m1_t __riscv_vredmaxu_vs_u16m2_u16m1(vuint16m2_t vs2, vuint16m1_t vs1,
                                            size_t vl);
vuint16m1_t __riscv_vredmaxu_vs_u16m4_u16m1(vuint16m4_t vs2, vuint16m1_t vs1,
                                            size_t vl);
vuint16m1_t __riscv_vredmaxu_vs_u16m8_u16m1(vuint16m8_t vs2, vuint16m1_t vs1,
                                            size_t vl);
vuint32m1_t __riscv_vredmaxu_vs_u32mf2_u32m1(vuint32mf2_t vs2, vuint32m1_t vs1,
                                             size_t vl);
vuint32m1_t __riscv_vredmaxu_vs_u32m1_u32m1(vuint32m1_t vs2, vuint32m1_t vs1,
                                            size_t vl);
vuint32m1_t __riscv_vredmaxu_vs_u32m2_u32m1(vuint32m2_t vs2, vuint32m1_t vs1,
                                            size_t vl);
vuint32m1_t __riscv_vredmaxu_vs_u32m4_u32m1(vuint32m4_t vs2, vuint32m1_t vs1,
                                            size_t vl);
vuint32m1_t __riscv_vredmaxu_vs_u32m8_u32m1(vuint32m8_t vs2, vuint32m1_t vs1,
                                            size_t vl);
vuint64m1_t __riscv_vredmaxu_vs_u64m1_u64m1(vuint64m1_t vs2, vuint64m1_t vs1,
                                            size_t vl);
vuint64m1_t __riscv_vredmaxu_vs_u64m2_u64m1(vuint64m2_t vs2, vuint64m1_t vs1,
                                            size_t vl);
vuint64m1_t __riscv_vredmaxu_vs_u64m4_u64m1(vuint64m4_t vs2, vuint64m1_t vs1,
                                            size_t vl);
vuint64m1_t __riscv_vredmaxu_vs_u64m8_u64m1(vuint64m8_t vs2, vuint64m1_t vs1,
                                            size_t vl);
vuint8m1_t __riscv_vredminu_vs_u8mf8_u8m1(vuint8mf8_t vs2, vuint8m1_t vs1,
                                          size_t vl);
vuint8m1_t __riscv_vredminu_vs_u8mf4_u8m1(vuint8mf4_t vs2, vuint8m1_t vs1,
                                          size_t vl);
vuint8m1_t __riscv_vredminu_vs_u8mf2_u8m1(vuint8mf2_t vs2, vuint8m1_t vs1,
                                          size_t vl);
vuint8m1_t __riscv_vredminu_vs_u8m1_u8m1(vuint8m1_t vs2, vuint8m1_t vs1,
                                         size_t vl);
vuint8m1_t __riscv_vredminu_vs_u8m2_u8m1(vuint8m2_t vs2, vuint8m1_t vs1,
                                         size_t vl);
vuint8m1_t __riscv_vredminu_vs_u8m4_u8m1(vuint8m4_t vs2, vuint8m1_t vs1,
                                         size_t vl);
vuint8m1_t __riscv_vredminu_vs_u8m8_u8m1(vuint8m8_t vs2, vuint8m1_t vs1,
                                         size_t vl);
vuint16m1_t __riscv_vredminu_vs_u16mf4_u16m1(vuint16mf4_t vs2, vuint16m1_t vs1,
                                             size_t vl);
vuint16m1_t __riscv_vredminu_vs_u16mf2_u16m1(vuint16mf2_t vs2, vuint16m1_t vs1,
                                             size_t vl);
vuint16m1_t __riscv_vredminu_vs_u16m1_u16m1(vuint16m1_t vs2, vuint16m1_t vs1,
                                            size_t vl);
vuint16m1_t __riscv_vredminu_vs_u16m2_u16m1(vuint16m2_t vs2, vuint16m1_t vs1,
                                            size_t vl);
vuint16m1_t __riscv_vredminu_vs_u16m4_u16m1(vuint16m4_t vs2, vuint16m1_t vs1,
                                            size_t vl);
vuint16m1_t __riscv_vredminu_vs_u16m8_u16m1(vuint16m8_t vs2, vuint16m1_t vs1,
                                            size_t vl);
vuint32m1_t __riscv_vredminu_vs_u32mf2_u32m1(vuint32mf2_t vs2, vuint32m1_t vs1,
                                             size_t vl);
vuint32m1_t __riscv_vredminu_vs_u32m1_u32m1(vuint32m1_t vs2, vuint32m1_t vs1,
                                            size_t vl);
vuint32m1_t __riscv_vredminu_vs_u32m2_u32m1(vuint32m2_t vs2, vuint32m1_t vs1,
                                            size_t vl);
vuint32m1_t __riscv_vredminu_vs_u32m4_u32m1(vuint32m4_t vs2, vuint32m1_t vs1,
                                            size_t vl);
vuint32m1_t __riscv_vredminu_vs_u32m8_u32m1(vuint32m8_t vs2, vuint32m1_t vs1,
                                            size_t vl);
vuint64m1_t __riscv_vredminu_vs_u64m1_u64m1(vuint64m1_t vs2, vuint64m1_t vs1,
                                            size_t vl);
vuint64m1_t __riscv_vredminu_vs_u64m2_u64m1(vuint64m2_t vs2, vuint64m1_t vs1,
                                            size_t vl);
vuint64m1_t __riscv_vredminu_vs_u64m4_u64m1(vuint64m4_t vs2, vuint64m1_t vs1,
                                            size_t vl);
vuint64m1_t __riscv_vredminu_vs_u64m8_u64m1(vuint64m8_t vs2, vuint64m1_t vs1,
                                            size_t vl);
vuint8m1_t __riscv_vredand_vs_u8mf8_u8m1(vuint8mf8_t vs2, vuint8m1_t vs1,
                                         size_t vl);
vuint8m1_t __riscv_vredand_vs_u8mf4_u8m1(vuint8mf4_t vs2, vuint8m1_t vs1,
                                         size_t vl);
vuint8m1_t __riscv_vredand_vs_u8mf2_u8m1(vuint8mf2_t vs2, vuint8m1_t vs1,
                                         size_t vl);
vuint8m1_t __riscv_vredand_vs_u8m1_u8m1(vuint8m1_t vs2, vuint8m1_t vs1,
                                        size_t vl);
vuint8m1_t __riscv_vredand_vs_u8m2_u8m1(vuint8m2_t vs2, vuint8m1_t vs1,
                                        size_t vl);
vuint8m1_t __riscv_vredand_vs_u8m4_u8m1(vuint8m4_t vs2, vuint8m1_t vs1,
                                        size_t vl);
vuint8m1_t __riscv_vredand_vs_u8m8_u8m1(vuint8m8_t vs2, vuint8m1_t vs1,
                                        size_t vl);
vuint16m1_t __riscv_vredand_vs_u16mf4_u16m1(vuint16mf4_t vs2, vuint16m1_t vs1,
                                            size_t vl);
vuint16m1_t __riscv_vredand_vs_u16mf2_u16m1(vuint16mf2_t vs2, vuint16m1_t vs1,
                                            size_t vl);
vuint16m1_t __riscv_vredand_vs_u16m1_u16m1(vuint16m1_t vs2, vuint16m1_t vs1,
                                           size_t vl);
vuint16m1_t __riscv_vredand_vs_u16m2_u16m1(vuint16m2_t vs2, vuint16m1_t vs1,
                                           size_t vl);
vuint16m1_t __riscv_vredand_vs_u16m4_u16m1(vuint16m4_t vs2, vuint16m1_t vs1,
                                           size_t vl);
vuint16m1_t __riscv_vredand_vs_u16m8_u16m1(vuint16m8_t vs2, vuint16m1_t vs1,
                                           size_t vl);
vuint32m1_t __riscv_vredand_vs_u32mf2_u32m1(vuint32mf2_t vs2, vuint32m1_t vs1,
                                            size_t vl);
vuint32m1_t __riscv_vredand_vs_u32m1_u32m1(vuint32m1_t vs2, vuint32m1_t vs1,
                                           size_t vl);
vuint32m1_t __riscv_vredand_vs_u32m2_u32m1(vuint32m2_t vs2, vuint32m1_t vs1,
                                           size_t vl);
vuint32m1_t __riscv_vredand_vs_u32m4_u32m1(vuint32m4_t vs2, vuint32m1_t vs1,
                                           size_t vl);
vuint32m1_t __riscv_vredand_vs_u32m8_u32m1(vuint32m8_t vs2, vuint32m1_t vs1,
                                           size_t vl);
vuint64m1_t __riscv_vredand_vs_u64m1_u64m1(vuint64m1_t vs2, vuint64m1_t vs1,
                                           size_t vl);
vuint64m1_t __riscv_vredand_vs_u64m2_u64m1(vuint64m2_t vs2, vuint64m1_t vs1,
                                           size_t vl);
vuint64m1_t __riscv_vredand_vs_u64m4_u64m1(vuint64m4_t vs2, vuint64m1_t vs1,
                                           size_t vl);
vuint64m1_t __riscv_vredand_vs_u64m8_u64m1(vuint64m8_t vs2, vuint64m1_t vs1,
                                           size_t vl);
vuint8m1_t __riscv_vredor_vs_u8mf8_u8m1(vuint8mf8_t vs2, vuint8m1_t vs1,
                                        size_t vl);
vuint8m1_t __riscv_vredor_vs_u8mf4_u8m1(vuint8mf4_t vs2, vuint8m1_t vs1,
                                        size_t vl);
vuint8m1_t __riscv_vredor_vs_u8mf2_u8m1(vuint8mf2_t vs2, vuint8m1_t vs1,
                                        size_t vl);
vuint8m1_t __riscv_vredor_vs_u8m1_u8m1(vuint8m1_t vs2, vuint8m1_t vs1,
                                       size_t vl);
vuint8m1_t __riscv_vredor_vs_u8m2_u8m1(vuint8m2_t vs2, vuint8m1_t vs1,
                                       size_t vl);
vuint8m1_t __riscv_vredor_vs_u8m4_u8m1(vuint8m4_t vs2, vuint8m1_t vs1,
                                       size_t vl);
vuint8m1_t __riscv_vredor_vs_u8m8_u8m1(vuint8m8_t vs2, vuint8m1_t vs1,
                                       size_t vl);
vuint16m1_t __riscv_vredor_vs_u16mf4_u16m1(vuint16mf4_t vs2, vuint16m1_t vs1,
                                           size_t vl);
vuint16m1_t __riscv_vredor_vs_u16mf2_u16m1(vuint16mf2_t vs2, vuint16m1_t vs1,
                                           size_t vl);
vuint16m1_t __riscv_vredor_vs_u16m1_u16m1(vuint16m1_t vs2, vuint16m1_t vs1,
                                          size_t vl);
vuint16m1_t __riscv_vredor_vs_u16m2_u16m1(vuint16m2_t vs2, vuint16m1_t vs1,
                                          size_t vl);
vuint16m1_t __riscv_vredor_vs_u16m4_u16m1(vuint16m4_t vs2, vuint16m1_t vs1,
                                          size_t vl);
vuint16m1_t __riscv_vredor_vs_u16m8_u16m1(vuint16m8_t vs2, vuint16m1_t vs1,
                                          size_t vl);
vuint32m1_t __riscv_vredor_vs_u32mf2_u32m1(vuint32mf2_t vs2, vuint32m1_t vs1,
                                           size_t vl);
vuint32m1_t __riscv_vredor_vs_u32m1_u32m1(vuint32m1_t vs2, vuint32m1_t vs1,
                                          size_t vl);
vuint32m1_t __riscv_vredor_vs_u32m2_u32m1(vuint32m2_t vs2, vuint32m1_t vs1,
                                          size_t vl);
vuint32m1_t __riscv_vredor_vs_u32m4_u32m1(vuint32m4_t vs2, vuint32m1_t vs1,
                                          size_t vl);
vuint32m1_t __riscv_vredor_vs_u32m8_u32m1(vuint32m8_t vs2, vuint32m1_t vs1,
                                          size_t vl);
vuint64m1_t __riscv_vredor_vs_u64m1_u64m1(vuint64m1_t vs2, vuint64m1_t vs1,
                                          size_t vl);
vuint64m1_t __riscv_vredor_vs_u64m2_u64m1(vuint64m2_t vs2, vuint64m1_t vs1,
                                          size_t vl);
vuint64m1_t __riscv_vredor_vs_u64m4_u64m1(vuint64m4_t vs2, vuint64m1_t vs1,
                                          size_t vl);
vuint64m1_t __riscv_vredor_vs_u64m8_u64m1(vuint64m8_t vs2, vuint64m1_t vs1,
                                          size_t vl);
vuint8m1_t __riscv_vredxor_vs_u8mf8_u8m1(vuint8mf8_t vs2, vuint8m1_t vs1,
                                         size_t vl);
vuint8m1_t __riscv_vredxor_vs_u8mf4_u8m1(vuint8mf4_t vs2, vuint8m1_t vs1,
                                         size_t vl);
vuint8m1_t __riscv_vredxor_vs_u8mf2_u8m1(vuint8mf2_t vs2, vuint8m1_t vs1,
                                         size_t vl);
vuint8m1_t __riscv_vredxor_vs_u8m1_u8m1(vuint8m1_t vs2, vuint8m1_t vs1,
                                        size_t vl);
vuint8m1_t __riscv_vredxor_vs_u8m2_u8m1(vuint8m2_t vs2, vuint8m1_t vs1,
                                        size_t vl);
vuint8m1_t __riscv_vredxor_vs_u8m4_u8m1(vuint8m4_t vs2, vuint8m1_t vs1,
                                        size_t vl);
vuint8m1_t __riscv_vredxor_vs_u8m8_u8m1(vuint8m8_t vs2, vuint8m1_t vs1,
                                        size_t vl);
vuint16m1_t __riscv_vredxor_vs_u16mf4_u16m1(vuint16mf4_t vs2, vuint16m1_t vs1,
                                            size_t vl);
vuint16m1_t __riscv_vredxor_vs_u16mf2_u16m1(vuint16mf2_t vs2, vuint16m1_t vs1,
                                            size_t vl);
vuint16m1_t __riscv_vredxor_vs_u16m1_u16m1(vuint16m1_t vs2, vuint16m1_t vs1,
                                           size_t vl);
vuint16m1_t __riscv_vredxor_vs_u16m2_u16m1(vuint16m2_t vs2, vuint16m1_t vs1,
                                           size_t vl);
vuint16m1_t __riscv_vredxor_vs_u16m4_u16m1(vuint16m4_t vs2, vuint16m1_t vs1,
                                           size_t vl);
vuint16m1_t __riscv_vredxor_vs_u16m8_u16m1(vuint16m8_t vs2, vuint16m1_t vs1,
                                           size_t vl);
vuint32m1_t __riscv_vredxor_vs_u32mf2_u32m1(vuint32mf2_t vs2, vuint32m1_t vs1,
                                            size_t vl);
vuint32m1_t __riscv_vredxor_vs_u32m1_u32m1(vuint32m1_t vs2, vuint32m1_t vs1,
                                           size_t vl);
vuint32m1_t __riscv_vredxor_vs_u32m2_u32m1(vuint32m2_t vs2, vuint32m1_t vs1,
                                           size_t vl);
vuint32m1_t __riscv_vredxor_vs_u32m4_u32m1(vuint32m4_t vs2, vuint32m1_t vs1,
                                           size_t vl);
vuint32m1_t __riscv_vredxor_vs_u32m8_u32m1(vuint32m8_t vs2, vuint32m1_t vs1,
                                           size_t vl);
vuint64m1_t __riscv_vredxor_vs_u64m1_u64m1(vuint64m1_t vs2, vuint64m1_t vs1,
                                           size_t vl);
vuint64m1_t __riscv_vredxor_vs_u64m2_u64m1(vuint64m2_t vs2, vuint64m1_t vs1,
                                           size_t vl);
vuint64m1_t __riscv_vredxor_vs_u64m4_u64m1(vuint64m4_t vs2, vuint64m1_t vs1,
                                           size_t vl);
vuint64m1_t __riscv_vredxor_vs_u64m8_u64m1(vuint64m8_t vs2, vuint64m1_t vs1,
                                           size_t vl);
// masked functions
vint8m1_t __riscv_vredsum_vs_i8mf8_i8m1_m(vbool64_t vm, vint8mf8_t vs2,
                                          vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredsum_vs_i8mf4_i8m1_m(vbool32_t vm, vint8mf4_t vs2,
                                          vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredsum_vs_i8mf2_i8m1_m(vbool16_t vm, vint8mf2_t vs2,
                                          vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredsum_vs_i8m1_i8m1_m(vbool8_t vm, vint8m1_t vs2,
                                         vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredsum_vs_i8m2_i8m1_m(vbool4_t vm, vint8m2_t vs2,
                                         vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredsum_vs_i8m4_i8m1_m(vbool2_t vm, vint8m4_t vs2,
                                         vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredsum_vs_i8m8_i8m1_m(vbool1_t vm, vint8m8_t vs2,
                                         vint8m1_t vs1, size_t vl);
vint16m1_t __riscv_vredsum_vs_i16mf4_i16m1_m(vbool64_t vm, vint16mf4_t vs2,
                                             vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredsum_vs_i16mf2_i16m1_m(vbool32_t vm, vint16mf2_t vs2,
                                             vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredsum_vs_i16m1_i16m1_m(vbool16_t vm, vint16m1_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredsum_vs_i16m2_i16m1_m(vbool8_t vm, vint16m2_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredsum_vs_i16m4_i16m1_m(vbool4_t vm, vint16m4_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredsum_vs_i16m8_i16m1_m(vbool2_t vm, vint16m8_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint32m1_t __riscv_vredsum_vs_i32mf2_i32m1_m(vbool64_t vm, vint32mf2_t vs2,
                                             vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredsum_vs_i32m1_i32m1_m(vbool32_t vm, vint32m1_t vs2,
                                            vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredsum_vs_i32m2_i32m1_m(vbool16_t vm, vint32m2_t vs2,
                                            vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredsum_vs_i32m4_i32m1_m(vbool8_t vm, vint32m4_t vs2,
                                            vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredsum_vs_i32m8_i32m1_m(vbool4_t vm, vint32m8_t vs2,
                                            vint32m1_t vs1, size_t vl);
vint64m1_t __riscv_vredsum_vs_i64m1_i64m1_m(vbool64_t vm, vint64m1_t vs2,
                                            vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredsum_vs_i64m2_i64m1_m(vbool32_t vm, vint64m2_t vs2,
                                            vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredsum_vs_i64m4_i64m1_m(vbool16_t vm, vint64m4_t vs2,
                                            vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredsum_vs_i64m8_i64m1_m(vbool8_t vm, vint64m8_t vs2,
                                            vint64m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmax_vs_i8mf8_i8m1_m(vbool64_t vm, vint8mf8_t vs2,
                                          vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmax_vs_i8mf4_i8m1_m(vbool32_t vm, vint8mf4_t vs2,
                                          vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmax_vs_i8mf2_i8m1_m(vbool16_t vm, vint8mf2_t vs2,
                                          vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmax_vs_i8m1_i8m1_m(vbool8_t vm, vint8m1_t vs2,
                                         vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmax_vs_i8m2_i8m1_m(vbool4_t vm, vint8m2_t vs2,
                                         vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmax_vs_i8m4_i8m1_m(vbool2_t vm, vint8m4_t vs2,
                                         vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmax_vs_i8m8_i8m1_m(vbool1_t vm, vint8m8_t vs2,
                                         vint8m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmax_vs_i16mf4_i16m1_m(vbool64_t vm, vint16mf4_t vs2,
                                             vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmax_vs_i16mf2_i16m1_m(vbool32_t vm, vint16mf2_t vs2,
                                             vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmax_vs_i16m1_i16m1_m(vbool16_t vm, vint16m1_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmax_vs_i16m2_i16m1_m(vbool8_t vm, vint16m2_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmax_vs_i16m4_i16m1_m(vbool4_t vm, vint16m4_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmax_vs_i16m8_i16m1_m(vbool2_t vm, vint16m8_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint32m1_t __riscv_vredmax_vs_i32mf2_i32m1_m(vbool64_t vm, vint32mf2_t vs2,
                                             vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredmax_vs_i32m1_i32m1_m(vbool32_t vm, vint32m1_t vs2,
                                            vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredmax_vs_i32m2_i32m1_m(vbool16_t vm, vint32m2_t vs2,
                                            vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredmax_vs_i32m4_i32m1_m(vbool8_t vm, vint32m4_t vs2,
                                            vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredmax_vs_i32m8_i32m1_m(vbool4_t vm, vint32m8_t vs2,
                                            vint32m1_t vs1, size_t vl);
vint64m1_t __riscv_vredmax_vs_i64m1_i64m1_m(vbool64_t vm, vint64m1_t vs2,
                                            vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredmax_vs_i64m2_i64m1_m(vbool32_t vm, vint64m2_t vs2,
                                            vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredmax_vs_i64m4_i64m1_m(vbool16_t vm, vint64m4_t vs2,
                                            vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredmax_vs_i64m8_i64m1_m(vbool8_t vm, vint64m8_t vs2,
                                            vint64m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmin_vs_i8mf8_i8m1_m(vbool64_t vm, vint8mf8_t vs2,
                                          vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmin_vs_i8mf4_i8m1_m(vbool32_t vm, vint8mf4_t vs2,
                                          vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmin_vs_i8mf2_i8m1_m(vbool16_t vm, vint8mf2_t vs2,
                                          vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmin_vs_i8m1_i8m1_m(vbool8_t vm, vint8m1_t vs2,
                                         vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmin_vs_i8m2_i8m1_m(vbool4_t vm, vint8m2_t vs2,
                                         vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmin_vs_i8m4_i8m1_m(vbool2_t vm, vint8m4_t vs2,
                                         vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmin_vs_i8m8_i8m1_m(vbool1_t vm, vint8m8_t vs2,
                                         vint8m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmin_vs_i16mf4_i16m1_m(vbool64_t vm, vint16mf4_t vs2,
                                             vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmin_vs_i16mf2_i16m1_m(vbool32_t vm, vint16mf2_t vs2,
                                             vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmin_vs_i16m1_i16m1_m(vbool16_t vm, vint16m1_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmin_vs_i16m2_i16m1_m(vbool8_t vm, vint16m2_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmin_vs_i16m4_i16m1_m(vbool4_t vm, vint16m4_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmin_vs_i16m8_i16m1_m(vbool2_t vm, vint16m8_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint32m1_t __riscv_vredmin_vs_i32mf2_i32m1_m(vbool64_t vm, vint32mf2_t vs2,
                                             vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredmin_vs_i32m1_i32m1_m(vbool32_t vm, vint32m1_t vs2,
                                            vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredmin_vs_i32m2_i32m1_m(vbool16_t vm, vint32m2_t vs2,
                                            vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredmin_vs_i32m4_i32m1_m(vbool8_t vm, vint32m4_t vs2,
                                            vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredmin_vs_i32m8_i32m1_m(vbool4_t vm, vint32m8_t vs2,
                                            vint32m1_t vs1, size_t vl);
vint64m1_t __riscv_vredmin_vs_i64m1_i64m1_m(vbool64_t vm, vint64m1_t vs2,
                                            vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredmin_vs_i64m2_i64m1_m(vbool32_t vm, vint64m2_t vs2,
                                            vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredmin_vs_i64m4_i64m1_m(vbool16_t vm, vint64m4_t vs2,
                                            vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredmin_vs_i64m8_i64m1_m(vbool8_t vm, vint64m8_t vs2,
                                            vint64m1_t vs1, size_t vl);
vint8m1_t __riscv_vredand_vs_i8mf8_i8m1_m(vbool64_t vm, vint8mf8_t vs2,
                                          vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredand_vs_i8mf4_i8m1_m(vbool32_t vm, vint8mf4_t vs2,
                                          vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredand_vs_i8mf2_i8m1_m(vbool16_t vm, vint8mf2_t vs2,
                                          vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredand_vs_i8m1_i8m1_m(vbool8_t vm, vint8m1_t vs2,
                                         vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredand_vs_i8m2_i8m1_m(vbool4_t vm, vint8m2_t vs2,
                                         vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredand_vs_i8m4_i8m1_m(vbool2_t vm, vint8m4_t vs2,
                                         vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredand_vs_i8m8_i8m1_m(vbool1_t vm, vint8m8_t vs2,
                                         vint8m1_t vs1, size_t vl);
vint16m1_t __riscv_vredand_vs_i16mf4_i16m1_m(vbool64_t vm, vint16mf4_t vs2,
                                             vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredand_vs_i16mf2_i16m1_m(vbool32_t vm, vint16mf2_t vs2,
                                             vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredand_vs_i16m1_i16m1_m(vbool16_t vm, vint16m1_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredand_vs_i16m2_i16m1_m(vbool8_t vm, vint16m2_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredand_vs_i16m4_i16m1_m(vbool4_t vm, vint16m4_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredand_vs_i16m8_i16m1_m(vbool2_t vm, vint16m8_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint32m1_t __riscv_vredand_vs_i32mf2_i32m1_m(vbool64_t vm, vint32mf2_t vs2,
                                             vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredand_vs_i32m1_i32m1_m(vbool32_t vm, vint32m1_t vs2,
                                            vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredand_vs_i32m2_i32m1_m(vbool16_t vm, vint32m2_t vs2,
                                            vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredand_vs_i32m4_i32m1_m(vbool8_t vm, vint32m4_t vs2,
                                            vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredand_vs_i32m8_i32m1_m(vbool4_t vm, vint32m8_t vs2,
                                            vint32m1_t vs1, size_t vl);
vint64m1_t __riscv_vredand_vs_i64m1_i64m1_m(vbool64_t vm, vint64m1_t vs2,
                                            vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredand_vs_i64m2_i64m1_m(vbool32_t vm, vint64m2_t vs2,
                                            vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredand_vs_i64m4_i64m1_m(vbool16_t vm, vint64m4_t vs2,
                                            vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredand_vs_i64m8_i64m1_m(vbool8_t vm, vint64m8_t vs2,
                                            vint64m1_t vs1, size_t vl);
vint8m1_t __riscv_vredor_vs_i8mf8_i8m1_m(vbool64_t vm, vint8mf8_t vs2,
                                         vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredor_vs_i8mf4_i8m1_m(vbool32_t vm, vint8mf4_t vs2,
                                         vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredor_vs_i8mf2_i8m1_m(vbool16_t vm, vint8mf2_t vs2,
                                         vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredor_vs_i8m1_i8m1_m(vbool8_t vm, vint8m1_t vs2,
                                        vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredor_vs_i8m2_i8m1_m(vbool4_t vm, vint8m2_t vs2,
                                        vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredor_vs_i8m4_i8m1_m(vbool2_t vm, vint8m4_t vs2,
                                        vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredor_vs_i8m8_i8m1_m(vbool1_t vm, vint8m8_t vs2,
                                        vint8m1_t vs1, size_t vl);
vint16m1_t __riscv_vredor_vs_i16mf4_i16m1_m(vbool64_t vm, vint16mf4_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredor_vs_i16mf2_i16m1_m(vbool32_t vm, vint16mf2_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredor_vs_i16m1_i16m1_m(vbool16_t vm, vint16m1_t vs2,
                                           vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredor_vs_i16m2_i16m1_m(vbool8_t vm, vint16m2_t vs2,
                                           vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredor_vs_i16m4_i16m1_m(vbool4_t vm, vint16m4_t vs2,
                                           vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredor_vs_i16m8_i16m1_m(vbool2_t vm, vint16m8_t vs2,
                                           vint16m1_t vs1, size_t vl);
vint32m1_t __riscv_vredor_vs_i32mf2_i32m1_m(vbool64_t vm, vint32mf2_t vs2,
                                            vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredor_vs_i32m1_i32m1_m(vbool32_t vm, vint32m1_t vs2,
                                           vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredor_vs_i32m2_i32m1_m(vbool16_t vm, vint32m2_t vs2,
                                           vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredor_vs_i32m4_i32m1_m(vbool8_t vm, vint32m4_t vs2,
                                           vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredor_vs_i32m8_i32m1_m(vbool4_t vm, vint32m8_t vs2,
                                           vint32m1_t vs1, size_t vl);
vint64m1_t __riscv_vredor_vs_i64m1_i64m1_m(vbool64_t vm, vint64m1_t vs2,
                                           vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredor_vs_i64m2_i64m1_m(vbool32_t vm, vint64m2_t vs2,
                                           vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredor_vs_i64m4_i64m1_m(vbool16_t vm, vint64m4_t vs2,
                                           vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredor_vs_i64m8_i64m1_m(vbool8_t vm, vint64m8_t vs2,
                                           vint64m1_t vs1, size_t vl);
vint8m1_t __riscv_vredxor_vs_i8mf8_i8m1_m(vbool64_t vm, vint8mf8_t vs2,
                                          vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredxor_vs_i8mf4_i8m1_m(vbool32_t vm, vint8mf4_t vs2,
                                          vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredxor_vs_i8mf2_i8m1_m(vbool16_t vm, vint8mf2_t vs2,
                                          vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredxor_vs_i8m1_i8m1_m(vbool8_t vm, vint8m1_t vs2,
                                         vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredxor_vs_i8m2_i8m1_m(vbool4_t vm, vint8m2_t vs2,
                                         vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredxor_vs_i8m4_i8m1_m(vbool2_t vm, vint8m4_t vs2,
                                         vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredxor_vs_i8m8_i8m1_m(vbool1_t vm, vint8m8_t vs2,
                                         vint8m1_t vs1, size_t vl);
vint16m1_t __riscv_vredxor_vs_i16mf4_i16m1_m(vbool64_t vm, vint16mf4_t vs2,
                                             vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredxor_vs_i16mf2_i16m1_m(vbool32_t vm, vint16mf2_t vs2,
                                             vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredxor_vs_i16m1_i16m1_m(vbool16_t vm, vint16m1_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredxor_vs_i16m2_i16m1_m(vbool8_t vm, vint16m2_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredxor_vs_i16m4_i16m1_m(vbool4_t vm, vint16m4_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredxor_vs_i16m8_i16m1_m(vbool2_t vm, vint16m8_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint32m1_t __riscv_vredxor_vs_i32mf2_i32m1_m(vbool64_t vm, vint32mf2_t vs2,
                                             vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredxor_vs_i32m1_i32m1_m(vbool32_t vm, vint32m1_t vs2,
                                            vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredxor_vs_i32m2_i32m1_m(vbool16_t vm, vint32m2_t vs2,
                                            vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredxor_vs_i32m4_i32m1_m(vbool8_t vm, vint32m4_t vs2,
                                            vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredxor_vs_i32m8_i32m1_m(vbool4_t vm, vint32m8_t vs2,
                                            vint32m1_t vs1, size_t vl);
vint64m1_t __riscv_vredxor_vs_i64m1_i64m1_m(vbool64_t vm, vint64m1_t vs2,
                                            vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredxor_vs_i64m2_i64m1_m(vbool32_t vm, vint64m2_t vs2,
                                            vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredxor_vs_i64m4_i64m1_m(vbool16_t vm, vint64m4_t vs2,
                                            vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredxor_vs_i64m8_i64m1_m(vbool8_t vm, vint64m8_t vs2,
                                            vint64m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredsum_vs_u8mf8_u8m1_m(vbool64_t vm, vuint8mf8_t vs2,
                                           vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredsum_vs_u8mf4_u8m1_m(vbool32_t vm, vuint8mf4_t vs2,
                                           vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredsum_vs_u8mf2_u8m1_m(vbool16_t vm, vuint8mf2_t vs2,
                                           vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredsum_vs_u8m1_u8m1_m(vbool8_t vm, vuint8m1_t vs2,
                                          vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredsum_vs_u8m2_u8m1_m(vbool4_t vm, vuint8m2_t vs2,
                                          vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredsum_vs_u8m4_u8m1_m(vbool2_t vm, vuint8m4_t vs2,
                                          vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredsum_vs_u8m8_u8m1_m(vbool1_t vm, vuint8m8_t vs2,
                                          vuint8m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredsum_vs_u16mf4_u16m1_m(vbool64_t vm, vuint16mf4_t vs2,
                                              vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredsum_vs_u16mf2_u16m1_m(vbool32_t vm, vuint16mf2_t vs2,
                                              vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredsum_vs_u16m1_u16m1_m(vbool16_t vm, vuint16m1_t vs2,
                                             vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredsum_vs_u16m2_u16m1_m(vbool8_t vm, vuint16m2_t vs2,
                                             vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredsum_vs_u16m4_u16m1_m(vbool4_t vm, vuint16m4_t vs2,
                                             vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredsum_vs_u16m8_u16m1_m(vbool2_t vm, vuint16m8_t vs2,
                                             vuint16m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredsum_vs_u32mf2_u32m1_m(vbool64_t vm, vuint32mf2_t vs2,
                                              vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredsum_vs_u32m1_u32m1_m(vbool32_t vm, vuint32m1_t vs2,
                                             vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredsum_vs_u32m2_u32m1_m(vbool16_t vm, vuint32m2_t vs2,
                                             vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredsum_vs_u32m4_u32m1_m(vbool8_t vm, vuint32m4_t vs2,
                                             vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredsum_vs_u32m8_u32m1_m(vbool4_t vm, vuint32m8_t vs2,
                                             vuint32m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredsum_vs_u64m1_u64m1_m(vbool64_t vm, vuint64m1_t vs2,
                                             vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredsum_vs_u64m2_u64m1_m(vbool32_t vm, vuint64m2_t vs2,
                                             vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredsum_vs_u64m4_u64m1_m(vbool16_t vm, vuint64m4_t vs2,
                                             vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredsum_vs_u64m8_u64m1_m(vbool8_t vm, vuint64m8_t vs2,
                                             vuint64m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredmaxu_vs_u8mf8_u8m1_m(vbool64_t vm, vuint8mf8_t vs2,
                                            vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredmaxu_vs_u8mf4_u8m1_m(vbool32_t vm, vuint8mf4_t vs2,
                                            vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredmaxu_vs_u8mf2_u8m1_m(vbool16_t vm, vuint8mf2_t vs2,
                                            vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredmaxu_vs_u8m1_u8m1_m(vbool8_t vm, vuint8m1_t vs2,
                                           vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredmaxu_vs_u8m2_u8m1_m(vbool4_t vm, vuint8m2_t vs2,
                                           vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredmaxu_vs_u8m4_u8m1_m(vbool2_t vm, vuint8m4_t vs2,
                                           vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredmaxu_vs_u8m8_u8m1_m(vbool1_t vm, vuint8m8_t vs2,
                                           vuint8m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredmaxu_vs_u16mf4_u16m1_m(vbool64_t vm, vuint16mf4_t vs2,
                                               vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredmaxu_vs_u16mf2_u16m1_m(vbool32_t vm, vuint16mf2_t vs2,
                                               vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredmaxu_vs_u16m1_u16m1_m(vbool16_t vm, vuint16m1_t vs2,
                                              vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredmaxu_vs_u16m2_u16m1_m(vbool8_t vm, vuint16m2_t vs2,
                                              vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredmaxu_vs_u16m4_u16m1_m(vbool4_t vm, vuint16m4_t vs2,
                                              vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredmaxu_vs_u16m8_u16m1_m(vbool2_t vm, vuint16m8_t vs2,
                                              vuint16m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredmaxu_vs_u32mf2_u32m1_m(vbool64_t vm, vuint32mf2_t vs2,
                                               vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredmaxu_vs_u32m1_u32m1_m(vbool32_t vm, vuint32m1_t vs2,
                                              vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredmaxu_vs_u32m2_u32m1_m(vbool16_t vm, vuint32m2_t vs2,
                                              vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredmaxu_vs_u32m4_u32m1_m(vbool8_t vm, vuint32m4_t vs2,
                                              vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredmaxu_vs_u32m8_u32m1_m(vbool4_t vm, vuint32m8_t vs2,
                                              vuint32m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredmaxu_vs_u64m1_u64m1_m(vbool64_t vm, vuint64m1_t vs2,
                                              vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredmaxu_vs_u64m2_u64m1_m(vbool32_t vm, vuint64m2_t vs2,
                                              vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredmaxu_vs_u64m4_u64m1_m(vbool16_t vm, vuint64m4_t vs2,
                                              vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredmaxu_vs_u64m8_u64m1_m(vbool8_t vm, vuint64m8_t vs2,
                                              vuint64m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredminu_vs_u8mf8_u8m1_m(vbool64_t vm, vuint8mf8_t vs2,
                                            vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredminu_vs_u8mf4_u8m1_m(vbool32_t vm, vuint8mf4_t vs2,
                                            vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredminu_vs_u8mf2_u8m1_m(vbool16_t vm, vuint8mf2_t vs2,
                                            vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredminu_vs_u8m1_u8m1_m(vbool8_t vm, vuint8m1_t vs2,
                                           vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredminu_vs_u8m2_u8m1_m(vbool4_t vm, vuint8m2_t vs2,
                                           vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredminu_vs_u8m4_u8m1_m(vbool2_t vm, vuint8m4_t vs2,
                                           vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredminu_vs_u8m8_u8m1_m(vbool1_t vm, vuint8m8_t vs2,
                                           vuint8m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredminu_vs_u16mf4_u16m1_m(vbool64_t vm, vuint16mf4_t vs2,
                                               vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredminu_vs_u16mf2_u16m1_m(vbool32_t vm, vuint16mf2_t vs2,
                                               vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredminu_vs_u16m1_u16m1_m(vbool16_t vm, vuint16m1_t vs2,
                                              vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredminu_vs_u16m2_u16m1_m(vbool8_t vm, vuint16m2_t vs2,
                                              vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredminu_vs_u16m4_u16m1_m(vbool4_t vm, vuint16m4_t vs2,
                                              vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredminu_vs_u16m8_u16m1_m(vbool2_t vm, vuint16m8_t vs2,
                                              vuint16m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredminu_vs_u32mf2_u32m1_m(vbool64_t vm, vuint32mf2_t vs2,
                                               vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredminu_vs_u32m1_u32m1_m(vbool32_t vm, vuint32m1_t vs2,
                                              vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredminu_vs_u32m2_u32m1_m(vbool16_t vm, vuint32m2_t vs2,
                                              vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredminu_vs_u32m4_u32m1_m(vbool8_t vm, vuint32m4_t vs2,
                                              vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredminu_vs_u32m8_u32m1_m(vbool4_t vm, vuint32m8_t vs2,
                                              vuint32m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredminu_vs_u64m1_u64m1_m(vbool64_t vm, vuint64m1_t vs2,
                                              vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredminu_vs_u64m2_u64m1_m(vbool32_t vm, vuint64m2_t vs2,
                                              vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredminu_vs_u64m4_u64m1_m(vbool16_t vm, vuint64m4_t vs2,
                                              vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredminu_vs_u64m8_u64m1_m(vbool8_t vm, vuint64m8_t vs2,
                                              vuint64m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredand_vs_u8mf8_u8m1_m(vbool64_t vm, vuint8mf8_t vs2,
                                           vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredand_vs_u8mf4_u8m1_m(vbool32_t vm, vuint8mf4_t vs2,
                                           vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredand_vs_u8mf2_u8m1_m(vbool16_t vm, vuint8mf2_t vs2,
                                           vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredand_vs_u8m1_u8m1_m(vbool8_t vm, vuint8m1_t vs2,
                                          vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredand_vs_u8m2_u8m1_m(vbool4_t vm, vuint8m2_t vs2,
                                          vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredand_vs_u8m4_u8m1_m(vbool2_t vm, vuint8m4_t vs2,
                                          vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredand_vs_u8m8_u8m1_m(vbool1_t vm, vuint8m8_t vs2,
                                          vuint8m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredand_vs_u16mf4_u16m1_m(vbool64_t vm, vuint16mf4_t vs2,
                                              vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredand_vs_u16mf2_u16m1_m(vbool32_t vm, vuint16mf2_t vs2,
                                              vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredand_vs_u16m1_u16m1_m(vbool16_t vm, vuint16m1_t vs2,
                                             vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredand_vs_u16m2_u16m1_m(vbool8_t vm, vuint16m2_t vs2,
                                             vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredand_vs_u16m4_u16m1_m(vbool4_t vm, vuint16m4_t vs2,
                                             vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredand_vs_u16m8_u16m1_m(vbool2_t vm, vuint16m8_t vs2,
                                             vuint16m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredand_vs_u32mf2_u32m1_m(vbool64_t vm, vuint32mf2_t vs2,
                                              vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredand_vs_u32m1_u32m1_m(vbool32_t vm, vuint32m1_t vs2,
                                             vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredand_vs_u32m2_u32m1_m(vbool16_t vm, vuint32m2_t vs2,
                                             vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredand_vs_u32m4_u32m1_m(vbool8_t vm, vuint32m4_t vs2,
                                             vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredand_vs_u32m8_u32m1_m(vbool4_t vm, vuint32m8_t vs2,
                                             vuint32m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredand_vs_u64m1_u64m1_m(vbool64_t vm, vuint64m1_t vs2,
                                             vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredand_vs_u64m2_u64m1_m(vbool32_t vm, vuint64m2_t vs2,
                                             vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredand_vs_u64m4_u64m1_m(vbool16_t vm, vuint64m4_t vs2,
                                             vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredand_vs_u64m8_u64m1_m(vbool8_t vm, vuint64m8_t vs2,
                                             vuint64m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredor_vs_u8mf8_u8m1_m(vbool64_t vm, vuint8mf8_t vs2,
                                          vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredor_vs_u8mf4_u8m1_m(vbool32_t vm, vuint8mf4_t vs2,
                                          vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredor_vs_u8mf2_u8m1_m(vbool16_t vm, vuint8mf2_t vs2,
                                          vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredor_vs_u8m1_u8m1_m(vbool8_t vm, vuint8m1_t vs2,
                                         vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredor_vs_u8m2_u8m1_m(vbool4_t vm, vuint8m2_t vs2,
                                         vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredor_vs_u8m4_u8m1_m(vbool2_t vm, vuint8m4_t vs2,
                                         vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredor_vs_u8m8_u8m1_m(vbool1_t vm, vuint8m8_t vs2,
                                         vuint8m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredor_vs_u16mf4_u16m1_m(vbool64_t vm, vuint16mf4_t vs2,
                                             vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredor_vs_u16mf2_u16m1_m(vbool32_t vm, vuint16mf2_t vs2,
                                             vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredor_vs_u16m1_u16m1_m(vbool16_t vm, vuint16m1_t vs2,
                                            vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredor_vs_u16m2_u16m1_m(vbool8_t vm, vuint16m2_t vs2,
                                            vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredor_vs_u16m4_u16m1_m(vbool4_t vm, vuint16m4_t vs2,
                                            vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredor_vs_u16m8_u16m1_m(vbool2_t vm, vuint16m8_t vs2,
                                            vuint16m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredor_vs_u32mf2_u32m1_m(vbool64_t vm, vuint32mf2_t vs2,
                                             vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredor_vs_u32m1_u32m1_m(vbool32_t vm, vuint32m1_t vs2,
                                            vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredor_vs_u32m2_u32m1_m(vbool16_t vm, vuint32m2_t vs2,
                                            vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredor_vs_u32m4_u32m1_m(vbool8_t vm, vuint32m4_t vs2,
                                            vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredor_vs_u32m8_u32m1_m(vbool4_t vm, vuint32m8_t vs2,
                                            vuint32m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredor_vs_u64m1_u64m1_m(vbool64_t vm, vuint64m1_t vs2,
                                            vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredor_vs_u64m2_u64m1_m(vbool32_t vm, vuint64m2_t vs2,
                                            vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredor_vs_u64m4_u64m1_m(vbool16_t vm, vuint64m4_t vs2,
                                            vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredor_vs_u64m8_u64m1_m(vbool8_t vm, vuint64m8_t vs2,
                                            vuint64m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredxor_vs_u8mf8_u8m1_m(vbool64_t vm, vuint8mf8_t vs2,
                                           vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredxor_vs_u8mf4_u8m1_m(vbool32_t vm, vuint8mf4_t vs2,
                                           vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredxor_vs_u8mf2_u8m1_m(vbool16_t vm, vuint8mf2_t vs2,
                                           vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredxor_vs_u8m1_u8m1_m(vbool8_t vm, vuint8m1_t vs2,
                                          vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredxor_vs_u8m2_u8m1_m(vbool4_t vm, vuint8m2_t vs2,
                                          vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredxor_vs_u8m4_u8m1_m(vbool2_t vm, vuint8m4_t vs2,
                                          vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredxor_vs_u8m8_u8m1_m(vbool1_t vm, vuint8m8_t vs2,
                                          vuint8m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredxor_vs_u16mf4_u16m1_m(vbool64_t vm, vuint16mf4_t vs2,
                                              vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredxor_vs_u16mf2_u16m1_m(vbool32_t vm, vuint16mf2_t vs2,
                                              vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredxor_vs_u16m1_u16m1_m(vbool16_t vm, vuint16m1_t vs2,
                                             vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredxor_vs_u16m2_u16m1_m(vbool8_t vm, vuint16m2_t vs2,
                                             vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredxor_vs_u16m4_u16m1_m(vbool4_t vm, vuint16m4_t vs2,
                                             vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredxor_vs_u16m8_u16m1_m(vbool2_t vm, vuint16m8_t vs2,
                                             vuint16m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredxor_vs_u32mf2_u32m1_m(vbool64_t vm, vuint32mf2_t vs2,
                                              vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredxor_vs_u32m1_u32m1_m(vbool32_t vm, vuint32m1_t vs2,
                                             vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredxor_vs_u32m2_u32m1_m(vbool16_t vm, vuint32m2_t vs2,
                                             vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredxor_vs_u32m4_u32m1_m(vbool8_t vm, vuint32m4_t vs2,
                                             vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredxor_vs_u32m8_u32m1_m(vbool4_t vm, vuint32m8_t vs2,
                                             vuint32m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredxor_vs_u64m1_u64m1_m(vbool64_t vm, vuint64m1_t vs2,
                                             vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredxor_vs_u64m2_u64m1_m(vbool32_t vm, vuint64m2_t vs2,
                                             vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredxor_vs_u64m4_u64m1_m(vbool16_t vm, vuint64m4_t vs2,
                                             vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredxor_vs_u64m8_u64m1_m(vbool8_t vm, vuint64m8_t vs2,
                                             vuint64m1_t vs1, size_t vl);

Vector Widening Integer Reduction Intrinsics

vint16m1_t __riscv_vwredsum_vs_i8mf8_i16m1(vint8mf8_t vs2, vint16m1_t vs1,
                                           size_t vl);
vint16m1_t __riscv_vwredsum_vs_i8mf4_i16m1(vint8mf4_t vs2, vint16m1_t vs1,
                                           size_t vl);
vint16m1_t __riscv_vwredsum_vs_i8mf2_i16m1(vint8mf2_t vs2, vint16m1_t vs1,
                                           size_t vl);
vint16m1_t __riscv_vwredsum_vs_i8m1_i16m1(vint8m1_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint16m1_t __riscv_vwredsum_vs_i8m2_i16m1(vint8m2_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint16m1_t __riscv_vwredsum_vs_i8m4_i16m1(vint8m4_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint16m1_t __riscv_vwredsum_vs_i8m8_i16m1(vint8m8_t vs2, vint16m1_t vs1,
                                          size_t vl);
vint32m1_t __riscv_vwredsum_vs_i16mf4_i32m1(vint16mf4_t vs2, vint32m1_t vs1,
                                            size_t vl);
vint32m1_t __riscv_vwredsum_vs_i16mf2_i32m1(vint16mf2_t vs2, vint32m1_t vs1,
                                            size_t vl);
vint32m1_t __riscv_vwredsum_vs_i16m1_i32m1(vint16m1_t vs2, vint32m1_t vs1,
                                           size_t vl);
vint32m1_t __riscv_vwredsum_vs_i16m2_i32m1(vint16m2_t vs2, vint32m1_t vs1,
                                           size_t vl);
vint32m1_t __riscv_vwredsum_vs_i16m4_i32m1(vint16m4_t vs2, vint32m1_t vs1,
                                           size_t vl);
vint32m1_t __riscv_vwredsum_vs_i16m8_i32m1(vint16m8_t vs2, vint32m1_t vs1,
                                           size_t vl);
vint64m1_t __riscv_vwredsum_vs_i32mf2_i64m1(vint32mf2_t vs2, vint64m1_t vs1,
                                            size_t vl);
vint64m1_t __riscv_vwredsum_vs_i32m1_i64m1(vint32m1_t vs2, vint64m1_t vs1,
                                           size_t vl);
vint64m1_t __riscv_vwredsum_vs_i32m2_i64m1(vint32m2_t vs2, vint64m1_t vs1,
                                           size_t vl);
vint64m1_t __riscv_vwredsum_vs_i32m4_i64m1(vint32m4_t vs2, vint64m1_t vs1,
                                           size_t vl);
vint64m1_t __riscv_vwredsum_vs_i32m8_i64m1(vint32m8_t vs2, vint64m1_t vs1,
                                           size_t vl);
vuint16m1_t __riscv_vwredsumu_vs_u8mf8_u16m1(vuint8mf8_t vs2, vuint16m1_t vs1,
                                             size_t vl);
vuint16m1_t __riscv_vwredsumu_vs_u8mf4_u16m1(vuint8mf4_t vs2, vuint16m1_t vs1,
                                             size_t vl);
vuint16m1_t __riscv_vwredsumu_vs_u8mf2_u16m1(vuint8mf2_t vs2, vuint16m1_t vs1,
                                             size_t vl);
vuint16m1_t __riscv_vwredsumu_vs_u8m1_u16m1(vuint8m1_t vs2, vuint16m1_t vs1,
                                            size_t vl);
vuint16m1_t __riscv_vwredsumu_vs_u8m2_u16m1(vuint8m2_t vs2, vuint16m1_t vs1,
                                            size_t vl);
vuint16m1_t __riscv_vwredsumu_vs_u8m4_u16m1(vuint8m4_t vs2, vuint16m1_t vs1,
                                            size_t vl);
vuint16m1_t __riscv_vwredsumu_vs_u8m8_u16m1(vuint8m8_t vs2, vuint16m1_t vs1,
                                            size_t vl);
vuint32m1_t __riscv_vwredsumu_vs_u16mf4_u32m1(vuint16mf4_t vs2, vuint32m1_t vs1,
                                              size_t vl);
vuint32m1_t __riscv_vwredsumu_vs_u16mf2_u32m1(vuint16mf2_t vs2, vuint32m1_t vs1,
                                              size_t vl);
vuint32m1_t __riscv_vwredsumu_vs_u16m1_u32m1(vuint16m1_t vs2, vuint32m1_t vs1,
                                             size_t vl);
vuint32m1_t __riscv_vwredsumu_vs_u16m2_u32m1(vuint16m2_t vs2, vuint32m1_t vs1,
                                             size_t vl);
vuint32m1_t __riscv_vwredsumu_vs_u16m4_u32m1(vuint16m4_t vs2, vuint32m1_t vs1,
                                             size_t vl);
vuint32m1_t __riscv_vwredsumu_vs_u16m8_u32m1(vuint16m8_t vs2, vuint32m1_t vs1,
                                             size_t vl);
vuint64m1_t __riscv_vwredsumu_vs_u32mf2_u64m1(vuint32mf2_t vs2, vuint64m1_t vs1,
                                              size_t vl);
vuint64m1_t __riscv_vwredsumu_vs_u32m1_u64m1(vuint32m1_t vs2, vuint64m1_t vs1,
                                             size_t vl);
vuint64m1_t __riscv_vwredsumu_vs_u32m2_u64m1(vuint32m2_t vs2, vuint64m1_t vs1,
                                             size_t vl);
vuint64m1_t __riscv_vwredsumu_vs_u32m4_u64m1(vuint32m4_t vs2, vuint64m1_t vs1,
                                             size_t vl);
vuint64m1_t __riscv_vwredsumu_vs_u32m8_u64m1(vuint32m8_t vs2, vuint64m1_t vs1,
                                             size_t vl);
// masked functions
vint16m1_t __riscv_vwredsum_vs_i8mf8_i16m1_m(vbool64_t vm, vint8mf8_t vs2,
                                             vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vwredsum_vs_i8mf4_i16m1_m(vbool32_t vm, vint8mf4_t vs2,
                                             vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vwredsum_vs_i8mf2_i16m1_m(vbool16_t vm, vint8mf2_t vs2,
                                             vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vwredsum_vs_i8m1_i16m1_m(vbool8_t vm, vint8m1_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vwredsum_vs_i8m2_i16m1_m(vbool4_t vm, vint8m2_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vwredsum_vs_i8m4_i16m1_m(vbool2_t vm, vint8m4_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vwredsum_vs_i8m8_i16m1_m(vbool1_t vm, vint8m8_t vs2,
                                            vint16m1_t vs1, size_t vl);
vint32m1_t __riscv_vwredsum_vs_i16mf4_i32m1_m(vbool64_t vm, vint16mf4_t vs2,
                                              vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vwredsum_vs_i16mf2_i32m1_m(vbool32_t vm, vint16mf2_t vs2,
                                              vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vwredsum_vs_i16m1_i32m1_m(vbool16_t vm, vint16m1_t vs2,
                                             vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vwredsum_vs_i16m2_i32m1_m(vbool8_t vm, vint16m2_t vs2,
                                             vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vwredsum_vs_i16m4_i32m1_m(vbool4_t vm, vint16m4_t vs2,
                                             vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vwredsum_vs_i16m8_i32m1_m(vbool2_t vm, vint16m8_t vs2,
                                             vint32m1_t vs1, size_t vl);
vint64m1_t __riscv_vwredsum_vs_i32mf2_i64m1_m(vbool64_t vm, vint32mf2_t vs2,
                                              vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vwredsum_vs_i32m1_i64m1_m(vbool32_t vm, vint32m1_t vs2,
                                             vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vwredsum_vs_i32m2_i64m1_m(vbool16_t vm, vint32m2_t vs2,
                                             vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vwredsum_vs_i32m4_i64m1_m(vbool8_t vm, vint32m4_t vs2,
                                             vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vwredsum_vs_i32m8_i64m1_m(vbool4_t vm, vint32m8_t vs2,
                                             vint64m1_t vs1, size_t vl);
vuint16m1_t __riscv_vwredsumu_vs_u8mf8_u16m1_m(vbool64_t vm, vuint8mf8_t vs2,
                                               vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vwredsumu_vs_u8mf4_u16m1_m(vbool32_t vm, vuint8mf4_t vs2,
                                               vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vwredsumu_vs_u8mf2_u16m1_m(vbool16_t vm, vuint8mf2_t vs2,
                                               vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vwredsumu_vs_u8m1_u16m1_m(vbool8_t vm, vuint8m1_t vs2,
                                              vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vwredsumu_vs_u8m2_u16m1_m(vbool4_t vm, vuint8m2_t vs2,
                                              vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vwredsumu_vs_u8m4_u16m1_m(vbool2_t vm, vuint8m4_t vs2,
                                              vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vwredsumu_vs_u8m8_u16m1_m(vbool1_t vm, vuint8m8_t vs2,
                                              vuint16m1_t vs1, size_t vl);
vuint32m1_t __riscv_vwredsumu_vs_u16mf4_u32m1_m(vbool64_t vm, vuint16mf4_t vs2,
                                                vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vwredsumu_vs_u16mf2_u32m1_m(vbool32_t vm, vuint16mf2_t vs2,
                                                vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vwredsumu_vs_u16m1_u32m1_m(vbool16_t vm, vuint16m1_t vs2,
                                               vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vwredsumu_vs_u16m2_u32m1_m(vbool8_t vm, vuint16m2_t vs2,
                                               vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vwredsumu_vs_u16m4_u32m1_m(vbool4_t vm, vuint16m4_t vs2,
                                               vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vwredsumu_vs_u16m8_u32m1_m(vbool2_t vm, vuint16m8_t vs2,
                                               vuint32m1_t vs1, size_t vl);
vuint64m1_t __riscv_vwredsumu_vs_u32mf2_u64m1_m(vbool64_t vm, vuint32mf2_t vs2,
                                                vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vwredsumu_vs_u32m1_u64m1_m(vbool32_t vm, vuint32m1_t vs2,
                                               vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vwredsumu_vs_u32m2_u64m1_m(vbool16_t vm, vuint32m2_t vs2,
                                               vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vwredsumu_vs_u32m4_u64m1_m(vbool8_t vm, vuint32m4_t vs2,
                                               vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vwredsumu_vs_u32m8_u64m1_m(vbool4_t vm, vuint32m8_t vs2,
                                               vuint64m1_t vs1, size_t vl);

Vector Single-Width Floating-Point Reduction Intrinsics

vfloat16m1_t __riscv_vfredosum_vs_f16mf4_f16m1(vfloat16mf4_t vs2,
                                               vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredosum_vs_f16mf2_f16m1(vfloat16mf2_t vs2,
                                               vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredosum_vs_f16m1_f16m1(vfloat16m1_t vs2,
                                              vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredosum_vs_f16m2_f16m1(vfloat16m2_t vs2,
                                              vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredosum_vs_f16m4_f16m1(vfloat16m4_t vs2,
                                              vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredosum_vs_f16m8_f16m1(vfloat16m8_t vs2,
                                              vfloat16m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredosum_vs_f32mf2_f32m1(vfloat32mf2_t vs2,
                                               vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredosum_vs_f32m1_f32m1(vfloat32m1_t vs2,
                                              vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredosum_vs_f32m2_f32m1(vfloat32m2_t vs2,
                                              vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredosum_vs_f32m4_f32m1(vfloat32m4_t vs2,
                                              vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredosum_vs_f32m8_f32m1(vfloat32m8_t vs2,
                                              vfloat32m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredosum_vs_f64m1_f64m1(vfloat64m1_t vs2,
                                              vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredosum_vs_f64m2_f64m1(vfloat64m2_t vs2,
                                              vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredosum_vs_f64m4_f64m1(vfloat64m4_t vs2,
                                              vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredosum_vs_f64m8_f64m1(vfloat64m8_t vs2,
                                              vfloat64m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredusum_vs_f16mf4_f16m1(vfloat16mf4_t vs2,
                                               vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredusum_vs_f16mf2_f16m1(vfloat16mf2_t vs2,
                                               vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredusum_vs_f16m1_f16m1(vfloat16m1_t vs2,
                                              vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredusum_vs_f16m2_f16m1(vfloat16m2_t vs2,
                                              vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredusum_vs_f16m4_f16m1(vfloat16m4_t vs2,
                                              vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredusum_vs_f16m8_f16m1(vfloat16m8_t vs2,
                                              vfloat16m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredusum_vs_f32mf2_f32m1(vfloat32mf2_t vs2,
                                               vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredusum_vs_f32m1_f32m1(vfloat32m1_t vs2,
                                              vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredusum_vs_f32m2_f32m1(vfloat32m2_t vs2,
                                              vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredusum_vs_f32m4_f32m1(vfloat32m4_t vs2,
                                              vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredusum_vs_f32m8_f32m1(vfloat32m8_t vs2,
                                              vfloat32m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredusum_vs_f64m1_f64m1(vfloat64m1_t vs2,
                                              vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredusum_vs_f64m2_f64m1(vfloat64m2_t vs2,
                                              vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredusum_vs_f64m4_f64m1(vfloat64m4_t vs2,
                                              vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredusum_vs_f64m8_f64m1(vfloat64m8_t vs2,
                                              vfloat64m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmax_vs_f16mf4_f16m1(vfloat16mf4_t vs2,
                                              vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmax_vs_f16mf2_f16m1(vfloat16mf2_t vs2,
                                              vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmax_vs_f16m1_f16m1(vfloat16m1_t vs2, vfloat16m1_t vs1,
                                             size_t vl);
vfloat16m1_t __riscv_vfredmax_vs_f16m2_f16m1(vfloat16m2_t vs2, vfloat16m1_t vs1,
                                             size_t vl);
vfloat16m1_t __riscv_vfredmax_vs_f16m4_f16m1(vfloat16m4_t vs2, vfloat16m1_t vs1,
                                             size_t vl);
vfloat16m1_t __riscv_vfredmax_vs_f16m8_f16m1(vfloat16m8_t vs2, vfloat16m1_t vs1,
                                             size_t vl);
vfloat32m1_t __riscv_vfredmax_vs_f32mf2_f32m1(vfloat32mf2_t vs2,
                                              vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredmax_vs_f32m1_f32m1(vfloat32m1_t vs2, vfloat32m1_t vs1,
                                             size_t vl);
vfloat32m1_t __riscv_vfredmax_vs_f32m2_f32m1(vfloat32m2_t vs2, vfloat32m1_t vs1,
                                             size_t vl);
vfloat32m1_t __riscv_vfredmax_vs_f32m4_f32m1(vfloat32m4_t vs2, vfloat32m1_t vs1,
                                             size_t vl);
vfloat32m1_t __riscv_vfredmax_vs_f32m8_f32m1(vfloat32m8_t vs2, vfloat32m1_t vs1,
                                             size_t vl);
vfloat64m1_t __riscv_vfredmax_vs_f64m1_f64m1(vfloat64m1_t vs2, vfloat64m1_t vs1,
                                             size_t vl);
vfloat64m1_t __riscv_vfredmax_vs_f64m2_f64m1(vfloat64m2_t vs2, vfloat64m1_t vs1,
                                             size_t vl);
vfloat64m1_t __riscv_vfredmax_vs_f64m4_f64m1(vfloat64m4_t vs2, vfloat64m1_t vs1,
                                             size_t vl);
vfloat64m1_t __riscv_vfredmax_vs_f64m8_f64m1(vfloat64m8_t vs2, vfloat64m1_t vs1,
                                             size_t vl);
vfloat16m1_t __riscv_vfredmin_vs_f16mf4_f16m1(vfloat16mf4_t vs2,
                                              vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmin_vs_f16mf2_f16m1(vfloat16mf2_t vs2,
                                              vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmin_vs_f16m1_f16m1(vfloat16m1_t vs2, vfloat16m1_t vs1,
                                             size_t vl);
vfloat16m1_t __riscv_vfredmin_vs_f16m2_f16m1(vfloat16m2_t vs2, vfloat16m1_t vs1,
                                             size_t vl);
vfloat16m1_t __riscv_vfredmin_vs_f16m4_f16m1(vfloat16m4_t vs2, vfloat16m1_t vs1,
                                             size_t vl);
vfloat16m1_t __riscv_vfredmin_vs_f16m8_f16m1(vfloat16m8_t vs2, vfloat16m1_t vs1,
                                             size_t vl);
vfloat32m1_t __riscv_vfredmin_vs_f32mf2_f32m1(vfloat32mf2_t vs2,
                                              vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredmin_vs_f32m1_f32m1(vfloat32m1_t vs2, vfloat32m1_t vs1,
                                             size_t vl);
vfloat32m1_t __riscv_vfredmin_vs_f32m2_f32m1(vfloat32m2_t vs2, vfloat32m1_t vs1,
                                             size_t vl);
vfloat32m1_t __riscv_vfredmin_vs_f32m4_f32m1(vfloat32m4_t vs2, vfloat32m1_t vs1,
                                             size_t vl);
vfloat32m1_t __riscv_vfredmin_vs_f32m8_f32m1(vfloat32m8_t vs2, vfloat32m1_t vs1,
                                             size_t vl);
vfloat64m1_t __riscv_vfredmin_vs_f64m1_f64m1(vfloat64m1_t vs2, vfloat64m1_t vs1,
                                             size_t vl);
vfloat64m1_t __riscv_vfredmin_vs_f64m2_f64m1(vfloat64m2_t vs2, vfloat64m1_t vs1,
                                             size_t vl);
vfloat64m1_t __riscv_vfredmin_vs_f64m4_f64m1(vfloat64m4_t vs2, vfloat64m1_t vs1,
                                             size_t vl);
vfloat64m1_t __riscv_vfredmin_vs_f64m8_f64m1(vfloat64m8_t vs2, vfloat64m1_t vs1,
                                             size_t vl);
// masked functions
vfloat16m1_t __riscv_vfredosum_vs_f16mf4_f16m1_m(vbool64_t vm,
                                                 vfloat16mf4_t vs2,
                                                 vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredosum_vs_f16mf2_f16m1_m(vbool32_t vm,
                                                 vfloat16mf2_t vs2,
                                                 vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredosum_vs_f16m1_f16m1_m(vbool16_t vm, vfloat16m1_t vs2,
                                                vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredosum_vs_f16m2_f16m1_m(vbool8_t vm, vfloat16m2_t vs2,
                                                vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredosum_vs_f16m4_f16m1_m(vbool4_t vm, vfloat16m4_t vs2,
                                                vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredosum_vs_f16m8_f16m1_m(vbool2_t vm, vfloat16m8_t vs2,
                                                vfloat16m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredosum_vs_f32mf2_f32m1_m(vbool64_t vm,
                                                 vfloat32mf2_t vs2,
                                                 vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredosum_vs_f32m1_f32m1_m(vbool32_t vm, vfloat32m1_t vs2,
                                                vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredosum_vs_f32m2_f32m1_m(vbool16_t vm, vfloat32m2_t vs2,
                                                vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredosum_vs_f32m4_f32m1_m(vbool8_t vm, vfloat32m4_t vs2,
                                                vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredosum_vs_f32m8_f32m1_m(vbool4_t vm, vfloat32m8_t vs2,
                                                vfloat32m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredosum_vs_f64m1_f64m1_m(vbool64_t vm, vfloat64m1_t vs2,
                                                vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredosum_vs_f64m2_f64m1_m(vbool32_t vm, vfloat64m2_t vs2,
                                                vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredosum_vs_f64m4_f64m1_m(vbool16_t vm, vfloat64m4_t vs2,
                                                vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredosum_vs_f64m8_f64m1_m(vbool8_t vm, vfloat64m8_t vs2,
                                                vfloat64m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredusum_vs_f16mf4_f16m1_m(vbool64_t vm,
                                                 vfloat16mf4_t vs2,
                                                 vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredusum_vs_f16mf2_f16m1_m(vbool32_t vm,
                                                 vfloat16mf2_t vs2,
                                                 vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredusum_vs_f16m1_f16m1_m(vbool16_t vm, vfloat16m1_t vs2,
                                                vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredusum_vs_f16m2_f16m1_m(vbool8_t vm, vfloat16m2_t vs2,
                                                vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredusum_vs_f16m4_f16m1_m(vbool4_t vm, vfloat16m4_t vs2,
                                                vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredusum_vs_f16m8_f16m1_m(vbool2_t vm, vfloat16m8_t vs2,
                                                vfloat16m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredusum_vs_f32mf2_f32m1_m(vbool64_t vm,
                                                 vfloat32mf2_t vs2,
                                                 vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredusum_vs_f32m1_f32m1_m(vbool32_t vm, vfloat32m1_t vs2,
                                                vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredusum_vs_f32m2_f32m1_m(vbool16_t vm, vfloat32m2_t vs2,
                                                vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredusum_vs_f32m4_f32m1_m(vbool8_t vm, vfloat32m4_t vs2,
                                                vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredusum_vs_f32m8_f32m1_m(vbool4_t vm, vfloat32m8_t vs2,
                                                vfloat32m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredusum_vs_f64m1_f64m1_m(vbool64_t vm, vfloat64m1_t vs2,
                                                vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredusum_vs_f64m2_f64m1_m(vbool32_t vm, vfloat64m2_t vs2,
                                                vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredusum_vs_f64m4_f64m1_m(vbool16_t vm, vfloat64m4_t vs2,
                                                vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredusum_vs_f64m8_f64m1_m(vbool8_t vm, vfloat64m8_t vs2,
                                                vfloat64m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmax_vs_f16mf4_f16m1_m(vbool64_t vm, vfloat16mf4_t vs2,
                                                vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmax_vs_f16mf2_f16m1_m(vbool32_t vm, vfloat16mf2_t vs2,
                                                vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmax_vs_f16m1_f16m1_m(vbool16_t vm, vfloat16m1_t vs2,
                                               vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmax_vs_f16m2_f16m1_m(vbool8_t vm, vfloat16m2_t vs2,
                                               vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmax_vs_f16m4_f16m1_m(vbool4_t vm, vfloat16m4_t vs2,
                                               vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmax_vs_f16m8_f16m1_m(vbool2_t vm, vfloat16m8_t vs2,
                                               vfloat16m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredmax_vs_f32mf2_f32m1_m(vbool64_t vm, vfloat32mf2_t vs2,
                                                vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredmax_vs_f32m1_f32m1_m(vbool32_t vm, vfloat32m1_t vs2,
                                               vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredmax_vs_f32m2_f32m1_m(vbool16_t vm, vfloat32m2_t vs2,
                                               vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredmax_vs_f32m4_f32m1_m(vbool8_t vm, vfloat32m4_t vs2,
                                               vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredmax_vs_f32m8_f32m1_m(vbool4_t vm, vfloat32m8_t vs2,
                                               vfloat32m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredmax_vs_f64m1_f64m1_m(vbool64_t vm, vfloat64m1_t vs2,
                                               vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredmax_vs_f64m2_f64m1_m(vbool32_t vm, vfloat64m2_t vs2,
                                               vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredmax_vs_f64m4_f64m1_m(vbool16_t vm, vfloat64m4_t vs2,
                                               vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredmax_vs_f64m8_f64m1_m(vbool8_t vm, vfloat64m8_t vs2,
                                               vfloat64m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmin_vs_f16mf4_f16m1_m(vbool64_t vm, vfloat16mf4_t vs2,
                                                vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmin_vs_f16mf2_f16m1_m(vbool32_t vm, vfloat16mf2_t vs2,
                                                vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmin_vs_f16m1_f16m1_m(vbool16_t vm, vfloat16m1_t vs2,
                                               vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmin_vs_f16m2_f16m1_m(vbool8_t vm, vfloat16m2_t vs2,
                                               vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmin_vs_f16m4_f16m1_m(vbool4_t vm, vfloat16m4_t vs2,
                                               vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmin_vs_f16m8_f16m1_m(vbool2_t vm, vfloat16m8_t vs2,
                                               vfloat16m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredmin_vs_f32mf2_f32m1_m(vbool64_t vm, vfloat32mf2_t vs2,
                                                vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredmin_vs_f32m1_f32m1_m(vbool32_t vm, vfloat32m1_t vs2,
                                               vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredmin_vs_f32m2_f32m1_m(vbool16_t vm, vfloat32m2_t vs2,
                                               vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredmin_vs_f32m4_f32m1_m(vbool8_t vm, vfloat32m4_t vs2,
                                               vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredmin_vs_f32m8_f32m1_m(vbool4_t vm, vfloat32m8_t vs2,
                                               vfloat32m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredmin_vs_f64m1_f64m1_m(vbool64_t vm, vfloat64m1_t vs2,
                                               vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredmin_vs_f64m2_f64m1_m(vbool32_t vm, vfloat64m2_t vs2,
                                               vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredmin_vs_f64m4_f64m1_m(vbool16_t vm, vfloat64m4_t vs2,
                                               vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredmin_vs_f64m8_f64m1_m(vbool8_t vm, vfloat64m8_t vs2,
                                               vfloat64m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredosum_vs_f16mf4_f16m1_rm(vfloat16mf4_t vs2,
                                                  vfloat16m1_t vs1,
                                                  unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredosum_vs_f16mf2_f16m1_rm(vfloat16mf2_t vs2,
                                                  vfloat16m1_t vs1,
                                                  unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredosum_vs_f16m1_f16m1_rm(vfloat16m1_t vs2,
                                                 vfloat16m1_t vs1,
                                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredosum_vs_f16m2_f16m1_rm(vfloat16m2_t vs2,
                                                 vfloat16m1_t vs1,
                                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredosum_vs_f16m4_f16m1_rm(vfloat16m4_t vs2,
                                                 vfloat16m1_t vs1,
                                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredosum_vs_f16m8_f16m1_rm(vfloat16m8_t vs2,
                                                 vfloat16m1_t vs1,
                                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredosum_vs_f32mf2_f32m1_rm(vfloat32mf2_t vs2,
                                                  vfloat32m1_t vs1,
                                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredosum_vs_f32m1_f32m1_rm(vfloat32m1_t vs2,
                                                 vfloat32m1_t vs1,
                                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredosum_vs_f32m2_f32m1_rm(vfloat32m2_t vs2,
                                                 vfloat32m1_t vs1,
                                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredosum_vs_f32m4_f32m1_rm(vfloat32m4_t vs2,
                                                 vfloat32m1_t vs1,
                                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredosum_vs_f32m8_f32m1_rm(vfloat32m8_t vs2,
                                                 vfloat32m1_t vs1,
                                                 unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfredosum_vs_f64m1_f64m1_rm(vfloat64m1_t vs2,
                                                 vfloat64m1_t vs1,
                                                 unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfredosum_vs_f64m2_f64m1_rm(vfloat64m2_t vs2,
                                                 vfloat64m1_t vs1,
                                                 unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfredosum_vs_f64m4_f64m1_rm(vfloat64m4_t vs2,
                                                 vfloat64m1_t vs1,
                                                 unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfredosum_vs_f64m8_f64m1_rm(vfloat64m8_t vs2,
                                                 vfloat64m1_t vs1,
                                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredusum_vs_f16mf4_f16m1_rm(vfloat16mf4_t vs2,
                                                  vfloat16m1_t vs1,
                                                  unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredusum_vs_f16mf2_f16m1_rm(vfloat16mf2_t vs2,
                                                  vfloat16m1_t vs1,
                                                  unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredusum_vs_f16m1_f16m1_rm(vfloat16m1_t vs2,
                                                 vfloat16m1_t vs1,
                                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredusum_vs_f16m2_f16m1_rm(vfloat16m2_t vs2,
                                                 vfloat16m1_t vs1,
                                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredusum_vs_f16m4_f16m1_rm(vfloat16m4_t vs2,
                                                 vfloat16m1_t vs1,
                                                 unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredusum_vs_f16m8_f16m1_rm(vfloat16m8_t vs2,
                                                 vfloat16m1_t vs1,
                                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredusum_vs_f32mf2_f32m1_rm(vfloat32mf2_t vs2,
                                                  vfloat32m1_t vs1,
                                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredusum_vs_f32m1_f32m1_rm(vfloat32m1_t vs2,
                                                 vfloat32m1_t vs1,
                                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredusum_vs_f32m2_f32m1_rm(vfloat32m2_t vs2,
                                                 vfloat32m1_t vs1,
                                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredusum_vs_f32m4_f32m1_rm(vfloat32m4_t vs2,
                                                 vfloat32m1_t vs1,
                                                 unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredusum_vs_f32m8_f32m1_rm(vfloat32m8_t vs2,
                                                 vfloat32m1_t vs1,
                                                 unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfredusum_vs_f64m1_f64m1_rm(vfloat64m1_t vs2,
                                                 vfloat64m1_t vs1,
                                                 unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfredusum_vs_f64m2_f64m1_rm(vfloat64m2_t vs2,
                                                 vfloat64m1_t vs1,
                                                 unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfredusum_vs_f64m4_f64m1_rm(vfloat64m4_t vs2,
                                                 vfloat64m1_t vs1,
                                                 unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfredusum_vs_f64m8_f64m1_rm(vfloat64m8_t vs2,
                                                 vfloat64m1_t vs1,
                                                 unsigned int frm, size_t vl);
// masked functions
vfloat16m1_t __riscv_vfredosum_vs_f16mf4_f16m1_rm_m(vbool64_t vm,
                                                    vfloat16mf4_t vs2,
                                                    vfloat16m1_t vs1,
                                                    unsigned int frm,
                                                    size_t vl);
vfloat16m1_t __riscv_vfredosum_vs_f16mf2_f16m1_rm_m(vbool32_t vm,
                                                    vfloat16mf2_t vs2,
                                                    vfloat16m1_t vs1,
                                                    unsigned int frm,
                                                    size_t vl);
vfloat16m1_t __riscv_vfredosum_vs_f16m1_f16m1_rm_m(vbool16_t vm,
                                                   vfloat16m1_t vs2,
                                                   vfloat16m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredosum_vs_f16m2_f16m1_rm_m(vbool8_t vm,
                                                   vfloat16m2_t vs2,
                                                   vfloat16m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredosum_vs_f16m4_f16m1_rm_m(vbool4_t vm,
                                                   vfloat16m4_t vs2,
                                                   vfloat16m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredosum_vs_f16m8_f16m1_rm_m(vbool2_t vm,
                                                   vfloat16m8_t vs2,
                                                   vfloat16m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredosum_vs_f32mf2_f32m1_rm_m(vbool64_t vm,
                                                    vfloat32mf2_t vs2,
                                                    vfloat32m1_t vs1,
                                                    unsigned int frm,
                                                    size_t vl);
vfloat32m1_t __riscv_vfredosum_vs_f32m1_f32m1_rm_m(vbool32_t vm,
                                                   vfloat32m1_t vs2,
                                                   vfloat32m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredosum_vs_f32m2_f32m1_rm_m(vbool16_t vm,
                                                   vfloat32m2_t vs2,
                                                   vfloat32m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredosum_vs_f32m4_f32m1_rm_m(vbool8_t vm,
                                                   vfloat32m4_t vs2,
                                                   vfloat32m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredosum_vs_f32m8_f32m1_rm_m(vbool4_t vm,
                                                   vfloat32m8_t vs2,
                                                   vfloat32m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfredosum_vs_f64m1_f64m1_rm_m(vbool64_t vm,
                                                   vfloat64m1_t vs2,
                                                   vfloat64m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfredosum_vs_f64m2_f64m1_rm_m(vbool32_t vm,
                                                   vfloat64m2_t vs2,
                                                   vfloat64m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfredosum_vs_f64m4_f64m1_rm_m(vbool16_t vm,
                                                   vfloat64m4_t vs2,
                                                   vfloat64m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfredosum_vs_f64m8_f64m1_rm_m(vbool8_t vm,
                                                   vfloat64m8_t vs2,
                                                   vfloat64m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredusum_vs_f16mf4_f16m1_rm_m(vbool64_t vm,
                                                    vfloat16mf4_t vs2,
                                                    vfloat16m1_t vs1,
                                                    unsigned int frm,
                                                    size_t vl);
vfloat16m1_t __riscv_vfredusum_vs_f16mf2_f16m1_rm_m(vbool32_t vm,
                                                    vfloat16mf2_t vs2,
                                                    vfloat16m1_t vs1,
                                                    unsigned int frm,
                                                    size_t vl);
vfloat16m1_t __riscv_vfredusum_vs_f16m1_f16m1_rm_m(vbool16_t vm,
                                                   vfloat16m1_t vs2,
                                                   vfloat16m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredusum_vs_f16m2_f16m1_rm_m(vbool8_t vm,
                                                   vfloat16m2_t vs2,
                                                   vfloat16m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredusum_vs_f16m4_f16m1_rm_m(vbool4_t vm,
                                                   vfloat16m4_t vs2,
                                                   vfloat16m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredusum_vs_f16m8_f16m1_rm_m(vbool2_t vm,
                                                   vfloat16m8_t vs2,
                                                   vfloat16m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredusum_vs_f32mf2_f32m1_rm_m(vbool64_t vm,
                                                    vfloat32mf2_t vs2,
                                                    vfloat32m1_t vs1,
                                                    unsigned int frm,
                                                    size_t vl);
vfloat32m1_t __riscv_vfredusum_vs_f32m1_f32m1_rm_m(vbool32_t vm,
                                                   vfloat32m1_t vs2,
                                                   vfloat32m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredusum_vs_f32m2_f32m1_rm_m(vbool16_t vm,
                                                   vfloat32m2_t vs2,
                                                   vfloat32m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredusum_vs_f32m4_f32m1_rm_m(vbool8_t vm,
                                                   vfloat32m4_t vs2,
                                                   vfloat32m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredusum_vs_f32m8_f32m1_rm_m(vbool4_t vm,
                                                   vfloat32m8_t vs2,
                                                   vfloat32m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfredusum_vs_f64m1_f64m1_rm_m(vbool64_t vm,
                                                   vfloat64m1_t vs2,
                                                   vfloat64m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfredusum_vs_f64m2_f64m1_rm_m(vbool32_t vm,
                                                   vfloat64m2_t vs2,
                                                   vfloat64m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfredusum_vs_f64m4_f64m1_rm_m(vbool16_t vm,
                                                   vfloat64m4_t vs2,
                                                   vfloat64m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfredusum_vs_f64m8_f64m1_rm_m(vbool8_t vm,
                                                   vfloat64m8_t vs2,
                                                   vfloat64m1_t vs1,
                                                   unsigned int frm, size_t vl);

Vector Widening Floating-Point Reduction Intrinsics

vfloat32m1_t __riscv_vfwredosum_vs_f16mf4_f32m1(vfloat16mf4_t vs2,
                                                vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredosum_vs_f16mf2_f32m1(vfloat16mf2_t vs2,
                                                vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredosum_vs_f16m1_f32m1(vfloat16m1_t vs2,
                                               vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredosum_vs_f16m2_f32m1(vfloat16m2_t vs2,
                                               vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredosum_vs_f16m4_f32m1(vfloat16m4_t vs2,
                                               vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredosum_vs_f16m8_f32m1(vfloat16m8_t vs2,
                                               vfloat32m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredosum_vs_f32mf2_f64m1(vfloat32mf2_t vs2,
                                                vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredosum_vs_f32m1_f64m1(vfloat32m1_t vs2,
                                               vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredosum_vs_f32m2_f64m1(vfloat32m2_t vs2,
                                               vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredosum_vs_f32m4_f64m1(vfloat32m4_t vs2,
                                               vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredosum_vs_f32m8_f64m1(vfloat32m8_t vs2,
                                               vfloat64m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredusum_vs_f16mf4_f32m1(vfloat16mf4_t vs2,
                                                vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredusum_vs_f16mf2_f32m1(vfloat16mf2_t vs2,
                                                vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredusum_vs_f16m1_f32m1(vfloat16m1_t vs2,
                                               vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredusum_vs_f16m2_f32m1(vfloat16m2_t vs2,
                                               vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredusum_vs_f16m4_f32m1(vfloat16m4_t vs2,
                                               vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredusum_vs_f16m8_f32m1(vfloat16m8_t vs2,
                                               vfloat32m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredusum_vs_f32mf2_f64m1(vfloat32mf2_t vs2,
                                                vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredusum_vs_f32m1_f64m1(vfloat32m1_t vs2,
                                               vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredusum_vs_f32m2_f64m1(vfloat32m2_t vs2,
                                               vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredusum_vs_f32m4_f64m1(vfloat32m4_t vs2,
                                               vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredusum_vs_f32m8_f64m1(vfloat32m8_t vs2,
                                               vfloat64m1_t vs1, size_t vl);
// masked functions
vfloat32m1_t __riscv_vfwredosum_vs_f16mf4_f32m1_m(vbool64_t vm,
                                                  vfloat16mf4_t vs2,
                                                  vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredosum_vs_f16mf2_f32m1_m(vbool32_t vm,
                                                  vfloat16mf2_t vs2,
                                                  vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredosum_vs_f16m1_f32m1_m(vbool16_t vm, vfloat16m1_t vs2,
                                                 vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredosum_vs_f16m2_f32m1_m(vbool8_t vm, vfloat16m2_t vs2,
                                                 vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredosum_vs_f16m4_f32m1_m(vbool4_t vm, vfloat16m4_t vs2,
                                                 vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredosum_vs_f16m8_f32m1_m(vbool2_t vm, vfloat16m8_t vs2,
                                                 vfloat32m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredosum_vs_f32mf2_f64m1_m(vbool64_t vm,
                                                  vfloat32mf2_t vs2,
                                                  vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredosum_vs_f32m1_f64m1_m(vbool32_t vm, vfloat32m1_t vs2,
                                                 vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredosum_vs_f32m2_f64m1_m(vbool16_t vm, vfloat32m2_t vs2,
                                                 vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredosum_vs_f32m4_f64m1_m(vbool8_t vm, vfloat32m4_t vs2,
                                                 vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredosum_vs_f32m8_f64m1_m(vbool4_t vm, vfloat32m8_t vs2,
                                                 vfloat64m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredusum_vs_f16mf4_f32m1_m(vbool64_t vm,
                                                  vfloat16mf4_t vs2,
                                                  vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredusum_vs_f16mf2_f32m1_m(vbool32_t vm,
                                                  vfloat16mf2_t vs2,
                                                  vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredusum_vs_f16m1_f32m1_m(vbool16_t vm, vfloat16m1_t vs2,
                                                 vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredusum_vs_f16m2_f32m1_m(vbool8_t vm, vfloat16m2_t vs2,
                                                 vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredusum_vs_f16m4_f32m1_m(vbool4_t vm, vfloat16m4_t vs2,
                                                 vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredusum_vs_f16m8_f32m1_m(vbool2_t vm, vfloat16m8_t vs2,
                                                 vfloat32m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredusum_vs_f32mf2_f64m1_m(vbool64_t vm,
                                                  vfloat32mf2_t vs2,
                                                  vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredusum_vs_f32m1_f64m1_m(vbool32_t vm, vfloat32m1_t vs2,
                                                 vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredusum_vs_f32m2_f64m1_m(vbool16_t vm, vfloat32m2_t vs2,
                                                 vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredusum_vs_f32m4_f64m1_m(vbool8_t vm, vfloat32m4_t vs2,
                                                 vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredusum_vs_f32m8_f64m1_m(vbool4_t vm, vfloat32m8_t vs2,
                                                 vfloat64m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredosum_vs_f16mf4_f32m1_rm(vfloat16mf4_t vs2,
                                                   vfloat32m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwredosum_vs_f16mf2_f32m1_rm(vfloat16mf2_t vs2,
                                                   vfloat32m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwredosum_vs_f16m1_f32m1_rm(vfloat16m1_t vs2,
                                                  vfloat32m1_t vs1,
                                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwredosum_vs_f16m2_f32m1_rm(vfloat16m2_t vs2,
                                                  vfloat32m1_t vs1,
                                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwredosum_vs_f16m4_f32m1_rm(vfloat16m4_t vs2,
                                                  vfloat32m1_t vs1,
                                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwredosum_vs_f16m8_f32m1_rm(vfloat16m8_t vs2,
                                                  vfloat32m1_t vs1,
                                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwredosum_vs_f32mf2_f64m1_rm(vfloat32mf2_t vs2,
                                                   vfloat64m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwredosum_vs_f32m1_f64m1_rm(vfloat32m1_t vs2,
                                                  vfloat64m1_t vs1,
                                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwredosum_vs_f32m2_f64m1_rm(vfloat32m2_t vs2,
                                                  vfloat64m1_t vs1,
                                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwredosum_vs_f32m4_f64m1_rm(vfloat32m4_t vs2,
                                                  vfloat64m1_t vs1,
                                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwredosum_vs_f32m8_f64m1_rm(vfloat32m8_t vs2,
                                                  vfloat64m1_t vs1,
                                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwredusum_vs_f16mf4_f32m1_rm(vfloat16mf4_t vs2,
                                                   vfloat32m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwredusum_vs_f16mf2_f32m1_rm(vfloat16mf2_t vs2,
                                                   vfloat32m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwredusum_vs_f16m1_f32m1_rm(vfloat16m1_t vs2,
                                                  vfloat32m1_t vs1,
                                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwredusum_vs_f16m2_f32m1_rm(vfloat16m2_t vs2,
                                                  vfloat32m1_t vs1,
                                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwredusum_vs_f16m4_f32m1_rm(vfloat16m4_t vs2,
                                                  vfloat32m1_t vs1,
                                                  unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwredusum_vs_f16m8_f32m1_rm(vfloat16m8_t vs2,
                                                  vfloat32m1_t vs1,
                                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwredusum_vs_f32mf2_f64m1_rm(vfloat32mf2_t vs2,
                                                   vfloat64m1_t vs1,
                                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwredusum_vs_f32m1_f64m1_rm(vfloat32m1_t vs2,
                                                  vfloat64m1_t vs1,
                                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwredusum_vs_f32m2_f64m1_rm(vfloat32m2_t vs2,
                                                  vfloat64m1_t vs1,
                                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwredusum_vs_f32m4_f64m1_rm(vfloat32m4_t vs2,
                                                  vfloat64m1_t vs1,
                                                  unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwredusum_vs_f32m8_f64m1_rm(vfloat32m8_t vs2,
                                                  vfloat64m1_t vs1,
                                                  unsigned int frm, size_t vl);
// masked functions
vfloat32m1_t __riscv_vfwredosum_vs_f16mf4_f32m1_rm_m(vbool64_t vm,
                                                     vfloat16mf4_t vs2,
                                                     vfloat32m1_t vs1,
                                                     unsigned int frm,
                                                     size_t vl);
vfloat32m1_t __riscv_vfwredosum_vs_f16mf2_f32m1_rm_m(vbool32_t vm,
                                                     vfloat16mf2_t vs2,
                                                     vfloat32m1_t vs1,
                                                     unsigned int frm,
                                                     size_t vl);
vfloat32m1_t __riscv_vfwredosum_vs_f16m1_f32m1_rm_m(vbool16_t vm,
                                                    vfloat16m1_t vs2,
                                                    vfloat32m1_t vs1,
                                                    unsigned int frm,
                                                    size_t vl);
vfloat32m1_t __riscv_vfwredosum_vs_f16m2_f32m1_rm_m(vbool8_t vm,
                                                    vfloat16m2_t vs2,
                                                    vfloat32m1_t vs1,
                                                    unsigned int frm,
                                                    size_t vl);
vfloat32m1_t __riscv_vfwredosum_vs_f16m4_f32m1_rm_m(vbool4_t vm,
                                                    vfloat16m4_t vs2,
                                                    vfloat32m1_t vs1,
                                                    unsigned int frm,
                                                    size_t vl);
vfloat32m1_t __riscv_vfwredosum_vs_f16m8_f32m1_rm_m(vbool2_t vm,
                                                    vfloat16m8_t vs2,
                                                    vfloat32m1_t vs1,
                                                    unsigned int frm,
                                                    size_t vl);
vfloat64m1_t __riscv_vfwredosum_vs_f32mf2_f64m1_rm_m(vbool64_t vm,
                                                     vfloat32mf2_t vs2,
                                                     vfloat64m1_t vs1,
                                                     unsigned int frm,
                                                     size_t vl);
vfloat64m1_t __riscv_vfwredosum_vs_f32m1_f64m1_rm_m(vbool32_t vm,
                                                    vfloat32m1_t vs2,
                                                    vfloat64m1_t vs1,
                                                    unsigned int frm,
                                                    size_t vl);
vfloat64m1_t __riscv_vfwredosum_vs_f32m2_f64m1_rm_m(vbool16_t vm,
                                                    vfloat32m2_t vs2,
                                                    vfloat64m1_t vs1,
                                                    unsigned int frm,
                                                    size_t vl);
vfloat64m1_t __riscv_vfwredosum_vs_f32m4_f64m1_rm_m(vbool8_t vm,
                                                    vfloat32m4_t vs2,
                                                    vfloat64m1_t vs1,
                                                    unsigned int frm,
                                                    size_t vl);
vfloat64m1_t __riscv_vfwredosum_vs_f32m8_f64m1_rm_m(vbool4_t vm,
                                                    vfloat32m8_t vs2,
                                                    vfloat64m1_t vs1,
                                                    unsigned int frm,
                                                    size_t vl);
vfloat32m1_t __riscv_vfwredusum_vs_f16mf4_f32m1_rm_m(vbool64_t vm,
                                                     vfloat16mf4_t vs2,
                                                     vfloat32m1_t vs1,
                                                     unsigned int frm,
                                                     size_t vl);
vfloat32m1_t __riscv_vfwredusum_vs_f16mf2_f32m1_rm_m(vbool32_t vm,
                                                     vfloat16mf2_t vs2,
                                                     vfloat32m1_t vs1,
                                                     unsigned int frm,
                                                     size_t vl);
vfloat32m1_t __riscv_vfwredusum_vs_f16m1_f32m1_rm_m(vbool16_t vm,
                                                    vfloat16m1_t vs2,
                                                    vfloat32m1_t vs1,
                                                    unsigned int frm,
                                                    size_t vl);
vfloat32m1_t __riscv_vfwredusum_vs_f16m2_f32m1_rm_m(vbool8_t vm,
                                                    vfloat16m2_t vs2,
                                                    vfloat32m1_t vs1,
                                                    unsigned int frm,
                                                    size_t vl);
vfloat32m1_t __riscv_vfwredusum_vs_f16m4_f32m1_rm_m(vbool4_t vm,
                                                    vfloat16m4_t vs2,
                                                    vfloat32m1_t vs1,
                                                    unsigned int frm,
                                                    size_t vl);
vfloat32m1_t __riscv_vfwredusum_vs_f16m8_f32m1_rm_m(vbool2_t vm,
                                                    vfloat16m8_t vs2,
                                                    vfloat32m1_t vs1,
                                                    unsigned int frm,
                                                    size_t vl);
vfloat64m1_t __riscv_vfwredusum_vs_f32mf2_f64m1_rm_m(vbool64_t vm,
                                                     vfloat32mf2_t vs2,
                                                     vfloat64m1_t vs1,
                                                     unsigned int frm,
                                                     size_t vl);
vfloat64m1_t __riscv_vfwredusum_vs_f32m1_f64m1_rm_m(vbool32_t vm,
                                                    vfloat32m1_t vs2,
                                                    vfloat64m1_t vs1,
                                                    unsigned int frm,
                                                    size_t vl);
vfloat64m1_t __riscv_vfwredusum_vs_f32m2_f64m1_rm_m(vbool16_t vm,
                                                    vfloat32m2_t vs2,
                                                    vfloat64m1_t vs1,
                                                    unsigned int frm,
                                                    size_t vl);
vfloat64m1_t __riscv_vfwredusum_vs_f32m4_f64m1_rm_m(vbool8_t vm,
                                                    vfloat32m4_t vs2,
                                                    vfloat64m1_t vs1,
                                                    unsigned int frm,
                                                    size_t vl);
vfloat64m1_t __riscv_vfwredusum_vs_f32m8_f64m1_rm_m(vbool4_t vm,
                                                    vfloat32m8_t vs2,
                                                    vfloat64m1_t vs1,
                                                    unsigned int frm,
                                                    size_t vl);