Skip to content

Latest commit

 

History

History
1958 lines (1949 loc) · 121 KB

05_vector_reduction_operations.adoc

File metadata and controls

1958 lines (1949 loc) · 121 KB

Vector Reduction Operations

Vector Single-Width Integer Reduction Intrinsics

vint8m1_t __riscv_vredsum_tu(vint8m1_t vd, vint8mf8_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredsum_tu(vint8m1_t vd, vint8mf4_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredsum_tu(vint8m1_t vd, vint8mf2_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredsum_tu(vint8m1_t vd, vint8m1_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredsum_tu(vint8m1_t vd, vint8m2_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredsum_tu(vint8m1_t vd, vint8m4_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredsum_tu(vint8m1_t vd, vint8m8_t vs2, vint8m1_t vs1,
                             size_t vl);
vint16m1_t __riscv_vredsum_tu(vint16m1_t vd, vint16mf4_t vs2, vint16m1_t vs1,
                              size_t vl);
vint16m1_t __riscv_vredsum_tu(vint16m1_t vd, vint16mf2_t vs2, vint16m1_t vs1,
                              size_t vl);
vint16m1_t __riscv_vredsum_tu(vint16m1_t vd, vint16m1_t vs2, vint16m1_t vs1,
                              size_t vl);
vint16m1_t __riscv_vredsum_tu(vint16m1_t vd, vint16m2_t vs2, vint16m1_t vs1,
                              size_t vl);
vint16m1_t __riscv_vredsum_tu(vint16m1_t vd, vint16m4_t vs2, vint16m1_t vs1,
                              size_t vl);
vint16m1_t __riscv_vredsum_tu(vint16m1_t vd, vint16m8_t vs2, vint16m1_t vs1,
                              size_t vl);
vint32m1_t __riscv_vredsum_tu(vint32m1_t vd, vint32mf2_t vs2, vint32m1_t vs1,
                              size_t vl);
vint32m1_t __riscv_vredsum_tu(vint32m1_t vd, vint32m1_t vs2, vint32m1_t vs1,
                              size_t vl);
vint32m1_t __riscv_vredsum_tu(vint32m1_t vd, vint32m2_t vs2, vint32m1_t vs1,
                              size_t vl);
vint32m1_t __riscv_vredsum_tu(vint32m1_t vd, vint32m4_t vs2, vint32m1_t vs1,
                              size_t vl);
vint32m1_t __riscv_vredsum_tu(vint32m1_t vd, vint32m8_t vs2, vint32m1_t vs1,
                              size_t vl);
vint64m1_t __riscv_vredsum_tu(vint64m1_t vd, vint64m1_t vs2, vint64m1_t vs1,
                              size_t vl);
vint64m1_t __riscv_vredsum_tu(vint64m1_t vd, vint64m2_t vs2, vint64m1_t vs1,
                              size_t vl);
vint64m1_t __riscv_vredsum_tu(vint64m1_t vd, vint64m4_t vs2, vint64m1_t vs1,
                              size_t vl);
vint64m1_t __riscv_vredsum_tu(vint64m1_t vd, vint64m8_t vs2, vint64m1_t vs1,
                              size_t vl);
vint8m1_t __riscv_vredmax_tu(vint8m1_t vd, vint8mf8_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredmax_tu(vint8m1_t vd, vint8mf4_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredmax_tu(vint8m1_t vd, vint8mf2_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredmax_tu(vint8m1_t vd, vint8m1_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredmax_tu(vint8m1_t vd, vint8m2_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredmax_tu(vint8m1_t vd, vint8m4_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredmax_tu(vint8m1_t vd, vint8m8_t vs2, vint8m1_t vs1,
                             size_t vl);
vint16m1_t __riscv_vredmax_tu(vint16m1_t vd, vint16mf4_t vs2, vint16m1_t vs1,
                              size_t vl);
vint16m1_t __riscv_vredmax_tu(vint16m1_t vd, vint16mf2_t vs2, vint16m1_t vs1,
                              size_t vl);
vint16m1_t __riscv_vredmax_tu(vint16m1_t vd, vint16m1_t vs2, vint16m1_t vs1,
                              size_t vl);
vint16m1_t __riscv_vredmax_tu(vint16m1_t vd, vint16m2_t vs2, vint16m1_t vs1,
                              size_t vl);
vint16m1_t __riscv_vredmax_tu(vint16m1_t vd, vint16m4_t vs2, vint16m1_t vs1,
                              size_t vl);
vint16m1_t __riscv_vredmax_tu(vint16m1_t vd, vint16m8_t vs2, vint16m1_t vs1,
                              size_t vl);
vint32m1_t __riscv_vredmax_tu(vint32m1_t vd, vint32mf2_t vs2, vint32m1_t vs1,
                              size_t vl);
vint32m1_t __riscv_vredmax_tu(vint32m1_t vd, vint32m1_t vs2, vint32m1_t vs1,
                              size_t vl);
vint32m1_t __riscv_vredmax_tu(vint32m1_t vd, vint32m2_t vs2, vint32m1_t vs1,
                              size_t vl);
vint32m1_t __riscv_vredmax_tu(vint32m1_t vd, vint32m4_t vs2, vint32m1_t vs1,
                              size_t vl);
vint32m1_t __riscv_vredmax_tu(vint32m1_t vd, vint32m8_t vs2, vint32m1_t vs1,
                              size_t vl);
vint64m1_t __riscv_vredmax_tu(vint64m1_t vd, vint64m1_t vs2, vint64m1_t vs1,
                              size_t vl);
vint64m1_t __riscv_vredmax_tu(vint64m1_t vd, vint64m2_t vs2, vint64m1_t vs1,
                              size_t vl);
vint64m1_t __riscv_vredmax_tu(vint64m1_t vd, vint64m4_t vs2, vint64m1_t vs1,
                              size_t vl);
vint64m1_t __riscv_vredmax_tu(vint64m1_t vd, vint64m8_t vs2, vint64m1_t vs1,
                              size_t vl);
vint8m1_t __riscv_vredmin_tu(vint8m1_t vd, vint8mf8_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredmin_tu(vint8m1_t vd, vint8mf4_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredmin_tu(vint8m1_t vd, vint8mf2_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredmin_tu(vint8m1_t vd, vint8m1_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredmin_tu(vint8m1_t vd, vint8m2_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredmin_tu(vint8m1_t vd, vint8m4_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredmin_tu(vint8m1_t vd, vint8m8_t vs2, vint8m1_t vs1,
                             size_t vl);
vint16m1_t __riscv_vredmin_tu(vint16m1_t vd, vint16mf4_t vs2, vint16m1_t vs1,
                              size_t vl);
vint16m1_t __riscv_vredmin_tu(vint16m1_t vd, vint16mf2_t vs2, vint16m1_t vs1,
                              size_t vl);
vint16m1_t __riscv_vredmin_tu(vint16m1_t vd, vint16m1_t vs2, vint16m1_t vs1,
                              size_t vl);
vint16m1_t __riscv_vredmin_tu(vint16m1_t vd, vint16m2_t vs2, vint16m1_t vs1,
                              size_t vl);
vint16m1_t __riscv_vredmin_tu(vint16m1_t vd, vint16m4_t vs2, vint16m1_t vs1,
                              size_t vl);
vint16m1_t __riscv_vredmin_tu(vint16m1_t vd, vint16m8_t vs2, vint16m1_t vs1,
                              size_t vl);
vint32m1_t __riscv_vredmin_tu(vint32m1_t vd, vint32mf2_t vs2, vint32m1_t vs1,
                              size_t vl);
vint32m1_t __riscv_vredmin_tu(vint32m1_t vd, vint32m1_t vs2, vint32m1_t vs1,
                              size_t vl);
vint32m1_t __riscv_vredmin_tu(vint32m1_t vd, vint32m2_t vs2, vint32m1_t vs1,
                              size_t vl);
vint32m1_t __riscv_vredmin_tu(vint32m1_t vd, vint32m4_t vs2, vint32m1_t vs1,
                              size_t vl);
vint32m1_t __riscv_vredmin_tu(vint32m1_t vd, vint32m8_t vs2, vint32m1_t vs1,
                              size_t vl);
vint64m1_t __riscv_vredmin_tu(vint64m1_t vd, vint64m1_t vs2, vint64m1_t vs1,
                              size_t vl);
vint64m1_t __riscv_vredmin_tu(vint64m1_t vd, vint64m2_t vs2, vint64m1_t vs1,
                              size_t vl);
vint64m1_t __riscv_vredmin_tu(vint64m1_t vd, vint64m4_t vs2, vint64m1_t vs1,
                              size_t vl);
vint64m1_t __riscv_vredmin_tu(vint64m1_t vd, vint64m8_t vs2, vint64m1_t vs1,
                              size_t vl);
vint8m1_t __riscv_vredand_tu(vint8m1_t vd, vint8mf8_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredand_tu(vint8m1_t vd, vint8mf4_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredand_tu(vint8m1_t vd, vint8mf2_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredand_tu(vint8m1_t vd, vint8m1_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredand_tu(vint8m1_t vd, vint8m2_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredand_tu(vint8m1_t vd, vint8m4_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredand_tu(vint8m1_t vd, vint8m8_t vs2, vint8m1_t vs1,
                             size_t vl);
vint16m1_t __riscv_vredand_tu(vint16m1_t vd, vint16mf4_t vs2, vint16m1_t vs1,
                              size_t vl);
vint16m1_t __riscv_vredand_tu(vint16m1_t vd, vint16mf2_t vs2, vint16m1_t vs1,
                              size_t vl);
vint16m1_t __riscv_vredand_tu(vint16m1_t vd, vint16m1_t vs2, vint16m1_t vs1,
                              size_t vl);
vint16m1_t __riscv_vredand_tu(vint16m1_t vd, vint16m2_t vs2, vint16m1_t vs1,
                              size_t vl);
vint16m1_t __riscv_vredand_tu(vint16m1_t vd, vint16m4_t vs2, vint16m1_t vs1,
                              size_t vl);
vint16m1_t __riscv_vredand_tu(vint16m1_t vd, vint16m8_t vs2, vint16m1_t vs1,
                              size_t vl);
vint32m1_t __riscv_vredand_tu(vint32m1_t vd, vint32mf2_t vs2, vint32m1_t vs1,
                              size_t vl);
vint32m1_t __riscv_vredand_tu(vint32m1_t vd, vint32m1_t vs2, vint32m1_t vs1,
                              size_t vl);
vint32m1_t __riscv_vredand_tu(vint32m1_t vd, vint32m2_t vs2, vint32m1_t vs1,
                              size_t vl);
vint32m1_t __riscv_vredand_tu(vint32m1_t vd, vint32m4_t vs2, vint32m1_t vs1,
                              size_t vl);
vint32m1_t __riscv_vredand_tu(vint32m1_t vd, vint32m8_t vs2, vint32m1_t vs1,
                              size_t vl);
vint64m1_t __riscv_vredand_tu(vint64m1_t vd, vint64m1_t vs2, vint64m1_t vs1,
                              size_t vl);
vint64m1_t __riscv_vredand_tu(vint64m1_t vd, vint64m2_t vs2, vint64m1_t vs1,
                              size_t vl);
vint64m1_t __riscv_vredand_tu(vint64m1_t vd, vint64m4_t vs2, vint64m1_t vs1,
                              size_t vl);
vint64m1_t __riscv_vredand_tu(vint64m1_t vd, vint64m8_t vs2, vint64m1_t vs1,
                              size_t vl);
vint8m1_t __riscv_vredor_tu(vint8m1_t vd, vint8mf8_t vs2, vint8m1_t vs1,
                            size_t vl);
vint8m1_t __riscv_vredor_tu(vint8m1_t vd, vint8mf4_t vs2, vint8m1_t vs1,
                            size_t vl);
vint8m1_t __riscv_vredor_tu(vint8m1_t vd, vint8mf2_t vs2, vint8m1_t vs1,
                            size_t vl);
vint8m1_t __riscv_vredor_tu(vint8m1_t vd, vint8m1_t vs2, vint8m1_t vs1,
                            size_t vl);
vint8m1_t __riscv_vredor_tu(vint8m1_t vd, vint8m2_t vs2, vint8m1_t vs1,
                            size_t vl);
vint8m1_t __riscv_vredor_tu(vint8m1_t vd, vint8m4_t vs2, vint8m1_t vs1,
                            size_t vl);
vint8m1_t __riscv_vredor_tu(vint8m1_t vd, vint8m8_t vs2, vint8m1_t vs1,
                            size_t vl);
vint16m1_t __riscv_vredor_tu(vint16m1_t vd, vint16mf4_t vs2, vint16m1_t vs1,
                             size_t vl);
vint16m1_t __riscv_vredor_tu(vint16m1_t vd, vint16mf2_t vs2, vint16m1_t vs1,
                             size_t vl);
vint16m1_t __riscv_vredor_tu(vint16m1_t vd, vint16m1_t vs2, vint16m1_t vs1,
                             size_t vl);
vint16m1_t __riscv_vredor_tu(vint16m1_t vd, vint16m2_t vs2, vint16m1_t vs1,
                             size_t vl);
vint16m1_t __riscv_vredor_tu(vint16m1_t vd, vint16m4_t vs2, vint16m1_t vs1,
                             size_t vl);
vint16m1_t __riscv_vredor_tu(vint16m1_t vd, vint16m8_t vs2, vint16m1_t vs1,
                             size_t vl);
vint32m1_t __riscv_vredor_tu(vint32m1_t vd, vint32mf2_t vs2, vint32m1_t vs1,
                             size_t vl);
vint32m1_t __riscv_vredor_tu(vint32m1_t vd, vint32m1_t vs2, vint32m1_t vs1,
                             size_t vl);
vint32m1_t __riscv_vredor_tu(vint32m1_t vd, vint32m2_t vs2, vint32m1_t vs1,
                             size_t vl);
vint32m1_t __riscv_vredor_tu(vint32m1_t vd, vint32m4_t vs2, vint32m1_t vs1,
                             size_t vl);
vint32m1_t __riscv_vredor_tu(vint32m1_t vd, vint32m8_t vs2, vint32m1_t vs1,
                             size_t vl);
vint64m1_t __riscv_vredor_tu(vint64m1_t vd, vint64m1_t vs2, vint64m1_t vs1,
                             size_t vl);
vint64m1_t __riscv_vredor_tu(vint64m1_t vd, vint64m2_t vs2, vint64m1_t vs1,
                             size_t vl);
vint64m1_t __riscv_vredor_tu(vint64m1_t vd, vint64m4_t vs2, vint64m1_t vs1,
                             size_t vl);
vint64m1_t __riscv_vredor_tu(vint64m1_t vd, vint64m8_t vs2, vint64m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredxor_tu(vint8m1_t vd, vint8mf8_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredxor_tu(vint8m1_t vd, vint8mf4_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredxor_tu(vint8m1_t vd, vint8mf2_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredxor_tu(vint8m1_t vd, vint8m1_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredxor_tu(vint8m1_t vd, vint8m2_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredxor_tu(vint8m1_t vd, vint8m4_t vs2, vint8m1_t vs1,
                             size_t vl);
vint8m1_t __riscv_vredxor_tu(vint8m1_t vd, vint8m8_t vs2, vint8m1_t vs1,
                             size_t vl);
vint16m1_t __riscv_vredxor_tu(vint16m1_t vd, vint16mf4_t vs2, vint16m1_t vs1,
                              size_t vl);
vint16m1_t __riscv_vredxor_tu(vint16m1_t vd, vint16mf2_t vs2, vint16m1_t vs1,
                              size_t vl);
vint16m1_t __riscv_vredxor_tu(vint16m1_t vd, vint16m1_t vs2, vint16m1_t vs1,
                              size_t vl);
vint16m1_t __riscv_vredxor_tu(vint16m1_t vd, vint16m2_t vs2, vint16m1_t vs1,
                              size_t vl);
vint16m1_t __riscv_vredxor_tu(vint16m1_t vd, vint16m4_t vs2, vint16m1_t vs1,
                              size_t vl);
vint16m1_t __riscv_vredxor_tu(vint16m1_t vd, vint16m8_t vs2, vint16m1_t vs1,
                              size_t vl);
vint32m1_t __riscv_vredxor_tu(vint32m1_t vd, vint32mf2_t vs2, vint32m1_t vs1,
                              size_t vl);
vint32m1_t __riscv_vredxor_tu(vint32m1_t vd, vint32m1_t vs2, vint32m1_t vs1,
                              size_t vl);
vint32m1_t __riscv_vredxor_tu(vint32m1_t vd, vint32m2_t vs2, vint32m1_t vs1,
                              size_t vl);
vint32m1_t __riscv_vredxor_tu(vint32m1_t vd, vint32m4_t vs2, vint32m1_t vs1,
                              size_t vl);
vint32m1_t __riscv_vredxor_tu(vint32m1_t vd, vint32m8_t vs2, vint32m1_t vs1,
                              size_t vl);
vint64m1_t __riscv_vredxor_tu(vint64m1_t vd, vint64m1_t vs2, vint64m1_t vs1,
                              size_t vl);
vint64m1_t __riscv_vredxor_tu(vint64m1_t vd, vint64m2_t vs2, vint64m1_t vs1,
                              size_t vl);
vint64m1_t __riscv_vredxor_tu(vint64m1_t vd, vint64m4_t vs2, vint64m1_t vs1,
                              size_t vl);
vint64m1_t __riscv_vredxor_tu(vint64m1_t vd, vint64m8_t vs2, vint64m1_t vs1,
                              size_t vl);
vuint8m1_t __riscv_vredsum_tu(vuint8m1_t vd, vuint8mf8_t vs2, vuint8m1_t vs1,
                              size_t vl);
vuint8m1_t __riscv_vredsum_tu(vuint8m1_t vd, vuint8mf4_t vs2, vuint8m1_t vs1,
                              size_t vl);
vuint8m1_t __riscv_vredsum_tu(vuint8m1_t vd, vuint8mf2_t vs2, vuint8m1_t vs1,
                              size_t vl);
vuint8m1_t __riscv_vredsum_tu(vuint8m1_t vd, vuint8m1_t vs2, vuint8m1_t vs1,
                              size_t vl);
vuint8m1_t __riscv_vredsum_tu(vuint8m1_t vd, vuint8m2_t vs2, vuint8m1_t vs1,
                              size_t vl);
vuint8m1_t __riscv_vredsum_tu(vuint8m1_t vd, vuint8m4_t vs2, vuint8m1_t vs1,
                              size_t vl);
vuint8m1_t __riscv_vredsum_tu(vuint8m1_t vd, vuint8m8_t vs2, vuint8m1_t vs1,
                              size_t vl);
vuint16m1_t __riscv_vredsum_tu(vuint16m1_t vd, vuint16mf4_t vs2,
                               vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredsum_tu(vuint16m1_t vd, vuint16mf2_t vs2,
                               vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredsum_tu(vuint16m1_t vd, vuint16m1_t vs2, vuint16m1_t vs1,
                               size_t vl);
vuint16m1_t __riscv_vredsum_tu(vuint16m1_t vd, vuint16m2_t vs2, vuint16m1_t vs1,
                               size_t vl);
vuint16m1_t __riscv_vredsum_tu(vuint16m1_t vd, vuint16m4_t vs2, vuint16m1_t vs1,
                               size_t vl);
vuint16m1_t __riscv_vredsum_tu(vuint16m1_t vd, vuint16m8_t vs2, vuint16m1_t vs1,
                               size_t vl);
vuint32m1_t __riscv_vredsum_tu(vuint32m1_t vd, vuint32mf2_t vs2,
                               vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredsum_tu(vuint32m1_t vd, vuint32m1_t vs2, vuint32m1_t vs1,
                               size_t vl);
vuint32m1_t __riscv_vredsum_tu(vuint32m1_t vd, vuint32m2_t vs2, vuint32m1_t vs1,
                               size_t vl);
vuint32m1_t __riscv_vredsum_tu(vuint32m1_t vd, vuint32m4_t vs2, vuint32m1_t vs1,
                               size_t vl);
vuint32m1_t __riscv_vredsum_tu(vuint32m1_t vd, vuint32m8_t vs2, vuint32m1_t vs1,
                               size_t vl);
vuint64m1_t __riscv_vredsum_tu(vuint64m1_t vd, vuint64m1_t vs2, vuint64m1_t vs1,
                               size_t vl);
vuint64m1_t __riscv_vredsum_tu(vuint64m1_t vd, vuint64m2_t vs2, vuint64m1_t vs1,
                               size_t vl);
vuint64m1_t __riscv_vredsum_tu(vuint64m1_t vd, vuint64m4_t vs2, vuint64m1_t vs1,
                               size_t vl);
vuint64m1_t __riscv_vredsum_tu(vuint64m1_t vd, vuint64m8_t vs2, vuint64m1_t vs1,
                               size_t vl);
vuint8m1_t __riscv_vredmaxu_tu(vuint8m1_t vd, vuint8mf8_t vs2, vuint8m1_t vs1,
                               size_t vl);
vuint8m1_t __riscv_vredmaxu_tu(vuint8m1_t vd, vuint8mf4_t vs2, vuint8m1_t vs1,
                               size_t vl);
vuint8m1_t __riscv_vredmaxu_tu(vuint8m1_t vd, vuint8mf2_t vs2, vuint8m1_t vs1,
                               size_t vl);
vuint8m1_t __riscv_vredmaxu_tu(vuint8m1_t vd, vuint8m1_t vs2, vuint8m1_t vs1,
                               size_t vl);
vuint8m1_t __riscv_vredmaxu_tu(vuint8m1_t vd, vuint8m2_t vs2, vuint8m1_t vs1,
                               size_t vl);
vuint8m1_t __riscv_vredmaxu_tu(vuint8m1_t vd, vuint8m4_t vs2, vuint8m1_t vs1,
                               size_t vl);
vuint8m1_t __riscv_vredmaxu_tu(vuint8m1_t vd, vuint8m8_t vs2, vuint8m1_t vs1,
                               size_t vl);
vuint16m1_t __riscv_vredmaxu_tu(vuint16m1_t vd, vuint16mf4_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredmaxu_tu(vuint16m1_t vd, vuint16mf2_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredmaxu_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredmaxu_tu(vuint16m1_t vd, vuint16m2_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredmaxu_tu(vuint16m1_t vd, vuint16m4_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredmaxu_tu(vuint16m1_t vd, vuint16m8_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredmaxu_tu(vuint32m1_t vd, vuint32mf2_t vs2,
                                vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredmaxu_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredmaxu_tu(vuint32m1_t vd, vuint32m2_t vs2,
                                vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredmaxu_tu(vuint32m1_t vd, vuint32m4_t vs2,
                                vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredmaxu_tu(vuint32m1_t vd, vuint32m8_t vs2,
                                vuint32m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredmaxu_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredmaxu_tu(vuint64m1_t vd, vuint64m2_t vs2,
                                vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredmaxu_tu(vuint64m1_t vd, vuint64m4_t vs2,
                                vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredmaxu_tu(vuint64m1_t vd, vuint64m8_t vs2,
                                vuint64m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredminu_tu(vuint8m1_t vd, vuint8mf8_t vs2, vuint8m1_t vs1,
                               size_t vl);
vuint8m1_t __riscv_vredminu_tu(vuint8m1_t vd, vuint8mf4_t vs2, vuint8m1_t vs1,
                               size_t vl);
vuint8m1_t __riscv_vredminu_tu(vuint8m1_t vd, vuint8mf2_t vs2, vuint8m1_t vs1,
                               size_t vl);
vuint8m1_t __riscv_vredminu_tu(vuint8m1_t vd, vuint8m1_t vs2, vuint8m1_t vs1,
                               size_t vl);
vuint8m1_t __riscv_vredminu_tu(vuint8m1_t vd, vuint8m2_t vs2, vuint8m1_t vs1,
                               size_t vl);
vuint8m1_t __riscv_vredminu_tu(vuint8m1_t vd, vuint8m4_t vs2, vuint8m1_t vs1,
                               size_t vl);
vuint8m1_t __riscv_vredminu_tu(vuint8m1_t vd, vuint8m8_t vs2, vuint8m1_t vs1,
                               size_t vl);
vuint16m1_t __riscv_vredminu_tu(vuint16m1_t vd, vuint16mf4_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredminu_tu(vuint16m1_t vd, vuint16mf2_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredminu_tu(vuint16m1_t vd, vuint16m1_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredminu_tu(vuint16m1_t vd, vuint16m2_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredminu_tu(vuint16m1_t vd, vuint16m4_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredminu_tu(vuint16m1_t vd, vuint16m8_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredminu_tu(vuint32m1_t vd, vuint32mf2_t vs2,
                                vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredminu_tu(vuint32m1_t vd, vuint32m1_t vs2,
                                vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredminu_tu(vuint32m1_t vd, vuint32m2_t vs2,
                                vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredminu_tu(vuint32m1_t vd, vuint32m4_t vs2,
                                vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredminu_tu(vuint32m1_t vd, vuint32m8_t vs2,
                                vuint32m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredminu_tu(vuint64m1_t vd, vuint64m1_t vs2,
                                vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredminu_tu(vuint64m1_t vd, vuint64m2_t vs2,
                                vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredminu_tu(vuint64m1_t vd, vuint64m4_t vs2,
                                vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredminu_tu(vuint64m1_t vd, vuint64m8_t vs2,
                                vuint64m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredand_tu(vuint8m1_t vd, vuint8mf8_t vs2, vuint8m1_t vs1,
                              size_t vl);
vuint8m1_t __riscv_vredand_tu(vuint8m1_t vd, vuint8mf4_t vs2, vuint8m1_t vs1,
                              size_t vl);
vuint8m1_t __riscv_vredand_tu(vuint8m1_t vd, vuint8mf2_t vs2, vuint8m1_t vs1,
                              size_t vl);
vuint8m1_t __riscv_vredand_tu(vuint8m1_t vd, vuint8m1_t vs2, vuint8m1_t vs1,
                              size_t vl);
vuint8m1_t __riscv_vredand_tu(vuint8m1_t vd, vuint8m2_t vs2, vuint8m1_t vs1,
                              size_t vl);
vuint8m1_t __riscv_vredand_tu(vuint8m1_t vd, vuint8m4_t vs2, vuint8m1_t vs1,
                              size_t vl);
vuint8m1_t __riscv_vredand_tu(vuint8m1_t vd, vuint8m8_t vs2, vuint8m1_t vs1,
                              size_t vl);
vuint16m1_t __riscv_vredand_tu(vuint16m1_t vd, vuint16mf4_t vs2,
                               vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredand_tu(vuint16m1_t vd, vuint16mf2_t vs2,
                               vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredand_tu(vuint16m1_t vd, vuint16m1_t vs2, vuint16m1_t vs1,
                               size_t vl);
vuint16m1_t __riscv_vredand_tu(vuint16m1_t vd, vuint16m2_t vs2, vuint16m1_t vs1,
                               size_t vl);
vuint16m1_t __riscv_vredand_tu(vuint16m1_t vd, vuint16m4_t vs2, vuint16m1_t vs1,
                               size_t vl);
vuint16m1_t __riscv_vredand_tu(vuint16m1_t vd, vuint16m8_t vs2, vuint16m1_t vs1,
                               size_t vl);
vuint32m1_t __riscv_vredand_tu(vuint32m1_t vd, vuint32mf2_t vs2,
                               vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredand_tu(vuint32m1_t vd, vuint32m1_t vs2, vuint32m1_t vs1,
                               size_t vl);
vuint32m1_t __riscv_vredand_tu(vuint32m1_t vd, vuint32m2_t vs2, vuint32m1_t vs1,
                               size_t vl);
vuint32m1_t __riscv_vredand_tu(vuint32m1_t vd, vuint32m4_t vs2, vuint32m1_t vs1,
                               size_t vl);
vuint32m1_t __riscv_vredand_tu(vuint32m1_t vd, vuint32m8_t vs2, vuint32m1_t vs1,
                               size_t vl);
vuint64m1_t __riscv_vredand_tu(vuint64m1_t vd, vuint64m1_t vs2, vuint64m1_t vs1,
                               size_t vl);
vuint64m1_t __riscv_vredand_tu(vuint64m1_t vd, vuint64m2_t vs2, vuint64m1_t vs1,
                               size_t vl);
vuint64m1_t __riscv_vredand_tu(vuint64m1_t vd, vuint64m4_t vs2, vuint64m1_t vs1,
                               size_t vl);
vuint64m1_t __riscv_vredand_tu(vuint64m1_t vd, vuint64m8_t vs2, vuint64m1_t vs1,
                               size_t vl);
vuint8m1_t __riscv_vredor_tu(vuint8m1_t vd, vuint8mf8_t vs2, vuint8m1_t vs1,
                             size_t vl);
vuint8m1_t __riscv_vredor_tu(vuint8m1_t vd, vuint8mf4_t vs2, vuint8m1_t vs1,
                             size_t vl);
vuint8m1_t __riscv_vredor_tu(vuint8m1_t vd, vuint8mf2_t vs2, vuint8m1_t vs1,
                             size_t vl);
vuint8m1_t __riscv_vredor_tu(vuint8m1_t vd, vuint8m1_t vs2, vuint8m1_t vs1,
                             size_t vl);
vuint8m1_t __riscv_vredor_tu(vuint8m1_t vd, vuint8m2_t vs2, vuint8m1_t vs1,
                             size_t vl);
vuint8m1_t __riscv_vredor_tu(vuint8m1_t vd, vuint8m4_t vs2, vuint8m1_t vs1,
                             size_t vl);
vuint8m1_t __riscv_vredor_tu(vuint8m1_t vd, vuint8m8_t vs2, vuint8m1_t vs1,
                             size_t vl);
vuint16m1_t __riscv_vredor_tu(vuint16m1_t vd, vuint16mf4_t vs2, vuint16m1_t vs1,
                              size_t vl);
vuint16m1_t __riscv_vredor_tu(vuint16m1_t vd, vuint16mf2_t vs2, vuint16m1_t vs1,
                              size_t vl);
vuint16m1_t __riscv_vredor_tu(vuint16m1_t vd, vuint16m1_t vs2, vuint16m1_t vs1,
                              size_t vl);
vuint16m1_t __riscv_vredor_tu(vuint16m1_t vd, vuint16m2_t vs2, vuint16m1_t vs1,
                              size_t vl);
vuint16m1_t __riscv_vredor_tu(vuint16m1_t vd, vuint16m4_t vs2, vuint16m1_t vs1,
                              size_t vl);
vuint16m1_t __riscv_vredor_tu(vuint16m1_t vd, vuint16m8_t vs2, vuint16m1_t vs1,
                              size_t vl);
vuint32m1_t __riscv_vredor_tu(vuint32m1_t vd, vuint32mf2_t vs2, vuint32m1_t vs1,
                              size_t vl);
vuint32m1_t __riscv_vredor_tu(vuint32m1_t vd, vuint32m1_t vs2, vuint32m1_t vs1,
                              size_t vl);
vuint32m1_t __riscv_vredor_tu(vuint32m1_t vd, vuint32m2_t vs2, vuint32m1_t vs1,
                              size_t vl);
vuint32m1_t __riscv_vredor_tu(vuint32m1_t vd, vuint32m4_t vs2, vuint32m1_t vs1,
                              size_t vl);
vuint32m1_t __riscv_vredor_tu(vuint32m1_t vd, vuint32m8_t vs2, vuint32m1_t vs1,
                              size_t vl);
vuint64m1_t __riscv_vredor_tu(vuint64m1_t vd, vuint64m1_t vs2, vuint64m1_t vs1,
                              size_t vl);
vuint64m1_t __riscv_vredor_tu(vuint64m1_t vd, vuint64m2_t vs2, vuint64m1_t vs1,
                              size_t vl);
vuint64m1_t __riscv_vredor_tu(vuint64m1_t vd, vuint64m4_t vs2, vuint64m1_t vs1,
                              size_t vl);
vuint64m1_t __riscv_vredor_tu(vuint64m1_t vd, vuint64m8_t vs2, vuint64m1_t vs1,
                              size_t vl);
vuint8m1_t __riscv_vredxor_tu(vuint8m1_t vd, vuint8mf8_t vs2, vuint8m1_t vs1,
                              size_t vl);
vuint8m1_t __riscv_vredxor_tu(vuint8m1_t vd, vuint8mf4_t vs2, vuint8m1_t vs1,
                              size_t vl);
vuint8m1_t __riscv_vredxor_tu(vuint8m1_t vd, vuint8mf2_t vs2, vuint8m1_t vs1,
                              size_t vl);
vuint8m1_t __riscv_vredxor_tu(vuint8m1_t vd, vuint8m1_t vs2, vuint8m1_t vs1,
                              size_t vl);
vuint8m1_t __riscv_vredxor_tu(vuint8m1_t vd, vuint8m2_t vs2, vuint8m1_t vs1,
                              size_t vl);
vuint8m1_t __riscv_vredxor_tu(vuint8m1_t vd, vuint8m4_t vs2, vuint8m1_t vs1,
                              size_t vl);
vuint8m1_t __riscv_vredxor_tu(vuint8m1_t vd, vuint8m8_t vs2, vuint8m1_t vs1,
                              size_t vl);
vuint16m1_t __riscv_vredxor_tu(vuint16m1_t vd, vuint16mf4_t vs2,
                               vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredxor_tu(vuint16m1_t vd, vuint16mf2_t vs2,
                               vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredxor_tu(vuint16m1_t vd, vuint16m1_t vs2, vuint16m1_t vs1,
                               size_t vl);
vuint16m1_t __riscv_vredxor_tu(vuint16m1_t vd, vuint16m2_t vs2, vuint16m1_t vs1,
                               size_t vl);
vuint16m1_t __riscv_vredxor_tu(vuint16m1_t vd, vuint16m4_t vs2, vuint16m1_t vs1,
                               size_t vl);
vuint16m1_t __riscv_vredxor_tu(vuint16m1_t vd, vuint16m8_t vs2, vuint16m1_t vs1,
                               size_t vl);
vuint32m1_t __riscv_vredxor_tu(vuint32m1_t vd, vuint32mf2_t vs2,
                               vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredxor_tu(vuint32m1_t vd, vuint32m1_t vs2, vuint32m1_t vs1,
                               size_t vl);
vuint32m1_t __riscv_vredxor_tu(vuint32m1_t vd, vuint32m2_t vs2, vuint32m1_t vs1,
                               size_t vl);
vuint32m1_t __riscv_vredxor_tu(vuint32m1_t vd, vuint32m4_t vs2, vuint32m1_t vs1,
                               size_t vl);
vuint32m1_t __riscv_vredxor_tu(vuint32m1_t vd, vuint32m8_t vs2, vuint32m1_t vs1,
                               size_t vl);
vuint64m1_t __riscv_vredxor_tu(vuint64m1_t vd, vuint64m1_t vs2, vuint64m1_t vs1,
                               size_t vl);
vuint64m1_t __riscv_vredxor_tu(vuint64m1_t vd, vuint64m2_t vs2, vuint64m1_t vs1,
                               size_t vl);
vuint64m1_t __riscv_vredxor_tu(vuint64m1_t vd, vuint64m4_t vs2, vuint64m1_t vs1,
                               size_t vl);
vuint64m1_t __riscv_vredxor_tu(vuint64m1_t vd, vuint64m8_t vs2, vuint64m1_t vs1,
                               size_t vl);
// masked functions
vint8m1_t __riscv_vredsum_tum(vbool64_t vm, vint8m1_t vd, vint8mf8_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredsum_tum(vbool32_t vm, vint8m1_t vd, vint8mf4_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredsum_tum(vbool16_t vm, vint8m1_t vd, vint8mf2_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredsum_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredsum_tum(vbool4_t vm, vint8m1_t vd, vint8m2_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredsum_tum(vbool2_t vm, vint8m1_t vd, vint8m4_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredsum_tum(vbool1_t vm, vint8m1_t vd, vint8m8_t vs2,
                              vint8m1_t vs1, size_t vl);
vint16m1_t __riscv_vredsum_tum(vbool64_t vm, vint16m1_t vd, vint16mf4_t vs2,
                               vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredsum_tum(vbool32_t vm, vint16m1_t vd, vint16mf2_t vs2,
                               vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredsum_tum(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                               vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredsum_tum(vbool8_t vm, vint16m1_t vd, vint16m2_t vs2,
                               vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredsum_tum(vbool4_t vm, vint16m1_t vd, vint16m4_t vs2,
                               vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredsum_tum(vbool2_t vm, vint16m1_t vd, vint16m8_t vs2,
                               vint16m1_t vs1, size_t vl);
vint32m1_t __riscv_vredsum_tum(vbool64_t vm, vint32m1_t vd, vint32mf2_t vs2,
                               vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredsum_tum(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                               vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredsum_tum(vbool16_t vm, vint32m1_t vd, vint32m2_t vs2,
                               vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredsum_tum(vbool8_t vm, vint32m1_t vd, vint32m4_t vs2,
                               vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredsum_tum(vbool4_t vm, vint32m1_t vd, vint32m8_t vs2,
                               vint32m1_t vs1, size_t vl);
vint64m1_t __riscv_vredsum_tum(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                               vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredsum_tum(vbool32_t vm, vint64m1_t vd, vint64m2_t vs2,
                               vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredsum_tum(vbool16_t vm, vint64m1_t vd, vint64m4_t vs2,
                               vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredsum_tum(vbool8_t vm, vint64m1_t vd, vint64m8_t vs2,
                               vint64m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmax_tum(vbool64_t vm, vint8m1_t vd, vint8mf8_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmax_tum(vbool32_t vm, vint8m1_t vd, vint8mf4_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmax_tum(vbool16_t vm, vint8m1_t vd, vint8mf2_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmax_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmax_tum(vbool4_t vm, vint8m1_t vd, vint8m2_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmax_tum(vbool2_t vm, vint8m1_t vd, vint8m4_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmax_tum(vbool1_t vm, vint8m1_t vd, vint8m8_t vs2,
                              vint8m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmax_tum(vbool64_t vm, vint16m1_t vd, vint16mf4_t vs2,
                               vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmax_tum(vbool32_t vm, vint16m1_t vd, vint16mf2_t vs2,
                               vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmax_tum(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                               vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmax_tum(vbool8_t vm, vint16m1_t vd, vint16m2_t vs2,
                               vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmax_tum(vbool4_t vm, vint16m1_t vd, vint16m4_t vs2,
                               vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmax_tum(vbool2_t vm, vint16m1_t vd, vint16m8_t vs2,
                               vint16m1_t vs1, size_t vl);
vint32m1_t __riscv_vredmax_tum(vbool64_t vm, vint32m1_t vd, vint32mf2_t vs2,
                               vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredmax_tum(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                               vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredmax_tum(vbool16_t vm, vint32m1_t vd, vint32m2_t vs2,
                               vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredmax_tum(vbool8_t vm, vint32m1_t vd, vint32m4_t vs2,
                               vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredmax_tum(vbool4_t vm, vint32m1_t vd, vint32m8_t vs2,
                               vint32m1_t vs1, size_t vl);
vint64m1_t __riscv_vredmax_tum(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                               vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredmax_tum(vbool32_t vm, vint64m1_t vd, vint64m2_t vs2,
                               vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredmax_tum(vbool16_t vm, vint64m1_t vd, vint64m4_t vs2,
                               vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredmax_tum(vbool8_t vm, vint64m1_t vd, vint64m8_t vs2,
                               vint64m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmin_tum(vbool64_t vm, vint8m1_t vd, vint8mf8_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmin_tum(vbool32_t vm, vint8m1_t vd, vint8mf4_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmin_tum(vbool16_t vm, vint8m1_t vd, vint8mf2_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmin_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmin_tum(vbool4_t vm, vint8m1_t vd, vint8m2_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmin_tum(vbool2_t vm, vint8m1_t vd, vint8m4_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredmin_tum(vbool1_t vm, vint8m1_t vd, vint8m8_t vs2,
                              vint8m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmin_tum(vbool64_t vm, vint16m1_t vd, vint16mf4_t vs2,
                               vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmin_tum(vbool32_t vm, vint16m1_t vd, vint16mf2_t vs2,
                               vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmin_tum(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                               vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmin_tum(vbool8_t vm, vint16m1_t vd, vint16m2_t vs2,
                               vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmin_tum(vbool4_t vm, vint16m1_t vd, vint16m4_t vs2,
                               vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredmin_tum(vbool2_t vm, vint16m1_t vd, vint16m8_t vs2,
                               vint16m1_t vs1, size_t vl);
vint32m1_t __riscv_vredmin_tum(vbool64_t vm, vint32m1_t vd, vint32mf2_t vs2,
                               vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredmin_tum(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                               vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredmin_tum(vbool16_t vm, vint32m1_t vd, vint32m2_t vs2,
                               vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredmin_tum(vbool8_t vm, vint32m1_t vd, vint32m4_t vs2,
                               vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredmin_tum(vbool4_t vm, vint32m1_t vd, vint32m8_t vs2,
                               vint32m1_t vs1, size_t vl);
vint64m1_t __riscv_vredmin_tum(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                               vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredmin_tum(vbool32_t vm, vint64m1_t vd, vint64m2_t vs2,
                               vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredmin_tum(vbool16_t vm, vint64m1_t vd, vint64m4_t vs2,
                               vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredmin_tum(vbool8_t vm, vint64m1_t vd, vint64m8_t vs2,
                               vint64m1_t vs1, size_t vl);
vint8m1_t __riscv_vredand_tum(vbool64_t vm, vint8m1_t vd, vint8mf8_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredand_tum(vbool32_t vm, vint8m1_t vd, vint8mf4_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredand_tum(vbool16_t vm, vint8m1_t vd, vint8mf2_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredand_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredand_tum(vbool4_t vm, vint8m1_t vd, vint8m2_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredand_tum(vbool2_t vm, vint8m1_t vd, vint8m4_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredand_tum(vbool1_t vm, vint8m1_t vd, vint8m8_t vs2,
                              vint8m1_t vs1, size_t vl);
vint16m1_t __riscv_vredand_tum(vbool64_t vm, vint16m1_t vd, vint16mf4_t vs2,
                               vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredand_tum(vbool32_t vm, vint16m1_t vd, vint16mf2_t vs2,
                               vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredand_tum(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                               vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredand_tum(vbool8_t vm, vint16m1_t vd, vint16m2_t vs2,
                               vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredand_tum(vbool4_t vm, vint16m1_t vd, vint16m4_t vs2,
                               vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredand_tum(vbool2_t vm, vint16m1_t vd, vint16m8_t vs2,
                               vint16m1_t vs1, size_t vl);
vint32m1_t __riscv_vredand_tum(vbool64_t vm, vint32m1_t vd, vint32mf2_t vs2,
                               vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredand_tum(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                               vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredand_tum(vbool16_t vm, vint32m1_t vd, vint32m2_t vs2,
                               vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredand_tum(vbool8_t vm, vint32m1_t vd, vint32m4_t vs2,
                               vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredand_tum(vbool4_t vm, vint32m1_t vd, vint32m8_t vs2,
                               vint32m1_t vs1, size_t vl);
vint64m1_t __riscv_vredand_tum(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                               vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredand_tum(vbool32_t vm, vint64m1_t vd, vint64m2_t vs2,
                               vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredand_tum(vbool16_t vm, vint64m1_t vd, vint64m4_t vs2,
                               vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredand_tum(vbool8_t vm, vint64m1_t vd, vint64m8_t vs2,
                               vint64m1_t vs1, size_t vl);
vint8m1_t __riscv_vredor_tum(vbool64_t vm, vint8m1_t vd, vint8mf8_t vs2,
                             vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredor_tum(vbool32_t vm, vint8m1_t vd, vint8mf4_t vs2,
                             vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredor_tum(vbool16_t vm, vint8m1_t vd, vint8mf2_t vs2,
                             vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredor_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                             vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredor_tum(vbool4_t vm, vint8m1_t vd, vint8m2_t vs2,
                             vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredor_tum(vbool2_t vm, vint8m1_t vd, vint8m4_t vs2,
                             vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredor_tum(vbool1_t vm, vint8m1_t vd, vint8m8_t vs2,
                             vint8m1_t vs1, size_t vl);
vint16m1_t __riscv_vredor_tum(vbool64_t vm, vint16m1_t vd, vint16mf4_t vs2,
                              vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredor_tum(vbool32_t vm, vint16m1_t vd, vint16mf2_t vs2,
                              vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredor_tum(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                              vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredor_tum(vbool8_t vm, vint16m1_t vd, vint16m2_t vs2,
                              vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredor_tum(vbool4_t vm, vint16m1_t vd, vint16m4_t vs2,
                              vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredor_tum(vbool2_t vm, vint16m1_t vd, vint16m8_t vs2,
                              vint16m1_t vs1, size_t vl);
vint32m1_t __riscv_vredor_tum(vbool64_t vm, vint32m1_t vd, vint32mf2_t vs2,
                              vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredor_tum(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                              vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredor_tum(vbool16_t vm, vint32m1_t vd, vint32m2_t vs2,
                              vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredor_tum(vbool8_t vm, vint32m1_t vd, vint32m4_t vs2,
                              vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredor_tum(vbool4_t vm, vint32m1_t vd, vint32m8_t vs2,
                              vint32m1_t vs1, size_t vl);
vint64m1_t __riscv_vredor_tum(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                              vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredor_tum(vbool32_t vm, vint64m1_t vd, vint64m2_t vs2,
                              vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredor_tum(vbool16_t vm, vint64m1_t vd, vint64m4_t vs2,
                              vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredor_tum(vbool8_t vm, vint64m1_t vd, vint64m8_t vs2,
                              vint64m1_t vs1, size_t vl);
vint8m1_t __riscv_vredxor_tum(vbool64_t vm, vint8m1_t vd, vint8mf8_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredxor_tum(vbool32_t vm, vint8m1_t vd, vint8mf4_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredxor_tum(vbool16_t vm, vint8m1_t vd, vint8mf2_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredxor_tum(vbool8_t vm, vint8m1_t vd, vint8m1_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredxor_tum(vbool4_t vm, vint8m1_t vd, vint8m2_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredxor_tum(vbool2_t vm, vint8m1_t vd, vint8m4_t vs2,
                              vint8m1_t vs1, size_t vl);
vint8m1_t __riscv_vredxor_tum(vbool1_t vm, vint8m1_t vd, vint8m8_t vs2,
                              vint8m1_t vs1, size_t vl);
vint16m1_t __riscv_vredxor_tum(vbool64_t vm, vint16m1_t vd, vint16mf4_t vs2,
                               vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredxor_tum(vbool32_t vm, vint16m1_t vd, vint16mf2_t vs2,
                               vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredxor_tum(vbool16_t vm, vint16m1_t vd, vint16m1_t vs2,
                               vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredxor_tum(vbool8_t vm, vint16m1_t vd, vint16m2_t vs2,
                               vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredxor_tum(vbool4_t vm, vint16m1_t vd, vint16m4_t vs2,
                               vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vredxor_tum(vbool2_t vm, vint16m1_t vd, vint16m8_t vs2,
                               vint16m1_t vs1, size_t vl);
vint32m1_t __riscv_vredxor_tum(vbool64_t vm, vint32m1_t vd, vint32mf2_t vs2,
                               vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredxor_tum(vbool32_t vm, vint32m1_t vd, vint32m1_t vs2,
                               vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredxor_tum(vbool16_t vm, vint32m1_t vd, vint32m2_t vs2,
                               vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredxor_tum(vbool8_t vm, vint32m1_t vd, vint32m4_t vs2,
                               vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vredxor_tum(vbool4_t vm, vint32m1_t vd, vint32m8_t vs2,
                               vint32m1_t vs1, size_t vl);
vint64m1_t __riscv_vredxor_tum(vbool64_t vm, vint64m1_t vd, vint64m1_t vs2,
                               vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredxor_tum(vbool32_t vm, vint64m1_t vd, vint64m2_t vs2,
                               vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredxor_tum(vbool16_t vm, vint64m1_t vd, vint64m4_t vs2,
                               vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vredxor_tum(vbool8_t vm, vint64m1_t vd, vint64m8_t vs2,
                               vint64m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredsum_tum(vbool64_t vm, vuint8m1_t vd, vuint8mf8_t vs2,
                               vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredsum_tum(vbool32_t vm, vuint8m1_t vd, vuint8mf4_t vs2,
                               vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredsum_tum(vbool16_t vm, vuint8m1_t vd, vuint8mf2_t vs2,
                               vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredsum_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                               vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredsum_tum(vbool4_t vm, vuint8m1_t vd, vuint8m2_t vs2,
                               vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredsum_tum(vbool2_t vm, vuint8m1_t vd, vuint8m4_t vs2,
                               vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredsum_tum(vbool1_t vm, vuint8m1_t vd, vuint8m8_t vs2,
                               vuint8m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredsum_tum(vbool64_t vm, vuint16m1_t vd, vuint16mf4_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredsum_tum(vbool32_t vm, vuint16m1_t vd, vuint16mf2_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredsum_tum(vbool16_t vm, vuint16m1_t vd, vuint16m1_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredsum_tum(vbool8_t vm, vuint16m1_t vd, vuint16m2_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredsum_tum(vbool4_t vm, vuint16m1_t vd, vuint16m4_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredsum_tum(vbool2_t vm, vuint16m1_t vd, vuint16m8_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredsum_tum(vbool64_t vm, vuint32m1_t vd, vuint32mf2_t vs2,
                                vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredsum_tum(vbool32_t vm, vuint32m1_t vd, vuint32m1_t vs2,
                                vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredsum_tum(vbool16_t vm, vuint32m1_t vd, vuint32m2_t vs2,
                                vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredsum_tum(vbool8_t vm, vuint32m1_t vd, vuint32m4_t vs2,
                                vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredsum_tum(vbool4_t vm, vuint32m1_t vd, vuint32m8_t vs2,
                                vuint32m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredsum_tum(vbool64_t vm, vuint64m1_t vd, vuint64m1_t vs2,
                                vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredsum_tum(vbool32_t vm, vuint64m1_t vd, vuint64m2_t vs2,
                                vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredsum_tum(vbool16_t vm, vuint64m1_t vd, vuint64m4_t vs2,
                                vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredsum_tum(vbool8_t vm, vuint64m1_t vd, vuint64m8_t vs2,
                                vuint64m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredmaxu_tum(vbool64_t vm, vuint8m1_t vd, vuint8mf8_t vs2,
                                vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredmaxu_tum(vbool32_t vm, vuint8m1_t vd, vuint8mf4_t vs2,
                                vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredmaxu_tum(vbool16_t vm, vuint8m1_t vd, vuint8mf2_t vs2,
                                vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredmaxu_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredmaxu_tum(vbool4_t vm, vuint8m1_t vd, vuint8m2_t vs2,
                                vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredmaxu_tum(vbool2_t vm, vuint8m1_t vd, vuint8m4_t vs2,
                                vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredmaxu_tum(vbool1_t vm, vuint8m1_t vd, vuint8m8_t vs2,
                                vuint8m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredmaxu_tum(vbool64_t vm, vuint16m1_t vd, vuint16mf4_t vs2,
                                 vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredmaxu_tum(vbool32_t vm, vuint16m1_t vd, vuint16mf2_t vs2,
                                 vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredmaxu_tum(vbool16_t vm, vuint16m1_t vd, vuint16m1_t vs2,
                                 vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredmaxu_tum(vbool8_t vm, vuint16m1_t vd, vuint16m2_t vs2,
                                 vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredmaxu_tum(vbool4_t vm, vuint16m1_t vd, vuint16m4_t vs2,
                                 vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredmaxu_tum(vbool2_t vm, vuint16m1_t vd, vuint16m8_t vs2,
                                 vuint16m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredmaxu_tum(vbool64_t vm, vuint32m1_t vd, vuint32mf2_t vs2,
                                 vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredmaxu_tum(vbool32_t vm, vuint32m1_t vd, vuint32m1_t vs2,
                                 vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredmaxu_tum(vbool16_t vm, vuint32m1_t vd, vuint32m2_t vs2,
                                 vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredmaxu_tum(vbool8_t vm, vuint32m1_t vd, vuint32m4_t vs2,
                                 vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredmaxu_tum(vbool4_t vm, vuint32m1_t vd, vuint32m8_t vs2,
                                 vuint32m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredmaxu_tum(vbool64_t vm, vuint64m1_t vd, vuint64m1_t vs2,
                                 vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredmaxu_tum(vbool32_t vm, vuint64m1_t vd, vuint64m2_t vs2,
                                 vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredmaxu_tum(vbool16_t vm, vuint64m1_t vd, vuint64m4_t vs2,
                                 vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredmaxu_tum(vbool8_t vm, vuint64m1_t vd, vuint64m8_t vs2,
                                 vuint64m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredminu_tum(vbool64_t vm, vuint8m1_t vd, vuint8mf8_t vs2,
                                vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredminu_tum(vbool32_t vm, vuint8m1_t vd, vuint8mf4_t vs2,
                                vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredminu_tum(vbool16_t vm, vuint8m1_t vd, vuint8mf2_t vs2,
                                vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredminu_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                                vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredminu_tum(vbool4_t vm, vuint8m1_t vd, vuint8m2_t vs2,
                                vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredminu_tum(vbool2_t vm, vuint8m1_t vd, vuint8m4_t vs2,
                                vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredminu_tum(vbool1_t vm, vuint8m1_t vd, vuint8m8_t vs2,
                                vuint8m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredminu_tum(vbool64_t vm, vuint16m1_t vd, vuint16mf4_t vs2,
                                 vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredminu_tum(vbool32_t vm, vuint16m1_t vd, vuint16mf2_t vs2,
                                 vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredminu_tum(vbool16_t vm, vuint16m1_t vd, vuint16m1_t vs2,
                                 vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredminu_tum(vbool8_t vm, vuint16m1_t vd, vuint16m2_t vs2,
                                 vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredminu_tum(vbool4_t vm, vuint16m1_t vd, vuint16m4_t vs2,
                                 vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredminu_tum(vbool2_t vm, vuint16m1_t vd, vuint16m8_t vs2,
                                 vuint16m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredminu_tum(vbool64_t vm, vuint32m1_t vd, vuint32mf2_t vs2,
                                 vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredminu_tum(vbool32_t vm, vuint32m1_t vd, vuint32m1_t vs2,
                                 vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredminu_tum(vbool16_t vm, vuint32m1_t vd, vuint32m2_t vs2,
                                 vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredminu_tum(vbool8_t vm, vuint32m1_t vd, vuint32m4_t vs2,
                                 vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredminu_tum(vbool4_t vm, vuint32m1_t vd, vuint32m8_t vs2,
                                 vuint32m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredminu_tum(vbool64_t vm, vuint64m1_t vd, vuint64m1_t vs2,
                                 vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredminu_tum(vbool32_t vm, vuint64m1_t vd, vuint64m2_t vs2,
                                 vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredminu_tum(vbool16_t vm, vuint64m1_t vd, vuint64m4_t vs2,
                                 vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredminu_tum(vbool8_t vm, vuint64m1_t vd, vuint64m8_t vs2,
                                 vuint64m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredand_tum(vbool64_t vm, vuint8m1_t vd, vuint8mf8_t vs2,
                               vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredand_tum(vbool32_t vm, vuint8m1_t vd, vuint8mf4_t vs2,
                               vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredand_tum(vbool16_t vm, vuint8m1_t vd, vuint8mf2_t vs2,
                               vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredand_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                               vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredand_tum(vbool4_t vm, vuint8m1_t vd, vuint8m2_t vs2,
                               vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredand_tum(vbool2_t vm, vuint8m1_t vd, vuint8m4_t vs2,
                               vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredand_tum(vbool1_t vm, vuint8m1_t vd, vuint8m8_t vs2,
                               vuint8m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredand_tum(vbool64_t vm, vuint16m1_t vd, vuint16mf4_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredand_tum(vbool32_t vm, vuint16m1_t vd, vuint16mf2_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredand_tum(vbool16_t vm, vuint16m1_t vd, vuint16m1_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredand_tum(vbool8_t vm, vuint16m1_t vd, vuint16m2_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredand_tum(vbool4_t vm, vuint16m1_t vd, vuint16m4_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredand_tum(vbool2_t vm, vuint16m1_t vd, vuint16m8_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredand_tum(vbool64_t vm, vuint32m1_t vd, vuint32mf2_t vs2,
                                vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredand_tum(vbool32_t vm, vuint32m1_t vd, vuint32m1_t vs2,
                                vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredand_tum(vbool16_t vm, vuint32m1_t vd, vuint32m2_t vs2,
                                vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredand_tum(vbool8_t vm, vuint32m1_t vd, vuint32m4_t vs2,
                                vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredand_tum(vbool4_t vm, vuint32m1_t vd, vuint32m8_t vs2,
                                vuint32m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredand_tum(vbool64_t vm, vuint64m1_t vd, vuint64m1_t vs2,
                                vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredand_tum(vbool32_t vm, vuint64m1_t vd, vuint64m2_t vs2,
                                vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredand_tum(vbool16_t vm, vuint64m1_t vd, vuint64m4_t vs2,
                                vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredand_tum(vbool8_t vm, vuint64m1_t vd, vuint64m8_t vs2,
                                vuint64m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredor_tum(vbool64_t vm, vuint8m1_t vd, vuint8mf8_t vs2,
                              vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredor_tum(vbool32_t vm, vuint8m1_t vd, vuint8mf4_t vs2,
                              vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredor_tum(vbool16_t vm, vuint8m1_t vd, vuint8mf2_t vs2,
                              vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredor_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                              vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredor_tum(vbool4_t vm, vuint8m1_t vd, vuint8m2_t vs2,
                              vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredor_tum(vbool2_t vm, vuint8m1_t vd, vuint8m4_t vs2,
                              vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredor_tum(vbool1_t vm, vuint8m1_t vd, vuint8m8_t vs2,
                              vuint8m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredor_tum(vbool64_t vm, vuint16m1_t vd, vuint16mf4_t vs2,
                               vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredor_tum(vbool32_t vm, vuint16m1_t vd, vuint16mf2_t vs2,
                               vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredor_tum(vbool16_t vm, vuint16m1_t vd, vuint16m1_t vs2,
                               vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredor_tum(vbool8_t vm, vuint16m1_t vd, vuint16m2_t vs2,
                               vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredor_tum(vbool4_t vm, vuint16m1_t vd, vuint16m4_t vs2,
                               vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredor_tum(vbool2_t vm, vuint16m1_t vd, vuint16m8_t vs2,
                               vuint16m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredor_tum(vbool64_t vm, vuint32m1_t vd, vuint32mf2_t vs2,
                               vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredor_tum(vbool32_t vm, vuint32m1_t vd, vuint32m1_t vs2,
                               vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredor_tum(vbool16_t vm, vuint32m1_t vd, vuint32m2_t vs2,
                               vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredor_tum(vbool8_t vm, vuint32m1_t vd, vuint32m4_t vs2,
                               vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredor_tum(vbool4_t vm, vuint32m1_t vd, vuint32m8_t vs2,
                               vuint32m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredor_tum(vbool64_t vm, vuint64m1_t vd, vuint64m1_t vs2,
                               vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredor_tum(vbool32_t vm, vuint64m1_t vd, vuint64m2_t vs2,
                               vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredor_tum(vbool16_t vm, vuint64m1_t vd, vuint64m4_t vs2,
                               vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredor_tum(vbool8_t vm, vuint64m1_t vd, vuint64m8_t vs2,
                               vuint64m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredxor_tum(vbool64_t vm, vuint8m1_t vd, vuint8mf8_t vs2,
                               vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredxor_tum(vbool32_t vm, vuint8m1_t vd, vuint8mf4_t vs2,
                               vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredxor_tum(vbool16_t vm, vuint8m1_t vd, vuint8mf2_t vs2,
                               vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredxor_tum(vbool8_t vm, vuint8m1_t vd, vuint8m1_t vs2,
                               vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredxor_tum(vbool4_t vm, vuint8m1_t vd, vuint8m2_t vs2,
                               vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredxor_tum(vbool2_t vm, vuint8m1_t vd, vuint8m4_t vs2,
                               vuint8m1_t vs1, size_t vl);
vuint8m1_t __riscv_vredxor_tum(vbool1_t vm, vuint8m1_t vd, vuint8m8_t vs2,
                               vuint8m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredxor_tum(vbool64_t vm, vuint16m1_t vd, vuint16mf4_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredxor_tum(vbool32_t vm, vuint16m1_t vd, vuint16mf2_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredxor_tum(vbool16_t vm, vuint16m1_t vd, vuint16m1_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredxor_tum(vbool8_t vm, vuint16m1_t vd, vuint16m2_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredxor_tum(vbool4_t vm, vuint16m1_t vd, vuint16m4_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vredxor_tum(vbool2_t vm, vuint16m1_t vd, vuint16m8_t vs2,
                                vuint16m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredxor_tum(vbool64_t vm, vuint32m1_t vd, vuint32mf2_t vs2,
                                vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredxor_tum(vbool32_t vm, vuint32m1_t vd, vuint32m1_t vs2,
                                vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredxor_tum(vbool16_t vm, vuint32m1_t vd, vuint32m2_t vs2,
                                vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredxor_tum(vbool8_t vm, vuint32m1_t vd, vuint32m4_t vs2,
                                vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vredxor_tum(vbool4_t vm, vuint32m1_t vd, vuint32m8_t vs2,
                                vuint32m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredxor_tum(vbool64_t vm, vuint64m1_t vd, vuint64m1_t vs2,
                                vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredxor_tum(vbool32_t vm, vuint64m1_t vd, vuint64m2_t vs2,
                                vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredxor_tum(vbool16_t vm, vuint64m1_t vd, vuint64m4_t vs2,
                                vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vredxor_tum(vbool8_t vm, vuint64m1_t vd, vuint64m8_t vs2,
                                vuint64m1_t vs1, size_t vl);

Vector Widening Integer Reduction Intrinsics

vint16m1_t __riscv_vwredsum_tu(vint16m1_t vd, vint8mf8_t vs2, vint16m1_t vs1,
                               size_t vl);
vint16m1_t __riscv_vwredsum_tu(vint16m1_t vd, vint8mf4_t vs2, vint16m1_t vs1,
                               size_t vl);
vint16m1_t __riscv_vwredsum_tu(vint16m1_t vd, vint8mf2_t vs2, vint16m1_t vs1,
                               size_t vl);
vint16m1_t __riscv_vwredsum_tu(vint16m1_t vd, vint8m1_t vs2, vint16m1_t vs1,
                               size_t vl);
vint16m1_t __riscv_vwredsum_tu(vint16m1_t vd, vint8m2_t vs2, vint16m1_t vs1,
                               size_t vl);
vint16m1_t __riscv_vwredsum_tu(vint16m1_t vd, vint8m4_t vs2, vint16m1_t vs1,
                               size_t vl);
vint16m1_t __riscv_vwredsum_tu(vint16m1_t vd, vint8m8_t vs2, vint16m1_t vs1,
                               size_t vl);
vint32m1_t __riscv_vwredsum_tu(vint32m1_t vd, vint16mf4_t vs2, vint32m1_t vs1,
                               size_t vl);
vint32m1_t __riscv_vwredsum_tu(vint32m1_t vd, vint16mf2_t vs2, vint32m1_t vs1,
                               size_t vl);
vint32m1_t __riscv_vwredsum_tu(vint32m1_t vd, vint16m1_t vs2, vint32m1_t vs1,
                               size_t vl);
vint32m1_t __riscv_vwredsum_tu(vint32m1_t vd, vint16m2_t vs2, vint32m1_t vs1,
                               size_t vl);
vint32m1_t __riscv_vwredsum_tu(vint32m1_t vd, vint16m4_t vs2, vint32m1_t vs1,
                               size_t vl);
vint32m1_t __riscv_vwredsum_tu(vint32m1_t vd, vint16m8_t vs2, vint32m1_t vs1,
                               size_t vl);
vint64m1_t __riscv_vwredsum_tu(vint64m1_t vd, vint32mf2_t vs2, vint64m1_t vs1,
                               size_t vl);
vint64m1_t __riscv_vwredsum_tu(vint64m1_t vd, vint32m1_t vs2, vint64m1_t vs1,
                               size_t vl);
vint64m1_t __riscv_vwredsum_tu(vint64m1_t vd, vint32m2_t vs2, vint64m1_t vs1,
                               size_t vl);
vint64m1_t __riscv_vwredsum_tu(vint64m1_t vd, vint32m4_t vs2, vint64m1_t vs1,
                               size_t vl);
vint64m1_t __riscv_vwredsum_tu(vint64m1_t vd, vint32m8_t vs2, vint64m1_t vs1,
                               size_t vl);
vuint16m1_t __riscv_vwredsumu_tu(vuint16m1_t vd, vuint8mf8_t vs2,
                                 vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vwredsumu_tu(vuint16m1_t vd, vuint8mf4_t vs2,
                                 vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vwredsumu_tu(vuint16m1_t vd, vuint8mf2_t vs2,
                                 vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vwredsumu_tu(vuint16m1_t vd, vuint8m1_t vs2,
                                 vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vwredsumu_tu(vuint16m1_t vd, vuint8m2_t vs2,
                                 vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vwredsumu_tu(vuint16m1_t vd, vuint8m4_t vs2,
                                 vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vwredsumu_tu(vuint16m1_t vd, vuint8m8_t vs2,
                                 vuint16m1_t vs1, size_t vl);
vuint32m1_t __riscv_vwredsumu_tu(vuint32m1_t vd, vuint16mf4_t vs2,
                                 vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vwredsumu_tu(vuint32m1_t vd, vuint16mf2_t vs2,
                                 vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vwredsumu_tu(vuint32m1_t vd, vuint16m1_t vs2,
                                 vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vwredsumu_tu(vuint32m1_t vd, vuint16m2_t vs2,
                                 vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vwredsumu_tu(vuint32m1_t vd, vuint16m4_t vs2,
                                 vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vwredsumu_tu(vuint32m1_t vd, vuint16m8_t vs2,
                                 vuint32m1_t vs1, size_t vl);
vuint64m1_t __riscv_vwredsumu_tu(vuint64m1_t vd, vuint32mf2_t vs2,
                                 vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vwredsumu_tu(vuint64m1_t vd, vuint32m1_t vs2,
                                 vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vwredsumu_tu(vuint64m1_t vd, vuint32m2_t vs2,
                                 vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vwredsumu_tu(vuint64m1_t vd, vuint32m4_t vs2,
                                 vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vwredsumu_tu(vuint64m1_t vd, vuint32m8_t vs2,
                                 vuint64m1_t vs1, size_t vl);
// masked functions
vint16m1_t __riscv_vwredsum_tum(vbool64_t vm, vint16m1_t vd, vint8mf8_t vs2,
                                vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vwredsum_tum(vbool32_t vm, vint16m1_t vd, vint8mf4_t vs2,
                                vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vwredsum_tum(vbool16_t vm, vint16m1_t vd, vint8mf2_t vs2,
                                vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vwredsum_tum(vbool8_t vm, vint16m1_t vd, vint8m1_t vs2,
                                vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vwredsum_tum(vbool4_t vm, vint16m1_t vd, vint8m2_t vs2,
                                vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vwredsum_tum(vbool2_t vm, vint16m1_t vd, vint8m4_t vs2,
                                vint16m1_t vs1, size_t vl);
vint16m1_t __riscv_vwredsum_tum(vbool1_t vm, vint16m1_t vd, vint8m8_t vs2,
                                vint16m1_t vs1, size_t vl);
vint32m1_t __riscv_vwredsum_tum(vbool64_t vm, vint32m1_t vd, vint16mf4_t vs2,
                                vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vwredsum_tum(vbool32_t vm, vint32m1_t vd, vint16mf2_t vs2,
                                vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vwredsum_tum(vbool16_t vm, vint32m1_t vd, vint16m1_t vs2,
                                vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vwredsum_tum(vbool8_t vm, vint32m1_t vd, vint16m2_t vs2,
                                vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vwredsum_tum(vbool4_t vm, vint32m1_t vd, vint16m4_t vs2,
                                vint32m1_t vs1, size_t vl);
vint32m1_t __riscv_vwredsum_tum(vbool2_t vm, vint32m1_t vd, vint16m8_t vs2,
                                vint32m1_t vs1, size_t vl);
vint64m1_t __riscv_vwredsum_tum(vbool64_t vm, vint64m1_t vd, vint32mf2_t vs2,
                                vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vwredsum_tum(vbool32_t vm, vint64m1_t vd, vint32m1_t vs2,
                                vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vwredsum_tum(vbool16_t vm, vint64m1_t vd, vint32m2_t vs2,
                                vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vwredsum_tum(vbool8_t vm, vint64m1_t vd, vint32m4_t vs2,
                                vint64m1_t vs1, size_t vl);
vint64m1_t __riscv_vwredsum_tum(vbool4_t vm, vint64m1_t vd, vint32m8_t vs2,
                                vint64m1_t vs1, size_t vl);
vuint16m1_t __riscv_vwredsumu_tum(vbool64_t vm, vuint16m1_t vd, vuint8mf8_t vs2,
                                  vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vwredsumu_tum(vbool32_t vm, vuint16m1_t vd, vuint8mf4_t vs2,
                                  vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vwredsumu_tum(vbool16_t vm, vuint16m1_t vd, vuint8mf2_t vs2,
                                  vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vwredsumu_tum(vbool8_t vm, vuint16m1_t vd, vuint8m1_t vs2,
                                  vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vwredsumu_tum(vbool4_t vm, vuint16m1_t vd, vuint8m2_t vs2,
                                  vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vwredsumu_tum(vbool2_t vm, vuint16m1_t vd, vuint8m4_t vs2,
                                  vuint16m1_t vs1, size_t vl);
vuint16m1_t __riscv_vwredsumu_tum(vbool1_t vm, vuint16m1_t vd, vuint8m8_t vs2,
                                  vuint16m1_t vs1, size_t vl);
vuint32m1_t __riscv_vwredsumu_tum(vbool64_t vm, vuint32m1_t vd,
                                  vuint16mf4_t vs2, vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vwredsumu_tum(vbool32_t vm, vuint32m1_t vd,
                                  vuint16mf2_t vs2, vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vwredsumu_tum(vbool16_t vm, vuint32m1_t vd, vuint16m1_t vs2,
                                  vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vwredsumu_tum(vbool8_t vm, vuint32m1_t vd, vuint16m2_t vs2,
                                  vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vwredsumu_tum(vbool4_t vm, vuint32m1_t vd, vuint16m4_t vs2,
                                  vuint32m1_t vs1, size_t vl);
vuint32m1_t __riscv_vwredsumu_tum(vbool2_t vm, vuint32m1_t vd, vuint16m8_t vs2,
                                  vuint32m1_t vs1, size_t vl);
vuint64m1_t __riscv_vwredsumu_tum(vbool64_t vm, vuint64m1_t vd,
                                  vuint32mf2_t vs2, vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vwredsumu_tum(vbool32_t vm, vuint64m1_t vd, vuint32m1_t vs2,
                                  vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vwredsumu_tum(vbool16_t vm, vuint64m1_t vd, vuint32m2_t vs2,
                                  vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vwredsumu_tum(vbool8_t vm, vuint64m1_t vd, vuint32m4_t vs2,
                                  vuint64m1_t vs1, size_t vl);
vuint64m1_t __riscv_vwredsumu_tum(vbool4_t vm, vuint64m1_t vd, vuint32m8_t vs2,
                                  vuint64m1_t vs1, size_t vl);

Vector Single-Width Floating-Point Reduction Intrinsics

vfloat16m1_t __riscv_vfredosum_tu(vfloat16m1_t vd, vfloat16mf4_t vs2,
                                  vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredosum_tu(vfloat16m1_t vd, vfloat16mf2_t vs2,
                                  vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredosum_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                  vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredosum_tu(vfloat16m1_t vd, vfloat16m2_t vs2,
                                  vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredosum_tu(vfloat16m1_t vd, vfloat16m4_t vs2,
                                  vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredosum_tu(vfloat16m1_t vd, vfloat16m8_t vs2,
                                  vfloat16m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredosum_tu(vfloat32m1_t vd, vfloat32mf2_t vs2,
                                  vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredosum_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                  vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredosum_tu(vfloat32m1_t vd, vfloat32m2_t vs2,
                                  vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredosum_tu(vfloat32m1_t vd, vfloat32m4_t vs2,
                                  vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredosum_tu(vfloat32m1_t vd, vfloat32m8_t vs2,
                                  vfloat32m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredosum_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                  vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredosum_tu(vfloat64m1_t vd, vfloat64m2_t vs2,
                                  vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredosum_tu(vfloat64m1_t vd, vfloat64m4_t vs2,
                                  vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredosum_tu(vfloat64m1_t vd, vfloat64m8_t vs2,
                                  vfloat64m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredusum_tu(vfloat16m1_t vd, vfloat16mf4_t vs2,
                                  vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredusum_tu(vfloat16m1_t vd, vfloat16mf2_t vs2,
                                  vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredusum_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                  vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredusum_tu(vfloat16m1_t vd, vfloat16m2_t vs2,
                                  vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredusum_tu(vfloat16m1_t vd, vfloat16m4_t vs2,
                                  vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredusum_tu(vfloat16m1_t vd, vfloat16m8_t vs2,
                                  vfloat16m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredusum_tu(vfloat32m1_t vd, vfloat32mf2_t vs2,
                                  vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredusum_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                  vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredusum_tu(vfloat32m1_t vd, vfloat32m2_t vs2,
                                  vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredusum_tu(vfloat32m1_t vd, vfloat32m4_t vs2,
                                  vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredusum_tu(vfloat32m1_t vd, vfloat32m8_t vs2,
                                  vfloat32m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredusum_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                  vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredusum_tu(vfloat64m1_t vd, vfloat64m2_t vs2,
                                  vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredusum_tu(vfloat64m1_t vd, vfloat64m4_t vs2,
                                  vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredusum_tu(vfloat64m1_t vd, vfloat64m8_t vs2,
                                  vfloat64m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmax_tu(vfloat16m1_t vd, vfloat16mf4_t vs2,
                                 vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmax_tu(vfloat16m1_t vd, vfloat16mf2_t vs2,
                                 vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmax_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                 vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmax_tu(vfloat16m1_t vd, vfloat16m2_t vs2,
                                 vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmax_tu(vfloat16m1_t vd, vfloat16m4_t vs2,
                                 vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmax_tu(vfloat16m1_t vd, vfloat16m8_t vs2,
                                 vfloat16m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredmax_tu(vfloat32m1_t vd, vfloat32mf2_t vs2,
                                 vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredmax_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                 vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredmax_tu(vfloat32m1_t vd, vfloat32m2_t vs2,
                                 vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredmax_tu(vfloat32m1_t vd, vfloat32m4_t vs2,
                                 vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredmax_tu(vfloat32m1_t vd, vfloat32m8_t vs2,
                                 vfloat32m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredmax_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                 vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredmax_tu(vfloat64m1_t vd, vfloat64m2_t vs2,
                                 vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredmax_tu(vfloat64m1_t vd, vfloat64m4_t vs2,
                                 vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredmax_tu(vfloat64m1_t vd, vfloat64m8_t vs2,
                                 vfloat64m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmin_tu(vfloat16m1_t vd, vfloat16mf4_t vs2,
                                 vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmin_tu(vfloat16m1_t vd, vfloat16mf2_t vs2,
                                 vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmin_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                 vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmin_tu(vfloat16m1_t vd, vfloat16m2_t vs2,
                                 vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmin_tu(vfloat16m1_t vd, vfloat16m4_t vs2,
                                 vfloat16m1_t vs1, size_t vl);
vfloat16m1_t __riscv_vfredmin_tu(vfloat16m1_t vd, vfloat16m8_t vs2,
                                 vfloat16m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredmin_tu(vfloat32m1_t vd, vfloat32mf2_t vs2,
                                 vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredmin_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                 vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredmin_tu(vfloat32m1_t vd, vfloat32m2_t vs2,
                                 vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredmin_tu(vfloat32m1_t vd, vfloat32m4_t vs2,
                                 vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfredmin_tu(vfloat32m1_t vd, vfloat32m8_t vs2,
                                 vfloat32m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredmin_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                 vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredmin_tu(vfloat64m1_t vd, vfloat64m2_t vs2,
                                 vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredmin_tu(vfloat64m1_t vd, vfloat64m4_t vs2,
                                 vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfredmin_tu(vfloat64m1_t vd, vfloat64m8_t vs2,
                                 vfloat64m1_t vs1, size_t vl);
// masked functions
vfloat16m1_t __riscv_vfredosum_tum(vbool64_t vm, vfloat16m1_t vd,
                                   vfloat16mf4_t vs2, vfloat16m1_t vs1,
                                   size_t vl);
vfloat16m1_t __riscv_vfredosum_tum(vbool32_t vm, vfloat16m1_t vd,
                                   vfloat16mf2_t vs2, vfloat16m1_t vs1,
                                   size_t vl);
vfloat16m1_t __riscv_vfredosum_tum(vbool16_t vm, vfloat16m1_t vd,
                                   vfloat16m1_t vs2, vfloat16m1_t vs1,
                                   size_t vl);
vfloat16m1_t __riscv_vfredosum_tum(vbool8_t vm, vfloat16m1_t vd,
                                   vfloat16m2_t vs2, vfloat16m1_t vs1,
                                   size_t vl);
vfloat16m1_t __riscv_vfredosum_tum(vbool4_t vm, vfloat16m1_t vd,
                                   vfloat16m4_t vs2, vfloat16m1_t vs1,
                                   size_t vl);
vfloat16m1_t __riscv_vfredosum_tum(vbool2_t vm, vfloat16m1_t vd,
                                   vfloat16m8_t vs2, vfloat16m1_t vs1,
                                   size_t vl);
vfloat32m1_t __riscv_vfredosum_tum(vbool64_t vm, vfloat32m1_t vd,
                                   vfloat32mf2_t vs2, vfloat32m1_t vs1,
                                   size_t vl);
vfloat32m1_t __riscv_vfredosum_tum(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat32m1_t vs2, vfloat32m1_t vs1,
                                   size_t vl);
vfloat32m1_t __riscv_vfredosum_tum(vbool16_t vm, vfloat32m1_t vd,
                                   vfloat32m2_t vs2, vfloat32m1_t vs1,
                                   size_t vl);
vfloat32m1_t __riscv_vfredosum_tum(vbool8_t vm, vfloat32m1_t vd,
                                   vfloat32m4_t vs2, vfloat32m1_t vs1,
                                   size_t vl);
vfloat32m1_t __riscv_vfredosum_tum(vbool4_t vm, vfloat32m1_t vd,
                                   vfloat32m8_t vs2, vfloat32m1_t vs1,
                                   size_t vl);
vfloat64m1_t __riscv_vfredosum_tum(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat64m1_t vs2, vfloat64m1_t vs1,
                                   size_t vl);
vfloat64m1_t __riscv_vfredosum_tum(vbool32_t vm, vfloat64m1_t vd,
                                   vfloat64m2_t vs2, vfloat64m1_t vs1,
                                   size_t vl);
vfloat64m1_t __riscv_vfredosum_tum(vbool16_t vm, vfloat64m1_t vd,
                                   vfloat64m4_t vs2, vfloat64m1_t vs1,
                                   size_t vl);
vfloat64m1_t __riscv_vfredosum_tum(vbool8_t vm, vfloat64m1_t vd,
                                   vfloat64m8_t vs2, vfloat64m1_t vs1,
                                   size_t vl);
vfloat16m1_t __riscv_vfredusum_tum(vbool64_t vm, vfloat16m1_t vd,
                                   vfloat16mf4_t vs2, vfloat16m1_t vs1,
                                   size_t vl);
vfloat16m1_t __riscv_vfredusum_tum(vbool32_t vm, vfloat16m1_t vd,
                                   vfloat16mf2_t vs2, vfloat16m1_t vs1,
                                   size_t vl);
vfloat16m1_t __riscv_vfredusum_tum(vbool16_t vm, vfloat16m1_t vd,
                                   vfloat16m1_t vs2, vfloat16m1_t vs1,
                                   size_t vl);
vfloat16m1_t __riscv_vfredusum_tum(vbool8_t vm, vfloat16m1_t vd,
                                   vfloat16m2_t vs2, vfloat16m1_t vs1,
                                   size_t vl);
vfloat16m1_t __riscv_vfredusum_tum(vbool4_t vm, vfloat16m1_t vd,
                                   vfloat16m4_t vs2, vfloat16m1_t vs1,
                                   size_t vl);
vfloat16m1_t __riscv_vfredusum_tum(vbool2_t vm, vfloat16m1_t vd,
                                   vfloat16m8_t vs2, vfloat16m1_t vs1,
                                   size_t vl);
vfloat32m1_t __riscv_vfredusum_tum(vbool64_t vm, vfloat32m1_t vd,
                                   vfloat32mf2_t vs2, vfloat32m1_t vs1,
                                   size_t vl);
vfloat32m1_t __riscv_vfredusum_tum(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat32m1_t vs2, vfloat32m1_t vs1,
                                   size_t vl);
vfloat32m1_t __riscv_vfredusum_tum(vbool16_t vm, vfloat32m1_t vd,
                                   vfloat32m2_t vs2, vfloat32m1_t vs1,
                                   size_t vl);
vfloat32m1_t __riscv_vfredusum_tum(vbool8_t vm, vfloat32m1_t vd,
                                   vfloat32m4_t vs2, vfloat32m1_t vs1,
                                   size_t vl);
vfloat32m1_t __riscv_vfredusum_tum(vbool4_t vm, vfloat32m1_t vd,
                                   vfloat32m8_t vs2, vfloat32m1_t vs1,
                                   size_t vl);
vfloat64m1_t __riscv_vfredusum_tum(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat64m1_t vs2, vfloat64m1_t vs1,
                                   size_t vl);
vfloat64m1_t __riscv_vfredusum_tum(vbool32_t vm, vfloat64m1_t vd,
                                   vfloat64m2_t vs2, vfloat64m1_t vs1,
                                   size_t vl);
vfloat64m1_t __riscv_vfredusum_tum(vbool16_t vm, vfloat64m1_t vd,
                                   vfloat64m4_t vs2, vfloat64m1_t vs1,
                                   size_t vl);
vfloat64m1_t __riscv_vfredusum_tum(vbool8_t vm, vfloat64m1_t vd,
                                   vfloat64m8_t vs2, vfloat64m1_t vs1,
                                   size_t vl);
vfloat16m1_t __riscv_vfredmax_tum(vbool64_t vm, vfloat16m1_t vd,
                                  vfloat16mf4_t vs2, vfloat16m1_t vs1,
                                  size_t vl);
vfloat16m1_t __riscv_vfredmax_tum(vbool32_t vm, vfloat16m1_t vd,
                                  vfloat16mf2_t vs2, vfloat16m1_t vs1,
                                  size_t vl);
vfloat16m1_t __riscv_vfredmax_tum(vbool16_t vm, vfloat16m1_t vd,
                                  vfloat16m1_t vs2, vfloat16m1_t vs1,
                                  size_t vl);
vfloat16m1_t __riscv_vfredmax_tum(vbool8_t vm, vfloat16m1_t vd,
                                  vfloat16m2_t vs2, vfloat16m1_t vs1,
                                  size_t vl);
vfloat16m1_t __riscv_vfredmax_tum(vbool4_t vm, vfloat16m1_t vd,
                                  vfloat16m4_t vs2, vfloat16m1_t vs1,
                                  size_t vl);
vfloat16m1_t __riscv_vfredmax_tum(vbool2_t vm, vfloat16m1_t vd,
                                  vfloat16m8_t vs2, vfloat16m1_t vs1,
                                  size_t vl);
vfloat32m1_t __riscv_vfredmax_tum(vbool64_t vm, vfloat32m1_t vd,
                                  vfloat32mf2_t vs2, vfloat32m1_t vs1,
                                  size_t vl);
vfloat32m1_t __riscv_vfredmax_tum(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat32m1_t vs2, vfloat32m1_t vs1,
                                  size_t vl);
vfloat32m1_t __riscv_vfredmax_tum(vbool16_t vm, vfloat32m1_t vd,
                                  vfloat32m2_t vs2, vfloat32m1_t vs1,
                                  size_t vl);
vfloat32m1_t __riscv_vfredmax_tum(vbool8_t vm, vfloat32m1_t vd,
                                  vfloat32m4_t vs2, vfloat32m1_t vs1,
                                  size_t vl);
vfloat32m1_t __riscv_vfredmax_tum(vbool4_t vm, vfloat32m1_t vd,
                                  vfloat32m8_t vs2, vfloat32m1_t vs1,
                                  size_t vl);
vfloat64m1_t __riscv_vfredmax_tum(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat64m1_t vs2, vfloat64m1_t vs1,
                                  size_t vl);
vfloat64m1_t __riscv_vfredmax_tum(vbool32_t vm, vfloat64m1_t vd,
                                  vfloat64m2_t vs2, vfloat64m1_t vs1,
                                  size_t vl);
vfloat64m1_t __riscv_vfredmax_tum(vbool16_t vm, vfloat64m1_t vd,
                                  vfloat64m4_t vs2, vfloat64m1_t vs1,
                                  size_t vl);
vfloat64m1_t __riscv_vfredmax_tum(vbool8_t vm, vfloat64m1_t vd,
                                  vfloat64m8_t vs2, vfloat64m1_t vs1,
                                  size_t vl);
vfloat16m1_t __riscv_vfredmin_tum(vbool64_t vm, vfloat16m1_t vd,
                                  vfloat16mf4_t vs2, vfloat16m1_t vs1,
                                  size_t vl);
vfloat16m1_t __riscv_vfredmin_tum(vbool32_t vm, vfloat16m1_t vd,
                                  vfloat16mf2_t vs2, vfloat16m1_t vs1,
                                  size_t vl);
vfloat16m1_t __riscv_vfredmin_tum(vbool16_t vm, vfloat16m1_t vd,
                                  vfloat16m1_t vs2, vfloat16m1_t vs1,
                                  size_t vl);
vfloat16m1_t __riscv_vfredmin_tum(vbool8_t vm, vfloat16m1_t vd,
                                  vfloat16m2_t vs2, vfloat16m1_t vs1,
                                  size_t vl);
vfloat16m1_t __riscv_vfredmin_tum(vbool4_t vm, vfloat16m1_t vd,
                                  vfloat16m4_t vs2, vfloat16m1_t vs1,
                                  size_t vl);
vfloat16m1_t __riscv_vfredmin_tum(vbool2_t vm, vfloat16m1_t vd,
                                  vfloat16m8_t vs2, vfloat16m1_t vs1,
                                  size_t vl);
vfloat32m1_t __riscv_vfredmin_tum(vbool64_t vm, vfloat32m1_t vd,
                                  vfloat32mf2_t vs2, vfloat32m1_t vs1,
                                  size_t vl);
vfloat32m1_t __riscv_vfredmin_tum(vbool32_t vm, vfloat32m1_t vd,
                                  vfloat32m1_t vs2, vfloat32m1_t vs1,
                                  size_t vl);
vfloat32m1_t __riscv_vfredmin_tum(vbool16_t vm, vfloat32m1_t vd,
                                  vfloat32m2_t vs2, vfloat32m1_t vs1,
                                  size_t vl);
vfloat32m1_t __riscv_vfredmin_tum(vbool8_t vm, vfloat32m1_t vd,
                                  vfloat32m4_t vs2, vfloat32m1_t vs1,
                                  size_t vl);
vfloat32m1_t __riscv_vfredmin_tum(vbool4_t vm, vfloat32m1_t vd,
                                  vfloat32m8_t vs2, vfloat32m1_t vs1,
                                  size_t vl);
vfloat64m1_t __riscv_vfredmin_tum(vbool64_t vm, vfloat64m1_t vd,
                                  vfloat64m1_t vs2, vfloat64m1_t vs1,
                                  size_t vl);
vfloat64m1_t __riscv_vfredmin_tum(vbool32_t vm, vfloat64m1_t vd,
                                  vfloat64m2_t vs2, vfloat64m1_t vs1,
                                  size_t vl);
vfloat64m1_t __riscv_vfredmin_tum(vbool16_t vm, vfloat64m1_t vd,
                                  vfloat64m4_t vs2, vfloat64m1_t vs1,
                                  size_t vl);
vfloat64m1_t __riscv_vfredmin_tum(vbool8_t vm, vfloat64m1_t vd,
                                  vfloat64m8_t vs2, vfloat64m1_t vs1,
                                  size_t vl);
vfloat16m1_t __riscv_vfredosum_tu(vfloat16m1_t vd, vfloat16mf4_t vs2,
                                  vfloat16m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat16m1_t __riscv_vfredosum_tu(vfloat16m1_t vd, vfloat16mf2_t vs2,
                                  vfloat16m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat16m1_t __riscv_vfredosum_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                  vfloat16m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat16m1_t __riscv_vfredosum_tu(vfloat16m1_t vd, vfloat16m2_t vs2,
                                  vfloat16m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat16m1_t __riscv_vfredosum_tu(vfloat16m1_t vd, vfloat16m4_t vs2,
                                  vfloat16m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat16m1_t __riscv_vfredosum_tu(vfloat16m1_t vd, vfloat16m8_t vs2,
                                  vfloat16m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfredosum_tu(vfloat32m1_t vd, vfloat32mf2_t vs2,
                                  vfloat32m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfredosum_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                  vfloat32m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfredosum_tu(vfloat32m1_t vd, vfloat32m2_t vs2,
                                  vfloat32m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfredosum_tu(vfloat32m1_t vd, vfloat32m4_t vs2,
                                  vfloat32m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfredosum_tu(vfloat32m1_t vd, vfloat32m8_t vs2,
                                  vfloat32m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat64m1_t __riscv_vfredosum_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                  vfloat64m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat64m1_t __riscv_vfredosum_tu(vfloat64m1_t vd, vfloat64m2_t vs2,
                                  vfloat64m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat64m1_t __riscv_vfredosum_tu(vfloat64m1_t vd, vfloat64m4_t vs2,
                                  vfloat64m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat64m1_t __riscv_vfredosum_tu(vfloat64m1_t vd, vfloat64m8_t vs2,
                                  vfloat64m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat16m1_t __riscv_vfredusum_tu(vfloat16m1_t vd, vfloat16mf4_t vs2,
                                  vfloat16m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat16m1_t __riscv_vfredusum_tu(vfloat16m1_t vd, vfloat16mf2_t vs2,
                                  vfloat16m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat16m1_t __riscv_vfredusum_tu(vfloat16m1_t vd, vfloat16m1_t vs2,
                                  vfloat16m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat16m1_t __riscv_vfredusum_tu(vfloat16m1_t vd, vfloat16m2_t vs2,
                                  vfloat16m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat16m1_t __riscv_vfredusum_tu(vfloat16m1_t vd, vfloat16m4_t vs2,
                                  vfloat16m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat16m1_t __riscv_vfredusum_tu(vfloat16m1_t vd, vfloat16m8_t vs2,
                                  vfloat16m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfredusum_tu(vfloat32m1_t vd, vfloat32mf2_t vs2,
                                  vfloat32m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfredusum_tu(vfloat32m1_t vd, vfloat32m1_t vs2,
                                  vfloat32m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfredusum_tu(vfloat32m1_t vd, vfloat32m2_t vs2,
                                  vfloat32m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfredusum_tu(vfloat32m1_t vd, vfloat32m4_t vs2,
                                  vfloat32m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat32m1_t __riscv_vfredusum_tu(vfloat32m1_t vd, vfloat32m8_t vs2,
                                  vfloat32m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat64m1_t __riscv_vfredusum_tu(vfloat64m1_t vd, vfloat64m1_t vs2,
                                  vfloat64m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat64m1_t __riscv_vfredusum_tu(vfloat64m1_t vd, vfloat64m2_t vs2,
                                  vfloat64m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat64m1_t __riscv_vfredusum_tu(vfloat64m1_t vd, vfloat64m4_t vs2,
                                  vfloat64m1_t vs1, unsigned int frm,
                                  size_t vl);
vfloat64m1_t __riscv_vfredusum_tu(vfloat64m1_t vd, vfloat64m8_t vs2,
                                  vfloat64m1_t vs1, unsigned int frm,
                                  size_t vl);
// masked functions
vfloat16m1_t __riscv_vfredosum_tum(vbool64_t vm, vfloat16m1_t vd,
                                   vfloat16mf4_t vs2, vfloat16m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredosum_tum(vbool32_t vm, vfloat16m1_t vd,
                                   vfloat16mf2_t vs2, vfloat16m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredosum_tum(vbool16_t vm, vfloat16m1_t vd,
                                   vfloat16m1_t vs2, vfloat16m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredosum_tum(vbool8_t vm, vfloat16m1_t vd,
                                   vfloat16m2_t vs2, vfloat16m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredosum_tum(vbool4_t vm, vfloat16m1_t vd,
                                   vfloat16m4_t vs2, vfloat16m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredosum_tum(vbool2_t vm, vfloat16m1_t vd,
                                   vfloat16m8_t vs2, vfloat16m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredosum_tum(vbool64_t vm, vfloat32m1_t vd,
                                   vfloat32mf2_t vs2, vfloat32m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredosum_tum(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat32m1_t vs2, vfloat32m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredosum_tum(vbool16_t vm, vfloat32m1_t vd,
                                   vfloat32m2_t vs2, vfloat32m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredosum_tum(vbool8_t vm, vfloat32m1_t vd,
                                   vfloat32m4_t vs2, vfloat32m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredosum_tum(vbool4_t vm, vfloat32m1_t vd,
                                   vfloat32m8_t vs2, vfloat32m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfredosum_tum(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat64m1_t vs2, vfloat64m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfredosum_tum(vbool32_t vm, vfloat64m1_t vd,
                                   vfloat64m2_t vs2, vfloat64m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfredosum_tum(vbool16_t vm, vfloat64m1_t vd,
                                   vfloat64m4_t vs2, vfloat64m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfredosum_tum(vbool8_t vm, vfloat64m1_t vd,
                                   vfloat64m8_t vs2, vfloat64m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredusum_tum(vbool64_t vm, vfloat16m1_t vd,
                                   vfloat16mf4_t vs2, vfloat16m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredusum_tum(vbool32_t vm, vfloat16m1_t vd,
                                   vfloat16mf2_t vs2, vfloat16m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredusum_tum(vbool16_t vm, vfloat16m1_t vd,
                                   vfloat16m1_t vs2, vfloat16m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredusum_tum(vbool8_t vm, vfloat16m1_t vd,
                                   vfloat16m2_t vs2, vfloat16m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredusum_tum(vbool4_t vm, vfloat16m1_t vd,
                                   vfloat16m4_t vs2, vfloat16m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat16m1_t __riscv_vfredusum_tum(vbool2_t vm, vfloat16m1_t vd,
                                   vfloat16m8_t vs2, vfloat16m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredusum_tum(vbool64_t vm, vfloat32m1_t vd,
                                   vfloat32mf2_t vs2, vfloat32m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredusum_tum(vbool32_t vm, vfloat32m1_t vd,
                                   vfloat32m1_t vs2, vfloat32m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredusum_tum(vbool16_t vm, vfloat32m1_t vd,
                                   vfloat32m2_t vs2, vfloat32m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredusum_tum(vbool8_t vm, vfloat32m1_t vd,
                                   vfloat32m4_t vs2, vfloat32m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfredusum_tum(vbool4_t vm, vfloat32m1_t vd,
                                   vfloat32m8_t vs2, vfloat32m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfredusum_tum(vbool64_t vm, vfloat64m1_t vd,
                                   vfloat64m1_t vs2, vfloat64m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfredusum_tum(vbool32_t vm, vfloat64m1_t vd,
                                   vfloat64m2_t vs2, vfloat64m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfredusum_tum(vbool16_t vm, vfloat64m1_t vd,
                                   vfloat64m4_t vs2, vfloat64m1_t vs1,
                                   unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfredusum_tum(vbool8_t vm, vfloat64m1_t vd,
                                   vfloat64m8_t vs2, vfloat64m1_t vs1,
                                   unsigned int frm, size_t vl);

Vector Widening Floating-Point Reduction Intrinsics

vfloat32m1_t __riscv_vfwredosum_tu(vfloat32m1_t vd, vfloat16mf4_t vs2,
                                   vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredosum_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                                   vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredosum_tu(vfloat32m1_t vd, vfloat16m1_t vs2,
                                   vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredosum_tu(vfloat32m1_t vd, vfloat16m2_t vs2,
                                   vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredosum_tu(vfloat32m1_t vd, vfloat16m4_t vs2,
                                   vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredosum_tu(vfloat32m1_t vd, vfloat16m8_t vs2,
                                   vfloat32m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredosum_tu(vfloat64m1_t vd, vfloat32mf2_t vs2,
                                   vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredosum_tu(vfloat64m1_t vd, vfloat32m1_t vs2,
                                   vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredosum_tu(vfloat64m1_t vd, vfloat32m2_t vs2,
                                   vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredosum_tu(vfloat64m1_t vd, vfloat32m4_t vs2,
                                   vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredosum_tu(vfloat64m1_t vd, vfloat32m8_t vs2,
                                   vfloat64m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredusum_tu(vfloat32m1_t vd, vfloat16mf4_t vs2,
                                   vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredusum_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                                   vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredusum_tu(vfloat32m1_t vd, vfloat16m1_t vs2,
                                   vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredusum_tu(vfloat32m1_t vd, vfloat16m2_t vs2,
                                   vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredusum_tu(vfloat32m1_t vd, vfloat16m4_t vs2,
                                   vfloat32m1_t vs1, size_t vl);
vfloat32m1_t __riscv_vfwredusum_tu(vfloat32m1_t vd, vfloat16m8_t vs2,
                                   vfloat32m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredusum_tu(vfloat64m1_t vd, vfloat32mf2_t vs2,
                                   vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredusum_tu(vfloat64m1_t vd, vfloat32m1_t vs2,
                                   vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredusum_tu(vfloat64m1_t vd, vfloat32m2_t vs2,
                                   vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredusum_tu(vfloat64m1_t vd, vfloat32m4_t vs2,
                                   vfloat64m1_t vs1, size_t vl);
vfloat64m1_t __riscv_vfwredusum_tu(vfloat64m1_t vd, vfloat32m8_t vs2,
                                   vfloat64m1_t vs1, size_t vl);
// masked functions
vfloat32m1_t __riscv_vfwredosum_tum(vbool64_t vm, vfloat32m1_t vd,
                                    vfloat16mf4_t vs2, vfloat32m1_t vs1,
                                    size_t vl);
vfloat32m1_t __riscv_vfwredosum_tum(vbool32_t vm, vfloat32m1_t vd,
                                    vfloat16mf2_t vs2, vfloat32m1_t vs1,
                                    size_t vl);
vfloat32m1_t __riscv_vfwredosum_tum(vbool16_t vm, vfloat32m1_t vd,
                                    vfloat16m1_t vs2, vfloat32m1_t vs1,
                                    size_t vl);
vfloat32m1_t __riscv_vfwredosum_tum(vbool8_t vm, vfloat32m1_t vd,
                                    vfloat16m2_t vs2, vfloat32m1_t vs1,
                                    size_t vl);
vfloat32m1_t __riscv_vfwredosum_tum(vbool4_t vm, vfloat32m1_t vd,
                                    vfloat16m4_t vs2, vfloat32m1_t vs1,
                                    size_t vl);
vfloat32m1_t __riscv_vfwredosum_tum(vbool2_t vm, vfloat32m1_t vd,
                                    vfloat16m8_t vs2, vfloat32m1_t vs1,
                                    size_t vl);
vfloat64m1_t __riscv_vfwredosum_tum(vbool64_t vm, vfloat64m1_t vd,
                                    vfloat32mf2_t vs2, vfloat64m1_t vs1,
                                    size_t vl);
vfloat64m1_t __riscv_vfwredosum_tum(vbool32_t vm, vfloat64m1_t vd,
                                    vfloat32m1_t vs2, vfloat64m1_t vs1,
                                    size_t vl);
vfloat64m1_t __riscv_vfwredosum_tum(vbool16_t vm, vfloat64m1_t vd,
                                    vfloat32m2_t vs2, vfloat64m1_t vs1,
                                    size_t vl);
vfloat64m1_t __riscv_vfwredosum_tum(vbool8_t vm, vfloat64m1_t vd,
                                    vfloat32m4_t vs2, vfloat64m1_t vs1,
                                    size_t vl);
vfloat64m1_t __riscv_vfwredosum_tum(vbool4_t vm, vfloat64m1_t vd,
                                    vfloat32m8_t vs2, vfloat64m1_t vs1,
                                    size_t vl);
vfloat32m1_t __riscv_vfwredusum_tum(vbool64_t vm, vfloat32m1_t vd,
                                    vfloat16mf4_t vs2, vfloat32m1_t vs1,
                                    size_t vl);
vfloat32m1_t __riscv_vfwredusum_tum(vbool32_t vm, vfloat32m1_t vd,
                                    vfloat16mf2_t vs2, vfloat32m1_t vs1,
                                    size_t vl);
vfloat32m1_t __riscv_vfwredusum_tum(vbool16_t vm, vfloat32m1_t vd,
                                    vfloat16m1_t vs2, vfloat32m1_t vs1,
                                    size_t vl);
vfloat32m1_t __riscv_vfwredusum_tum(vbool8_t vm, vfloat32m1_t vd,
                                    vfloat16m2_t vs2, vfloat32m1_t vs1,
                                    size_t vl);
vfloat32m1_t __riscv_vfwredusum_tum(vbool4_t vm, vfloat32m1_t vd,
                                    vfloat16m4_t vs2, vfloat32m1_t vs1,
                                    size_t vl);
vfloat32m1_t __riscv_vfwredusum_tum(vbool2_t vm, vfloat32m1_t vd,
                                    vfloat16m8_t vs2, vfloat32m1_t vs1,
                                    size_t vl);
vfloat64m1_t __riscv_vfwredusum_tum(vbool64_t vm, vfloat64m1_t vd,
                                    vfloat32mf2_t vs2, vfloat64m1_t vs1,
                                    size_t vl);
vfloat64m1_t __riscv_vfwredusum_tum(vbool32_t vm, vfloat64m1_t vd,
                                    vfloat32m1_t vs2, vfloat64m1_t vs1,
                                    size_t vl);
vfloat64m1_t __riscv_vfwredusum_tum(vbool16_t vm, vfloat64m1_t vd,
                                    vfloat32m2_t vs2, vfloat64m1_t vs1,
                                    size_t vl);
vfloat64m1_t __riscv_vfwredusum_tum(vbool8_t vm, vfloat64m1_t vd,
                                    vfloat32m4_t vs2, vfloat64m1_t vs1,
                                    size_t vl);
vfloat64m1_t __riscv_vfwredusum_tum(vbool4_t vm, vfloat64m1_t vd,
                                    vfloat32m8_t vs2, vfloat64m1_t vs1,
                                    size_t vl);
vfloat32m1_t __riscv_vfwredosum_tu(vfloat32m1_t vd, vfloat16mf4_t vs2,
                                   vfloat32m1_t vs1, unsigned int frm,
                                   size_t vl);
vfloat32m1_t __riscv_vfwredosum_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                                   vfloat32m1_t vs1, unsigned int frm,
                                   size_t vl);
vfloat32m1_t __riscv_vfwredosum_tu(vfloat32m1_t vd, vfloat16m1_t vs2,
                                   vfloat32m1_t vs1, unsigned int frm,
                                   size_t vl);
vfloat32m1_t __riscv_vfwredosum_tu(vfloat32m1_t vd, vfloat16m2_t vs2,
                                   vfloat32m1_t vs1, unsigned int frm,
                                   size_t vl);
vfloat32m1_t __riscv_vfwredosum_tu(vfloat32m1_t vd, vfloat16m4_t vs2,
                                   vfloat32m1_t vs1, unsigned int frm,
                                   size_t vl);
vfloat32m1_t __riscv_vfwredosum_tu(vfloat32m1_t vd, vfloat16m8_t vs2,
                                   vfloat32m1_t vs1, unsigned int frm,
                                   size_t vl);
vfloat64m1_t __riscv_vfwredosum_tu(vfloat64m1_t vd, vfloat32mf2_t vs2,
                                   vfloat64m1_t vs1, unsigned int frm,
                                   size_t vl);
vfloat64m1_t __riscv_vfwredosum_tu(vfloat64m1_t vd, vfloat32m1_t vs2,
                                   vfloat64m1_t vs1, unsigned int frm,
                                   size_t vl);
vfloat64m1_t __riscv_vfwredosum_tu(vfloat64m1_t vd, vfloat32m2_t vs2,
                                   vfloat64m1_t vs1, unsigned int frm,
                                   size_t vl);
vfloat64m1_t __riscv_vfwredosum_tu(vfloat64m1_t vd, vfloat32m4_t vs2,
                                   vfloat64m1_t vs1, unsigned int frm,
                                   size_t vl);
vfloat64m1_t __riscv_vfwredosum_tu(vfloat64m1_t vd, vfloat32m8_t vs2,
                                   vfloat64m1_t vs1, unsigned int frm,
                                   size_t vl);
vfloat32m1_t __riscv_vfwredusum_tu(vfloat32m1_t vd, vfloat16mf4_t vs2,
                                   vfloat32m1_t vs1, unsigned int frm,
                                   size_t vl);
vfloat32m1_t __riscv_vfwredusum_tu(vfloat32m1_t vd, vfloat16mf2_t vs2,
                                   vfloat32m1_t vs1, unsigned int frm,
                                   size_t vl);
vfloat32m1_t __riscv_vfwredusum_tu(vfloat32m1_t vd, vfloat16m1_t vs2,
                                   vfloat32m1_t vs1, unsigned int frm,
                                   size_t vl);
vfloat32m1_t __riscv_vfwredusum_tu(vfloat32m1_t vd, vfloat16m2_t vs2,
                                   vfloat32m1_t vs1, unsigned int frm,
                                   size_t vl);
vfloat32m1_t __riscv_vfwredusum_tu(vfloat32m1_t vd, vfloat16m4_t vs2,
                                   vfloat32m1_t vs1, unsigned int frm,
                                   size_t vl);
vfloat32m1_t __riscv_vfwredusum_tu(vfloat32m1_t vd, vfloat16m8_t vs2,
                                   vfloat32m1_t vs1, unsigned int frm,
                                   size_t vl);
vfloat64m1_t __riscv_vfwredusum_tu(vfloat64m1_t vd, vfloat32mf2_t vs2,
                                   vfloat64m1_t vs1, unsigned int frm,
                                   size_t vl);
vfloat64m1_t __riscv_vfwredusum_tu(vfloat64m1_t vd, vfloat32m1_t vs2,
                                   vfloat64m1_t vs1, unsigned int frm,
                                   size_t vl);
vfloat64m1_t __riscv_vfwredusum_tu(vfloat64m1_t vd, vfloat32m2_t vs2,
                                   vfloat64m1_t vs1, unsigned int frm,
                                   size_t vl);
vfloat64m1_t __riscv_vfwredusum_tu(vfloat64m1_t vd, vfloat32m4_t vs2,
                                   vfloat64m1_t vs1, unsigned int frm,
                                   size_t vl);
vfloat64m1_t __riscv_vfwredusum_tu(vfloat64m1_t vd, vfloat32m8_t vs2,
                                   vfloat64m1_t vs1, unsigned int frm,
                                   size_t vl);
// masked functions
vfloat32m1_t __riscv_vfwredosum_tum(vbool64_t vm, vfloat32m1_t vd,
                                    vfloat16mf4_t vs2, vfloat32m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwredosum_tum(vbool32_t vm, vfloat32m1_t vd,
                                    vfloat16mf2_t vs2, vfloat32m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwredosum_tum(vbool16_t vm, vfloat32m1_t vd,
                                    vfloat16m1_t vs2, vfloat32m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwredosum_tum(vbool8_t vm, vfloat32m1_t vd,
                                    vfloat16m2_t vs2, vfloat32m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwredosum_tum(vbool4_t vm, vfloat32m1_t vd,
                                    vfloat16m4_t vs2, vfloat32m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwredosum_tum(vbool2_t vm, vfloat32m1_t vd,
                                    vfloat16m8_t vs2, vfloat32m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwredosum_tum(vbool64_t vm, vfloat64m1_t vd,
                                    vfloat32mf2_t vs2, vfloat64m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwredosum_tum(vbool32_t vm, vfloat64m1_t vd,
                                    vfloat32m1_t vs2, vfloat64m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwredosum_tum(vbool16_t vm, vfloat64m1_t vd,
                                    vfloat32m2_t vs2, vfloat64m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwredosum_tum(vbool8_t vm, vfloat64m1_t vd,
                                    vfloat32m4_t vs2, vfloat64m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwredosum_tum(vbool4_t vm, vfloat64m1_t vd,
                                    vfloat32m8_t vs2, vfloat64m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwredusum_tum(vbool64_t vm, vfloat32m1_t vd,
                                    vfloat16mf4_t vs2, vfloat32m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwredusum_tum(vbool32_t vm, vfloat32m1_t vd,
                                    vfloat16mf2_t vs2, vfloat32m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwredusum_tum(vbool16_t vm, vfloat32m1_t vd,
                                    vfloat16m1_t vs2, vfloat32m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwredusum_tum(vbool8_t vm, vfloat32m1_t vd,
                                    vfloat16m2_t vs2, vfloat32m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwredusum_tum(vbool4_t vm, vfloat32m1_t vd,
                                    vfloat16m4_t vs2, vfloat32m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat32m1_t __riscv_vfwredusum_tum(vbool2_t vm, vfloat32m1_t vd,
                                    vfloat16m8_t vs2, vfloat32m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwredusum_tum(vbool64_t vm, vfloat64m1_t vd,
                                    vfloat32mf2_t vs2, vfloat64m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwredusum_tum(vbool32_t vm, vfloat64m1_t vd,
                                    vfloat32m1_t vs2, vfloat64m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwredusum_tum(vbool16_t vm, vfloat64m1_t vd,
                                    vfloat32m2_t vs2, vfloat64m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwredusum_tum(vbool8_t vm, vfloat64m1_t vd,
                                    vfloat32m4_t vs2, vfloat64m1_t vs1,
                                    unsigned int frm, size_t vl);
vfloat64m1_t __riscv_vfwredusum_tum(vbool4_t vm, vfloat64m1_t vd,
                                    vfloat32m8_t vs2, vfloat64m1_t vs1,
                                    unsigned int frm, size_t vl);