}
};
+/* Implements Andes vdot. */
+template<rtx_code EXTEND>
+class nds_vd4dot : public function_base
+{
+public:
+ bool has_merge_operand_p () const override { return false; }
+
+ rtx expand (function_expander &e) const override
+ {
+ return e.use_widen_ternop_insn
+ (code_for_pred_nds_vd4dot (EXTEND, e.vector_mode ()));
+ }
+};
+
+/* Implements vwmacc<su><su>. */
+class nds_vd4dotsu : public function_base
+{
+public:
+ bool has_merge_operand_p () const override { return false; }
+
+ rtx expand (function_expander &e) const override
+ {
+ return e.use_widen_ternop_insn
+ (code_for_pred_nds_vd4dotsu (e.vector_mode ()));
+ }
+};
+
static CONSTEXPR const nds_vfwcvtbf16_f nds_vfwcvt_s_obj;
static CONSTEXPR const nds_vfncvtbf16_f<NO_FRM> nds_vfncvt_bf16_obj;
static CONSTEXPR const nds_vfncvtbf16_f<HAS_FRM> nds_vfncvt_bf16_frm_obj;
static CONSTEXPR const nds_vfpmad <UNSPEC_NDS_VFPMADB, NO_FRM> nds_vfpmadb_obj;
static CONSTEXPR const nds_vfpmad <UNSPEC_NDS_VFPMADT, HAS_FRM> nds_vfpmadt_frm_obj;
static CONSTEXPR const nds_vfpmad <UNSPEC_NDS_VFPMADB, HAS_FRM> nds_vfpmadb_frm_obj;
+static CONSTEXPR const nds_vd4dot<SIGN_EXTEND> nds_vd4dots_obj;
+static CONSTEXPR const nds_vd4dot<ZERO_EXTEND> nds_vd4dotu_obj;
+static CONSTEXPR const nds_vd4dotsu nds_vd4dotsu_obj;
/* Declare the function base NAME, pointing it to an instance
of class <NAME>_obj. */
BASE (nds_vfpmadb)
BASE (nds_vfpmadt_frm)
BASE (nds_vfpmadb_frm)
+BASE (nds_vd4dots)
+BASE (nds_vd4dotu)
+BASE (nds_vd4dotsu)
} // end namespace riscv_vector
extern const function_base *const nds_vfpmadb;
extern const function_base *const nds_vfpmadt_frm;
extern const function_base *const nds_vfpmadb_frm;
+extern const function_base *const nds_vd4dots;
+extern const function_base *const nds_vd4dotu;
+extern const function_base *const nds_vd4dotsu;
}
} // end namespace riscv_vector
DEF_RVV_FUNCTION (nds_vfpmadb_frm, alu_frm, full_preds, f16_vvw_ops)
#undef REQUIRED_EXTENSIONS
+/* Andes Vector Dot Product Extension (XAndesVDot). */
+#define REQUIRED_EXTENSIONS XANDESVDOT_EXT
+DEF_RVV_FUNCTION (nds_vd4dots, alu, full_preds, qexti_vvvv_ops)
+DEF_RVV_FUNCTION (nds_vd4dotsu, alu, full_preds, qexti_su_vvvv_ops)
+DEF_RVV_FUNCTION (nds_vd4dotu, alu, full_preds, qextu_vvvv_ops)
+#undef REQUIRED_EXTENSIONS
+
#undef DEF_RVV_FUNCTION
UNSPEC_NDS_INTLOAD
UNSPEC_NDS_VFPMADT
UNSPEC_NDS_VFPMADB
+ UNSPEC_NDS_VD4DOT
])
(define_int_iterator NDS_VFPMAD [UNSPEC_NDS_VFPMADT UNSPEC_NDS_VFPMADB])
(set_attr "enabled" "yes")
(set (attr "frm_mode")
(symbol_ref "riscv_vector::get_frm_mode (operands[9])"))])
+
+;; Vector Dot Product Extension
+
+(define_insn "@pred_nds_vd4dot<su><mode>"
+ [(set (match_operand:VQEXTI 0 "register_operand" "=&vr")
+ (if_then_else:VQEXTI
+ (unspec:<VM>
+ [(match_operand:<VM> 1 "vector_mask_operand" "vmWc1")
+ (match_operand 5 "vector_length_operand" " rK")
+ (match_operand 6 "const_int_operand" " i")
+ (match_operand 7 "const_int_operand" " i")
+ (match_operand 8 "const_int_operand" " i")
+ (reg:SI VL_REGNUM)
+ (reg:SI VTYPE_REGNUM)] UNSPEC_VPREDICATE)
+ (unspec:VQEXTI
+ [(any_extend:VQEXTI
+ (match_operand:<NDS_QUAD_FIX> 3 "register_operand" " vr"))
+ (any_extend:VQEXTI
+ (match_operand:<NDS_QUAD_FIX> 4 "register_operand" " vr"))
+ (any_extend:VQEXTI
+ (match_operand:VQEXTI 2 "register_operand" " 0"))]
+ UNSPEC_NDS_VD4DOT)
+ (match_dup 2)))]
+ "TARGET_VECTOR && TARGET_XANDESVDOT"
+ "nds.vd4dot<su>.vv\t%0,%3,%4%p1"
+ [(set_attr "type" "viwmuladd")
+ (set_attr "mode" "<MODE>")])
+
+(define_insn "@pred_nds_vd4dotsu<mode>"
+ [(set (match_operand:VQEXTI 0 "register_operand" "=&vr")
+ (if_then_else:VQEXTI
+ (unspec:<VM>
+ [(match_operand:<VM> 1 "vector_mask_operand" "vmWc1")
+ (match_operand 5 "vector_length_operand" " rK")
+ (match_operand 6 "const_int_operand" " i")
+ (match_operand 7 "const_int_operand" " i")
+ (match_operand 8 "const_int_operand" " i")
+ (reg:SI VL_REGNUM)
+ (reg:SI VTYPE_REGNUM)] UNSPEC_VPREDICATE)
+ (unspec:VQEXTI
+ [(sign_extend:VQEXTI
+ (match_operand:<NDS_QUAD_FIX> 3 "register_operand" " vr"))
+ (zero_extend:VQEXTI
+ (match_operand:<NDS_QUAD_FIX> 4 "register_operand" " vr"))
+ (sign_extend:VQEXTI
+ (match_operand:VQEXTI 2 "register_operand" " 0"))]
+ UNSPEC_NDS_VD4DOT)
+ (match_dup 2)))]
+ "TARGET_VECTOR && TARGET_XANDESVDOT"
+ "nds.vd4dotsu.vv\t%0,%3,%4%p1"
+ [(set_attr "type" "viwmuladd")
+ (set_attr "mode" "<MODE>")])
fprintf (fp, " /*QUAD_EMUL_UNSIGNED*/ %s,\n",
inttype (8, lmul_log2 - 1, true).c_str ());
fprintf (fp, " /*QUAD_FIX*/ %s,\n",
- inttype (8, lmul_log2, unsigned_p).c_str ());
+ inttype (sew / 4, lmul_log2, unsigned_p).c_str ());
fprintf (fp, " /*QUAD_FIX_SIGNED*/ %s,\n",
- inttype (8, lmul_log2, false).c_str ());
+ inttype (sew / 4, lmul_log2, false).c_str ());
fprintf (fp, " /*QUAD_FIX_UNSIGNED*/ %s,\n",
- inttype (8, lmul_log2, true).c_str ());
+ inttype (sew / 4, lmul_log2, true).c_str ());
fprintf (fp, " /*OCT_TRUNC*/ %s,\n",
same_ratio_eew_type (sew, lmul_log2, sew / 8, unsigned_p,
false)
= {rvv_arg_type_info (RVV_BASE_vector), rvv_arg_type_info (RVV_BASE_vector),
rvv_arg_type_info (RVV_BASE_vector), rvv_arg_type_info_end};
+/* A list of args for vector_type func (vector_type, vector_type, vector_type)
+ * function. */
+static CONSTEXPR const rvv_arg_type_info vqq_args[]
+ = {rvv_arg_type_info (RVV_BASE_vector),
+ rvv_arg_type_info (RVV_BASE_quad_fixed_vector),
+ rvv_arg_type_info (RVV_BASE_quad_fixed_vector), rvv_arg_type_info_end};
+
+static CONSTEXPR const rvv_arg_type_info su_vqq_args[]
+ = {rvv_arg_type_info (RVV_BASE_vector),
+ rvv_arg_type_info (RVV_BASE_quad_fixed_vector),
+ rvv_arg_type_info (RVV_BASE_quad_fixed_unsigned_vector),
+ rvv_arg_type_info_end};
+
/* A list of args for vector_type func (vector_type, vector_type, vector_type)
* function. */
static CONSTEXPR const rvv_arg_type_info vxv_args[]
rvv_arg_type_info (RVV_BASE_vector), /* Return type */
vw_args /* Args */};
+static CONSTEXPR const rvv_op_info qexti_vvvv_ops
+ = {qexti_ops, /* Types */
+ OP_TYPE_vv, /* Suffix */
+ rvv_arg_type_info (RVV_BASE_vector), /* Return type */
+ vqq_args /* Args */};
+
+static CONSTEXPR const rvv_op_info qexti_su_vvvv_ops
+ = {qexti_ops, /* Types */
+ OP_TYPE_vv, /* Suffix */
+ rvv_arg_type_info (RVV_BASE_vector), /* Return type */
+ su_vqq_args /* Args */};
+
+static CONSTEXPR const rvv_op_info qextu_vvvv_ops
+ = {qextu_ops, /* Types */
+ OP_TYPE_vv, /* Suffix */
+ rvv_arg_type_info (RVV_BASE_vector), /* Return type */
+ vqq_args /* Args */};
+
/* A static operand information for vector_type func (vector_type).
Some insns just supports SEW=32, such as the crypto vector Zvkg extension.
* function registration. */
XANDESVBFHCVT_EXT, /* XANDESVBFHCVT extension */
XANDESVSINTLOAD_EXT, /* XANDESVSINTLOAD extension */
XANDESVPACKFPH_EXT, /* XANDESVPACKFPH extension */
+ XANDESVDOT_EXT, /* XANDESVDOT extension */
/* Please update below to isa_name func when add or remove enum type(s). */
};
return "xandesvsintload";
case XANDESVPACKFPH_EXT:
return "xandesvpackfph";
+ case XANDESVDOT_EXT:
+ return "xandesvdot";
default:
gcc_unreachable ();
}
return TARGET_XANDESVSINTLOAD;
case XANDESVPACKFPH_EXT:
return TARGET_XANDESVPACKFPH;
+ case XANDESVDOT_EXT:
+ return TARGET_XANDESVDOT;
default:
gcc_unreachable ();
}
RVVM8HF RVVM4HF RVVM2HF RVVM1HF RVVMF2HF
(RVVMF4HF "TARGET_MIN_VLEN > 32")
])
+
+(define_mode_attr NDS_QUAD_FIX [
+ (RVVM8SI "RVVM8QI") (RVVM4SI "RVVM4QI") (RVVM2SI "RVVM2QI")
+ (RVVM1SI "RVVM1QI") (RVVMF2SI "RVVMF2QI") (RVVM8DI "RVVM8HI")
+ (RVVM4DI "RVVM4HI") (RVVM2DI "RVVM2HI") (RVVM1DI "RVVM1HI")
+
+ (V1SI "V1QI") (V2SI "V2QI") (V4SI "V4QI") (V8SI "V8QI") (V16SI "V16QI")
+ (V32SI "V32QI") (V64SI "V64QI") (V128SI "V128QI") (V256SI "V256QI")
+ (V512SI "V512QI") (V1024SI "V1024QI")
+ (V1DI "V1HI") (V2DI "V2HI") (V4DI "V4HI") (V8DI "V8HI") (V16DI "V16HI")
+ (V32DI "V32HI") (V64DI "V64HI") (V128DI "V128HI") (V256DI "V256HI")
+ (V512DI "V512HI")
+])
--- /dev/null
+/* { dg-do compile } */
+/* { dg-options "-march=rv32gv_xandesvdot -O3 -mabi=ilp32" { target { rv32 } } } */
+/* { dg-options "-march=rv64gv_xandesvdot -O3 -mabi=lp64" { target { rv64 } } } */
+
+#include "andes_vector.h"
+
+vint32mf2_t
+test_nds_vd4dots_vv_i32mf2 (vint32mf2_t vd, vint8mf2_t vs1, vint8mf2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32mf2(vd, vs1, vs2, vl);
+}
+
+vint32m1_t
+test_nds_vd4dots_vv_i32m1 (vint32m1_t vd, vint8m1_t vs1, vint8m1_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32m1(vd, vs1, vs2, vl);
+}
+
+vint32m2_t
+test_nds_vd4dots_vv_i32m2 (vint32m2_t vd, vint8m2_t vs1, vint8m2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32m2(vd, vs1, vs2, vl);
+}
+
+vint32m4_t
+test_nds_vd4dots_vv_i32m4 (vint32m4_t vd, vint8m4_t vs1, vint8m4_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32m4(vd, vs1, vs2, vl);
+}
+
+vint32m8_t
+test_nds_vd4dots_vv_i32m8 (vint32m8_t vd, vint8m8_t vs1, vint8m8_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32m8(vd, vs1, vs2, vl);
+}
+
+vint64m1_t
+test_nds_vd4dots_vv_i64m1 (vint64m1_t vd, vint16m1_t vs1, vint16m1_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i64m1(vd, vs1, vs2, vl);
+}
+
+vint64m2_t
+test_nds_vd4dots_vv_i64m2 (vint64m2_t vd, vint16m2_t vs1, vint16m2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i64m2(vd, vs1, vs2, vl);
+}
+
+vint64m4_t
+test_nds_vd4dots_vv_i64m4 (vint64m4_t vd, vint16m4_t vs1, vint16m4_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i64m4(vd, vs1, vs2, vl);
+}
+
+vint64m8_t
+test_nds_vd4dots_vv_i64m8 (vint64m8_t vd, vint16m8_t vs1, vint16m8_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i64m8(vd, vs1, vs2, vl);
+}
+
+vint32mf2_t
+test_nds_vd4dots_vv_i32mf2_m (vbool64_t vm, vint32mf2_t vd, vint8mf2_t vs1,
+ vint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32mf2_m (vm, vd, vs1, vs2, vl);
+}
+
+vint32m1_t
+test_nds_vd4dots_vv_i32m1_m (vbool32_t vm, vint32m1_t vd, vint8m1_t vs1,
+ vint8m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32m1_m (vm, vd, vs1, vs2, vl);
+}
+
+vint32m2_t
+test_nds_vd4dots_vv_i32m2_m (vbool16_t vm, vint32m2_t vd, vint8m2_t vs1,
+ vint8m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32m2_m (vm, vd, vs1, vs2, vl);
+}
+
+vint32m4_t
+test_nds_vd4dots_vv_i32m4_m (vbool8_t vm, vint32m4_t vd, vint8m4_t vs1,
+ vint8m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32m4_m (vm, vd, vs1, vs2, vl);
+}
+
+vint32m8_t
+test_nds_vd4dots_vv_i32m8_m (vbool4_t vm, vint32m8_t vd, vint8m8_t vs1,
+ vint8m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32m8_m (vm, vd, vs1, vs2, vl);
+}
+
+vint64m1_t
+test_nds_vd4dots_vv_i64m1_m (vbool64_t vm, vint64m1_t vd, vint16m1_t vs1,
+ vint16m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i64m1_m (vm, vd, vs1, vs2, vl);
+}
+
+vint64m2_t
+test_nds_vd4dots_vv_i64m2_m (vbool32_t vm, vint64m2_t vd, vint16m2_t vs1,
+ vint16m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i64m2_m (vm, vd, vs1, vs2, vl);
+}
+
+vint64m4_t
+test_nds_vd4dots_vv_i64m4_m (vbool16_t vm, vint64m4_t vd, vint16m4_t vs1,
+ vint16m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i64m4_m (vm, vd, vs1, vs2, vl);
+}
+
+vint64m8_t
+test_nds_vd4dots_vv_i64m8_m (vbool8_t vm, vint64m8_t vd, vint16m8_t vs1,
+ vint16m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i64m8_m (vm, vd, vs1, vs2, vl);
+}
+/* { dg-final { scan-assembler-times {vseti?vli\s+[a-z0-9]+,\s*[a-z0-9]+,\s*e[0-9]+,\s*mf?[1248],\s*t[au],\s*m[au]\s+nds\.vd4dots[ivxfswum.]*\s+} 18 } } */
--- /dev/null
+/* { dg-do compile } */
+/* { dg-options "-march=rv32gv_xandesvdot -O3 -mabi=ilp32" { target { rv32 } } } */
+/* { dg-options "-march=rv64gv_xandesvdot -O3 -mabi=lp64" { target { rv64 } } } */
+
+#include "andes_vector.h"
+
+vint32mf2_t
+test_nds_vd4dotsu_vv_i32mf2 (vint32mf2_t vd, vint8mf2_t vs1, vuint8mf2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32mf2(vd, vs1, vs2, vl);
+}
+
+vint32m1_t
+test_nds_vd4dotsu_vv_i32m1 (vint32m1_t vd, vint8m1_t vs1, vuint8m1_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32m1(vd, vs1, vs2, vl);
+}
+
+vint32m2_t
+test_nds_vd4dotsu_vv_i32m2 (vint32m2_t vd, vint8m2_t vs1, vuint8m2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32m2(vd, vs1, vs2, vl);
+}
+
+vint32m4_t
+test_nds_vd4dotsu_vv_i32m4 (vint32m4_t vd, vint8m4_t vs1, vuint8m4_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32m4(vd, vs1, vs2, vl);
+}
+
+vint32m8_t
+test_nds_vd4dotsu_vv_i32m8 (vint32m8_t vd, vint8m8_t vs1, vuint8m8_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32m8(vd, vs1, vs2, vl);
+}
+
+vint64m1_t
+test_nds_vd4dotsu_vv_i64m1 (vint64m1_t vd, vint16m1_t vs1, vuint16m1_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i64m1(vd, vs1, vs2, vl);
+}
+
+vint64m2_t
+test_nds_vd4dotsu_vv_i64m2 (vint64m2_t vd, vint16m2_t vs1, vuint16m2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i64m2(vd, vs1, vs2, vl);
+}
+
+vint64m4_t
+test_nds_vd4dotsu_vv_i64m4 (vint64m4_t vd, vint16m4_t vs1, vuint16m4_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i64m4(vd, vs1, vs2, vl);
+}
+
+vint64m8_t
+test_nds_vd4dotsu_vv_i64m8 (vint64m8_t vd, vint16m8_t vs1, vuint16m8_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i64m8(vd, vs1, vs2, vl);
+}
+
+vint32mf2_t
+test_nds_vd4dotsu_vv_i32mf2_m (vbool64_t vm, vint32mf2_t vd, vint8mf2_t vs1,
+ vuint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32mf2_m (vm, vd, vs1, vs2, vl);
+}
+
+vint32m1_t
+test_nds_vd4dotsu_vv_i32m1_m (vbool32_t vm, vint32m1_t vd, vint8m1_t vs1,
+ vuint8m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32m1_m (vm, vd, vs1, vs2, vl);
+}
+
+vint32m2_t
+test_nds_vd4dotsu_vv_i32m2_m (vbool16_t vm, vint32m2_t vd, vint8m2_t vs1,
+ vuint8m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32m2_m (vm, vd, vs1, vs2, vl);
+}
+
+vint32m4_t
+test_nds_vd4dotsu_vv_i32m4_m (vbool8_t vm, vint32m4_t vd, vint8m4_t vs1,
+ vuint8m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32m4_m (vm, vd, vs1, vs2, vl);
+}
+
+vint32m8_t
+test_nds_vd4dotsu_vv_i32m8_m (vbool4_t vm, vint32m8_t vd, vint8m8_t vs1,
+ vuint8m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32m8_m (vm, vd, vs1, vs2, vl);
+}
+
+vint64m1_t
+test_nds_vd4dotsu_vv_i64m1_m (vbool64_t vm, vint64m1_t vd, vint16m1_t vs1,
+ vuint16m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i64m1_m (vm, vd, vs1, vs2, vl);
+}
+
+vint64m2_t
+test_nds_vd4dotsu_vv_i64m2_m (vbool32_t vm, vint64m2_t vd, vint16m2_t vs1,
+ vuint16m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i64m2_m (vm, vd, vs1, vs2, vl);
+}
+
+vint64m4_t
+test_nds_vd4dotsu_vv_i64m4_m (vbool16_t vm, vint64m4_t vd, vint16m4_t vs1,
+ vuint16m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i64m4_m (vm, vd, vs1, vs2, vl);
+}
+
+vint64m8_t
+test_nds_vd4dotsu_vv_i64m8_m (vbool8_t vm, vint64m8_t vd, vint16m8_t vs1,
+ vuint16m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i64m8_m (vm, vd, vs1, vs2, vl);
+}
+/* { dg-final { scan-assembler-times {vseti?vli\s+[a-z0-9]+,\s*[a-z0-9]+,\s*e[0-9]+,\s*mf?[1248],\s*t[au],\s*m[au]\s+nds\.vd4dotsu[ivxfswum.]*\s+} 18 } } */
--- /dev/null
+/* { dg-do compile } */
+/* { dg-options "-march=rv32gv_xandesvdot -O3 -mabi=ilp32" { target { rv32 } } } */
+/* { dg-options "-march=rv64gv_xandesvdot -O3 -mabi=lp64" { target { rv64 } } } */
+
+#include "andes_vector.h"
+
+vuint32mf2_t
+test_nds_vd4dotu_vv_u32mf2 (vuint32mf2_t vd, vuint8mf2_t vs1, vuint8mf2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32mf2(vd, vs1, vs2, vl);
+}
+
+vuint32m1_t
+test_nds_vd4dotu_vv_u32m1 (vuint32m1_t vd, vuint8m1_t vs1, vuint8m1_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32m1(vd, vs1, vs2, vl);
+}
+
+vuint32m2_t
+test_nds_vd4dotu_vv_u32m2 (vuint32m2_t vd, vuint8m2_t vs1, vuint8m2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32m2(vd, vs1, vs2, vl);
+}
+
+vuint32m4_t
+test_nds_vd4dotu_vv_u32m4 (vuint32m4_t vd, vuint8m4_t vs1, vuint8m4_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32m4(vd, vs1, vs2, vl);
+}
+
+vuint32m8_t
+test_nds_vd4dotu_vv_u32m8 (vuint32m8_t vd, vuint8m8_t vs1, vuint8m8_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32m8(vd, vs1, vs2, vl);
+}
+
+vuint64m1_t
+test_nds_vd4dotu_vv_u64m1 (vuint64m1_t vd, vuint16m1_t vs1, vuint16m1_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u64m1(vd, vs1, vs2, vl);
+}
+
+vuint64m2_t
+test_nds_vd4dotu_vv_u64m2 (vuint64m2_t vd, vuint16m2_t vs1, vuint16m2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u64m2(vd, vs1, vs2, vl);
+}
+
+vuint64m4_t
+test_nds_vd4dotu_vv_u64m4 (vuint64m4_t vd, vuint16m4_t vs1, vuint16m4_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u64m4(vd, vs1, vs2, vl);
+}
+
+vuint64m8_t
+test_nds_vd4dotu_vv_u64m8 (vuint64m8_t vd, vuint16m8_t vs1, vuint16m8_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u64m8(vd, vs1, vs2, vl);
+}
+
+vuint32mf2_t
+test_nds_vd4dotu_vv_u32mf2_m (vbool64_t vm, vuint32mf2_t vd, vuint8mf2_t vs1,
+ vuint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32mf2_m (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m1_t
+test_nds_vd4dotu_vv_u32m1_m (vbool32_t vm, vuint32m1_t vd, vuint8m1_t vs1,
+ vuint8m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32m1_m (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m2_t
+test_nds_vd4dotu_vv_u32m2_m (vbool16_t vm, vuint32m2_t vd, vuint8m2_t vs1,
+ vuint8m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32m2_m (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m4_t
+test_nds_vd4dotu_vv_u32m4_m (vbool8_t vm, vuint32m4_t vd, vuint8m4_t vs1,
+ vuint8m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32m4_m (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m8_t
+test_nds_vd4dotu_vv_u32m8_m (vbool4_t vm, vuint32m8_t vd, vuint8m8_t vs1,
+ vuint8m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32m8_m (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m1_t
+test_nds_vd4dotu_vv_u64m1_m (vbool64_t vm, vuint64m1_t vd, vuint16m1_t vs1,
+ vuint16m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u64m1_m (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m2_t
+test_nds_vd4dotu_vv_u64m2_m (vbool32_t vm, vuint64m2_t vd, vuint16m2_t vs1,
+ vuint16m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u64m2_m (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m4_t
+test_nds_vd4dotu_vv_u64m4_m (vbool16_t vm, vuint64m4_t vd, vuint16m4_t vs1,
+ vuint16m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u64m4_m (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m8_t
+test_nds_vd4dotu_vv_u64m8_m (vbool8_t vm, vuint64m8_t vd, vuint16m8_t vs1,
+ vuint16m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u64m8_m (vm, vd, vs1, vs2, vl);
+}
+/* { dg-final { scan-assembler-times {vseti?vli\s+[a-z0-9]+,\s*[a-z0-9]+,\s*e[0-9]+,\s*mf?[1248],\s*t[au],\s*m[au]\s+nds\.vd4dotu[ivxfswum.]*\s+} 18 } } */
--- /dev/null
+/* { dg-do compile } */
+/* { dg-options "-march=rv32gv_xandesvdot -O3 -mabi=ilp32" { target { rv32 } } } */
+/* { dg-options "-march=rv64gv_xandesvdot -O3 -mabi=lp64" { target { rv64 } } } */
+
+#include "andes_vector.h"
+
+vint32mf2_t
+test_nds_vd4dots_vv_i32mf2 (vint32mf2_t vd, vint8mf2_t vs1, vint8mf2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots(vd, vs1, vs2, vl);
+}
+
+vint32m1_t
+test_nds_vd4dots_vv_i32m1 (vint32m1_t vd, vint8m1_t vs1, vint8m1_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots(vd, vs1, vs2, vl);
+}
+
+vint32m2_t
+test_nds_vd4dots_vv_i32m2 (vint32m2_t vd, vint8m2_t vs1, vint8m2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots(vd, vs1, vs2, vl);
+}
+
+vint32m4_t
+test_nds_vd4dots_vv_i32m4 (vint32m4_t vd, vint8m4_t vs1, vint8m4_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots(vd, vs1, vs2, vl);
+}
+
+vint32m8_t
+test_nds_vd4dots_vv_i32m8 (vint32m8_t vd, vint8m8_t vs1, vint8m8_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots(vd, vs1, vs2, vl);
+}
+
+vint64m1_t
+test_nds_vd4dots_vv_i64m1 (vint64m1_t vd, vint16m1_t vs1, vint16m1_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots(vd, vs1, vs2, vl);
+}
+
+vint64m2_t
+test_nds_vd4dots_vv_i64m2 (vint64m2_t vd, vint16m2_t vs1, vint16m2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots(vd, vs1, vs2, vl);
+}
+
+vint64m4_t
+test_nds_vd4dots_vv_i64m4 (vint64m4_t vd, vint16m4_t vs1, vint16m4_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots(vd, vs1, vs2, vl);
+}
+
+vint64m8_t
+test_nds_vd4dots_vv_i64m8 (vint64m8_t vd, vint16m8_t vs1, vint16m8_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots(vd, vs1, vs2, vl);
+}
+
+vint32mf2_t
+test_nds_vd4dots_vv_i32mf2_m (vbool64_t vm, vint32mf2_t vd, vint8mf2_t vs1,
+ vint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots (vm, vd, vs1, vs2, vl);
+}
+
+vint32m1_t
+test_nds_vd4dots_vv_i32m1_m (vbool32_t vm, vint32m1_t vd, vint8m1_t vs1,
+ vint8m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots (vm, vd, vs1, vs2, vl);
+}
+
+vint32m2_t
+test_nds_vd4dots_vv_i32m2_m (vbool16_t vm, vint32m2_t vd, vint8m2_t vs1,
+ vint8m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots (vm, vd, vs1, vs2, vl);
+}
+
+vint32m4_t
+test_nds_vd4dots_vv_i32m4_m (vbool8_t vm, vint32m4_t vd, vint8m4_t vs1,
+ vint8m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots (vm, vd, vs1, vs2, vl);
+}
+
+vint32m8_t
+test_nds_vd4dots_vv_i32m8_m (vbool4_t vm, vint32m8_t vd, vint8m8_t vs1,
+ vint8m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots (vm, vd, vs1, vs2, vl);
+}
+
+vint64m1_t
+test_nds_vd4dots_vv_i64m1_m (vbool64_t vm, vint64m1_t vd, vint16m1_t vs1,
+ vint16m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots (vm, vd, vs1, vs2, vl);
+}
+
+vint64m2_t
+test_nds_vd4dots_vv_i64m2_m (vbool32_t vm, vint64m2_t vd, vint16m2_t vs1,
+ vint16m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots (vm, vd, vs1, vs2, vl);
+}
+
+vint64m4_t
+test_nds_vd4dots_vv_i64m4_m (vbool16_t vm, vint64m4_t vd, vint16m4_t vs1,
+ vint16m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots (vm, vd, vs1, vs2, vl);
+}
+
+vint64m8_t
+test_nds_vd4dots_vv_i64m8_m (vbool8_t vm, vint64m8_t vd, vint16m8_t vs1,
+ vint16m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots (vm, vd, vs1, vs2, vl);
+}
+/* { dg-final { scan-assembler-times {vseti?vli\s+[a-z0-9]+,\s*[a-z0-9]+,\s*e[0-9]+,\s*mf?[1248],\s*t[au],\s*m[au]\s+nds\.vd4dots[ivxfswum.]*\s+} 18 } } */
--- /dev/null
+/* { dg-do compile } */
+/* { dg-options "-march=rv32gv_xandesvdot -O3 -mabi=ilp32" { target { rv32 } } } */
+/* { dg-options "-march=rv64gv_xandesvdot -O3 -mabi=lp64" { target { rv64 } } } */
+
+#include "andes_vector.h"
+
+vint32mf2_t
+test_nds_vd4dotsu_vv_i32mf2 (vint32mf2_t vd, vint8mf2_t vs1, vuint8mf2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu(vd, vs1, vs2, vl);
+}
+
+vint32m1_t
+test_nds_vd4dotsu_vv_i32m1 (vint32m1_t vd, vint8m1_t vs1, vuint8m1_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu(vd, vs1, vs2, vl);
+}
+
+vint32m2_t
+test_nds_vd4dotsu_vv_i32m2 (vint32m2_t vd, vint8m2_t vs1, vuint8m2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu(vd, vs1, vs2, vl);
+}
+
+vint32m4_t
+test_nds_vd4dotsu_vv_i32m4 (vint32m4_t vd, vint8m4_t vs1, vuint8m4_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu(vd, vs1, vs2, vl);
+}
+
+vint32m8_t
+test_nds_vd4dotsu_vv_i32m8 (vint32m8_t vd, vint8m8_t vs1, vuint8m8_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu(vd, vs1, vs2, vl);
+}
+
+vint64m1_t
+test_nds_vd4dotsu_vv_i64m1 (vint64m1_t vd, vint16m1_t vs1, vuint16m1_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu(vd, vs1, vs2, vl);
+}
+
+vint64m2_t
+test_nds_vd4dotsu_vv_i64m2 (vint64m2_t vd, vint16m2_t vs1, vuint16m2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu(vd, vs1, vs2, vl);
+}
+
+vint64m4_t
+test_nds_vd4dotsu_vv_i64m4 (vint64m4_t vd, vint16m4_t vs1, vuint16m4_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu(vd, vs1, vs2, vl);
+}
+
+vint64m8_t
+test_nds_vd4dotsu_vv_i64m8 (vint64m8_t vd, vint16m8_t vs1, vuint16m8_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu(vd, vs1, vs2, vl);
+}
+
+vint32mf2_t
+test_nds_vd4dotsu_vv_i32mf2_m (vbool64_t vm, vint32mf2_t vd, vint8mf2_t vs1,
+ vuint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m1_t
+test_nds_vd4dotsu_vv_i32m1_m (vbool32_t vm, vint32m1_t vd, vint8m1_t vs1,
+ vuint8m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m2_t
+test_nds_vd4dotsu_vv_i32m2_m (vbool16_t vm, vint32m2_t vd, vint8m2_t vs1,
+ vuint8m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m4_t
+test_nds_vd4dotsu_vv_i32m4_m (vbool8_t vm, vint32m4_t vd, vint8m4_t vs1,
+ vuint8m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m8_t
+test_nds_vd4dotsu_vv_i32m8_m (vbool4_t vm, vint32m8_t vd, vint8m8_t vs1,
+ vuint8m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m1_t
+test_nds_vd4dotsu_vv_i64m1_m (vbool64_t vm, vint64m1_t vd, vint16m1_t vs1,
+ vuint16m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m2_t
+test_nds_vd4dotsu_vv_i64m2_m (vbool32_t vm, vint64m2_t vd, vint16m2_t vs1,
+ vuint16m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m4_t
+test_nds_vd4dotsu_vv_i64m4_m (vbool16_t vm, vint64m4_t vd, vint16m4_t vs1,
+ vuint16m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m8_t
+test_nds_vd4dotsu_vv_i64m8_m (vbool8_t vm, vint64m8_t vd, vint16m8_t vs1,
+ vuint16m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu (vm, vd, vs1, vs2, vl);
+}
+/* { dg-final { scan-assembler-times {vseti?vli\s+[a-z0-9]+,\s*[a-z0-9]+,\s*e[0-9]+,\s*mf?[1248],\s*t[au],\s*m[au]\s+nds\.vd4dotsu[ivxfswum.]*\s+} 18 } } */
--- /dev/null
+/* { dg-do compile } */
+/* { dg-options "-march=rv32gv_xandesvdot -O3 -mabi=ilp32" { target { rv32 } } } */
+/* { dg-options "-march=rv64gv_xandesvdot -O3 -mabi=lp64" { target { rv64 } } } */
+
+#include "andes_vector.h"
+
+vuint32mf2_t
+test_vd4dotu_vv_u32mf2 (vuint32mf2_t vd, vuint8mf2_t vs1, vuint8mf2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu (vd, vs1, vs2, vl);
+}
+
+vuint32m1_t
+test_vd4dotu_vv_u32m1 (vuint32m1_t vd, vuint8m1_t vs1, vuint8m1_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu (vd, vs1, vs2, vl);
+}
+
+vuint32m2_t
+test_vd4dotu_vv_u32m2 (vuint32m2_t vd, vuint8m2_t vs1, vuint8m2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu (vd, vs1, vs2, vl);
+}
+
+vuint32m4_t
+test_vd4dotu_vv_u32m4 (vuint32m4_t vd, vuint8m4_t vs1, vuint8m4_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu (vd, vs1, vs2, vl);
+}
+
+vuint32m8_t
+test_vd4dotu_vv_u32m8 (vuint32m8_t vd, vuint8m8_t vs1, vuint8m8_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu (vd, vs1, vs2, vl);
+}
+
+vuint64m1_t
+test_vd4dotu_vv_u64m1 (vuint64m1_t vd, vuint16m1_t vs1, vuint16m1_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu (vd, vs1, vs2, vl);
+}
+
+vuint64m2_t
+test_vd4dotu_vv_u64m2 (vuint64m2_t vd, vuint16m2_t vs1, vuint16m2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu (vd, vs1, vs2, vl);
+}
+
+vuint64m4_t
+test_vd4dotu_vv_u64m4 (vuint64m4_t vd, vuint16m4_t vs1, vuint16m4_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu (vd, vs1, vs2, vl);
+}
+
+vuint64m8_t
+test_vd4dotu_vv_u64m8 (vuint64m8_t vd, vuint16m8_t vs1, vuint16m8_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu (vd, vs1, vs2, vl);
+}
+
+vuint32mf2_t
+test_vd4dotu_vv_u32mf2_m (vbool64_t vm, vuint32mf2_t vd, vuint8mf2_t vs1,
+ vuint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m1_t
+test_vd4dotu_vv_u32m1_m (vbool32_t vm, vuint32m1_t vd, vuint8m1_t vs1,
+ vuint8m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m2_t
+test_vd4dotu_vv_u32m2_m (vbool16_t vm, vuint32m2_t vd, vuint8m2_t vs1,
+ vuint8m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m4_t
+test_vd4dotu_vv_u32m4_m (vbool8_t vm, vuint32m4_t vd, vuint8m4_t vs1,
+ vuint8m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m8_t
+test_vd4dotu_vv_u32m8_m (vbool4_t vm, vuint32m8_t vd, vuint8m8_t vs1,
+ vuint8m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m1_t
+test_vd4dotu_vv_u64m1_m (vbool64_t vm, vuint64m1_t vd, vuint16m1_t vs1,
+ vuint16m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m2_t
+test_vd4dotu_vv_u64m2_m (vbool32_t vm, vuint64m2_t vd, vuint16m2_t vs1,
+ vuint16m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m4_t
+test_vd4dotu_vv_u64m4_m (vbool16_t vm, vuint64m4_t vd, vuint16m4_t vs1,
+ vuint16m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m8_t
+test_vd4dotu_vv_u64m8_m (vbool8_t vm, vuint64m8_t vd, vuint16m8_t vs1,
+ vuint16m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu (vm, vd, vs1, vs2, vl);
+}
+/* { dg-final { scan-assembler-times {vseti?vli\s+[a-z0-9]+,\s*[a-z0-9]+,\s*e[0-9]+,\s*mf?[1248],\s*t[au],\s*m[au]\s+nds\.vd4dotu[ivxfswum.]*\s+} 18 } } */
--- /dev/null
+/* { dg-do compile } */
+/* { dg-options "-march=rv32gv_xandesvdot -O3 -mabi=ilp32" { target { rv32 } } } */
+/* { dg-options "-march=rv64gv_xandesvdot -O3 -mabi=lp64" { target { rv64 } } } */
+
+#include "andes_vector.h"
+
+vint32mf2_t
+test_nds_vd4dots_vv_i32mf2_tu (vint32mf2_t vd, vint8mf2_t vs1, vint8mf2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32mf2_tu(vd, vs1, vs2, vl);
+}
+
+vint32m1_t
+test_nds_vd4dots_vv_i32m1_tu (vint32m1_t vd, vint8m1_t vs1, vint8m1_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32m1_tu(vd, vs1, vs2, vl);
+}
+
+vint32m2_t
+test_nds_vd4dots_vv_i32m2_tu (vint32m2_t vd, vint8m2_t vs1, vint8m2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32m2_tu(vd, vs1, vs2, vl);
+}
+
+vint32m4_t
+test_nds_vd4dots_vv_i32m4_tu (vint32m4_t vd, vint8m4_t vs1, vint8m4_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32m4_tu(vd, vs1, vs2, vl);
+}
+
+vint32m8_t
+test_nds_vd4dots_vv_i32m8_tu (vint32m8_t vd, vint8m8_t vs1, vint8m8_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32m8_tu(vd, vs1, vs2, vl);
+}
+
+vint64m1_t
+test_nds_vd4dots_vv_i64m1_tu (vint64m1_t vd, vint16m1_t vs1, vint16m1_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i64m1_tu(vd, vs1, vs2, vl);
+}
+
+vint64m2_t
+test_nds_vd4dots_vv_i64m2_tu (vint64m2_t vd, vint16m2_t vs1, vint16m2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i64m2_tu(vd, vs1, vs2, vl);
+}
+
+vint64m4_t
+test_nds_vd4dots_vv_i64m4_tu (vint64m4_t vd, vint16m4_t vs1, vint16m4_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i64m4_tu(vd, vs1, vs2, vl);
+}
+
+vint64m8_t
+test_nds_vd4dots_vv_i64m8_tu (vint64m8_t vd, vint16m8_t vs1, vint16m8_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i64m8_tu(vd, vs1, vs2, vl);
+}
+
+vint32mf2_t
+test_nds_vd4dots_vv_i32mf2_tum (vbool64_t vm, vint32mf2_t vd, vint8mf2_t vs1,
+ vint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32mf2_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint32m1_t
+test_nds_vd4dots_vv_i32m1_tum (vbool32_t vm, vint32m1_t vd, vint8m1_t vs1,
+ vint8m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32m1_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint32m2_t
+test_nds_vd4dots_vv_i32m2_tum (vbool16_t vm, vint32m2_t vd, vint8m2_t vs1,
+ vint8m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32m2_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint32m4_t
+test_nds_vd4dots_vv_i32m4_tum (vbool8_t vm, vint32m4_t vd, vint8m4_t vs1,
+ vint8m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32m4_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint32m8_t
+test_nds_vd4dots_vv_i32m8_tum (vbool4_t vm, vint32m8_t vd, vint8m8_t vs1,
+ vint8m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32m8_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint64m1_t
+test_nds_vd4dots_vv_i64m1_tum (vbool64_t vm, vint64m1_t vd, vint16m1_t vs1,
+ vint16m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i64m1_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint64m2_t
+test_nds_vd4dots_vv_i64m2_tum (vbool32_t vm, vint64m2_t vd, vint16m2_t vs1,
+ vint16m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i64m2_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint64m4_t
+test_nds_vd4dots_vv_i64m4_tum (vbool16_t vm, vint64m4_t vd, vint16m4_t vs1,
+ vint16m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i64m4_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint64m8_t
+test_nds_vd4dots_vv_i64m8_tum (vbool8_t vm, vint64m8_t vd, vint16m8_t vs1,
+ vint16m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i64m8_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint32mf2_t
+test_nds_vd4dots_vv_i32mf2_tumu (vbool64_t vm, vint32mf2_t vd, vint8mf2_t vs1,
+ vint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32mf2_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m1_t
+test_nds_vd4dots_vv_i32m1_tumu (vbool32_t vm, vint32m1_t vd, vint8m1_t vs1,
+ vint8m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32m1_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m2_t
+test_nds_vd4dots_vv_i32m2_tumu (vbool16_t vm, vint32m2_t vd, vint8m2_t vs1,
+ vint8m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32m2_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m4_t
+test_nds_vd4dots_vv_i32m4_tumu (vbool8_t vm, vint32m4_t vd, vint8m4_t vs1,
+ vint8m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32m4_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m8_t
+test_nds_vd4dots_vv_i32m8_tumu (vbool4_t vm, vint32m8_t vd, vint8m8_t vs1,
+ vint8m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32m8_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m1_t
+test_nds_vd4dots_vv_i64m1_tumu (vbool64_t vm, vint64m1_t vd, vint16m1_t vs1,
+ vint16m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i64m1_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m2_t
+test_nds_vd4dots_vv_i64m2_tumu (vbool32_t vm, vint64m2_t vd, vint16m2_t vs1,
+ vint16m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i64m2_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m4_t
+test_nds_vd4dots_vv_i64m4_tumu (vbool16_t vm, vint64m4_t vd, vint16m4_t vs1,
+ vint16m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i64m4_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m8_t
+test_nds_vd4dots_vv_i64m8_tumu (vbool8_t vm, vint64m8_t vd, vint16m8_t vs1,
+ vint16m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i64m8_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint32mf2_t
+test_nds_vd4dots_vv_i32mf2_mu (vbool64_t vm, vint32mf2_t vd, vint8mf2_t vs1,
+ vint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32mf2_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m1_t
+test_nds_vd4dots_vv_i32m1_mu (vbool32_t vm, vint32m1_t vd, vint8m1_t vs1,
+ vint8m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32m1_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m2_t
+test_nds_vd4dots_vv_i32m2_mu (vbool16_t vm, vint32m2_t vd, vint8m2_t vs1,
+ vint8m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32m2_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m4_t
+test_nds_vd4dots_vv_i32m4_mu (vbool8_t vm, vint32m4_t vd, vint8m4_t vs1,
+ vint8m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32m4_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m8_t
+test_nds_vd4dots_vv_i32m8_mu (vbool4_t vm, vint32m8_t vd, vint8m8_t vs1,
+ vint8m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i32m8_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m1_t
+test_nds_vd4dots_vv_i64m1_mu (vbool64_t vm, vint64m1_t vd, vint16m1_t vs1,
+ vint16m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i64m1_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m2_t
+test_nds_vd4dots_vv_i64m2_mu (vbool32_t vm, vint64m2_t vd, vint16m2_t vs1,
+ vint16m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i64m2_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m4_t
+test_nds_vd4dots_vv_i64m4_mu (vbool16_t vm, vint64m4_t vd, vint16m4_t vs1,
+ vint16m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i64m4_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m8_t
+test_nds_vd4dots_vv_i64m8_mu (vbool8_t vm, vint64m8_t vd, vint16m8_t vs1,
+ vint16m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_vv_i64m8_mu (vm, vd, vs1, vs2, vl);
+}
+/* { dg-final { scan-assembler-times {vseti?vli\s+[a-z0-9]+,\s*[a-z0-9]+,\s*e[0-9]+,\s*mf?[1248],\s*t[au],\s*m[au]\s+nds\.vd4dots[ivxfswum.]*\s+} 36 } } */
--- /dev/null
+/* { dg-do compile } */
+/* { dg-options "-march=rv32gv_xandesvdot -O3 -mabi=ilp32" { target { rv32 } } } */
+/* { dg-options "-march=rv64gv_xandesvdot -O3 -mabi=lp64" { target { rv64 } } } */
+
+#include "andes_vector.h"
+
+vint32mf2_t
+test_nds_vd4dotsu_vv_i32mf2_tu (vint32mf2_t vd, vint8mf2_t vs1, vuint8mf2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32mf2_tu(vd, vs1, vs2, vl);
+}
+
+vint32m1_t
+test_nds_vd4dotsu_vv_i32m1_tu (vint32m1_t vd, vint8m1_t vs1, vuint8m1_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32m1_tu(vd, vs1, vs2, vl);
+}
+
+vint32m2_t
+test_nds_vd4dotsu_vv_i32m2_tu (vint32m2_t vd, vint8m2_t vs1, vuint8m2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32m2_tu(vd, vs1, vs2, vl);
+}
+
+vint32m4_t
+test_nds_vd4dotsu_vv_i32m4_tu (vint32m4_t vd, vint8m4_t vs1, vuint8m4_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32m4_tu(vd, vs1, vs2, vl);
+}
+
+vint32m8_t
+test_nds_vd4dotsu_vv_i32m8_tu (vint32m8_t vd, vint8m8_t vs1, vuint8m8_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32m8_tu(vd, vs1, vs2, vl);
+}
+
+vint64m1_t
+test_nds_vd4dotsu_vv_i64m1_tu (vint64m1_t vd, vint16m1_t vs1, vuint16m1_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i64m1_tu(vd, vs1, vs2, vl);
+}
+
+vint64m2_t
+test_nds_vd4dotsu_vv_i64m2_tu (vint64m2_t vd, vint16m2_t vs1, vuint16m2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i64m2_tu(vd, vs1, vs2, vl);
+}
+
+vint64m4_t
+test_nds_vd4dotsu_vv_i64m4_tu (vint64m4_t vd, vint16m4_t vs1, vuint16m4_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i64m4_tu(vd, vs1, vs2, vl);
+}
+
+vint64m8_t
+test_nds_vd4dotsu_vv_i64m8_tu (vint64m8_t vd, vint16m8_t vs1, vuint16m8_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i64m8_tu(vd, vs1, vs2, vl);
+}
+
+vint32mf2_t
+test_nds_vd4dotsu_vv_i32mf2_tum (vbool64_t vm, vint32mf2_t vd, vint8mf2_t vs1,
+ vuint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32mf2_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint32m1_t
+test_nds_vd4dotsu_vv_i32m1_tum (vbool32_t vm, vint32m1_t vd, vint8m1_t vs1,
+ vuint8m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32m1_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint32m2_t
+test_nds_vd4dotsu_vv_i32m2_tum (vbool16_t vm, vint32m2_t vd, vint8m2_t vs1,
+ vuint8m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32m2_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint32m4_t
+test_nds_vd4dotsu_vv_i32m4_tum (vbool8_t vm, vint32m4_t vd, vint8m4_t vs1,
+ vuint8m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32m4_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint32m8_t
+test_nds_vd4dotsu_vv_i32m8_tum (vbool4_t vm, vint32m8_t vd, vint8m8_t vs1,
+ vuint8m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32m8_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint64m1_t
+test_nds_vd4dotsu_vv_i64m1_tum (vbool64_t vm, vint64m1_t vd, vint16m1_t vs1,
+ vuint16m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i64m1_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint64m2_t
+test_nds_vd4dotsu_vv_i64m2_tum (vbool32_t vm, vint64m2_t vd, vint16m2_t vs1,
+ vuint16m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i64m2_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint64m4_t
+test_nds_vd4dotsu_vv_i64m4_tum (vbool16_t vm, vint64m4_t vd, vint16m4_t vs1,
+ vuint16m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i64m4_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint64m8_t
+test_nds_vd4dotsu_vv_i64m8_tum (vbool8_t vm, vint64m8_t vd, vint16m8_t vs1,
+ vuint16m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i64m8_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint32mf2_t
+test_nds_vd4dotsu_vv_i32mf2_tumu (vbool64_t vm, vint32mf2_t vd, vint8mf2_t vs1,
+ vuint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32mf2_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m1_t
+test_nds_vd4dotsu_vv_i32m1_tumu (vbool32_t vm, vint32m1_t vd, vint8m1_t vs1,
+ vuint8m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32m1_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m2_t
+test_nds_vd4dotsu_vv_i32m2_tumu (vbool16_t vm, vint32m2_t vd, vint8m2_t vs1,
+ vuint8m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32m2_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m4_t
+test_nds_vd4dotsu_vv_i32m4_tumu (vbool8_t vm, vint32m4_t vd, vint8m4_t vs1,
+ vuint8m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32m4_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m8_t
+test_nds_vd4dotsu_vv_i32m8_tumu (vbool4_t vm, vint32m8_t vd, vint8m8_t vs1,
+ vuint8m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32m8_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m1_t
+test_nds_vd4dotsu_vv_i64m1_tumu (vbool64_t vm, vint64m1_t vd, vint16m1_t vs1,
+ vuint16m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i64m1_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m2_t
+test_nds_vd4dotsu_vv_i64m2_tumu (vbool32_t vm, vint64m2_t vd, vint16m2_t vs1,
+ vuint16m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i64m2_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m4_t
+test_nds_vd4dotsu_vv_i64m4_tumu (vbool16_t vm, vint64m4_t vd, vint16m4_t vs1,
+ vuint16m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i64m4_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m8_t
+test_nds_vd4dotsu_vv_i64m8_tumu (vbool8_t vm, vint64m8_t vd, vint16m8_t vs1,
+ vuint16m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i64m8_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint32mf2_t
+test_nds_vd4dotsu_vv_i32mf2_mu (vbool64_t vm, vint32mf2_t vd, vint8mf2_t vs1,
+ vuint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32mf2_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m1_t
+test_nds_vd4dotsu_vv_i32m1_mu (vbool32_t vm, vint32m1_t vd, vint8m1_t vs1,
+ vuint8m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32m1_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m2_t
+test_nds_vd4dotsu_vv_i32m2_mu (vbool16_t vm, vint32m2_t vd, vint8m2_t vs1,
+ vuint8m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32m2_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m4_t
+test_nds_vd4dotsu_vv_i32m4_mu (vbool8_t vm, vint32m4_t vd, vint8m4_t vs1,
+ vuint8m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32m4_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m8_t
+test_nds_vd4dotsu_vv_i32m8_mu (vbool4_t vm, vint32m8_t vd, vint8m8_t vs1,
+ vuint8m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i32m8_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m1_t
+test_nds_vd4dotsu_vv_i64m1_mu (vbool64_t vm, vint64m1_t vd, vint16m1_t vs1,
+ vuint16m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i64m1_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m2_t
+test_nds_vd4dotsu_vv_i64m2_mu (vbool32_t vm, vint64m2_t vd, vint16m2_t vs1,
+ vuint16m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i64m2_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m4_t
+test_nds_vd4dotsu_vv_i64m4_mu (vbool16_t vm, vint64m4_t vd, vint16m4_t vs1,
+ vuint16m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i64m4_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m8_t
+test_nds_vd4dotsu_vv_i64m8_mu (vbool8_t vm, vint64m8_t vd, vint16m8_t vs1,
+ vuint16m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_vv_i64m8_mu (vm, vd, vs1, vs2, vl);
+}
+/* { dg-final { scan-assembler-times {vseti?vli\s+[a-z0-9]+,\s*[a-z0-9]+,\s*e[0-9]+,\s*mf?[1248],\s*t[au],\s*m[au]\s+nds\.vd4dotsu[ivxfswum.]*\s+} 36 } } */
--- /dev/null
+/* { dg-do compile } */
+/* { dg-options "-march=rv32gv_xandesvdot -O3 -mabi=ilp32" { target { rv32 } } } */
+/* { dg-options "-march=rv64gv_xandesvdot -O3 -mabi=lp64" { target { rv64 } } } */
+
+#include "andes_vector.h"
+
+vuint32mf2_t
+test_nds_vd4dotu_vv_u32mf2_tu (vuint32mf2_t vd, vuint8mf2_t vs1,
+ vuint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32mf2_tu(vd, vs1, vs2, vl);
+}
+
+vuint32m1_t
+test_nds_vd4dotu_vv_u32m1_tu (vuint32m1_t vd, vuint8m1_t vs1, vuint8m1_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32m1_tu(vd, vs1, vs2, vl);
+}
+
+vuint32m2_t
+test_nds_vd4dotu_vv_u32m2_tu (vuint32m2_t vd, vuint8m2_t vs1, vuint8m2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32m2_tu(vd, vs1, vs2, vl);
+}
+
+vuint32m4_t
+test_nds_vd4dotu_vv_u32m4_tu (vuint32m4_t vd, vuint8m4_t vs1, vuint8m4_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32m4_tu(vd, vs1, vs2, vl);
+}
+
+vuint32m8_t
+test_nds_vd4dotu_vv_u32m8_tu (vuint32m8_t vd, vuint8m8_t vs1, vuint8m8_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32m8_tu(vd, vs1, vs2, vl);
+}
+
+vuint64m1_t
+test_nds_vd4dotu_vv_u64m1_tu (vuint64m1_t vd, vuint16m1_t vs1, vuint16m1_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u64m1_tu(vd, vs1, vs2, vl);
+}
+
+vuint64m2_t
+test_nds_vd4dotu_vv_u64m2_tu (vuint64m2_t vd, vuint16m2_t vs1, vuint16m2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u64m2_tu(vd, vs1, vs2, vl);
+}
+
+vuint64m4_t
+test_nds_vd4dotu_vv_u64m4_tu (vuint64m4_t vd, vuint16m4_t vs1, vuint16m4_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u64m4_tu(vd, vs1, vs2, vl);
+}
+
+vuint64m8_t
+test_nds_vd4dotu_vv_u64m8_tu (vuint64m8_t vd, vuint16m8_t vs1, vuint16m8_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u64m8_tu(vd, vs1, vs2, vl);
+}
+
+vuint32mf2_t
+test_nds_vd4dotu_vv_u32mf2_tum (vbool64_t vm, vuint32mf2_t vd, vuint8mf2_t vs1,
+ vuint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32mf2_tum (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m1_t
+test_nds_vd4dotu_vv_u32m1_tum (vbool32_t vm, vuint32m1_t vd, vuint8m1_t vs1,
+ vuint8m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32m1_tum (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m2_t
+test_nds_vd4dotu_vv_u32m2_tum (vbool16_t vm, vuint32m2_t vd, vuint8m2_t vs1,
+ vuint8m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32m2_tum (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m4_t
+test_nds_vd4dotu_vv_u32m4_tum (vbool8_t vm, vuint32m4_t vd, vuint8m4_t vs1,
+ vuint8m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32m4_tum (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m8_t
+test_nds_vd4dotu_vv_u32m8_tum (vbool4_t vm, vuint32m8_t vd, vuint8m8_t vs1,
+ vuint8m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32m8_tum (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m1_t
+test_nds_vd4dotu_vv_u64m1_tum (vbool64_t vm, vuint64m1_t vd, vuint16m1_t vs1,
+ vuint16m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u64m1_tum (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m2_t
+test_nds_vd4dotu_vv_u64m2_tum (vbool32_t vm, vuint64m2_t vd, vuint16m2_t vs1,
+ vuint16m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u64m2_tum (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m4_t
+test_nds_vd4dotu_vv_u64m4_tum (vbool16_t vm, vuint64m4_t vd, vuint16m4_t vs1,
+ vuint16m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u64m4_tum (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m8_t
+test_nds_vd4dotu_vv_u64m8_tum (vbool8_t vm, vuint64m8_t vd, vuint16m8_t vs1,
+ vuint16m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u64m8_tum (vm, vd, vs1, vs2, vl);
+}
+
+vuint32mf2_t
+test_nds_vd4dotu_vv_u32mf2_tumu (vbool64_t vm, vuint32mf2_t vd, vuint8mf2_t vs1,
+ vuint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32mf2_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m1_t
+test_nds_vd4dotu_vv_u32m1_tumu (vbool32_t vm, vuint32m1_t vd, vuint8m1_t vs1,
+ vuint8m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32m1_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m2_t
+test_nds_vd4dotu_vv_u32m2_tumu (vbool16_t vm, vuint32m2_t vd, vuint8m2_t vs1,
+ vuint8m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32m2_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m4_t
+test_nds_vd4dotu_vv_u32m4_tumu (vbool8_t vm, vuint32m4_t vd, vuint8m4_t vs1,
+ vuint8m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32m4_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m8_t
+test_nds_vd4dotu_vv_u32m8_tumu (vbool4_t vm, vuint32m8_t vd, vuint8m8_t vs1,
+ vuint8m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32m8_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m1_t
+test_nds_vd4dotu_vv_u64m1_tumu (vbool64_t vm, vuint64m1_t vd, vuint16m1_t vs1,
+ vuint16m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u64m1_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m2_t
+test_nds_vd4dotu_vv_u64m2_tumu (vbool32_t vm, vuint64m2_t vd, vuint16m2_t vs1,
+ vuint16m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u64m2_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m4_t
+test_nds_vd4dotu_vv_u64m4_tumu (vbool16_t vm, vuint64m4_t vd, vuint16m4_t vs1,
+ vuint16m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u64m4_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m8_t
+test_nds_vd4dotu_vv_u64m8_tumu (vbool8_t vm, vuint64m8_t vd, vuint16m8_t vs1,
+ vuint16m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u64m8_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vuint32mf2_t
+test_nds_vd4dotu_vv_u32mf2_mu (vbool64_t vm, vuint32mf2_t vd, vuint8mf2_t vs1,
+ vuint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32mf2_mu (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m1_t
+test_nds_vd4dotu_vv_u32m1_mu (vbool32_t vm, vuint32m1_t vd, vuint8m1_t vs1,
+ vuint8m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32m1_mu (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m2_t
+test_nds_vd4dotu_vv_u32m2_mu (vbool16_t vm, vuint32m2_t vd, vuint8m2_t vs1,
+ vuint8m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32m2_mu (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m4_t
+test_nds_vd4dotu_vv_u32m4_mu (vbool8_t vm, vuint32m4_t vd, vuint8m4_t vs1,
+ vuint8m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32m4_mu (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m8_t
+test_nds_vd4dotu_vv_u32m8_mu (vbool4_t vm, vuint32m8_t vd, vuint8m8_t vs1,
+ vuint8m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u32m8_mu (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m1_t
+test_nds_vd4dotu_vv_u64m1_mu (vbool64_t vm, vuint64m1_t vd, vuint16m1_t vs1,
+ vuint16m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u64m1_mu (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m2_t
+test_nds_vd4dotu_vv_u64m2_mu (vbool32_t vm, vuint64m2_t vd, vuint16m2_t vs1,
+ vuint16m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u64m2_mu (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m4_t
+test_nds_vd4dotu_vv_u64m4_mu (vbool16_t vm, vuint64m4_t vd, vuint16m4_t vs1,
+ vuint16m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u64m4_mu (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m8_t
+test_nds_vd4dotu_vv_u64m8_mu (vbool8_t vm, vuint64m8_t vd, vuint16m8_t vs1,
+ vuint16m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_vv_u64m8_mu (vm, vd, vs1, vs2, vl);
+}
+/* { dg-final { scan-assembler-times {vseti?vli\s+[a-z0-9]+,\s*[a-z0-9]+,\s*e[0-9]+,\s*mf?[1248],\s*t[au],\s*m[au]\s+nds\.vd4dotu[ivxfswum.]*\s+} 36 } } */
--- /dev/null
+/* { dg-do compile } */
+/* { dg-options "-march=rv32gv_xandesvdot -O3 -mabi=ilp32" { target { rv32 } } } */
+/* { dg-options "-march=rv64gv_xandesvdot -O3 -mabi=lp64" { target { rv64 } } } */
+
+#include "andes_vector.h"
+
+vint32mf2_t
+test_nds_vd4dots_vv_i32mf2_tu (vint32mf2_t vd, vint8mf2_t vs1, vint8mf2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_tu(vd, vs1, vs2, vl);
+}
+
+vint32m1_t
+test_nds_vd4dots_vv_i32m1_tu (vint32m1_t vd, vint8m1_t vs1, vint8m1_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_tu(vd, vs1, vs2, vl);
+}
+
+vint32m2_t
+test_nds_vd4dots_vv_i32m2_tu (vint32m2_t vd, vint8m2_t vs1, vint8m2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_tu(vd, vs1, vs2, vl);
+}
+
+vint32m4_t
+test_nds_vd4dots_vv_i32m4_tu (vint32m4_t vd, vint8m4_t vs1, vint8m4_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_tu(vd, vs1, vs2, vl);
+}
+
+vint32m8_t
+test_nds_vd4dots_vv_i32m8_tu (vint32m8_t vd, vint8m8_t vs1, vint8m8_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_tu(vd, vs1, vs2, vl);
+}
+
+vint64m1_t
+test_nds_vd4dots_vv_i64m1_tu (vint64m1_t vd, vint16m1_t vs1, vint16m1_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_tu(vd, vs1, vs2, vl);
+}
+
+vint64m2_t
+test_nds_vd4dots_vv_i64m2_tu (vint64m2_t vd, vint16m2_t vs1, vint16m2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_tu(vd, vs1, vs2, vl);
+}
+
+vint64m4_t
+test_nds_vd4dots_vv_i64m4_tu (vint64m4_t vd, vint16m4_t vs1, vint16m4_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_tu(vd, vs1, vs2, vl);
+}
+
+vint64m8_t
+test_nds_vd4dots_vv_i64m8_tu (vint64m8_t vd, vint16m8_t vs1, vint16m8_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dots_tu(vd, vs1, vs2, vl);
+}
+
+vint32mf2_t
+test_nds_vd4dots_vv_i32mf2_tum (vbool64_t vm, vint32mf2_t vd, vint8mf2_t vs1,
+ vint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint32m1_t
+test_nds_vd4dots_vv_i32m1_tum (vbool32_t vm, vint32m1_t vd, vint8m1_t vs1,
+ vint8m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint32m2_t
+test_nds_vd4dots_vv_i32m2_tum (vbool16_t vm, vint32m2_t vd, vint8m2_t vs1,
+ vint8m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint32m4_t
+test_nds_vd4dots_vv_i32m4_tum (vbool8_t vm, vint32m4_t vd, vint8m4_t vs1,
+ vint8m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint32m8_t
+test_nds_vd4dots_vv_i32m8_tum (vbool4_t vm, vint32m8_t vd, vint8m8_t vs1,
+ vint8m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint64m1_t
+test_nds_vd4dots_vv_i64m1_tum (vbool64_t vm, vint64m1_t vd, vint16m1_t vs1,
+ vint16m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint64m2_t
+test_nds_vd4dots_vv_i64m2_tum (vbool32_t vm, vint64m2_t vd, vint16m2_t vs1,
+ vint16m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint64m4_t
+test_nds_vd4dots_vv_i64m4_tum (vbool16_t vm, vint64m4_t vd, vint16m4_t vs1,
+ vint16m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint64m8_t
+test_nds_vd4dots_vv_i64m8_tum (vbool8_t vm, vint64m8_t vd, vint16m8_t vs1,
+ vint16m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint32mf2_t
+test_nds_vd4dots_vv_i32mf2_tumu (vbool64_t vm, vint32mf2_t vd, vint8mf2_t vs1,
+ vint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m1_t
+test_nds_vd4dots_vv_i32m1_tumu (vbool32_t vm, vint32m1_t vd, vint8m1_t vs1,
+ vint8m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m2_t
+test_nds_vd4dots_vv_i32m2_tumu (vbool16_t vm, vint32m2_t vd, vint8m2_t vs1,
+ vint8m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m4_t
+test_nds_vd4dots_vv_i32m4_tumu (vbool8_t vm, vint32m4_t vd, vint8m4_t vs1,
+ vint8m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m8_t
+test_nds_vd4dots_vv_i32m8_tumu (vbool4_t vm, vint32m8_t vd, vint8m8_t vs1,
+ vint8m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m1_t
+test_nds_vd4dots_vv_i64m1_tumu (vbool64_t vm, vint64m1_t vd, vint16m1_t vs1,
+ vint16m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m2_t
+test_nds_vd4dots_vv_i64m2_tumu (vbool32_t vm, vint64m2_t vd, vint16m2_t vs1,
+ vint16m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m4_t
+test_nds_vd4dots_vv_i64m4_tumu (vbool16_t vm, vint64m4_t vd, vint16m4_t vs1,
+ vint16m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m8_t
+test_nds_vd4dots_vv_i64m8_tumu (vbool8_t vm, vint64m8_t vd, vint16m8_t vs1,
+ vint16m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint32mf2_t
+test_nds_vd4dots_vv_i32mf2_mu (vbool64_t vm, vint32mf2_t vd, vint8mf2_t vs1,
+ vint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m1_t
+test_nds_vd4dots_vv_i32m1_mu (vbool32_t vm, vint32m1_t vd, vint8m1_t vs1,
+ vint8m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m2_t
+test_nds_vd4dots_vv_i32m2_mu (vbool16_t vm, vint32m2_t vd, vint8m2_t vs1,
+ vint8m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m4_t
+test_nds_vd4dots_vv_i32m4_mu (vbool8_t vm, vint32m4_t vd, vint8m4_t vs1,
+ vint8m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m8_t
+test_nds_vd4dots_vv_i32m8_mu (vbool4_t vm, vint32m8_t vd, vint8m8_t vs1,
+ vint8m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m1_t
+test_nds_vd4dots_vv_i64m1_mu (vbool64_t vm, vint64m1_t vd, vint16m1_t vs1,
+ vint16m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m2_t
+test_nds_vd4dots_vv_i64m2_mu (vbool32_t vm, vint64m2_t vd, vint16m2_t vs1,
+ vint16m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m4_t
+test_nds_vd4dots_vv_i64m4_mu (vbool16_t vm, vint64m4_t vd, vint16m4_t vs1,
+ vint16m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m8_t
+test_nds_vd4dots_vv_i64m8_mu (vbool8_t vm, vint64m8_t vd, vint16m8_t vs1,
+ vint16m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dots_mu (vm, vd, vs1, vs2, vl);
+}
+/* { dg-final { scan-assembler-times {vseti?vli\s+[a-z0-9]+,\s*[a-z0-9]+,\s*e[0-9]+,\s*mf?[1248],\s*t[au],\s*m[au]\s+nds\.vd4dots[ivxfswum.]*\s+} 36 } } */
--- /dev/null
+/* { dg-do compile } */
+/* { dg-options "-march=rv32gv_xandesvdot -O3 -mabi=ilp32" { target { rv32 } } } */
+/* { dg-options "-march=rv64gv_xandesvdot -O3 -mabi=lp64" { target { rv64 } } } */
+
+#include "andes_vector.h"
+
+vint32mf2_t
+test_nds_vd4dotsu_vv_i32mf2_tu (vint32mf2_t vd, vint8mf2_t vs1, vuint8mf2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tu(vd, vs1, vs2, vl);
+}
+
+vint32m1_t
+test_nds_vd4dotsu_vv_i32m1_tu (vint32m1_t vd, vint8m1_t vs1, vuint8m1_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tu(vd, vs1, vs2, vl);
+}
+
+vint32m2_t
+test_nds_vd4dotsu_vv_i32m2_tu (vint32m2_t vd, vint8m2_t vs1, vuint8m2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tu(vd, vs1, vs2, vl);
+}
+
+vint32m4_t
+test_nds_vd4dotsu_vv_i32m4_tu (vint32m4_t vd, vint8m4_t vs1, vuint8m4_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tu(vd, vs1, vs2, vl);
+}
+
+vint32m8_t
+test_nds_vd4dotsu_vv_i32m8_tu (vint32m8_t vd, vint8m8_t vs1, vuint8m8_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tu(vd, vs1, vs2, vl);
+}
+
+vint64m1_t
+test_nds_vd4dotsu_vv_i64m1_tu (vint64m1_t vd, vint16m1_t vs1, vuint16m1_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tu(vd, vs1, vs2, vl);
+}
+
+vint64m2_t
+test_nds_vd4dotsu_vv_i64m2_tu (vint64m2_t vd, vint16m2_t vs1, vuint16m2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tu(vd, vs1, vs2, vl);
+}
+
+vint64m4_t
+test_nds_vd4dotsu_vv_i64m4_tu (vint64m4_t vd, vint16m4_t vs1, vuint16m4_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tu(vd, vs1, vs2, vl);
+}
+
+vint64m8_t
+test_nds_vd4dotsu_vv_i64m8_tu (vint64m8_t vd, vint16m8_t vs1, vuint16m8_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tu(vd, vs1, vs2, vl);
+}
+
+vint32mf2_t
+test_nds_vd4dotsu_vv_i32mf2_tum (vbool64_t vm, vint32mf2_t vd, vint8mf2_t vs1,
+ vuint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint32m1_t
+test_nds_vd4dotsu_vv_i32m1_tum (vbool32_t vm, vint32m1_t vd, vint8m1_t vs1,
+ vuint8m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint32m2_t
+test_nds_vd4dotsu_vv_i32m2_tum (vbool16_t vm, vint32m2_t vd, vint8m2_t vs1,
+ vuint8m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint32m4_t
+test_nds_vd4dotsu_vv_i32m4_tum (vbool8_t vm, vint32m4_t vd, vint8m4_t vs1,
+ vuint8m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint32m8_t
+test_nds_vd4dotsu_vv_i32m8_tum (vbool4_t vm, vint32m8_t vd, vint8m8_t vs1,
+ vuint8m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint64m1_t
+test_nds_vd4dotsu_vv_i64m1_tum (vbool64_t vm, vint64m1_t vd, vint16m1_t vs1,
+ vuint16m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint64m2_t
+test_nds_vd4dotsu_vv_i64m2_tum (vbool32_t vm, vint64m2_t vd, vint16m2_t vs1,
+ vuint16m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint64m4_t
+test_nds_vd4dotsu_vv_i64m4_tum (vbool16_t vm, vint64m4_t vd, vint16m4_t vs1,
+ vuint16m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint64m8_t
+test_nds_vd4dotsu_vv_i64m8_tum (vbool8_t vm, vint64m8_t vd, vint16m8_t vs1,
+ vuint16m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tum (vm, vd, vs1, vs2, vl);
+}
+
+vint32mf2_t
+test_nds_vd4dotsu_vv_i32mf2_tumu (vbool64_t vm, vint32mf2_t vd, vint8mf2_t vs1,
+ vuint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m1_t
+test_nds_vd4dotsu_vv_i32m1_tumu (vbool32_t vm, vint32m1_t vd, vint8m1_t vs1,
+ vuint8m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m2_t
+test_nds_vd4dotsu_vv_i32m2_tumu (vbool16_t vm, vint32m2_t vd, vint8m2_t vs1,
+ vuint8m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m4_t
+test_nds_vd4dotsu_vv_i32m4_tumu (vbool8_t vm, vint32m4_t vd, vint8m4_t vs1,
+ vuint8m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m8_t
+test_nds_vd4dotsu_vv_i32m8_tumu (vbool4_t vm, vint32m8_t vd, vint8m8_t vs1,
+ vuint8m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m1_t
+test_nds_vd4dotsu_vv_i64m1_tumu (vbool64_t vm, vint64m1_t vd, vint16m1_t vs1,
+ vuint16m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m2_t
+test_nds_vd4dotsu_vv_i64m2_tumu (vbool32_t vm, vint64m2_t vd, vint16m2_t vs1,
+ vuint16m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m4_t
+test_nds_vd4dotsu_vv_i64m4_tumu (vbool16_t vm, vint64m4_t vd, vint16m4_t vs1,
+ vuint16m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m8_t
+test_nds_vd4dotsu_vv_i64m8_tumu (vbool8_t vm, vint64m8_t vd, vint16m8_t vs1,
+ vuint16m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vint32mf2_t
+test_nds_vd4dotsu_vv_i32mf2_mu (vbool64_t vm, vint32mf2_t vd, vint8mf2_t vs1,
+ vuint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m1_t
+test_nds_vd4dotsu_vv_i32m1_mu (vbool32_t vm, vint32m1_t vd, vint8m1_t vs1,
+ vuint8m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m2_t
+test_nds_vd4dotsu_vv_i32m2_mu (vbool16_t vm, vint32m2_t vd, vint8m2_t vs1,
+ vuint8m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m4_t
+test_nds_vd4dotsu_vv_i32m4_mu (vbool8_t vm, vint32m4_t vd, vint8m4_t vs1,
+ vuint8m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint32m8_t
+test_nds_vd4dotsu_vv_i32m8_mu (vbool4_t vm, vint32m8_t vd, vint8m8_t vs1,
+ vuint8m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m1_t
+test_nds_vd4dotsu_vv_i64m1_mu (vbool64_t vm, vint64m1_t vd, vint16m1_t vs1,
+ vuint16m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m2_t
+test_nds_vd4dotsu_vv_i64m2_mu (vbool32_t vm, vint64m2_t vd, vint16m2_t vs1,
+ vuint16m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m4_t
+test_nds_vd4dotsu_vv_i64m4_mu (vbool16_t vm, vint64m4_t vd, vint16m4_t vs1,
+ vuint16m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_mu (vm, vd, vs1, vs2, vl);
+}
+
+vint64m8_t
+test_nds_vd4dotsu_vv_i64m8_mu (vbool8_t vm, vint64m8_t vd, vint16m8_t vs1,
+ vuint16m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotsu_mu (vm, vd, vs1, vs2, vl);
+}
+/* { dg-final { scan-assembler-times {vseti?vli\s+[a-z0-9]+,\s*[a-z0-9]+,\s*e[0-9]+,\s*mf?[1248],\s*t[au],\s*m[au]\s+nds\.vd4dotsu[ivxfswum.]*\s+} 36 } } */
--- /dev/null
+/* { dg-do compile } */
+/* { dg-options "-march=rv32gv_xandesvdot -O3 -mabi=ilp32" { target { rv32 } } } */
+/* { dg-options "-march=rv64gv_xandesvdot -O3 -mabi=lp64" { target { rv64 } } } */
+
+#include "andes_vector.h"
+
+vuint32mf2_t
+test_nds_vd4dotu_vv_u32mf2_tu (vuint32mf2_t vd, vuint8mf2_t vs1,
+ vuint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_tu(vd, vs1, vs2, vl);
+}
+
+vuint32m1_t
+test_nds_vd4dotu_vv_u32m1_tu (vuint32m1_t vd, vuint8m1_t vs1, vuint8m1_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu_tu(vd, vs1, vs2, vl);
+}
+
+vuint32m2_t
+test_nds_vd4dotu_vv_u32m2_tu (vuint32m2_t vd, vuint8m2_t vs1, vuint8m2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu_tu(vd, vs1, vs2, vl);
+}
+
+vuint32m4_t
+test_nds_vd4dotu_vv_u32m4_tu (vuint32m4_t vd, vuint8m4_t vs1, vuint8m4_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu_tu(vd, vs1, vs2, vl);
+}
+
+vuint32m8_t
+test_nds_vd4dotu_vv_u32m8_tu (vuint32m8_t vd, vuint8m8_t vs1, vuint8m8_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu_tu(vd, vs1, vs2, vl);
+}
+
+vuint64m1_t
+test_nds_vd4dotu_vv_u64m1_tu (vuint64m1_t vd, vuint16m1_t vs1, vuint16m1_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu_tu(vd, vs1, vs2, vl);
+}
+
+vuint64m2_t
+test_nds_vd4dotu_vv_u64m2_tu (vuint64m2_t vd, vuint16m2_t vs1, vuint16m2_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu_tu(vd, vs1, vs2, vl);
+}
+
+vuint64m4_t
+test_nds_vd4dotu_vv_u64m4_tu (vuint64m4_t vd, vuint16m4_t vs1, vuint16m4_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu_tu(vd, vs1, vs2, vl);
+}
+
+vuint64m8_t
+test_nds_vd4dotu_vv_u64m8_tu (vuint64m8_t vd, vuint16m8_t vs1, vuint16m8_t vs2,
+ size_t vl)
+{
+ return __riscv_nds_vd4dotu_tu(vd, vs1, vs2, vl);
+}
+
+vuint32mf2_t
+test_nds_vd4dotu_vv_u32mf2_tum (vbool64_t vm, vuint32mf2_t vd, vuint8mf2_t vs1,
+ vuint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_tum (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m1_t
+test_nds_vd4dotu_vv_u32m1_tum (vbool32_t vm, vuint32m1_t vd, vuint8m1_t vs1,
+ vuint8m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_tum (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m2_t
+test_nds_vd4dotu_vv_u32m2_tum (vbool16_t vm, vuint32m2_t vd, vuint8m2_t vs1,
+ vuint8m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_tum (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m4_t
+test_nds_vd4dotu_vv_u32m4_tum (vbool8_t vm, vuint32m4_t vd, vuint8m4_t vs1,
+ vuint8m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_tum (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m8_t
+test_nds_vd4dotu_vv_u32m8_tum (vbool4_t vm, vuint32m8_t vd, vuint8m8_t vs1,
+ vuint8m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_tum (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m1_t
+test_nds_vd4dotu_vv_u64m1_tum (vbool64_t vm, vuint64m1_t vd, vuint16m1_t vs1,
+ vuint16m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_tum (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m2_t
+test_nds_vd4dotu_vv_u64m2_tum (vbool32_t vm, vuint64m2_t vd, vuint16m2_t vs1,
+ vuint16m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_tum (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m4_t
+test_nds_vd4dotu_vv_u64m4_tum (vbool16_t vm, vuint64m4_t vd, vuint16m4_t vs1,
+ vuint16m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_tum (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m8_t
+test_nds_vd4dotu_vv_u64m8_tum (vbool8_t vm, vuint64m8_t vd, vuint16m8_t vs1,
+ vuint16m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_tum (vm, vd, vs1, vs2, vl);
+}
+
+vuint32mf2_t
+test_nds_vd4dotu_vv_u32mf2_tumu (vbool64_t vm, vuint32mf2_t vd, vuint8mf2_t vs1,
+ vuint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m1_t
+test_nds_vd4dotu_vv_u32m1_tumu (vbool32_t vm, vuint32m1_t vd, vuint8m1_t vs1,
+ vuint8m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m2_t
+test_nds_vd4dotu_vv_u32m2_tumu (vbool16_t vm, vuint32m2_t vd, vuint8m2_t vs1,
+ vuint8m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m4_t
+test_nds_vd4dotu_vv_u32m4_tumu (vbool8_t vm, vuint32m4_t vd, vuint8m4_t vs1,
+ vuint8m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m8_t
+test_nds_vd4dotu_vv_u32m8_tumu (vbool4_t vm, vuint32m8_t vd, vuint8m8_t vs1,
+ vuint8m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m1_t
+test_nds_vd4dotu_vv_u64m1_tumu (vbool64_t vm, vuint64m1_t vd, vuint16m1_t vs1,
+ vuint16m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m2_t
+test_nds_vd4dotu_vv_u64m2_tumu (vbool32_t vm, vuint64m2_t vd, vuint16m2_t vs1,
+ vuint16m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m4_t
+test_nds_vd4dotu_vv_u64m4_tumu (vbool16_t vm, vuint64m4_t vd, vuint16m4_t vs1,
+ vuint16m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m8_t
+test_nds_vd4dotu_vv_u64m8_tumu (vbool8_t vm, vuint64m8_t vd, vuint16m8_t vs1,
+ vuint16m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_tumu (vm, vd, vs1, vs2, vl);
+}
+
+vuint32mf2_t
+test_nds_vd4dotu_vv_u32mf2_mu (vbool64_t vm, vuint32mf2_t vd, vuint8mf2_t vs1,
+ vuint8mf2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_mu (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m1_t
+test_nds_vd4dotu_vv_u32m1_mu (vbool32_t vm, vuint32m1_t vd, vuint8m1_t vs1,
+ vuint8m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_mu (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m2_t
+test_nds_vd4dotu_vv_u32m2_mu (vbool16_t vm, vuint32m2_t vd, vuint8m2_t vs1,
+ vuint8m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_mu (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m4_t
+test_nds_vd4dotu_vv_u32m4_mu (vbool8_t vm, vuint32m4_t vd, vuint8m4_t vs1,
+ vuint8m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_mu (vm, vd, vs1, vs2, vl);
+}
+
+vuint32m8_t
+test_nds_vd4dotu_vv_u32m8_mu (vbool4_t vm, vuint32m8_t vd, vuint8m8_t vs1,
+ vuint8m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_mu (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m1_t
+test_nds_vd4dotu_vv_u64m1_mu (vbool64_t vm, vuint64m1_t vd, vuint16m1_t vs1,
+ vuint16m1_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_mu (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m2_t
+test_nds_vd4dotu_vv_u64m2_mu (vbool32_t vm, vuint64m2_t vd, vuint16m2_t vs1,
+ vuint16m2_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_mu (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m4_t
+test_nds_vd4dotu_vv_u64m4_mu (vbool16_t vm, vuint64m4_t vd, vuint16m4_t vs1,
+ vuint16m4_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_mu (vm, vd, vs1, vs2, vl);
+}
+
+vuint64m8_t
+test_nds_vd4dotu_vv_u64m8_mu (vbool8_t vm, vuint64m8_t vd, vuint16m8_t vs1,
+ vuint16m8_t vs2, size_t vl)
+{
+ return __riscv_nds_vd4dotu_mu (vm, vd, vs1, vs2, vl);
+}
+/* { dg-final { scan-assembler-times {vseti?vli\s+[a-z0-9]+,\s*[a-z0-9]+,\s*e[0-9]+,\s*mf?[1248],\s*t[au],\s*m[au]\s+nds\.vd4dotu[ivxfswum.]*\s+} 36 } } */