blob: 6fa305734f1945d8a0a74f979336e44daaa79310 [file] [log] [blame]
// Copyright 2023 Google LLC
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
//
// clang-format off
// Kelvin instruction intrinsics
#ifndef CRT_KELVIN_INTRINSICS_H_
#define CRT_KELVIN_INTRINSICS_H_
#define eexit() __asm__ __volatile_always__("eexit");
#define eyield() __asm__ __volatile_always__("eyield");
#define ectxsw() __asm__ __volatile_always__("ectxsw");
#define mpause() __asm__ __volatile_always__("mpause");
#define flog(s) __asm__ __volatile_always__(ARGS_F_A("flog", %0) : : "r"(s))
#define slog(s) __asm__ __volatile_always__(ARGS_F_A("slog", %0) : : "r"(s))
#define clog(s) __asm__ __volatile_always__(ARGS_F_A("clog", %0) : : "r"(s))
#define klog(s) __asm__ __volatile_always__(ARGS_F_A("klog", %0) : : "r"(s))
#define flushall() __asm__ __volatile__("flushall");
#define flushat(s) __asm__ __volatile__(ARGS_F_A("flushat", %0) : : "r"(s))
#define getmaxvl_b(d) __asm__ __volatile__(ARGS_F_A("getmaxvl.b", %0) : "=r"(d) : )
#define getmaxvl_h(d) __asm__ __volatile__(ARGS_F_A("getmaxvl.h", %0) : "=r"(d) : )
#define getmaxvl_w(d) __asm__ __volatile__(ARGS_F_A("getmaxvl.w", %0) : "=r"(d) : )
#define getvl_b_x(d, s) __asm__ __volatile__(ARGS_F_A_A("getvl.b.x", %0, %1) : "=r"(d) : "r"(s))
#define getvl_h_x(d, s) __asm__ __volatile__(ARGS_F_A_A("getvl.h.x", %0, %1) : "=r"(d) : "r"(s))
#define getvl_w_x(d, s) __asm__ __volatile__(ARGS_F_A_A("getvl.w.x", %0, %1) : "=r"(d) : "r"(s))
#define getvl_b_xx(d, s, t) __asm__ __volatile__(ARGS_F_A_A_A("getvl.b.xx", %0, %1, %2) : "=r"(d) : "r"(s), "r"(t))
#define getvl_h_xx(d, s, t) __asm__ __volatile__(ARGS_F_A_A_A("getvl.h.xx", %0, %1, %2) : "=r"(d) : "r"(s), "r"(t))
#define getvl_w_xx(d, s, t) __asm__ __volatile__(ARGS_F_A_A_A("getvl.w.xx", %0, %1, %2) : "=r"(d) : "r"(s), "r"(t))
#define getmaxvl_b_m(d) __asm__ __volatile__(ARGS_F_A("getmaxvl.b.m", %0) : "=r"(d) : )
#define getmaxvl_h_m(d) __asm__ __volatile__(ARGS_F_A("getmaxvl.h.m", %0) : "=r"(d) : )
#define getmaxvl_w_m(d) __asm__ __volatile__(ARGS_F_A("getmaxvl.w.m", %0) : "=r"(d) : )
#define getvl_b_x_m(d, s) __asm__ __volatile__(ARGS_F_A_A("getvl.b.x.m", %0, %1) : "=r"(d) : "r"(s))
#define getvl_h_x_m(d, s) __asm__ __volatile__(ARGS_F_A_A("getvl.h.x.m", %0, %1) : "=r"(d) : "r"(s))
#define getvl_w_x_m(d, s) __asm__ __volatile__(ARGS_F_A_A("getvl.w.x.m", %0, %1) : "=r"(d) : "r"(s))
#define getvl_b_xx_m(d, s, t) __asm__ __volatile__(ARGS_F_A_A_A("getvl.b.xx.m", %0, %1, %2) : "=r"(d) : "r"(s), "r"(t))
#define getvl_h_xx_m(d, s, t) __asm__ __volatile__(ARGS_F_A_A_A("getvl.h.xx.m", %0, %1, %2) : "=r"(d) : "r"(s), "r"(t))
#define getvl_w_xx_m(d, s, t) __asm__ __volatile__(ARGS_F_A_A_A("getvl.w.xx.m", %0, %1, %2) : "=r"(d) : "r"(s), "r"(t))
// 111 Load/Store
#define vld_b_x(Vd, s) __asm__ __volatile_always__(ARGS_F_A_A("vld.b.x", Vd, %0) : : "r"(s) : "memory")
#define vld_b_p_x(Vd, s) __asm__ __volatile_always__(ARGS_F_A_A("vld.b.p.x", Vd, %0) : "=r"(s) : "0"(s) : "memory")
#define vld_b_l_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.b.l.xx", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vld_b_s_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.b.s.xx", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vld_b_p_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.b.p.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vld_b_lp_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.b.lp.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vld_b_sp_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.b.sp.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vld_b_tp_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.b.tp.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vld_b_x_m(Vd, s) __asm__ __volatile_always__(ARGS_F_A_A("vld.b.x.m", Vd, %0) : : "r"(s) : "memory")
#define vld_b_p_x_m(Vd, s) __asm__ __volatile_always__(ARGS_F_A_A("vld.b.p.x.m", Vd, %0) : "=r"(s) : "0"(s) : "memory")
#define vld_b_l_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.b.l.xx.m", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vld_b_s_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.b.s.xx.m", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vld_b_p_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.b.p.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vld_b_lp_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.b.lp.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vld_b_sp_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.b.sp.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vld_b_tp_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.b.tp.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vld_h_x(Vd, s) __asm__ __volatile_always__(ARGS_F_A_A("vld.h.x", Vd, %0) : : "r"(s) : "memory")
#define vld_h_p_x(Vd, s) __asm__ __volatile_always__(ARGS_F_A_A("vld.h.p.x", Vd, %0) : "=r"(s) : "0"(s) : "memory")
#define vld_h_l_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.h.l.xx", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vld_h_s_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.h.s.xx", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vld_h_p_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.h.p.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vld_h_lp_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.h.lp.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vld_h_sp_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.h.sp.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vld_h_tp_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.h.tp.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vld_h_x_m(Vd, s) __asm__ __volatile_always__(ARGS_F_A_A("vld.h.x.m", Vd, %0) : : "r"(s) : "memory")
#define vld_h_p_x_m(Vd, s) __asm__ __volatile_always__(ARGS_F_A_A("vld.h.p.x.m", Vd, %0) : "=r"(s) : "0"(s) : "memory")
#define vld_h_l_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.h.l.xx.m", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vld_h_s_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.h.s.xx.m", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vld_h_p_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.h.p.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vld_h_lp_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.h.lp.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vld_h_sp_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.h.sp.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vld_h_tp_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.h.tp.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vld_w_x(Vd, s) __asm__ __volatile_always__(ARGS_F_A_A("vld.w.x", Vd, %0) : : "r"(s) : "memory")
#define vld_w_p_x(Vd, s) __asm__ __volatile_always__(ARGS_F_A_A("vld.w.p.x", Vd, %0) : "=r"(s) : "0"(s) : "memory")
#define vld_w_l_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.w.l.xx", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vld_w_s_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.w.s.xx", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vld_w_p_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.w.p.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vld_w_lp_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.w.lp.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vld_w_sp_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.w.sp.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vld_w_tp_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.w.tp.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vld_w_x_m(Vd, s) __asm__ __volatile_always__(ARGS_F_A_A("vld.w.x.m", Vd, %0) : : "r"(s) : "memory")
#define vld_w_p_x_m(Vd, s) __asm__ __volatile_always__(ARGS_F_A_A("vld.w.p.x.m", Vd, %0) : "=r"(s) : "0"(s) : "memory")
#define vld_w_l_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.w.l.xx.m", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vld_w_s_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.w.s.xx.m", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vld_w_p_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.w.p.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vld_w_lp_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.w.lp.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vld_w_sp_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.w.sp.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vld_w_tp_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vld.w.tp.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vst_b_x(Vd, s) __asm__ __volatile_always__(ARGS_F_A_A("vst.b.x", Vd, %0) : : "r"(s) : "memory")
#define vst_b_p_x(Vd, s) __asm__ __volatile_always__(ARGS_F_A_A("vst.b.p.x", Vd, %0) : "=r"(s) : "0"(s) : "memory")
#define vst_b_l_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.b.l.xx", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vst_b_s_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.b.s.xx", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vst_b_p_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.b.p.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vst_b_lp_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.b.lp.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vst_b_sp_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.b.sp.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vst_b_tp_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.b.tp.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vst_b_x_m(Vd, s) __asm__ __volatile_always__(ARGS_F_A_A("vst.b.x.m", Vd, %0) : : "r"(s) : "memory")
#define vst_b_p_x_m(Vd, s) __asm__ __volatile_always__(ARGS_F_A_A("vst.b.p.x.m", Vd, %0) : "=r"(s) : "0"(s) : "memory")
#define vst_b_l_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.b.l.xx.m", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vst_b_s_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.b.s.xx.m", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vst_b_p_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.b.p.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vst_b_lp_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.b.lp.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vst_b_sp_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.b.sp.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vst_b_tp_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.b.tp.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vst_h_x(Vd, s) __asm__ __volatile_always__(ARGS_F_A_A("vst.h.x", Vd, %0) : : "r"(s) : "memory")
#define vst_h_p_x(Vd, s) __asm__ __volatile_always__(ARGS_F_A_A("vst.h.p.x", Vd, %0) : "=r"(s) : "0"(s) : "memory")
#define vst_h_l_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.h.l.xx", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vst_h_s_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.h.s.xx", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vst_h_p_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.h.p.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vst_h_lp_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.h.lp.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vst_h_sp_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.h.sp.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vst_h_tp_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.h.tp.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vst_h_x_m(Vd, s) __asm__ __volatile_always__(ARGS_F_A_A("vst.h.x.m", Vd, %0) : : "r"(s) : "memory")
#define vst_h_p_x_m(Vd, s) __asm__ __volatile_always__(ARGS_F_A_A("vst.h.p.x.m", Vd, %0) : "=r"(s) : "0"(s) : "memory")
#define vst_h_l_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.h.l.xx.m", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vst_h_s_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.h.s.xx.m", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vst_h_p_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.h.p.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vst_h_lp_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.h.lp.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vst_h_sp_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.h.sp.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vst_h_tp_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.h.tp.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vst_w_x(Vd, s) __asm__ __volatile_always__(ARGS_F_A_A("vst.w.x", Vd, %0) : : "r"(s) : "memory")
#define vst_w_p_x(Vd, s) __asm__ __volatile_always__(ARGS_F_A_A("vst.w.p.x", Vd, %0) : "=r"(s) : "0"(s) : "memory")
#define vst_w_l_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.w.l.xx", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vst_w_s_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.w.s.xx", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vst_w_p_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.w.p.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vst_w_lp_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.w.lp.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vst_w_sp_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.w.sp.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vst_w_tp_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.w.tp.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vst_w_x_m(Vd, s) __asm__ __volatile_always__(ARGS_F_A_A("vst.w.x.m", Vd, %0) : : "r"(s) : "memory")
#define vst_w_p_x_m(Vd, s) __asm__ __volatile_always__(ARGS_F_A_A("vst.w.p.x.m", Vd, %0) : "=r"(s) : "0"(s) : "memory")
#define vst_w_l_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.w.l.xx.m", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vst_w_s_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.w.s.xx.m", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vst_w_p_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.w.p.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vst_w_lp_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.w.lp.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vst_w_sp_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.w.sp.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vst_w_tp_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vst.w.tp.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vdup_b_x(Vd, t) __asm__ __volatile__(ARGS_F_A_A("vdup.b.x", Vd, %0) : : "r"(t))
#define vdup_b_x_m(Vd, t) __asm__ __volatile__(ARGS_F_A_A("vdup.b.x.m", Vd, %0) : : "r"(t))
#define vdup_h_x(Vd, t) __asm__ __volatile__(ARGS_F_A_A("vdup.h.x", Vd, %0) : : "r"(t))
#define vdup_h_x_m(Vd, t) __asm__ __volatile__(ARGS_F_A_A("vdup.h.x.m", Vd, %0) : : "r"(t))
#define vdup_w_x(Vd, t) __asm__ __volatile__(ARGS_F_A_A("vdup.w.x", Vd, %0) : : "r"(t))
#define vdup_w_x_m(Vd, t) __asm__ __volatile__(ARGS_F_A_A("vdup.w.x.m", Vd, %0) : : "r"(t))
#define vcget(Vd) __asm__ __volatile__(ARGS_F_A("vcget", Vd) : : )
#define vstq_b_s_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vstq.b.s.xx", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vstq_b_sp_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vstq.b.sp.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vstq_b_s_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vstq.b.s.xx.m", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vstq_b_sp_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vstq.b.sp.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vstq_h_s_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vstq.h.s.xx", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vstq_h_sp_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vstq.h.sp.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vstq_h_s_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vstq.h.s.xx.m", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vstq_h_sp_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vstq.h.sp.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vstq_w_s_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vstq.w.s.xx", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vstq_w_sp_xx(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vstq.w.sp.xx", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
#define vstq_w_s_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vstq.w.s.xx.m", Vd, %0, %1) : : "r"(s), "r"(t) : "memory")
#define vstq_w_sp_xx_m(Vd, s, t) __asm__ __volatile_always__(ARGS_F_A_A_A("vstq.w.sp.xx.m", Vd, %0, %1) : "=r"(s) : "r"(t), "0"(s) : "memory")
// 000 Arithmetic
#define vadd_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vadd.b.vv", Vd, Vs, Vt))
#define vadd_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vadd.b.vx", Vd, Vs, %0) : : "r"(t))
#define vadd_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vadd.b.vv.m", Vd, Vs, Vt))
#define vadd_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vadd.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vadd_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vadd.h.vv", Vd, Vs, Vt))
#define vadd_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vadd.h.vx", Vd, Vs, %0) : : "r"(t))
#define vadd_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vadd.h.vv.m", Vd, Vs, Vt))
#define vadd_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vadd.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vadd_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vadd.w.vv", Vd, Vs, Vt))
#define vadd_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vadd.w.vx", Vd, Vs, %0) : : "r"(t))
#define vadd_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vadd.w.vv.m", Vd, Vs, Vt))
#define vadd_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vadd.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsub_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsub.b.vv", Vd, Vs, Vt))
#define vsub_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsub.b.vx", Vd, Vs, %0) : : "r"(t))
#define vsub_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsub.b.vv.m", Vd, Vs, Vt))
#define vsub_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsub.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsub_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsub.h.vv", Vd, Vs, Vt))
#define vsub_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsub.h.vx", Vd, Vs, %0) : : "r"(t))
#define vsub_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsub.h.vv.m", Vd, Vs, Vt))
#define vsub_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsub.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsub_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsub.w.vv", Vd, Vs, Vt))
#define vsub_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsub.w.vx", Vd, Vs, %0) : : "r"(t))
#define vsub_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsub.w.vv.m", Vd, Vs, Vt))
#define vsub_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsub.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vrsub_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vrsub.b.vx", Vd, Vs, %0) : : "r"(t))
#define vrsub_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vrsub.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vrsub_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vrsub.h.vx", Vd, Vs, %0) : : "r"(t))
#define vrsub_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vrsub.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vrsub_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vrsub.w.vx", Vd, Vs, %0) : : "r"(t))
#define vrsub_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vrsub.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define veq_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("veq.b.vv", Vd, Vs, Vt))
#define veq_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("veq.b.vx", Vd, Vs, %0) : : "r"(t))
#define veq_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("veq.b.vv.m", Vd, Vs, Vt))
#define veq_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("veq.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define veq_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("veq.h.vv", Vd, Vs, Vt))
#define veq_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("veq.h.vx", Vd, Vs, %0) : : "r"(t))
#define veq_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("veq.h.vv.m", Vd, Vs, Vt))
#define veq_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("veq.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define veq_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("veq.w.vv", Vd, Vs, Vt))
#define veq_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("veq.w.vx", Vd, Vs, %0) : : "r"(t))
#define veq_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("veq.w.vv.m", Vd, Vs, Vt))
#define veq_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("veq.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vne_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vne.b.vv", Vd, Vs, Vt))
#define vne_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vne.b.vx", Vd, Vs, %0) : : "r"(t))
#define vne_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vne.b.vv.m", Vd, Vs, Vt))
#define vne_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vne.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vne_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vne.h.vv", Vd, Vs, Vt))
#define vne_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vne.h.vx", Vd, Vs, %0) : : "r"(t))
#define vne_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vne.h.vv.m", Vd, Vs, Vt))
#define vne_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vne.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vne_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vne.w.vv", Vd, Vs, Vt))
#define vne_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vne.w.vx", Vd, Vs, %0) : : "r"(t))
#define vne_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vne.w.vv.m", Vd, Vs, Vt))
#define vne_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vne.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vlt_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vlt.b.vv", Vd, Vs, Vt))
#define vlt_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vlt.b.vx", Vd, Vs, %0) : : "r"(t))
#define vlt_b_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vlt.b.u.vv", Vd, Vs, Vt))
#define vlt_b_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vlt.b.u.vx", Vd, Vs, %0) : : "r"(t))
#define vlt_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vlt.b.vv.m", Vd, Vs, Vt))
#define vlt_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vlt.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vlt_b_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vlt.b.u.vv.m", Vd, Vs, Vt))
#define vlt_b_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vlt.b.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vlt_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vlt.h.vv", Vd, Vs, Vt))
#define vlt_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vlt.h.vx", Vd, Vs, %0) : : "r"(t))
#define vlt_h_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vlt.h.u.vv", Vd, Vs, Vt))
#define vlt_h_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vlt.h.u.vx", Vd, Vs, %0) : : "r"(t))
#define vlt_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vlt.h.vv.m", Vd, Vs, Vt))
#define vlt_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vlt.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vlt_h_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vlt.h.u.vv.m", Vd, Vs, Vt))
#define vlt_h_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vlt.h.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vlt_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vlt.w.vv", Vd, Vs, Vt))
#define vlt_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vlt.w.vx", Vd, Vs, %0) : : "r"(t))
#define vlt_w_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vlt.w.u.vv", Vd, Vs, Vt))
#define vlt_w_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vlt.w.u.vx", Vd, Vs, %0) : : "r"(t))
#define vlt_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vlt.w.vv.m", Vd, Vs, Vt))
#define vlt_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vlt.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vlt_w_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vlt.w.u.vv.m", Vd, Vs, Vt))
#define vlt_w_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vlt.w.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vle_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vle.b.vv", Vd, Vs, Vt))
#define vle_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vle.b.vx", Vd, Vs, %0) : : "r"(t))
#define vle_b_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vle.b.u.vv", Vd, Vs, Vt))
#define vle_b_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vle.b.u.vx", Vd, Vs, %0) : : "r"(t))
#define vle_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vle.b.vv.m", Vd, Vs, Vt))
#define vle_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vle.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vle_b_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vle.b.u.vv.m", Vd, Vs, Vt))
#define vle_b_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vle.b.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vle_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vle.h.vv", Vd, Vs, Vt))
#define vle_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vle.h.vx", Vd, Vs, %0) : : "r"(t))
#define vle_h_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vle.h.u.vv", Vd, Vs, Vt))
#define vle_h_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vle.h.u.vx", Vd, Vs, %0) : : "r"(t))
#define vle_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vle.h.vv.m", Vd, Vs, Vt))
#define vle_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vle.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vle_h_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vle.h.u.vv.m", Vd, Vs, Vt))
#define vle_h_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vle.h.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vle_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vle.w.vv", Vd, Vs, Vt))
#define vle_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vle.w.vx", Vd, Vs, %0) : : "r"(t))
#define vle_w_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vle.w.u.vv", Vd, Vs, Vt))
#define vle_w_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vle.w.u.vx", Vd, Vs, %0) : : "r"(t))
#define vle_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vle.w.vv.m", Vd, Vs, Vt))
#define vle_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vle.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vle_w_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vle.w.u.vv.m", Vd, Vs, Vt))
#define vle_w_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vle.w.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vgt_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vgt.b.vv", Vd, Vs, Vt))
#define vgt_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vgt.b.vx", Vd, Vs, %0) : : "r"(t))
#define vgt_b_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vgt.b.u.vv", Vd, Vs, Vt))
#define vgt_b_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vgt.b.u.vx", Vd, Vs, %0) : : "r"(t))
#define vgt_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vgt.b.vv.m", Vd, Vs, Vt))
#define vgt_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vgt.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vgt_b_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vgt.b.u.vv.m", Vd, Vs, Vt))
#define vgt_b_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vgt.b.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vgt_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vgt.h.vv", Vd, Vs, Vt))
#define vgt_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vgt.h.vx", Vd, Vs, %0) : : "r"(t))
#define vgt_h_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vgt.h.u.vv", Vd, Vs, Vt))
#define vgt_h_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vgt.h.u.vx", Vd, Vs, %0) : : "r"(t))
#define vgt_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vgt.h.vv.m", Vd, Vs, Vt))
#define vgt_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vgt.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vgt_h_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vgt.h.u.vv.m", Vd, Vs, Vt))
#define vgt_h_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vgt.h.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vgt_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vgt.w.vv", Vd, Vs, Vt))
#define vgt_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vgt.w.vx", Vd, Vs, %0) : : "r"(t))
#define vgt_w_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vgt.w.u.vv", Vd, Vs, Vt))
#define vgt_w_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vgt.w.u.vx", Vd, Vs, %0) : : "r"(t))
#define vgt_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vgt.w.vv.m", Vd, Vs, Vt))
#define vgt_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vgt.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vgt_w_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vgt.w.u.vv.m", Vd, Vs, Vt))
#define vgt_w_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vgt.w.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vge_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vge.b.vv", Vd, Vs, Vt))
#define vge_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vge.b.vx", Vd, Vs, %0) : : "r"(t))
#define vge_b_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vge.b.u.vv", Vd, Vs, Vt))
#define vge_b_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vge.b.u.vx", Vd, Vs, %0) : : "r"(t))
#define vge_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vge.b.vv.m", Vd, Vs, Vt))
#define vge_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vge.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vge_b_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vge.b.u.vv.m", Vd, Vs, Vt))
#define vge_b_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vge.b.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vge_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vge.h.vv", Vd, Vs, Vt))
#define vge_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vge.h.vx", Vd, Vs, %0) : : "r"(t))
#define vge_h_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vge.h.u.vv", Vd, Vs, Vt))
#define vge_h_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vge.h.u.vx", Vd, Vs, %0) : : "r"(t))
#define vge_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vge.h.vv.m", Vd, Vs, Vt))
#define vge_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vge.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vge_h_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vge.h.u.vv.m", Vd, Vs, Vt))
#define vge_h_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vge.h.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vge_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vge.w.vv", Vd, Vs, Vt))
#define vge_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vge.w.vx", Vd, Vs, %0) : : "r"(t))
#define vge_w_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vge.w.u.vv", Vd, Vs, Vt))
#define vge_w_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vge.w.u.vx", Vd, Vs, %0) : : "r"(t))
#define vge_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vge.w.vv.m", Vd, Vs, Vt))
#define vge_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vge.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vge_w_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vge.w.u.vv.m", Vd, Vs, Vt))
#define vge_w_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vge.w.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vabsd_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vabsd.b.vv", Vd, Vs, Vt))
#define vabsd_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vabsd.b.vx", Vd, Vs, %0) : : "r"(t))
#define vabsd_b_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vabsd.b.u.vv", Vd, Vs, Vt))
#define vabsd_b_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vabsd.b.u.vx", Vd, Vs, %0) : : "r"(t))
#define vabsd_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vabsd.b.vv.m", Vd, Vs, Vt))
#define vabsd_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vabsd.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vabsd_b_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vabsd.b.u.vv.m", Vd, Vs, Vt))
#define vabsd_b_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vabsd.b.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vabsd_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vabsd.h.vv", Vd, Vs, Vt))
#define vabsd_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vabsd.h.vx", Vd, Vs, %0) : : "r"(t))
#define vabsd_h_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vabsd.h.u.vv", Vd, Vs, Vt))
#define vabsd_h_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vabsd.h.u.vx", Vd, Vs, %0) : : "r"(t))
#define vabsd_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vabsd.h.vv.m", Vd, Vs, Vt))
#define vabsd_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vabsd.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vabsd_h_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vabsd.h.u.vv.m", Vd, Vs, Vt))
#define vabsd_h_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vabsd.h.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vabsd_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vabsd.w.vv", Vd, Vs, Vt))
#define vabsd_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vabsd.w.vx", Vd, Vs, %0) : : "r"(t))
#define vabsd_w_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vabsd.w.u.vv", Vd, Vs, Vt))
#define vabsd_w_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vabsd.w.u.vx", Vd, Vs, %0) : : "r"(t))
#define vabsd_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vabsd.w.vv.m", Vd, Vs, Vt))
#define vabsd_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vabsd.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vabsd_w_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vabsd.w.u.vv.m", Vd, Vs, Vt))
#define vabsd_w_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vabsd.w.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmax_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmax.b.vv", Vd, Vs, Vt))
#define vmax_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmax.b.vx", Vd, Vs, %0) : : "r"(t))
#define vmax_b_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmax.b.u.vv", Vd, Vs, Vt))
#define vmax_b_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmax.b.u.vx", Vd, Vs, %0) : : "r"(t))
#define vmax_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmax.b.vv.m", Vd, Vs, Vt))
#define vmax_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmax.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmax_b_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmax.b.u.vv.m", Vd, Vs, Vt))
#define vmax_b_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmax.b.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmax_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmax.h.vv", Vd, Vs, Vt))
#define vmax_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmax.h.vx", Vd, Vs, %0) : : "r"(t))
#define vmax_h_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmax.h.u.vv", Vd, Vs, Vt))
#define vmax_h_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmax.h.u.vx", Vd, Vs, %0) : : "r"(t))
#define vmax_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmax.h.vv.m", Vd, Vs, Vt))
#define vmax_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmax.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmax_h_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmax.h.u.vv.m", Vd, Vs, Vt))
#define vmax_h_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmax.h.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmax_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmax.w.vv", Vd, Vs, Vt))
#define vmax_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmax.w.vx", Vd, Vs, %0) : : "r"(t))
#define vmax_w_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmax.w.u.vv", Vd, Vs, Vt))
#define vmax_w_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmax.w.u.vx", Vd, Vs, %0) : : "r"(t))
#define vmax_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmax.w.vv.m", Vd, Vs, Vt))
#define vmax_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmax.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmax_w_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmax.w.u.vv.m", Vd, Vs, Vt))
#define vmax_w_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmax.w.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmin_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmin.b.vv", Vd, Vs, Vt))
#define vmin_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmin.b.vx", Vd, Vs, %0) : : "r"(t))
#define vmin_b_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmin.b.u.vv", Vd, Vs, Vt))
#define vmin_b_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmin.b.u.vx", Vd, Vs, %0) : : "r"(t))
#define vmin_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmin.b.vv.m", Vd, Vs, Vt))
#define vmin_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmin.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmin_b_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmin.b.u.vv.m", Vd, Vs, Vt))
#define vmin_b_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmin.b.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmin_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmin.h.vv", Vd, Vs, Vt))
#define vmin_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmin.h.vx", Vd, Vs, %0) : : "r"(t))
#define vmin_h_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmin.h.u.vv", Vd, Vs, Vt))
#define vmin_h_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmin.h.u.vx", Vd, Vs, %0) : : "r"(t))
#define vmin_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmin.h.vv.m", Vd, Vs, Vt))
#define vmin_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmin.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmin_h_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmin.h.u.vv.m", Vd, Vs, Vt))
#define vmin_h_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmin.h.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmin_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmin.w.vv", Vd, Vs, Vt))
#define vmin_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmin.w.vx", Vd, Vs, %0) : : "r"(t))
#define vmin_w_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmin.w.u.vv", Vd, Vs, Vt))
#define vmin_w_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmin.w.u.vx", Vd, Vs, %0) : : "r"(t))
#define vmin_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmin.w.vv.m", Vd, Vs, Vt))
#define vmin_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmin.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmin_w_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmin.w.u.vv.m", Vd, Vs, Vt))
#define vmin_w_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmin.w.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vadd3_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vadd3.b.vv", Vd, Vs, Vt))
#define vadd3_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vadd3.b.vx", Vd, Vs, %0) : : "r"(t))
#define vadd3_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vadd3.b.vv.m", Vd, Vs, Vt))
#define vadd3_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vadd3.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vadd3_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vadd3.h.vv", Vd, Vs, Vt))
#define vadd3_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vadd3.h.vx", Vd, Vs, %0) : : "r"(t))
#define vadd3_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vadd3.h.vv.m", Vd, Vs, Vt))
#define vadd3_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vadd3.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vadd3_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vadd3.w.vv", Vd, Vs, Vt))
#define vadd3_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vadd3.w.vx", Vd, Vs, %0) : : "r"(t))
#define vadd3_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vadd3.w.vv.m", Vd, Vs, Vt))
#define vadd3_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vadd3.w.vx.m", Vd, Vs, %0) : : "r"(t))
// 100 Arithmetic2
#define vadds_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vadds.b.vv", Vd, Vs, Vt))
#define vadds_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vadds.b.vx", Vd, Vs, %0) : : "r"(t))
#define vadds_b_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vadds.b.u.vv", Vd, Vs, Vt))
#define vadds_b_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vadds.b.u.vx", Vd, Vs, %0) : : "r"(t))
#define vadds_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vadds.b.vv.m", Vd, Vs, Vt))
#define vadds_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vadds.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vadds_b_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vadds.b.u.vv.m", Vd, Vs, Vt))
#define vadds_b_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vadds.b.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vadds_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vadds.h.vv", Vd, Vs, Vt))
#define vadds_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vadds.h.vx", Vd, Vs, %0) : : "r"(t))
#define vadds_h_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vadds.h.u.vv", Vd, Vs, Vt))
#define vadds_h_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vadds.h.u.vx", Vd, Vs, %0) : : "r"(t))
#define vadds_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vadds.h.vv.m", Vd, Vs, Vt))
#define vadds_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vadds.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vadds_h_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vadds.h.u.vv.m", Vd, Vs, Vt))
#define vadds_h_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vadds.h.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vadds_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vadds.w.vv", Vd, Vs, Vt))
#define vadds_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vadds.w.vx", Vd, Vs, %0) : : "r"(t))
#define vadds_w_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vadds.w.u.vv", Vd, Vs, Vt))
#define vadds_w_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vadds.w.u.vx", Vd, Vs, %0) : : "r"(t))
#define vadds_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vadds.w.vv.m", Vd, Vs, Vt))
#define vadds_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vadds.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vadds_w_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vadds.w.u.vv.m", Vd, Vs, Vt))
#define vadds_w_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vadds.w.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsubs_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsubs.b.vv", Vd, Vs, Vt))
#define vsubs_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsubs.b.vx", Vd, Vs, %0) : : "r"(t))
#define vsubs_b_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsubs.b.u.vv", Vd, Vs, Vt))
#define vsubs_b_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsubs.b.u.vx", Vd, Vs, %0) : : "r"(t))
#define vsubs_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsubs.b.vv.m", Vd, Vs, Vt))
#define vsubs_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsubs.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsubs_b_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsubs.b.u.vv.m", Vd, Vs, Vt))
#define vsubs_b_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsubs.b.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsubs_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsubs.h.vv", Vd, Vs, Vt))
#define vsubs_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsubs.h.vx", Vd, Vs, %0) : : "r"(t))
#define vsubs_h_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsubs.h.u.vv", Vd, Vs, Vt))
#define vsubs_h_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsubs.h.u.vx", Vd, Vs, %0) : : "r"(t))
#define vsubs_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsubs.h.vv.m", Vd, Vs, Vt))
#define vsubs_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsubs.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsubs_h_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsubs.h.u.vv.m", Vd, Vs, Vt))
#define vsubs_h_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsubs.h.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsubs_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsubs.w.vv", Vd, Vs, Vt))
#define vsubs_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsubs.w.vx", Vd, Vs, %0) : : "r"(t))
#define vsubs_w_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsubs.w.u.vv", Vd, Vs, Vt))
#define vsubs_w_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsubs.w.u.vx", Vd, Vs, %0) : : "r"(t))
#define vsubs_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsubs.w.vv.m", Vd, Vs, Vt))
#define vsubs_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsubs.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsubs_w_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsubs.w.u.vv.m", Vd, Vs, Vt))
#define vsubs_w_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsubs.w.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vaddw_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vaddw.h.vv", Vd, Vs, Vt))
#define vaddw_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vaddw.h.vx", Vd, Vs, %0) : : "r"(t))
#define vaddw_h_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vaddw.h.u.vv", Vd, Vs, Vt))
#define vaddw_h_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vaddw.h.u.vx", Vd, Vs, %0) : : "r"(t))
#define vaddw_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vaddw.h.vv.m", Vd, Vs, Vt))
#define vaddw_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vaddw.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vaddw_h_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vaddw.h.u.vv.m", Vd, Vs, Vt))
#define vaddw_h_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vaddw.h.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vaddw_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vaddw.w.vv", Vd, Vs, Vt))
#define vaddw_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vaddw.w.vx", Vd, Vs, %0) : : "r"(t))
#define vaddw_w_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vaddw.w.u.vv", Vd, Vs, Vt))
#define vaddw_w_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vaddw.w.u.vx", Vd, Vs, %0) : : "r"(t))
#define vaddw_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vaddw.w.vv.m", Vd, Vs, Vt))
#define vaddw_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vaddw.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vaddw_w_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vaddw.w.u.vv.m", Vd, Vs, Vt))
#define vaddw_w_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vaddw.w.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsubw_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsubw.h.vv", Vd, Vs, Vt))
#define vsubw_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsubw.h.vx", Vd, Vs, %0) : : "r"(t))
#define vsubw_h_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsubw.h.u.vv", Vd, Vs, Vt))
#define vsubw_h_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsubw.h.u.vx", Vd, Vs, %0) : : "r"(t))
#define vsubw_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsubw.h.vv.m", Vd, Vs, Vt))
#define vsubw_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsubw.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsubw_h_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsubw.h.u.vv.m", Vd, Vs, Vt))
#define vsubw_h_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsubw.h.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsubw_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsubw.w.vv", Vd, Vs, Vt))
#define vsubw_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsubw.w.vx", Vd, Vs, %0) : : "r"(t))
#define vsubw_w_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsubw.w.u.vv", Vd, Vs, Vt))
#define vsubw_w_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsubw.w.u.vx", Vd, Vs, %0) : : "r"(t))
#define vsubw_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsubw.w.vv.m", Vd, Vs, Vt))
#define vsubw_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsubw.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsubw_w_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsubw.w.u.vv.m", Vd, Vs, Vt))
#define vsubw_w_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsubw.w.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vacc_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vacc.h.vv", Vd, Vs, Vt))
#define vacc_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vacc.h.vx", Vd, Vs, %0) : : "r"(t))
#define vacc_h_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vacc.h.u.vv", Vd, Vs, Vt))
#define vacc_h_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vacc.h.u.vx", Vd, Vs, %0) : : "r"(t))
#define vacc_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vacc.h.vv.m", Vd, Vs, Vt))
#define vacc_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vacc.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vacc_h_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vacc.h.u.vv.m", Vd, Vs, Vt))
#define vacc_h_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vacc.h.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vacc_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vacc.w.vv", Vd, Vs, Vt))
#define vacc_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vacc.w.vx", Vd, Vs, %0) : : "r"(t))
#define vacc_w_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vacc.w.u.vv", Vd, Vs, Vt))
#define vacc_w_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vacc.w.u.vx", Vd, Vs, %0) : : "r"(t))
#define vacc_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vacc.w.vv.m", Vd, Vs, Vt))
#define vacc_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vacc.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vacc_w_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vacc.w.u.vv.m", Vd, Vs, Vt))
#define vacc_w_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vacc.w.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vpadd_h_v(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vpadd.h.v", Vd, Vs))
#define vpadd_h_u_v(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vpadd.h.u.v", Vd, Vs))
#define vpadd_h_v_m(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vpadd.h.v.m", Vd, Vs))
#define vpadd_h_u_v_m(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vpadd.h.u.v.m", Vd, Vs))
#define vpadd_w_v(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vpadd.w.v", Vd, Vs))
#define vpadd_w_u_v(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vpadd.w.u.v", Vd, Vs))
#define vpadd_w_v_m(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vpadd.w.v.m", Vd, Vs))
#define vpadd_w_u_v_m(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vpadd.w.u.v.m", Vd, Vs))
#define vpsub_h_v(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vpsub.h.v", Vd, Vs))
#define vpsub_h_u_v(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vpsub.h.u.v", Vd, Vs))
#define vpsub_h_v_m(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vpsub.h.v.m", Vd, Vs))
#define vpsub_h_u_v_m(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vpsub.h.u.v.m", Vd, Vs))
#define vpsub_w_v(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vpsub.w.v", Vd, Vs))
#define vpsub_w_u_v(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vpsub.w.u.v", Vd, Vs))
#define vpsub_w_v_m(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vpsub.w.v.m", Vd, Vs))
#define vpsub_w_u_v_m(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vpsub.w.u.v.m", Vd, Vs))
#define vhadd_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.b.vv", Vd, Vs, Vt))
#define vhadd_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.b.vx", Vd, Vs, %0) : : "r"(t))
#define vhadd_b_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.b.r.vv", Vd, Vs, Vt))
#define vhadd_b_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.b.r.vx", Vd, Vs, %0) : : "r"(t))
#define vhadd_b_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.b.u.vv", Vd, Vs, Vt))
#define vhadd_b_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.b.u.vx", Vd, Vs, %0) : : "r"(t))
#define vhadd_b_ur_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.b.ur.vv", Vd, Vs, Vt))
#define vhadd_b_ur_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.b.ur.vx", Vd, Vs, %0) : : "r"(t))
#define vhadd_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.b.vv.m", Vd, Vs, Vt))
#define vhadd_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vhadd_b_r_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.b.r.vv.m", Vd, Vs, Vt))
#define vhadd_b_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.b.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vhadd_b_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.b.u.vv.m", Vd, Vs, Vt))
#define vhadd_b_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.b.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vhadd_b_ur_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.b.ur.vv.m", Vd, Vs, Vt))
#define vhadd_b_ur_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.b.ur.vx.m", Vd, Vs, %0) : : "r"(t))
#define vhadd_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.h.vv", Vd, Vs, Vt))
#define vhadd_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.h.vx", Vd, Vs, %0) : : "r"(t))
#define vhadd_h_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.h.r.vv", Vd, Vs, Vt))
#define vhadd_h_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.h.r.vx", Vd, Vs, %0) : : "r"(t))
#define vhadd_h_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.h.u.vv", Vd, Vs, Vt))
#define vhadd_h_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.h.u.vx", Vd, Vs, %0) : : "r"(t))
#define vhadd_h_ur_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.h.ur.vv", Vd, Vs, Vt))
#define vhadd_h_ur_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.h.ur.vx", Vd, Vs, %0) : : "r"(t))
#define vhadd_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.h.vv.m", Vd, Vs, Vt))
#define vhadd_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vhadd_h_r_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.h.r.vv.m", Vd, Vs, Vt))
#define vhadd_h_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.h.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vhadd_h_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.h.u.vv.m", Vd, Vs, Vt))
#define vhadd_h_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.h.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vhadd_h_ur_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.h.ur.vv.m", Vd, Vs, Vt))
#define vhadd_h_ur_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.h.ur.vx.m", Vd, Vs, %0) : : "r"(t))
#define vhadd_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.w.vv", Vd, Vs, Vt))
#define vhadd_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.w.vx", Vd, Vs, %0) : : "r"(t))
#define vhadd_w_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.w.r.vv", Vd, Vs, Vt))
#define vhadd_w_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.w.r.vx", Vd, Vs, %0) : : "r"(t))
#define vhadd_w_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.w.u.vv", Vd, Vs, Vt))
#define vhadd_w_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.w.u.vx", Vd, Vs, %0) : : "r"(t))
#define vhadd_w_ur_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.w.ur.vv", Vd, Vs, Vt))
#define vhadd_w_ur_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.w.ur.vx", Vd, Vs, %0) : : "r"(t))
#define vhadd_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.w.vv.m", Vd, Vs, Vt))
#define vhadd_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vhadd_w_r_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.w.r.vv.m", Vd, Vs, Vt))
#define vhadd_w_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.w.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vhadd_w_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.w.u.vv.m", Vd, Vs, Vt))
#define vhadd_w_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.w.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vhadd_w_ur_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.w.ur.vv.m", Vd, Vs, Vt))
#define vhadd_w_ur_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhadd.w.ur.vx.m", Vd, Vs, %0) : : "r"(t))
#define vhsub_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.b.vv", Vd, Vs, Vt))
#define vhsub_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.b.vx", Vd, Vs, %0) : : "r"(t))
#define vhsub_b_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.b.r.vv", Vd, Vs, Vt))
#define vhsub_b_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.b.r.vx", Vd, Vs, %0) : : "r"(t))
#define vhsub_b_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.b.u.vv", Vd, Vs, Vt))
#define vhsub_b_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.b.u.vx", Vd, Vs, %0) : : "r"(t))
#define vhsub_b_ur_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.b.ur.vv", Vd, Vs, Vt))
#define vhsub_b_ur_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.b.ur.vx", Vd, Vs, %0) : : "r"(t))
#define vhsub_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.b.vv.m", Vd, Vs, Vt))
#define vhsub_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vhsub_b_r_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.b.r.vv.m", Vd, Vs, Vt))
#define vhsub_b_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.b.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vhsub_b_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.b.u.vv.m", Vd, Vs, Vt))
#define vhsub_b_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.b.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vhsub_b_ur_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.b.ur.vv.m", Vd, Vs, Vt))
#define vhsub_b_ur_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.b.ur.vx.m", Vd, Vs, %0) : : "r"(t))
#define vhsub_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.h.vv", Vd, Vs, Vt))
#define vhsub_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.h.vx", Vd, Vs, %0) : : "r"(t))
#define vhsub_h_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.h.r.vv", Vd, Vs, Vt))
#define vhsub_h_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.h.r.vx", Vd, Vs, %0) : : "r"(t))
#define vhsub_h_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.h.u.vv", Vd, Vs, Vt))
#define vhsub_h_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.h.u.vx", Vd, Vs, %0) : : "r"(t))
#define vhsub_h_ur_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.h.ur.vv", Vd, Vs, Vt))
#define vhsub_h_ur_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.h.ur.vx", Vd, Vs, %0) : : "r"(t))
#define vhsub_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.h.vv.m", Vd, Vs, Vt))
#define vhsub_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vhsub_h_r_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.h.r.vv.m", Vd, Vs, Vt))
#define vhsub_h_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.h.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vhsub_h_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.h.u.vv.m", Vd, Vs, Vt))
#define vhsub_h_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.h.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vhsub_h_ur_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.h.ur.vv.m", Vd, Vs, Vt))
#define vhsub_h_ur_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.h.ur.vx.m", Vd, Vs, %0) : : "r"(t))
#define vhsub_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.w.vv", Vd, Vs, Vt))
#define vhsub_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.w.vx", Vd, Vs, %0) : : "r"(t))
#define vhsub_w_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.w.r.vv", Vd, Vs, Vt))
#define vhsub_w_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.w.r.vx", Vd, Vs, %0) : : "r"(t))
#define vhsub_w_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.w.u.vv", Vd, Vs, Vt))
#define vhsub_w_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.w.u.vx", Vd, Vs, %0) : : "r"(t))
#define vhsub_w_ur_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.w.ur.vv", Vd, Vs, Vt))
#define vhsub_w_ur_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.w.ur.vx", Vd, Vs, %0) : : "r"(t))
#define vhsub_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.w.vv.m", Vd, Vs, Vt))
#define vhsub_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vhsub_w_r_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.w.r.vv.m", Vd, Vs, Vt))
#define vhsub_w_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.w.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vhsub_w_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.w.u.vv.m", Vd, Vs, Vt))
#define vhsub_w_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.w.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vhsub_w_ur_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.w.ur.vv.m", Vd, Vs, Vt))
#define vhsub_w_ur_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vhsub.w.ur.vx.m", Vd, Vs, %0) : : "r"(t))
// 001 Logical
#define vand_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vand.vv", Vd, Vs, Vt))
#define vand_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vand.b.vx", Vd, Vs, %0) : : "r"(t))
#define vand_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vand.vv.m", Vd, Vs, Vt))
#define vand_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vand.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vand_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vand.h.vx", Vd, Vs, %0) : : "r"(t))
#define vand_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vand.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vand_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vand.w.vx", Vd, Vs, %0) : : "r"(t))
#define vand_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vand.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vor_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vor.vv", Vd, Vs, Vt))
#define vor_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vor.b.vx", Vd, Vs, %0) : : "r"(t))
#define vor_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vor.vv.m", Vd, Vs, Vt))
#define vor_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vor.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vor_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vor.h.vx", Vd, Vs, %0) : : "r"(t))
#define vor_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vor.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vor_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vor.w.vx", Vd, Vs, %0) : : "r"(t))
#define vor_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vor.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vxor_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vxor.vv", Vd, Vs, Vt))
#define vxor_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vxor.b.vx", Vd, Vs, %0) : : "r"(t))
#define vxor_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vxor.vv.m", Vd, Vs, Vt))
#define vxor_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vxor.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vxor_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vxor.h.vx", Vd, Vs, %0) : : "r"(t))
#define vxor_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vxor.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vxor_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vxor.w.vx", Vd, Vs, %0) : : "r"(t))
#define vxor_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vxor.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vnot_v(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vnot.v", Vd, Vs))
#define vnot_v_m(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vnot.v.m", Vd, Vs))
#define vrev_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vrev.b.vv", Vd, Vs, Vt))
#define vrev_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vrev.b.vx", Vd, Vs, %0) : : "r"(t))
#define vrev_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vrev.b.vv.m", Vd, Vs, Vt))
#define vrev_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vrev.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vrev_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vrev.h.vv", Vd, Vs, Vt))
#define vrev_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vrev.h.vx", Vd, Vs, %0) : : "r"(t))
#define vrev_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vrev.h.vv.m", Vd, Vs, Vt))
#define vrev_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vrev.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vrev_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vrev.w.vv", Vd, Vs, Vt))
#define vrev_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vrev.w.vx", Vd, Vs, %0) : : "r"(t))
#define vrev_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vrev.w.vv.m", Vd, Vs, Vt))
#define vrev_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vrev.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vror_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vror.b.vv", Vd, Vs, Vt))
#define vror_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vror.b.vx", Vd, Vs, %0) : : "r"(t))
#define vror_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vror.b.vv.m", Vd, Vs, Vt))
#define vror_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vror.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vror_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vror.h.vv", Vd, Vs, Vt))
#define vror_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vror.h.vx", Vd, Vs, %0) : : "r"(t))
#define vror_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vror.h.vv.m", Vd, Vs, Vt))
#define vror_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vror.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vror_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vror.w.vv", Vd, Vs, Vt))
#define vror_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vror.w.vx", Vd, Vs, %0) : : "r"(t))
#define vror_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vror.w.vv.m", Vd, Vs, Vt))
#define vror_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vror.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vclb_b_v(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vclb.b.v", Vd, Vs))
#define vclb_b_v_m(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vclb.b.v.m", Vd, Vs))
#define vclb_h_v(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vclb.h.v", Vd, Vs))
#define vclb_h_v_m(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vclb.h.v.m", Vd, Vs))
#define vclb_w_v(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vclb.w.v", Vd, Vs))
#define vclb_w_v_m(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vclb.w.v.m", Vd, Vs))
#define vclz_b_v(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vclz.b.v", Vd, Vs))
#define vclz_b_v_m(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vclz.b.v.m", Vd, Vs))
#define vclz_h_v(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vclz.h.v", Vd, Vs))
#define vclz_h_v_m(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vclz.h.v.m", Vd, Vs))
#define vclz_w_v(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vclz.w.v", Vd, Vs))
#define vclz_w_v_m(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vclz.w.v.m", Vd, Vs))
#define vcpop_b_v(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vcpop.b.v", Vd, Vs))
#define vcpop_b_v_m(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vcpop.b.v.m", Vd, Vs))
#define vcpop_h_v(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vcpop.h.v", Vd, Vs))
#define vcpop_h_v_m(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vcpop.h.v.m", Vd, Vs))
#define vcpop_w_v(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vcpop.w.v", Vd, Vs))
#define vcpop_w_v_m(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vcpop.w.v.m", Vd, Vs))
#define vmv_v(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vmv.v", Vd, Vs))
#define vmv_v_m(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("vmv.v.m", Vd, Vs))
#define vmvp_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmvp.vv", Vd, Vs, Vt))
#define vmvp_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmvp.b.vx", Vd, Vs, %0) : : "r"(t))
#define vmvp_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmvp.vv.m", Vd, Vs, Vt))
#define vmvp_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmvp.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmvp_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmvp.h.vx", Vd, Vs, %0) : : "r"(t))
#define vmvp_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmvp.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmvp_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmvp.w.vx", Vd, Vs, %0) : : "r"(t))
#define vmvp_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmvp.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define acset_v(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("acset.v", Vd, Vs))
#define actr_v(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("actr.v", Vd, Vs))
#define adwinit_v(Vd, Vs) __asm__ __volatile__(ARGS_F_A_A("adwinit.v", Vd, Vs))
// 010 Shift
#define vsll_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsll.b.vv", Vd, Vs, Vt))
#define vsll_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsll.b.vx", Vd, Vs, %0) : : "r"(t))
#define vsll_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsll.b.vv.m", Vd, Vs, Vt))
#define vsll_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsll.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsll_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsll.h.vv", Vd, Vs, Vt))
#define vsll_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsll.h.vx", Vd, Vs, %0) : : "r"(t))
#define vsll_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsll.h.vv.m", Vd, Vs, Vt))
#define vsll_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsll.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsll_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsll.w.vv", Vd, Vs, Vt))
#define vsll_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsll.w.vx", Vd, Vs, %0) : : "r"(t))
#define vsll_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsll.w.vv.m", Vd, Vs, Vt))
#define vsll_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsll.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsra_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsra.b.vv", Vd, Vs, Vt))
#define vsra_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsra.b.vx", Vd, Vs, %0) : : "r"(t))
#define vsra_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsra.b.vv.m", Vd, Vs, Vt))
#define vsra_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsra.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsra_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsra.h.vv", Vd, Vs, Vt))
#define vsra_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsra.h.vx", Vd, Vs, %0) : : "r"(t))
#define vsra_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsra.h.vv.m", Vd, Vs, Vt))
#define vsra_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsra.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsra_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsra.w.vv", Vd, Vs, Vt))
#define vsra_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsra.w.vx", Vd, Vs, %0) : : "r"(t))
#define vsra_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsra.w.vv.m", Vd, Vs, Vt))
#define vsra_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsra.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsrl_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsrl.b.vv", Vd, Vs, Vt))
#define vsrl_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsrl.b.vx", Vd, Vs, %0) : : "r"(t))
#define vsrl_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsrl.b.vv.m", Vd, Vs, Vt))
#define vsrl_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsrl.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsrl_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsrl.h.vv", Vd, Vs, Vt))
#define vsrl_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsrl.h.vx", Vd, Vs, %0) : : "r"(t))
#define vsrl_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsrl.h.vv.m", Vd, Vs, Vt))
#define vsrl_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsrl.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsrl_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsrl.w.vv", Vd, Vs, Vt))
#define vsrl_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsrl.w.vx", Vd, Vs, %0) : : "r"(t))
#define vsrl_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsrl.w.vv.m", Vd, Vs, Vt))
#define vsrl_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsrl.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsha_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsha.b.vv", Vd, Vs, Vt))
#define vsha_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsha.b.vx", Vd, Vs, %0) : : "r"(t))
#define vsha_b_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsha.b.r.vv", Vd, Vs, Vt))
#define vsha_b_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsha.b.r.vx", Vd, Vs, %0) : : "r"(t))
#define vsha_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsha.b.vv.m", Vd, Vs, Vt))
#define vsha_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsha.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsha_b_r_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsha.b.r.vv.m", Vd, Vs, Vt))
#define vsha_b_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsha.b.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsha_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsha.h.vv", Vd, Vs, Vt))
#define vsha_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsha.h.vx", Vd, Vs, %0) : : "r"(t))
#define vsha_h_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsha.h.r.vv", Vd, Vs, Vt))
#define vsha_h_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsha.h.r.vx", Vd, Vs, %0) : : "r"(t))
#define vsha_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsha.h.vv.m", Vd, Vs, Vt))
#define vsha_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsha.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsha_h_r_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsha.h.r.vv.m", Vd, Vs, Vt))
#define vsha_h_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsha.h.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsha_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsha.w.vv", Vd, Vs, Vt))
#define vsha_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsha.w.vx", Vd, Vs, %0) : : "r"(t))
#define vsha_w_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsha.w.r.vv", Vd, Vs, Vt))
#define vsha_w_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsha.w.r.vx", Vd, Vs, %0) : : "r"(t))
#define vsha_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsha.w.vv.m", Vd, Vs, Vt))
#define vsha_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsha.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsha_w_r_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsha.w.r.vv.m", Vd, Vs, Vt))
#define vsha_w_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsha.w.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vshl_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vshl.b.vv", Vd, Vs, Vt))
#define vshl_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vshl.b.vx", Vd, Vs, %0) : : "r"(t))
#define vshl_b_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vshl.b.r.vv", Vd, Vs, Vt))
#define vshl_b_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vshl.b.r.vx", Vd, Vs, %0) : : "r"(t))
#define vshl_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vshl.b.vv.m", Vd, Vs, Vt))
#define vshl_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vshl.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vshl_b_r_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vshl.b.r.vv.m", Vd, Vs, Vt))
#define vshl_b_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vshl.b.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vshl_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vshl.h.vv", Vd, Vs, Vt))
#define vshl_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vshl.h.vx", Vd, Vs, %0) : : "r"(t))
#define vshl_h_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vshl.h.r.vv", Vd, Vs, Vt))
#define vshl_h_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vshl.h.r.vx", Vd, Vs, %0) : : "r"(t))
#define vshl_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vshl.h.vv.m", Vd, Vs, Vt))
#define vshl_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vshl.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vshl_h_r_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vshl.h.r.vv.m", Vd, Vs, Vt))
#define vshl_h_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vshl.h.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vshl_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vshl.w.vv", Vd, Vs, Vt))
#define vshl_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vshl.w.vx", Vd, Vs, %0) : : "r"(t))
#define vshl_w_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vshl.w.r.vv", Vd, Vs, Vt))
#define vshl_w_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vshl.w.r.vx", Vd, Vs, %0) : : "r"(t))
#define vshl_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vshl.w.vv.m", Vd, Vs, Vt))
#define vshl_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vshl.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vshl_w_r_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vshl.w.r.vv.m", Vd, Vs, Vt))
#define vshl_w_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vshl.w.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsrans_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsrans.b.vv", Vd, Vs, Vt))
#define vsrans_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsrans.b.vx", Vd, Vs, %0) : : "r"(t))
#define vsrans_b_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsrans.b.r.vv", Vd, Vs, Vt))
#define vsrans_b_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsrans.b.r.vx", Vd, Vs, %0) : : "r"(t))
#define vsrans_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsrans.b.vv.m", Vd, Vs, Vt))
#define vsrans_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsrans.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsrans_b_r_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsrans.b.r.vv.m", Vd, Vs, Vt))
#define vsrans_b_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsrans.b.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsrans_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsrans.h.vv", Vd, Vs, Vt))
#define vsrans_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsrans.h.vx", Vd, Vs, %0) : : "r"(t))
#define vsrans_h_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsrans.h.r.vv", Vd, Vs, Vt))
#define vsrans_h_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsrans.h.r.vx", Vd, Vs, %0) : : "r"(t))
#define vsrans_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsrans.h.vv.m", Vd, Vs, Vt))
#define vsrans_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsrans.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsrans_h_r_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsrans.h.r.vv.m", Vd, Vs, Vt))
#define vsrans_h_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsrans.h.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsransu_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsransu.b.vv", Vd, Vs, Vt))
#define vsransu_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsransu.b.vx", Vd, Vs, %0) : : "r"(t))
#define vsransu_b_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsransu.b.r.vv", Vd, Vs, Vt))
#define vsransu_b_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsransu.b.r.vx", Vd, Vs, %0) : : "r"(t))
#define vsransu_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsransu.b.vv.m", Vd, Vs, Vt))
#define vsransu_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsransu.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsransu_b_r_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vsransu.b.r.vv.m", Vd, Vs, Vt))
#define vsransu_b_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsransu.b.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsransu_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsransu.h.vv", Vd, Vs, Vt))
#define vsransu_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsransu.h.vx", Vd, Vs, %0) : : "r"(t))
#define vsransu_h_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsransu.h.r.vv", Vd, Vs, Vt))
#define vsransu_h_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsransu.h.r.vx", Vd, Vs, %0) : : "r"(t))
#define vsransu_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsransu.h.vv.m", Vd, Vs, Vt))
#define vsransu_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsransu.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsransu_h_r_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vsransu.h.r.vv.m", Vd, Vs, Vt))
#define vsransu_h_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsransu.h.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsraqs_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsraqs.b.vv", Vd, Vs, Vt))
#define vsraqs_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsraqs.b.vx", Vd, Vs, %0) : : "r"(t))
#define vsraqs_b_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsraqs.b.r.vv", Vd, Vs, Vt))
#define vsraqs_b_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsraqs.b.r.vx", Vd, Vs, %0) : : "r"(t))
#define vsraqs_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsraqs.b.vv.m", Vd, Vs, Vt))
#define vsraqs_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsraqs.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsraqs_b_r_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsraqs.b.r.vv.m", Vd, Vs, Vt))
#define vsraqs_b_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsraqs.b.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsraqsu_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsraqsu.b.vv", Vd, Vs, Vt))
#define vsraqsu_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsraqsu.b.vx", Vd, Vs, %0) : : "r"(t))
#define vsraqsu_b_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsraqsu.b.r.vv", Vd, Vs, Vt))
#define vsraqsu_b_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsraqsu.b.r.vx", Vd, Vs, %0) : : "r"(t))
#define vsraqsu_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsraqsu.b.vv.m", Vd, Vs, Vt))
#define vsraqsu_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsraqsu.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsraqsu_b_r_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vsraqsu.b.r.vv.m", Vd, Vs, Vt))
#define vsraqsu_b_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsraqsu.b.r.vx.m", Vd, Vs, %0) : : "r"(t))
// 011 Mul/Div
#define vmul_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmul.b.vv", Vd, Vs, Vt))
#define vmul_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmul.b.vx", Vd, Vs, %0) : : "r"(t))
#define vmul_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmul.b.vv.m", Vd, Vs, Vt))
#define vmul_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmul.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmul_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmul.h.vv", Vd, Vs, Vt))
#define vmul_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmul.h.vx", Vd, Vs, %0) : : "r"(t))
#define vmul_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmul.h.vv.m", Vd, Vs, Vt))
#define vmul_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmul.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmul_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmul.w.vv", Vd, Vs, Vt))
#define vmul_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmul.w.vx", Vd, Vs, %0) : : "r"(t))
#define vmul_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmul.w.vv.m", Vd, Vs, Vt))
#define vmul_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmul.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmuls_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmuls.b.vv", Vd, Vs, Vt))
#define vmuls_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmuls.b.vx", Vd, Vs, %0) : : "r"(t))
#define vmuls_b_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmuls.b.u.vv", Vd, Vs, Vt))
#define vmuls_b_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmuls.b.u.vx", Vd, Vs, %0) : : "r"(t))
#define vmuls_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmuls.b.vv.m", Vd, Vs, Vt))
#define vmuls_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmuls.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmuls_b_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmuls.b.u.vv.m", Vd, Vs, Vt))
#define vmuls_b_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmuls.b.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmuls_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmuls.h.vv", Vd, Vs, Vt))
#define vmuls_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmuls.h.vx", Vd, Vs, %0) : : "r"(t))
#define vmuls_h_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmuls.h.u.vv", Vd, Vs, Vt))
#define vmuls_h_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmuls.h.u.vx", Vd, Vs, %0) : : "r"(t))
#define vmuls_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmuls.h.vv.m", Vd, Vs, Vt))
#define vmuls_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmuls.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmuls_h_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmuls.h.u.vv.m", Vd, Vs, Vt))
#define vmuls_h_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmuls.h.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmuls_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmuls.w.vv", Vd, Vs, Vt))
#define vmuls_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmuls.w.vx", Vd, Vs, %0) : : "r"(t))
#define vmuls_w_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmuls.w.u.vv", Vd, Vs, Vt))
#define vmuls_w_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmuls.w.u.vx", Vd, Vs, %0) : : "r"(t))
#define vmuls_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmuls.w.vv.m", Vd, Vs, Vt))
#define vmuls_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmuls.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmuls_w_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmuls.w.u.vv.m", Vd, Vs, Vt))
#define vmuls_w_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmuls.w.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmulw_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulw.b.vv", Vd, Vs, Vt))
#define vmulw_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulw.b.vx", Vd, Vs, %0) : : "r"(t))
#define vmulw_b_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulw.b.u.vv", Vd, Vs, Vt))
#define vmulw_b_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulw.b.u.vx", Vd, Vs, %0) : : "r"(t))
#define vmulw_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulw.b.vv.m", Vd, Vs, Vt))
#define vmulw_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulw.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmulw_b_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulw.b.u.vv.m", Vd, Vs, Vt))
#define vmulw_b_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulw.b.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmulw_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulw.h.vv", Vd, Vs, Vt))
#define vmulw_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulw.h.vx", Vd, Vs, %0) : : "r"(t))
#define vmulw_h_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulw.h.u.vv", Vd, Vs, Vt))
#define vmulw_h_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulw.h.u.vx", Vd, Vs, %0) : : "r"(t))
#define vmulw_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulw.h.vv.m", Vd, Vs, Vt))
#define vmulw_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulw.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmulw_h_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulw.h.u.vv.m", Vd, Vs, Vt))
#define vmulw_h_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulw.h.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmulw_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulw.w.vv", Vd, Vs, Vt))
#define vmulw_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulw.w.vx", Vd, Vs, %0) : : "r"(t))
#define vmulw_w_u_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulw.w.u.vv", Vd, Vs, Vt))
#define vmulw_w_u_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulw.w.u.vx", Vd, Vs, %0) : : "r"(t))
#define vmulw_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulw.w.vv.m", Vd, Vs, Vt))
#define vmulw_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulw.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmulw_w_u_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulw.w.u.vv.m", Vd, Vs, Vt))
#define vmulw_w_u_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulw.w.u.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmulh_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulh.b.vv", Vd, Vs, Vt))
#define vmulh_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulh.b.vx", Vd, Vs, %0) : : "r"(t))
#define vmulh_b_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulh.b.r.vv", Vd, Vs, Vt))
#define vmulh_b_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulh.b.r.vx", Vd, Vs, %0) : : "r"(t))
#define vmulh_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulh.b.vv.m", Vd, Vs, Vt))
#define vmulh_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulh.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmulh_b_r_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulh.b.r.vv.m", Vd, Vs, Vt))
#define vmulh_b_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulh.b.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmulh_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulh.h.vv", Vd, Vs, Vt))
#define vmulh_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulh.h.vx", Vd, Vs, %0) : : "r"(t))
#define vmulh_h_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulh.h.r.vv", Vd, Vs, Vt))
#define vmulh_h_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulh.h.r.vx", Vd, Vs, %0) : : "r"(t))
#define vmulh_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulh.h.vv.m", Vd, Vs, Vt))
#define vmulh_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulh.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmulh_h_r_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulh.h.r.vv.m", Vd, Vs, Vt))
#define vmulh_h_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulh.h.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmulh_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulh.w.vv", Vd, Vs, Vt))
#define vmulh_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulh.w.vx", Vd, Vs, %0) : : "r"(t))
#define vmulh_w_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulh.w.r.vv", Vd, Vs, Vt))
#define vmulh_w_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulh.w.r.vx", Vd, Vs, %0) : : "r"(t))
#define vmulh_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulh.w.vv.m", Vd, Vs, Vt))
#define vmulh_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulh.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmulh_w_r_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulh.w.r.vv.m", Vd, Vs, Vt))
#define vmulh_w_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulh.w.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmulhu_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulhu.b.vv", Vd, Vs, Vt))
#define vmulhu_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulhu.b.vx", Vd, Vs, %0) : : "r"(t))
#define vmulhu_b_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulhu.b.r.vv", Vd, Vs, Vt))
#define vmulhu_b_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulhu.b.r.vx", Vd, Vs, %0) : : "r"(t))
#define vmulhu_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulhu.b.vv.m", Vd, Vs, Vt))
#define vmulhu_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulhu.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmulhu_b_r_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulhu.b.r.vv.m", Vd, Vs, Vt))
#define vmulhu_b_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulhu.b.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmulhu_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulhu.h.vv", Vd, Vs, Vt))
#define vmulhu_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulhu.h.vx", Vd, Vs, %0) : : "r"(t))
#define vmulhu_h_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulhu.h.r.vv", Vd, Vs, Vt))
#define vmulhu_h_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulhu.h.r.vx", Vd, Vs, %0) : : "r"(t))
#define vmulhu_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulhu.h.vv.m", Vd, Vs, Vt))
#define vmulhu_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulhu.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmulhu_h_r_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulhu.h.r.vv.m", Vd, Vs, Vt))
#define vmulhu_h_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulhu.h.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmulhu_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulhu.w.vv", Vd, Vs, Vt))
#define vmulhu_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulhu.w.vx", Vd, Vs, %0) : : "r"(t))
#define vmulhu_w_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulhu.w.r.vv", Vd, Vs, Vt))
#define vmulhu_w_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulhu.w.r.vx", Vd, Vs, %0) : : "r"(t))
#define vmulhu_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulhu.w.vv.m", Vd, Vs, Vt))
#define vmulhu_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulhu.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmulhu_w_r_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmulhu.w.r.vv.m", Vd, Vs, Vt))
#define vmulhu_w_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmulhu.w.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vdmulh_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.b.vv", Vd, Vs, Vt))
#define vdmulh_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.b.vx", Vd, Vs, %0) : : "r"(t))
#define vdmulh_b_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.b.r.vv", Vd, Vs, Vt))
#define vdmulh_b_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.b.r.vx", Vd, Vs, %0) : : "r"(t))
#define vdmulh_b_rn_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.b.rn.vv", Vd, Vs, Vt))
#define vdmulh_b_rn_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.b.rn.vx", Vd, Vs, %0) : : "r"(t))
#define vdmulh_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.b.vv.m", Vd, Vs, Vt))
#define vdmulh_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vdmulh_b_r_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.b.r.vv.m", Vd, Vs, Vt))
#define vdmulh_b_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.b.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vdmulh_b_rn_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vdmulh.b.rn.vv.m", Vd, Vs, Vt))
#define vdmulh_b_rn_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.b.rn.vx.m", Vd, Vs, %0) : : "r"(t))
#define vdmulh_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.h.vv", Vd, Vs, Vt))
#define vdmulh_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.h.vx", Vd, Vs, %0) : : "r"(t))
#define vdmulh_h_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.h.r.vv", Vd, Vs, Vt))
#define vdmulh_h_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.h.r.vx", Vd, Vs, %0) : : "r"(t))
#define vdmulh_h_rn_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.h.rn.vv", Vd, Vs, Vt))
#define vdmulh_h_rn_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.h.rn.vx", Vd, Vs, %0) : : "r"(t))
#define vdmulh_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.h.vv.m", Vd, Vs, Vt))
#define vdmulh_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vdmulh_h_r_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.h.r.vv.m", Vd, Vs, Vt))
#define vdmulh_h_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.h.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vdmulh_h_rn_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vdmulh.h.rn.vv.m", Vd, Vs, Vt))
#define vdmulh_h_rn_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.h.rn.vx.m", Vd, Vs, %0) : : "r"(t))
#define vdmulh_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.w.vv", Vd, Vs, Vt))
#define vdmulh_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.w.vx", Vd, Vs, %0) : : "r"(t))
#define vdmulh_w_r_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.w.r.vv", Vd, Vs, Vt))
#define vdmulh_w_r_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.w.r.vx", Vd, Vs, %0) : : "r"(t))
#define vdmulh_w_rn_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.w.rn.vv", Vd, Vs, Vt))
#define vdmulh_w_rn_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.w.rn.vx", Vd, Vs, %0) : : "r"(t))
#define vdmulh_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.w.vv.m", Vd, Vs, Vt))
#define vdmulh_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vdmulh_w_r_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.w.r.vv.m", Vd, Vs, Vt))
#define vdmulh_w_r_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.w.r.vx.m", Vd, Vs, %0) : : "r"(t))
#define vdmulh_w_rn_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vdmulh.w.rn.vv.m", Vd, Vs, Vt))
#define vdmulh_w_rn_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vdmulh.w.rn.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmacc_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmacc.b.vv", Vd, Vs, Vt))
#define vmacc_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmacc.b.vx", Vd, Vs, %0) : : "r"(t))
#define vmacc_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmacc.b.vv.m", Vd, Vs, Vt))
#define vmacc_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmacc.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmacc_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmacc.h.vv", Vd, Vs, Vt))
#define vmacc_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmacc.h.vx", Vd, Vs, %0) : : "r"(t))
#define vmacc_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmacc.h.vv.m", Vd, Vs, Vt))
#define vmacc_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmacc.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmacc_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmacc.w.vv", Vd, Vs, Vt))
#define vmacc_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmacc.w.vx", Vd, Vs, %0) : : "r"(t))
#define vmacc_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmacc.w.vv.m", Vd, Vs, Vt))
#define vmacc_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmacc.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmadd_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmadd.b.vv", Vd, Vs, Vt))
#define vmadd_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmadd.b.vx", Vd, Vs, %0) : : "r"(t))
#define vmadd_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmadd.b.vv.m", Vd, Vs, Vt))
#define vmadd_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmadd.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmadd_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmadd.h.vv", Vd, Vs, Vt))
#define vmadd_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmadd.h.vx", Vd, Vs, %0) : : "r"(t))
#define vmadd_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmadd.h.vv.m", Vd, Vs, Vt))
#define vmadd_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmadd.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vmadd_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmadd.w.vv", Vd, Vs, Vt))
#define vmadd_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmadd.w.vx", Vd, Vs, %0) : : "r"(t))
#define vmadd_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vmadd.w.vv.m", Vd, Vs, Vt))
#define vmadd_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vmadd.w.vx.m", Vd, Vs, %0) : : "r"(t))
// 110 Shuffle
#define vsliden_b_1_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsliden.b.1.vv", Vd, Vs, Vt))
#define vsliden_b_1_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsliden.b.1.vx", Vd, Vs, %0) : : "r"(t))
#define vsliden_b_2_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsliden.b.2.vv", Vd, Vs, Vt))
#define vsliden_b_2_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsliden.b.2.vx", Vd, Vs, %0) : : "r"(t))
#define vsliden_b_3_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsliden.b.3.vv", Vd, Vs, Vt))
#define vsliden_b_3_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsliden.b.3.vx", Vd, Vs, %0) : : "r"(t))
#define vsliden_b_4_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsliden.b.4.vv", Vd, Vs, Vt))
#define vsliden_b_4_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsliden.b.4.vx", Vd, Vs, %0) : : "r"(t))
#define vsliden_h_1_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsliden.h.1.vv", Vd, Vs, Vt))
#define vsliden_h_1_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsliden.h.1.vx", Vd, Vs, %0) : : "r"(t))
#define vsliden_h_2_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsliden.h.2.vv", Vd, Vs, Vt))
#define vsliden_h_2_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsliden.h.2.vx", Vd, Vs, %0) : : "r"(t))
#define vsliden_h_3_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsliden.h.3.vv", Vd, Vs, Vt))
#define vsliden_h_3_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsliden.h.3.vx", Vd, Vs, %0) : : "r"(t))
#define vsliden_h_4_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsliden.h.4.vv", Vd, Vs, Vt))
#define vsliden_h_4_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsliden.h.4.vx", Vd, Vs, %0) : : "r"(t))
#define vsliden_w_1_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsliden.w.1.vv", Vd, Vs, Vt))
#define vsliden_w_1_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsliden.w.1.vx", Vd, Vs, %0) : : "r"(t))
#define vsliden_w_2_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsliden.w.2.vv", Vd, Vs, Vt))
#define vsliden_w_2_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsliden.w.2.vx", Vd, Vs, %0) : : "r"(t))
#define vsliden_w_3_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsliden.w.3.vv", Vd, Vs, Vt))
#define vsliden_w_3_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsliden.w.3.vx", Vd, Vs, %0) : : "r"(t))
#define vsliden_w_4_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsliden.w.4.vv", Vd, Vs, Vt))
#define vsliden_w_4_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsliden.w.4.vx", Vd, Vs, %0) : : "r"(t))
#define vslidevn_b_1_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidevn.b.1.vv.m", Vd, Vs, Vt))
#define vslidevn_b_1_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidevn.b.1.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidevn_b_2_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidevn.b.2.vv.m", Vd, Vs, Vt))
#define vslidevn_b_2_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidevn.b.2.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidevn_b_3_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidevn.b.3.vv.m", Vd, Vs, Vt))
#define vslidevn_b_3_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidevn.b.3.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidevn_b_4_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidevn.b.4.vv.m", Vd, Vs, Vt))
#define vslidevn_b_4_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidevn.b.4.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidevn_h_1_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidevn.h.1.vv.m", Vd, Vs, Vt))
#define vslidevn_h_1_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidevn.h.1.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidevn_h_2_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidevn.h.2.vv.m", Vd, Vs, Vt))
#define vslidevn_h_2_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidevn.h.2.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidevn_h_3_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidevn.h.3.vv.m", Vd, Vs, Vt))
#define vslidevn_h_3_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidevn.h.3.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidevn_h_4_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidevn.h.4.vv.m", Vd, Vs, Vt))
#define vslidevn_h_4_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidevn.h.4.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidevn_w_1_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidevn.w.1.vv.m", Vd, Vs, Vt))
#define vslidevn_w_1_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidevn.w.1.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidevn_w_2_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidevn.w.2.vv.m", Vd, Vs, Vt))
#define vslidevn_w_2_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidevn.w.2.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidevn_w_3_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidevn.w.3.vv.m", Vd, Vs, Vt))
#define vslidevn_w_3_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidevn.w.3.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidevn_w_4_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidevn.w.4.vv.m", Vd, Vs, Vt))
#define vslidevn_w_4_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidevn.w.4.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidehn_b_1_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidehn.b.1.vv.m", Vd, Vs, Vt))
#define vslidehn_b_1_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidehn.b.1.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidehn_b_2_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidehn.b.2.vv.m", Vd, Vs, Vt))
#define vslidehn_b_2_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidehn.b.2.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidehn_b_3_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidehn.b.3.vv.m", Vd, Vs, Vt))
#define vslidehn_b_3_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidehn.b.3.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidehn_b_4_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidehn.b.4.vv.m", Vd, Vs, Vt))
#define vslidehn_b_4_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidehn.b.4.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidehn_h_1_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidehn.h.1.vv.m", Vd, Vs, Vt))
#define vslidehn_h_1_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidehn.h.1.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidehn_h_2_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidehn.h.2.vv.m", Vd, Vs, Vt))
#define vslidehn_h_2_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidehn.h.2.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidehn_h_3_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidehn.h.3.vv.m", Vd, Vs, Vt))
#define vslidehn_h_3_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidehn.h.3.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidehn_h_4_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidehn.h.4.vv.m", Vd, Vs, Vt))
#define vslidehn_h_4_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidehn.h.4.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidehn_w_1_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidehn.w.1.vv.m", Vd, Vs, Vt))
#define vslidehn_w_1_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidehn.w.1.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidehn_w_2_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidehn.w.2.vv.m", Vd, Vs, Vt))
#define vslidehn_w_2_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidehn.w.2.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidehn_w_3_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidehn.w.3.vv.m", Vd, Vs, Vt))
#define vslidehn_w_3_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidehn.w.3.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidehn_w_4_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidehn.w.4.vv.m", Vd, Vs, Vt))
#define vslidehn_w_4_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidehn.w.4.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidep_b_1_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vslidep.b.1.vv", Vd, Vs, Vt))
#define vslidep_b_1_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vslidep.b.1.vx", Vd, Vs, %0) : : "r"(t))
#define vslidep_b_2_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vslidep.b.2.vv", Vd, Vs, Vt))
#define vslidep_b_2_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vslidep.b.2.vx", Vd, Vs, %0) : : "r"(t))
#define vslidep_b_3_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vslidep.b.3.vv", Vd, Vs, Vt))
#define vslidep_b_3_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vslidep.b.3.vx", Vd, Vs, %0) : : "r"(t))
#define vslidep_b_4_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vslidep.b.4.vv", Vd, Vs, Vt))
#define vslidep_b_4_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vslidep.b.4.vx", Vd, Vs, %0) : : "r"(t))
#define vslidep_h_1_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vslidep.h.1.vv", Vd, Vs, Vt))
#define vslidep_h_1_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vslidep.h.1.vx", Vd, Vs, %0) : : "r"(t))
#define vslidep_h_2_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vslidep.h.2.vv", Vd, Vs, Vt))
#define vslidep_h_2_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vslidep.h.2.vx", Vd, Vs, %0) : : "r"(t))
#define vslidep_h_3_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vslidep.h.3.vv", Vd, Vs, Vt))
#define vslidep_h_3_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vslidep.h.3.vx", Vd, Vs, %0) : : "r"(t))
#define vslidep_h_4_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vslidep.h.4.vv", Vd, Vs, Vt))
#define vslidep_h_4_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vslidep.h.4.vx", Vd, Vs, %0) : : "r"(t))
#define vslidep_w_1_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vslidep.w.1.vv", Vd, Vs, Vt))
#define vslidep_w_1_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vslidep.w.1.vx", Vd, Vs, %0) : : "r"(t))
#define vslidep_w_2_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vslidep.w.2.vv", Vd, Vs, Vt))
#define vslidep_w_2_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vslidep.w.2.vx", Vd, Vs, %0) : : "r"(t))
#define vslidep_w_3_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vslidep.w.3.vv", Vd, Vs, Vt))
#define vslidep_w_3_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vslidep.w.3.vx", Vd, Vs, %0) : : "r"(t))
#define vslidep_w_4_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vslidep.w.4.vv", Vd, Vs, Vt))
#define vslidep_w_4_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vslidep.w.4.vx", Vd, Vs, %0) : : "r"(t))
#define vslidevp_b_1_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidevp.b.1.vv.m", Vd, Vs, Vt))
#define vslidevp_b_1_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidevp.b.1.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidevp_b_2_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidevp.b.2.vv.m", Vd, Vs, Vt))
#define vslidevp_b_2_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidevp.b.2.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidevp_b_3_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidevp.b.3.vv.m", Vd, Vs, Vt))
#define vslidevp_b_3_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidevp.b.3.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidevp_b_4_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidevp.b.4.vv.m", Vd, Vs, Vt))
#define vslidevp_b_4_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidevp.b.4.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidevp_h_1_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidevp.h.1.vv.m", Vd, Vs, Vt))
#define vslidevp_h_1_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidevp.h.1.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidevp_h_2_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidevp.h.2.vv.m", Vd, Vs, Vt))
#define vslidevp_h_2_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidevp.h.2.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidevp_h_3_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidevp.h.3.vv.m", Vd, Vs, Vt))
#define vslidevp_h_3_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidevp.h.3.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidevp_h_4_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidevp.h.4.vv.m", Vd, Vs, Vt))
#define vslidevp_h_4_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidevp.h.4.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidevp_w_1_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidevp.w.1.vv.m", Vd, Vs, Vt))
#define vslidevp_w_1_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidevp.w.1.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidevp_w_2_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidevp.w.2.vv.m", Vd, Vs, Vt))
#define vslidevp_w_2_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidevp.w.2.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidevp_w_3_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidevp.w.3.vv.m", Vd, Vs, Vt))
#define vslidevp_w_3_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidevp.w.3.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidevp_w_4_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidevp.w.4.vv.m", Vd, Vs, Vt))
#define vslidevp_w_4_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidevp.w.4.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidehp_b_1_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidehp.b.1.vv.m", Vd, Vs, Vt))
#define vslidehp_b_1_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidehp.b.1.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidehp_b_2_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidehp.b.2.vv.m", Vd, Vs, Vt))
#define vslidehp_b_2_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidehp.b.2.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidehp_b_3_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidehp.b.3.vv.m", Vd, Vs, Vt))
#define vslidehp_b_3_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidehp.b.3.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidehp_b_4_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidehp.b.4.vv.m", Vd, Vs, Vt))
#define vslidehp_b_4_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidehp.b.4.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidehp_h_1_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidehp.h.1.vv.m", Vd, Vs, Vt))
#define vslidehp_h_1_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidehp.h.1.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidehp_h_2_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidehp.h.2.vv.m", Vd, Vs, Vt))
#define vslidehp_h_2_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidehp.h.2.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidehp_h_3_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidehp.h.3.vv.m", Vd, Vs, Vt))
#define vslidehp_h_3_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidehp.h.3.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidehp_h_4_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidehp.h.4.vv.m", Vd, Vs, Vt))
#define vslidehp_h_4_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidehp.h.4.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidehp_w_1_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidehp.w.1.vv.m", Vd, Vs, Vt))
#define vslidehp_w_1_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidehp.w.1.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidehp_w_2_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidehp.w.2.vv.m", Vd, Vs, Vt))
#define vslidehp_w_2_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidehp.w.2.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidehp_w_3_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidehp.w.3.vv.m", Vd, Vs, Vt))
#define vslidehp_w_3_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidehp.w.3.vx.m", Vd, Vs, %0) : : "r"(t))
#define vslidehp_w_4_vv_m(Vd, Vs, Vt)__asm__ __volatile__(ARGS_F_A_A_A("vslidehp.w.4.vv.m", Vd, Vs, Vt))
#define vslidehp_w_4_vx_m(Vd, Vs, t)__asm__ __volatile__(ARGS_F_A_A_A("vslidehp.w.4.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsel_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsel.b.vv", Vd, Vs, Vt))
#define vsel_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsel.b.vx", Vd, Vs, %0) : : "r"(t))
#define vsel_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsel.b.vv.m", Vd, Vs, Vt))
#define vsel_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsel.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsel_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsel.h.vv", Vd, Vs, Vt))
#define vsel_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsel.h.vx", Vd, Vs, %0) : : "r"(t))
#define vsel_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsel.h.vv.m", Vd, Vs, Vt))
#define vsel_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsel.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vsel_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsel.w.vv", Vd, Vs, Vt))
#define vsel_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsel.w.vx", Vd, Vs, %0) : : "r"(t))
#define vsel_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vsel.w.vv.m", Vd, Vs, Vt))
#define vsel_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vsel.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vevn_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vevn.b.vv", Vd, Vs, Vt))
#define vevn_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vevn.b.vx", Vd, Vs, %0) : : "r"(t))
#define vevn_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vevn.b.vv.m", Vd, Vs, Vt))
#define vevn_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vevn.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vevn_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vevn.h.vv", Vd, Vs, Vt))
#define vevn_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vevn.h.vx", Vd, Vs, %0) : : "r"(t))
#define vevn_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vevn.h.vv.m", Vd, Vs, Vt))
#define vevn_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vevn.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vevn_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vevn.w.vv", Vd, Vs, Vt))
#define vevn_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vevn.w.vx", Vd, Vs, %0) : : "r"(t))
#define vevn_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vevn.w.vv.m", Vd, Vs, Vt))
#define vevn_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vevn.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vodd_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vodd.b.vv", Vd, Vs, Vt))
#define vodd_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vodd.b.vx", Vd, Vs, %0) : : "r"(t))
#define vodd_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vodd.b.vv.m", Vd, Vs, Vt))
#define vodd_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vodd.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vodd_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vodd.h.vv", Vd, Vs, Vt))
#define vodd_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vodd.h.vx", Vd, Vs, %0) : : "r"(t))
#define vodd_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vodd.h.vv.m", Vd, Vs, Vt))
#define vodd_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vodd.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vodd_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vodd.w.vv", Vd, Vs, Vt))
#define vodd_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vodd.w.vx", Vd, Vs, %0) : : "r"(t))
#define vodd_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vodd.w.vv.m", Vd, Vs, Vt))
#define vodd_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vodd.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vevnodd_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vevnodd.b.vv", Vd, Vs, Vt))
#define vevnodd_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vevnodd.b.vx", Vd, Vs, %0) : : "r"(t))
#define vevnodd_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vevnodd.b.vv.m", Vd, Vs, Vt))
#define vevnodd_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vevnodd.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vevnodd_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vevnodd.h.vv", Vd, Vs, Vt))
#define vevnodd_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vevnodd.h.vx", Vd, Vs, %0) : : "r"(t))
#define vevnodd_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vevnodd.h.vv.m", Vd, Vs, Vt))
#define vevnodd_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vevnodd.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vevnodd_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vevnodd.w.vv", Vd, Vs, Vt))
#define vevnodd_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vevnodd.w.vx", Vd, Vs, %0) : : "r"(t))
#define vevnodd_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vevnodd.w.vv.m", Vd, Vs, Vt))
#define vevnodd_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vevnodd.w.vx.m", Vd, Vs, %0) : : "r"(t))
#define vzip_b_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vzip.b.vv", Vd, Vs, Vt))
#define vzip_b_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vzip.b.vx", Vd, Vs, %0) : : "r"(t))
#define vzip_b_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vzip.b.vv.m", Vd, Vs, Vt))
#define vzip_b_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vzip.b.vx.m", Vd, Vs, %0) : : "r"(t))
#define vzip_h_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vzip.h.vv", Vd, Vs, Vt))
#define vzip_h_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vzip.h.vx", Vd, Vs, %0) : : "r"(t))
#define vzip_h_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vzip.h.vv.m", Vd, Vs, Vt))
#define vzip_h_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vzip.h.vx.m", Vd, Vs, %0) : : "r"(t))
#define vzip_w_vv(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vzip.w.vv", Vd, Vs, Vt))
#define vzip_w_vx(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vzip.w.vx", Vd, Vs, %0) : : "r"(t))
#define vzip_w_vv_m(Vd, Vs, Vt) __asm__ __volatile__(ARGS_F_A_A_A("vzip.w.vv.m", Vd, Vs, Vt))
#define vzip_w_vx_m(Vd, Vs, t) __asm__ __volatile__(ARGS_F_A_A_A("vzip.w.vx.m", Vd, Vs, %0) : : "r"(t))
// 3arg
#define aconv_vxv(Vd, Vs, t, Vr) __asm__ __volatile__(ARGS_F_A_A_A_A("aconv.vxv", Vd, Vs, %0, Vr) : : "r"(t))
#define adwconv_vxv(Vd, Vs, t, Vr) __asm__ __volatile__(ARGS_F_A_A_A_A("adwconv.vxv", Vd, Vs, %0, Vr) : : "r"(t))
#define vdwconv_vxv(Vd, Vs, t, Vr) __asm__ __volatile__(ARGS_F_A_A_A_A("vdwconv.vxv", Vd, Vs, %0, Vr) : : "r"(t))
#endif // CRT_KELVIN_INTRINSICS_H_
// clang-format on