src - FreeBSD source tree

diff options


context:
space:
mode:

author	Dimitry Andric <dim@FreeBSD.org>	2021-08-25 18:31:14 +0000
committer	Dimitry Andric <dim@FreeBSD.org>	2021-12-25 11:51:35 +0000
commit	0fa51cfc680260c79257f065769557b2988d7ff9 (patch)
tree	3c18c3440b6f09ebf3cafe783af80e9bc9cbc8d8 /contrib/llvm-project/llvm/lib/Target/RISCV/RISCVInstrInfoV.td
parent	c7893a8deb0057939976283af6e9c283b53f32d0 (diff)
download	src-0fa51cfc680260c79257f065769557b2988d7ff9.tar.gz src-0fa51cfc680260c79257f065769557b2988d7ff9.zip

Merge llvm-project release/13.x llvmorg-13.0.0-rc1-97-g23ba3732246a

This updates llvm, clang, compiler-rt, libc++, libunwind, lld, lldb and openmp to llvmorg-13.0.0-rc1-97-g23ba3732246a. PR: 258209 MFC after: 2 weeks (cherry picked from commit 6e75b2fbf9a03e6876e0a3c089e0b3ad71876125)

Diffstat (limited to 'contrib/llvm-project/llvm/lib/Target/RISCV/RISCVInstrInfoV.td')

-rw-r--r--

contrib/llvm-project/llvm/lib/Target/RISCV/RISCVInstrInfoV.td

1003

1 files changed, 715 insertions, 288 deletions

diff --git a/contrib/llvm-project/llvm/lib/Target/RISCV/RISCVInstrInfoV.td b/contrib/llvm-project/llvm/lib/Target/RISCV/RISCVInstrInfoV.td
index 342497150d49..8af3c8f5cfdb 100644
--- a/contrib/llvm-project/llvm/lib/Target/RISCV/RISCVInstrInfoV.td
+++ b/contrib/llvm-project/llvm/lib/Target/RISCV/RISCVInstrInfoV.td

@@ -78,6 +78,39 @@ def simm5_plus1 : Operand<XLenVT>, ImmLeaf<XLenVT,

}

//===----------------------------------------------------------------------===//

+// Scheduling definitions.

+//===----------------------------------------------------------------------===//

+class VMVRSched<int n>: Sched <[!cast<SchedReadWrite>("WriteVMov" # n # "V"),

+ !cast<SchedReadWrite>("ReadVMov" # n # "V")]>;

+class VLESched<int n> : Sched <[!cast<SchedReadWrite>("WriteVLDE" # n),

+ ReadVLDX, ReadVMask]>;

+class VSESched<int n> : Sched <[!cast<SchedReadWrite>("WriteVSTE" # n),

+ !cast<SchedReadWrite>("ReadVSTE" # n # "V"),

+ ReadVSTX, ReadVMask]>;

+class VLSSched<int n> : Sched <[!cast<SchedReadWrite>("WriteVLDS" # n),

+ ReadVLDX, ReadVLDSX, ReadVMask]>;

+class VSSSched<int n> : Sched <[!cast<SchedReadWrite>("WriteVSTS" # n),

+ !cast<SchedReadWrite>("ReadVSTS" # n # "V"),

+ ReadVSTX, ReadVSTSX, ReadVMask]>;

+class VLXSched<int n, string o> :

+ Sched <[!cast<SchedReadWrite>("WriteVLD" # o # "X" # n),

+ ReadVLDX, !cast<SchedReadWrite>("ReadVLD" # o # "XV"), ReadVMask]>;

+class VSXSched<int n, string o> :

+ Sched <[!cast<SchedReadWrite>("WriteVST" # o # "X" # n),

+ !cast<SchedReadWrite>("ReadVST" # o # "X" # n),

+ ReadVSTX, !cast<SchedReadWrite>("ReadVST" # o # "XV"), ReadVMask]>;

+class VLFSched<int n> : Sched <[!cast<SchedReadWrite>("WriteVLDFF" # n),

+ ReadVLDX, ReadVMask]>;

+//===----------------------------------------------------------------------===//

// Instruction class templates

//===----------------------------------------------------------------------===//

@@ -328,106 +361,417 @@ class VAMONoWd<RISCVAMOOP amoop, RISCVWidth width, string opcodestr>

// Use these multiclasses to define instructions more easily.

//===----------------------------------------------------------------------===//

multiclass VALU_IV_V_X_I<string opcodestr, bits<6> funct6, Operand optype = simm5, string vw = "v"> {

- def V : VALUVV<funct6, OPIVV, opcodestr # "." # vw # "v">;

- def X : VALUVX<funct6, OPIVX, opcodestr # "." # vw # "x">;

- def I : VALUVI<funct6, opcodestr # "." # vw # "i", optype>;

+ def V : VALUVV<funct6, OPIVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVIALUV, ReadVIALUV, ReadVIALUV, ReadVMask]>;

+ def X : VALUVX<funct6, OPIVX, opcodestr # "." # vw # "x">,

+ Sched<[WriteVIALUX, ReadVIALUV, ReadVIALUX, ReadVMask]>;

+ def I : VALUVI<funct6, opcodestr # "." # vw # "i", optype>,

+ Sched<[WriteVIALUI, ReadVIALUV, ReadVMask]>;

}

multiclass VALU_IV_V_X<string opcodestr, bits<6> funct6, string vw = "v"> {

- def V : VALUVV<funct6, OPIVV, opcodestr # "." # vw # "v">;

- def X : VALUVX<funct6, OPIVX, opcodestr # "." # vw # "x">;

+ def V : VALUVV<funct6, OPIVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVIALUV, ReadVIALUV, ReadVIALUV, ReadVMask]>;

+ def X : VALUVX<funct6, OPIVX, opcodestr # "." # vw # "x">,

+ Sched<[WriteVIALUX, ReadVIALUV, ReadVIALUX, ReadVMask]>;

}

-multiclass VALUr_IV_V_X<string opcodestr, bits<6> funct6, string vw = "v"> {

- def V : VALUrVV<funct6, OPIVV, opcodestr # "." # vw # "v">;

- def X : VALUrVX<funct6, OPIVX, opcodestr # "." # vw # "x">;

+multiclass VALU_IV_X_I<string opcodestr, bits<6> funct6, Operand optype = simm5, string vw = "v"> {

+ def X : VALUVX<funct6, OPIVX, opcodestr # "." # vw # "x">,

+ Sched<[WriteVIALUV, ReadVIALUV, ReadVIALUX, ReadVMask]>;

+ def I : VALUVI<funct6, opcodestr # "." # vw # "i", optype>,

+ Sched<[WriteVIALUI, ReadVIALUV, ReadVMask]>;

}

-multiclass VALU_IV_X_I<string opcodestr, bits<6> funct6, Operand optype = simm5, string vw = "v"> {

- def X : VALUVX<funct6, OPIVX, opcodestr # "." # vw # "x">;

- def I : VALUVI<funct6, opcodestr # "." # vw # "i", optype>;

+multiclass VALU_MV_V_X<string opcodestr, bits<6> funct6, string vw = "v"> {

+ def V : VALUVV<funct6, OPMVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVIWALUV, ReadVIWALUV, ReadVIWALUV, ReadVMask]>;

+ def X : VALUVX<funct6, OPMVX, opcodestr # "." # vw # "x">,

+ Sched<[WriteVIWALUX, ReadVIWALUV, ReadVIWALUX, ReadVMask]>;

}

-multiclass VALU_IV_V<string opcodestr, bits<6> funct6> {

- def _VS : VALUVV<funct6, OPIVV, opcodestr # ".vs">;

+multiclass VMAC_MV_V_X<string opcodestr, bits<6> funct6, string vw = "v"> {

+ def V : VALUrVV<funct6, OPMVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVIMulAddV, ReadVIMulAddV, ReadVIMulAddV, ReadVMask]>;

+ def X : VALUrVX<funct6, OPMVX, opcodestr # "." # vw # "x">,

+ Sched<[WriteVIMulAddX, ReadVIMulAddV, ReadVIMulAddX, ReadVMask]>;

}

-multiclass VALUr_IV_X<string opcodestr, bits<6> funct6, string vw = "v"> {

- def X : VALUrVX<funct6, OPIVX, opcodestr # "." # vw # "x">;

+multiclass VWMAC_MV_V_X<string opcodestr, bits<6> funct6, string vw = "v"> {

+ def V : VALUrVV<funct6, OPMVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVIWMulAddV, ReadVIWMulAddV, ReadVIWMulAddV, ReadVMask]>;

+ def X : VALUrVX<funct6, OPMVX, opcodestr # "." # vw # "x">,

+ Sched<[WriteVIWMulAddX, ReadVIWMulAddV, ReadVIWMulAddX, ReadVMask]>;

}

-multiclass VALU_MV_V_X<string opcodestr, bits<6> funct6, string vw = "v"> {

- def V : VALUVV<funct6, OPMVV, opcodestr # "." # vw # "v">;

- def X : VALUVX<funct6, OPMVX, opcodestr # "." # vw # "x">;

+multiclass VWMAC_MV_X<string opcodestr, bits<6> funct6, string vw = "v"> {

+ def X : VALUrVX<funct6, OPMVX, opcodestr # "." # vw # "x">,

+ Sched<[WriteVIWMulAddX, ReadVIWMulAddV, ReadVIWMulAddX, ReadVMask]>;

+multiclass VALU_MV_VS2<string opcodestr, bits<6> funct6, bits<5> vs1> {

+ def "" : VALUVs2<funct6, vs1, OPMVV, opcodestr>,

+ Sched<[WriteVExtV, ReadVExtV, ReadVMask]>;

+multiclass VALUm_IV_V_X_I<string opcodestr, bits<6> funct6> {

+ def VM : VALUmVV<funct6, OPIVV, opcodestr # ".vvm">,

+ Sched<[WriteVICALUV, ReadVIALUCV, ReadVIALUCV, ReadVMask]>;

+ def XM : VALUmVX<funct6, OPIVX, opcodestr # ".vxm">,

+ Sched<[WriteVICALUX, ReadVIALUCV, ReadVIALUCX, ReadVMask]>;

+ def IM : VALUmVI<funct6, opcodestr # ".vim">,

+ Sched<[WriteVICALUI, ReadVIALUCV, ReadVMask]>;

}

-multiclass VALU_MV_V<string opcodestr, bits<6> funct6> {

- def _VS : VALUVV<funct6, OPMVV, opcodestr # ".vs">;

+multiclass VMRG_IV_V_X_I<string opcodestr, bits<6> funct6> {

+ def VM : VALUmVV<funct6, OPIVV, opcodestr # ".vvm">,

+ Sched<[WriteVIMergeV, ReadVIMergeV, ReadVIMergeV, ReadVMask]>;

+ def XM : VALUmVX<funct6, OPIVX, opcodestr # ".vxm">,

+ Sched<[WriteVIMergeX, ReadVIMergeV, ReadVIMergeX, ReadVMask]>;

+ def IM : VALUmVI<funct6, opcodestr # ".vim">,

+ Sched<[WriteVIMergeI, ReadVIMergeV, ReadVMask]>;

}

-multiclass VALU_MV_Mask<string opcodestr, bits<6> funct6, string vm = "v"> {

- def M : VALUVVNoVm<funct6, OPMVV, opcodestr # "." # vm # "m">;

+multiclass VALUm_IV_V_X<string opcodestr, bits<6> funct6> {

+ def VM : VALUmVV<funct6, OPIVV, opcodestr # ".vvm">,

+ Sched<[WriteVICALUV, ReadVIALUCV, ReadVIALUCV, ReadVMask]>;

+ def XM : VALUmVX<funct6, OPIVX, opcodestr # ".vxm">,

+ Sched<[WriteVICALUX, ReadVIALUCV, ReadVIALUCX, ReadVMask]>;

}

-multiclass VALU_MV_X<string opcodestr, bits<6> funct6, string vw = "v"> {

- def X : VALUVX<funct6, OPMVX, opcodestr # "." # vw # "x">;

+multiclass VALUNoVm_IV_V_X_I<string opcodestr, bits<6> funct6, Operand optype = simm5> {

+ def V : VALUVVNoVm<funct6, OPIVV, opcodestr # ".vv">,

+ Sched<[WriteVICALUV, ReadVIALUCV, ReadVIALUCV]>;

+ def X : VALUVXNoVm<funct6, OPIVX, opcodestr # ".vx">,

+ Sched<[WriteVICALUX, ReadVIALUCV, ReadVIALUCX]>;

+ def I : VALUVINoVm<funct6, opcodestr # ".vi", optype>,

+ Sched<[WriteVICALUI, ReadVIALUCV]>;

}

-multiclass VALUr_MV_V_X<string opcodestr, bits<6> funct6, string vw = "v"> {

- def V : VALUrVV<funct6, OPMVV, opcodestr # "." # vw # "v">;

- def X : VALUrVX<funct6, OPMVX, opcodestr # "." # vw # "x">;

+multiclass VALUNoVm_IV_V_X<string opcodestr, bits<6> funct6> {

+ def V : VALUVVNoVm<funct6, OPIVV, opcodestr # ".vv">,

+ Sched<[WriteVICALUV, ReadVIALUCV, ReadVIALUCV]>;

+ def X : VALUVXNoVm<funct6, OPIVX, opcodestr # ".vx">,

+ Sched<[WriteVICALUX, ReadVIALUCV, ReadVIALUCX]>;

}

-multiclass VALUr_MV_X<string opcodestr, bits<6> funct6, string vw = "v"> {

- def X : VALUrVX<funct6, OPMVX, opcodestr # "." # vw # "x">;

+multiclass VALU_FV_V_F<string opcodestr, bits<6> funct6, string vw = "v"> {

+ def V : VALUVV<funct6, OPFVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVFALUV, ReadVFALUV, ReadVFALUV, ReadVMask]>;

+ def F : VALUVF<funct6, OPFVF, opcodestr # "." # vw # "f">,

+ Sched<[WriteVFALUF, ReadVFALUV, ReadVFALUF, ReadVMask]>;

}

-multiclass VALU_MV_VS2<string opcodestr, bits<6> funct6, bits<5> vs1> {

- def "" : VALUVs2<funct6, vs1, OPMVV, opcodestr>;

+multiclass VALU_FV_F<string opcodestr, bits<6> funct6, string vw = "v"> {

+ def F : VALUVF<funct6, OPFVF, opcodestr # "." # vw # "f">,

+ Sched<[WriteVFALUF, ReadVFALUV, ReadVFALUF, ReadVMask]>;

}

-multiclass VALUm_IV_V_X_I<string opcodestr, bits<6> funct6> {

- def VM : VALUmVV<funct6, OPIVV, opcodestr # ".vvm">;

- def XM : VALUmVX<funct6, OPIVX, opcodestr # ".vxm">;

- def IM : VALUmVI<funct6, opcodestr # ".vim">;

+multiclass VWALU_FV_V_F<string opcodestr, bits<6> funct6, string vw = "v"> {

+ def V : VALUVV<funct6, OPFVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVFWALUV, ReadVFWALUV, ReadVFWALUV, ReadVMask]>;

+ def F : VALUVF<funct6, OPFVF, opcodestr # "." # vw # "f">,

+ Sched<[WriteVFWALUF, ReadVFWALUV, ReadVFWALUF, ReadVMask]>;

}

-multiclass VALUm_IV_V_X<string opcodestr, bits<6> funct6> {

- def VM : VALUmVV<funct6, OPIVV, opcodestr # ".vvm">;

- def XM : VALUmVX<funct6, OPIVX, opcodestr # ".vxm">;

+multiclass VMUL_FV_V_F<string opcodestr, bits<6> funct6, string vw = "v"> {

+ def V : VALUVV<funct6, OPFVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVFMulV, ReadVFMulV, ReadVFMulV, ReadVMask]>;

+ def F : VALUVF<funct6, OPFVF, opcodestr # "." # vw # "f">,

+ Sched<[WriteVFMulF, ReadVFMulV, ReadVFMulF, ReadVMask]>;

}

-multiclass VALUNoVm_IV_V_X_I<string opcodestr, bits<6> funct6, Operand optype = simm5> {

- def V : VALUVVNoVm<funct6, OPIVV, opcodestr # ".vv">;

- def X : VALUVXNoVm<funct6, OPIVX, opcodestr # ".vx">;

- def I : VALUVINoVm<funct6, opcodestr # ".vi", optype>;

+multiclass VDIV_FV_V_F<string opcodestr, bits<6> funct6, string vw = "v"> {

+ def V : VALUVV<funct6, OPFVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVFDivV, ReadVFDivV, ReadVFDivV, ReadVMask]>;

+ def F : VALUVF<funct6, OPFVF, opcodestr # "." # vw # "f">,

+ Sched<[WriteVFDivF, ReadVFDivV, ReadVFDivF, ReadVMask]>;

}

-multiclass VALUNoVm_IV_V_X<string opcodestr, bits<6> funct6> {

- def V : VALUVVNoVm<funct6, OPIVV, opcodestr # ".vv">;

- def X : VALUVXNoVm<funct6, OPIVX, opcodestr # ".vx">;

+multiclass VRDIV_FV_F<string opcodestr, bits<6> funct6, string vw = "v"> {

+ def F : VALUVF<funct6, OPFVF, opcodestr # "." # vw # "f">,

+ Sched<[WriteVFDivF, ReadVFDivV, ReadVFDivF, ReadVMask]>;

}

-multiclass VALU_FV_V_F<string opcodestr, bits<6> funct6, string vw = "v"> {

- def V : VALUVV<funct6, OPFVV, opcodestr # "." # vw # "v">;

- def F : VALUVF<funct6, OPFVF, opcodestr # "." # vw # "f">;

+multiclass VWMUL_FV_V_F<string opcodestr, bits<6> funct6, string vw = "v"> {

+ def V : VALUVV<funct6, OPFVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVFWMulV, ReadVFWMulV, ReadVFWMulV, ReadVMask]>;

+ def F : VALUVF<funct6, OPFVF, opcodestr # "." # vw # "f">,

+ Sched<[WriteVFWMulF, ReadVFWMulV, ReadVFWMulF, ReadVMask]>;

}

-multiclass VALU_FV_F<string opcodestr, bits<6> funct6, string vw = "v"> {

- def F : VALUVF<funct6, OPFVF, opcodestr # "." # vw # "f">;

+multiclass VMAC_FV_V_F<string opcodestr, bits<6> funct6, string vw = "v"> {

+ def V : VALUrVV<funct6, OPFVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVFMulAddV, ReadVFMulAddV, ReadVFMulAddV, ReadVMask]>;

+ def F : VALUrVF<funct6, OPFVF, opcodestr # "." # vw # "f">,

+ Sched<[WriteVFMulAddF, ReadVFMulAddV, ReadVFMulAddF, ReadVMask]>;

+multiclass VWMAC_FV_V_F<string opcodestr, bits<6> funct6, string vw = "v"> {

+ def V : VALUrVV<funct6, OPFVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVFWMulAddV, ReadVFWMulAddV, ReadVFWMulAddV, ReadVMask]>;

+ def F : VALUrVF<funct6, OPFVF, opcodestr # "." # vw # "f">,

+ Sched<[WriteVFWMulAddF, ReadVFWMulAddV, ReadVFWMulAddF, ReadVMask]>;

+multiclass VSQR_FV_VS2<string opcodestr, bits<6> funct6, bits<5> vs1> {

+ def "" : VALUVs2<funct6, vs1, OPFVV, opcodestr>,

+ Sched<[WriteVFSqrtV, ReadVFSqrtV, ReadVMask]>;

+multiclass VRCP_FV_VS2<string opcodestr, bits<6> funct6, bits<5> vs1> {

+ def "" : VALUVs2<funct6, vs1, OPFVV, opcodestr>,

+ Sched<[WriteVFRecpV, ReadVFRecpV, ReadVMask]>;

+multiclass VCMP_FV_V_F<string opcodestr, bits<6> funct6, string vw = "v"> {

+ def V : VALUVV<funct6, OPFVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVFCmpV, ReadVFCmpV, ReadVFCmpV, ReadVMask]>;

+ def F : VALUVF<funct6, OPFVF, opcodestr # "." # vw # "f">,

+ Sched<[WriteVFCmpF, ReadVFCmpV, ReadVFCmpF, ReadVMask]>;

+multiclass VCMP_FV_F<string opcodestr, bits<6> funct6, string vw = "v"> {

+ def F : VALUVF<funct6, OPFVF, opcodestr # "." # vw # "f">,

+ Sched<[WriteVFCmpF, ReadVFCmpV, ReadVFCmpF, ReadVMask]>;

+multiclass VSGNJ_FV_V_F<string opcodestr, bits<6> funct6, string vw = "v"> {

+ def V : VALUVV<funct6, OPFVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVFSgnjV, ReadVFSgnjV, ReadVFSgnjV, ReadVMask]>;

+ def F : VALUVF<funct6, OPFVF, opcodestr # "." # vw # "f">,

+ Sched<[WriteVFSgnjF, ReadVFSgnjV, ReadVFSgnjF, ReadVMask]>;

+multiclass VCLS_FV_VS2<string opcodestr, bits<6> funct6, bits<5> vs1> {

+ def "" : VALUVs2<funct6, vs1, OPFVV, opcodestr>,

+ Sched<[WriteVFClassV, ReadVFClassV, ReadVMask]>;

+multiclass VCVTF_IV_VS2<string opcodestr, bits<6> funct6, bits<5> vs1> {

+ def "" : VALUVs2<funct6, vs1, OPFVV, opcodestr>,

+ Sched<[WriteVFCvtIToFV, ReadVFCvtIToFV, ReadVMask]>;

+multiclass VCVTI_FV_VS2<string opcodestr, bits<6> funct6, bits<5> vs1> {

+ def "" : VALUVs2<funct6, vs1, OPFVV, opcodestr>,

+ Sched<[WriteVFCvtFToIV, ReadVFCvtFToIV, ReadVMask]>;

+multiclass VWCVTF_IV_VS2<string opcodestr, bits<6> funct6, bits<5> vs1> {

+ def "" : VALUVs2<funct6, vs1, OPFVV, opcodestr>,

+ Sched<[WriteVFWCvtIToFV, ReadVFWCvtIToFV, ReadVMask]>;

+multiclass VWCVTI_FV_VS2<string opcodestr, bits<6> funct6, bits<5> vs1> {

+ def "" : VALUVs2<funct6, vs1, OPFVV, opcodestr>,

+ Sched<[WriteVFWCvtFToIV, ReadVFWCvtFToIV, ReadVMask]>;

+multiclass VWCVTF_FV_VS2<string opcodestr, bits<6> funct6, bits<5> vs1> {

+ def "" : VALUVs2<funct6, vs1, OPFVV, opcodestr>,

+ Sched<[WriteVFWCvtFToFV, ReadVFWCvtFToFV, ReadVMask]>;

+multiclass VNCVTF_IV_VS2<string opcodestr, bits<6> funct6, bits<5> vs1> {

+ def "" : VALUVs2<funct6, vs1, OPFVV, opcodestr>,

+ Sched<[WriteVFNCvtIToFV, ReadVFNCvtIToFV, ReadVMask]>;

+multiclass VNCVTI_FV_VS2<string opcodestr, bits<6> funct6, bits<5> vs1> {

+ def "" : VALUVs2<funct6, vs1, OPFVV, opcodestr>,

+ Sched<[WriteVFNCvtFToIV, ReadVFNCvtFToIV, ReadVMask]>;

+multiclass VNCVTF_FV_VS2<string opcodestr, bits<6> funct6, bits<5> vs1> {

+ def "" : VALUVs2<funct6, vs1, OPFVV, opcodestr>,

+ Sched<[WriteVFNCvtFToFV, ReadVFNCvtFToFV, ReadVMask]>;

+multiclass VRED_MV_V<string opcodestr, bits<6> funct6> {

+ def _VS : VALUVV<funct6, OPMVV, opcodestr # ".vs">,

+ Sched<[WriteVIRedV, ReadVIRedV, ReadVIRedV0, ReadVMask]>;

+multiclass VWRED_IV_V<string opcodestr, bits<6> funct6> {

+ def _VS : VALUVV<funct6, OPIVV, opcodestr # ".vs">,

+ Sched<[WriteVIWRedV, ReadVIWRedV, ReadVIWRedV0, ReadVMask]>;

+multiclass VRED_FV_V<string opcodestr, bits<6> funct6> {

+ def _VS : VALUVV<funct6, OPFVV, opcodestr # ".vs">,

+ Sched<[WriteVFRedV, ReadVFRedV, ReadVFRedV0, ReadVMask]>;

+multiclass VREDO_FV_V<string opcodestr, bits<6> funct6> {

+ def _VS : VALUVV<funct6, OPFVV, opcodestr # ".vs">,

+ Sched<[WriteVFRedOV, ReadVFRedOV, ReadVFRedOV0, ReadVMask]>;

+multiclass VWRED_FV_V<string opcodestr, bits<6> funct6> {

+ def _VS : VALUVV<funct6, OPFVV, opcodestr # ".vs">,

+ Sched<[WriteVFWRedV, ReadVFWRedV, ReadVFWRedV0, ReadVMask]>;

+multiclass VWREDO_FV_V<string opcodestr, bits<6> funct6> {

+ def _VS : VALUVV<funct6, OPFVV, opcodestr # ".vs">,

+ Sched<[WriteVFWRedOV, ReadVFWRedOV, ReadVFWRedOV0, ReadVMask]>;

}

-multiclass VALUr_FV_V_F<string opcodestr, bits<6> funct6, string vw = "v"> {

- def V : VALUrVV<funct6, OPFVV, opcodestr # "." # vw # "v">;

- def F : VALUrVF<funct6, OPFVF, opcodestr # "." # vw # "f">;

+multiclass VMALU_MV_Mask<string opcodestr, bits<6> funct6, string vm = "v"> {

+ def M : VALUVVNoVm<funct6, OPMVV, opcodestr # "." # vm # "m">,

+ Sched<[WriteVMALUV, ReadVMALUV, ReadVMALUV]>;

}

-multiclass VALU_FV_V<string opcodestr, bits<6> funct6> {

- def _VS : VALUVV<funct6, OPFVV, opcodestr # ".vs">;

+multiclass VMSFS_MV_V<string opcodestr, bits<6> funct6, bits<5> vs1> {

+ def "" : VALUVs2<funct6, vs1, OPMVV, opcodestr>,

+ Sched<[WriteVMSFSV, ReadVMSFSV, ReadVMask]>;

}

-multiclass VALU_FV_VS2<string opcodestr, bits<6> funct6, bits<5> vs1> {

- def "" : VALUVs2<funct6, vs1, OPFVV, opcodestr>;

+multiclass VMIOT_MV_V<string opcodestr, bits<6> funct6, bits<5> vs1> {

+ def "" : VALUVs2<funct6, vs1, OPMVV, opcodestr>,

+ Sched<[WriteVMIotV, ReadVMIotV, ReadVMask]>;

+multiclass VSHT_IV_V_X_I<string opcodestr, bits<6> funct6, Operand optype = simm5, string vw = "v"> {

+ def V : VALUVV<funct6, OPIVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVShiftV, ReadVShiftV, ReadVShiftV, ReadVMask]>;

+ def X : VALUVX<funct6, OPIVX, opcodestr # "." # vw # "x">,

+ Sched<[WriteVShiftX, ReadVShiftV, ReadVShiftX, ReadVMask]>;

+ def I : VALUVI<funct6, opcodestr # "." # vw # "i", optype>,

+ Sched<[WriteVShiftI, ReadVShiftV, ReadVMask]>;

+multiclass VNSHT_IV_V_X_I<string opcodestr, bits<6> funct6, Operand optype = simm5, string vw = "v"> {

+ def V : VALUVV<funct6, OPIVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVNShiftV, ReadVNShiftV, ReadVNShiftV, ReadVMask]>;

+ def X : VALUVX<funct6, OPIVX, opcodestr # "." # vw # "x">,

+ Sched<[WriteVNShiftX, ReadVNShiftV, ReadVNShiftX, ReadVMask]>;

+ def I : VALUVI<funct6, opcodestr # "." # vw # "i", optype>,

+ Sched<[WriteVNShiftI, ReadVNShiftV, ReadVMask]>;

+multiclass VCMP_IV_V_X_I<string opcodestr, bits<6> funct6, Operand optype = simm5, string vw = "v"> {

+ def V : VALUVV<funct6, OPIVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVICmpV, ReadVICmpV, ReadVICmpV, ReadVMask]>;

+ def X : VALUVX<funct6, OPIVX, opcodestr # "." # vw # "x">,

+ Sched<[WriteVICmpX, ReadVICmpV, ReadVICmpX, ReadVMask]>;

+ def I : VALUVI<funct6, opcodestr # "." # vw # "i", optype>,

+ Sched<[WriteVICmpI, ReadVICmpV, ReadVMask]>;

+multiclass VCMP_IV_X_I<string opcodestr, bits<6> funct6, Operand optype = simm5, string vw = "v"> {

+ def X : VALUVX<funct6, OPIVX, opcodestr # "." # vw # "x">,

+ Sched<[WriteVICmpV, ReadVICmpV, ReadVICmpX, ReadVMask]>;

+ def I : VALUVI<funct6, opcodestr # "." # vw # "i", optype>,

+ Sched<[WriteVICmpI, ReadVICmpV, ReadVMask]>;

+multiclass VCMP_IV_V_X<string opcodestr, bits<6> funct6, Operand optype = simm5, string vw = "v"> {

+ def V : VALUVV<funct6, OPIVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVICmpV, ReadVICmpV, ReadVICmpV, ReadVMask]>;

+ def X : VALUVX<funct6, OPIVX, opcodestr # "." # vw # "x">,

+ Sched<[WriteVICmpX, ReadVICmpV, ReadVICmpX, ReadVMask]>;

+multiclass VMUL_MV_V_X<string opcodestr, bits<6> funct6, string vw = "v"> {

+ def V : VALUVV<funct6, OPMVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVIMulV, ReadVIMulV, ReadVIMulV, ReadVMask]>;

+ def X : VALUVX<funct6, OPMVX, opcodestr # "." # vw # "x">,

+ Sched<[WriteVIMulX, ReadVIMulV, ReadVIMulX, ReadVMask]>;

+multiclass VWMUL_MV_V_X<string opcodestr, bits<6> funct6, string vw = "v"> {

+ def V : VALUVV<funct6, OPMVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVIWMulV, ReadVIWMulV, ReadVIWMulV, ReadVMask]>;

+ def X : VALUVX<funct6, OPMVX, opcodestr # "." # vw # "x">,

+ Sched<[WriteVIWMulX, ReadVIWMulV, ReadVIWMulX, ReadVMask]>;

+multiclass VDIV_MV_V_X<string opcodestr, bits<6> funct6, string vw = "v"> {

+ def V : VALUVV<funct6, OPMVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVIDivV, ReadVIDivV, ReadVIDivV, ReadVMask]>;

+ def X : VALUVX<funct6, OPMVX, opcodestr # "." # vw # "x">,

+ Sched<[WriteVIDivX, ReadVIDivV, ReadVIDivX, ReadVMask]>;

+multiclass VSALU_IV_V_X_I<string opcodestr, bits<6> funct6, Operand optype = simm5, string vw = "v"> {

+ def V : VALUVV<funct6, OPIVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVSALUV, ReadVSALUV, ReadVSALUV, ReadVMask]>;

+ def X : VALUVX<funct6, OPIVX, opcodestr # "." # vw # "x">,

+ Sched<[WriteVSALUX, ReadVSALUV, ReadVSALUX, ReadVMask]>;

+ def I : VALUVI<funct6, opcodestr # "." # vw # "i", optype>,

+ Sched<[WriteVSALUI, ReadVSALUV, ReadVMask]>;

+multiclass VSALU_IV_V_X<string opcodestr, bits<6> funct6, string vw = "v"> {

+ def V : VALUVV<funct6, OPIVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVSALUV, ReadVSALUV, ReadVSALUV, ReadVMask]>;

+ def X : VALUVX<funct6, OPIVX, opcodestr # "." # vw # "x">,

+ Sched<[WriteVSALUX, ReadVSALUV, ReadVSALUX, ReadVMask]>;

+multiclass VAALU_MV_V_X<string opcodestr, bits<6> funct6, string vw = "v"> {

+ def V : VALUVV<funct6, OPMVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVAALUV, ReadVAALUV, ReadVAALUV, ReadVMask]>;

+ def X : VALUVX<funct6, OPMVX, opcodestr # "." # vw # "x">,

+ Sched<[WriteVAALUX, ReadVAALUV, ReadVAALUX, ReadVMask]>;

+multiclass VSMUL_IV_V_X<string opcodestr, bits<6> funct6, string vw = "v"> {

+ def V : VALUVV<funct6, OPIVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVSMulV, ReadVSMulV, ReadVSMulV, ReadVMask]>;

+ def X : VALUVX<funct6, OPIVX, opcodestr # "." # vw # "x">,

+ Sched<[WriteVSMulX, ReadVSMulV, ReadVSMulX, ReadVMask]>;

+multiclass VSSHF_IV_V_X_I<string opcodestr, bits<6> funct6, Operand optype = simm5, string vw = "v"> {

+ def V : VALUVV<funct6, OPIVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVSShiftV, ReadVSShiftV, ReadVSShiftV, ReadVMask]>;

+ def X : VALUVX<funct6, OPIVX, opcodestr # "." # vw # "x">,

+ Sched<[WriteVSShiftX, ReadVSShiftV, ReadVSShiftX, ReadVMask]>;

+ def I : VALUVI<funct6, opcodestr # "." # vw # "i", optype>,

+ Sched<[WriteVSShiftI, ReadVSShiftV, ReadVMask]>;

+multiclass VNCLP_IV_V_X_I<string opcodestr, bits<6> funct6, Operand optype = simm5, string vw = "v"> {

+ def V : VALUVV<funct6, OPIVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVNClipV, ReadVNClipV, ReadVNClipV, ReadVMask]>;

+ def X : VALUVX<funct6, OPIVX, opcodestr # "." # vw # "x">,

+ Sched<[WriteVNClipX, ReadVNClipV, ReadVNClipX, ReadVMask]>;

+ def I : VALUVI<funct6, opcodestr # "." # vw # "i", optype>,

+ Sched<[WriteVNClipI, ReadVNClipV, ReadVMask]>;

+multiclass VSLD_IV_X_I<string opcodestr, bits<6> funct6, Operand optype = simm5, string vw = "v"> {

+ def X : VALUVX<funct6, OPIVX, opcodestr # "." # vw # "x">,

+ Sched<[WriteVISlideX, ReadVISlideV, ReadVISlideX, ReadVMask]>;

+ def I : VALUVI<funct6, opcodestr # "." # vw # "i", optype>,

+ Sched<[WriteVISlideI, ReadVISlideV, ReadVMask]>;

+multiclass VSLD1_MV_X<string opcodestr, bits<6> funct6, string vw = "v"> {

+ def X : VALUVX<funct6, OPMVX, opcodestr # "." # vw # "x">,

+ Sched<[WriteVISlide1X, ReadVISlideV, ReadVISlideX, ReadVMask]>;

+multiclass VSLD1_FV_F<string opcodestr, bits<6> funct6, string vw = "v"> {

+ def F : VALUVF<funct6, OPFVF, opcodestr # "." # vw # "f">,

+ Sched<[WriteVFSlide1F, ReadVFSlideV, ReadVFSlideF, ReadVMask]>;

+multiclass VGTR_IV_V_X_I<string opcodestr, bits<6> funct6, Operand optype = simm5, string vw = "v"> {

+ def V : VALUVV<funct6, OPIVV, opcodestr # "." # vw # "v">,

+ Sched<[WriteVGatherV, ReadVGatherV, ReadVGatherV, ReadVMask]>;

+ def X : VALUVX<funct6, OPIVX, opcodestr # "." # vw # "x">,

+ Sched<[WriteVGatherX, ReadVGatherV, ReadVGatherX, ReadVMask]>;

+ def I : VALUVI<funct6, opcodestr # "." # vw # "i", optype>,

+ Sched<[WriteVGatherI, ReadVGatherV, ReadVMask]>;

+multiclass VCPR_MV_Mask<string opcodestr, bits<6> funct6, string vm = "v"> {

+ def M : VALUVVNoVm<funct6, OPMVV, opcodestr # "." # vm # "m">,

+ Sched<[WriteVCompressV, ReadVCompressV, ReadVCompressV]>;

}

multiclass VAMO<RISCVAMOOP amoop, RISCVWidth width, string opcodestr> {

@@ -435,11 +779,48 @@ multiclass VAMO<RISCVAMOOP amoop, RISCVWidth width, string opcodestr> {

def _UNWD : VAMONoWd<amoop, width, opcodestr>;

}

-multiclass VWholeLoad<bits<3> nf, string opcodestr, RegisterClass VRC> {

- def E8_V : VWholeLoad<nf, LSWidth8, opcodestr # "e8.v", VRC>;

- def E16_V : VWholeLoad<nf, LSWidth16, opcodestr # "e16.v", VRC>;

- def E32_V : VWholeLoad<nf, LSWidth32, opcodestr # "e32.v", VRC>;

- def E64_V : VWholeLoad<nf, LSWidth64, opcodestr # "e64.v", VRC>;

+multiclass VWholeLoad1<string opcodestr, RegisterClass VRC> {

+ def E8_V : VWholeLoad<0, LSWidth8, opcodestr # "e8.v", VRC>,

+ Sched<[WriteVLD1R8, ReadVLDX]>;

+ def E16_V : VWholeLoad<0, LSWidth16, opcodestr # "e16.v", VRC>,

+ Sched<[WriteVLD1R16, ReadVLDX]>;

+ def E32_V : VWholeLoad<0, LSWidth32, opcodestr # "e32.v", VRC>,

+ Sched<[WriteVLD1R32, ReadVLDX]>;

+ def E64_V : VWholeLoad<0, LSWidth64, opcodestr # "e64.v", VRC>,

+ Sched<[WriteVLD1R64, ReadVLDX]>;

+multiclass VWholeLoad2<string opcodestr, RegisterClass VRC> {

+ def E8_V : VWholeLoad<1, LSWidth8, opcodestr # "e8.v", VRC>,

+ Sched<[WriteVLD2R8, ReadVLDX]>;

+ def E16_V : VWholeLoad<1, LSWidth16, opcodestr # "e16.v", VRC>,

+ Sched<[WriteVLD2R16, ReadVLDX]>;

+ def E32_V : VWholeLoad<1, LSWidth32, opcodestr # "e32.v", VRC>,

+ Sched<[WriteVLD2R32, ReadVLDX]>;

+ def E64_V : VWholeLoad<1, LSWidth64, opcodestr # "e64.v", VRC>,

+ Sched<[WriteVLD2R64, ReadVLDX]>;

+multiclass VWholeLoad4<string opcodestr, RegisterClass VRC> {

+ def E8_V : VWholeLoad<3, LSWidth8, opcodestr # "e8.v", VRC>,

+ Sched<[WriteVLD4R8, ReadVLDX]>;

+ def E16_V : VWholeLoad<3, LSWidth16, opcodestr # "e16.v", VRC>,

+ Sched<[WriteVLD4R16, ReadVLDX]>;

+ def E32_V : VWholeLoad<3, LSWidth32, opcodestr # "e32.v", VRC>,

+ Sched<[WriteVLD4R32, ReadVLDX]>;

+ def E64_V : VWholeLoad<3, LSWidth64, opcodestr # "e64.v", VRC>,

+ Sched<[WriteVLD1R64, ReadVLDX]>;

+multiclass VWholeLoad8<string opcodestr, RegisterClass VRC> {

+ def E8_V : VWholeLoad<7, LSWidth8, opcodestr # "e8.v", VRC>,

+ Sched<[WriteVLD8R8, ReadVLDX]>;

+ def E16_V : VWholeLoad<7, LSWidth16, opcodestr # "e16.v", VRC>,

+ Sched<[WriteVLD8R16, ReadVLDX]>;

+ def E32_V : VWholeLoad<7, LSWidth32, opcodestr # "e32.v", VRC>,

+ Sched<[WriteVLD8R32, ReadVLDX]>;

+ def E64_V : VWholeLoad<7, LSWidth64, opcodestr # "e64.v", VRC>,

+ Sched<[WriteVLD8R64, ReadVLDX]>;

}

//===----------------------------------------------------------------------===//

@@ -459,69 +840,94 @@ def VSETVL : RVInstSetVL<(outs GPR:$rd), (ins GPR:$rs1, GPR:$rs2),

} // hasSideEffects = 1, mayLoad = 0, mayStore = 0

// Vector Unit-Stride Instructions

-def VLE8_V : VUnitStrideLoad<LUMOPUnitStride, LSWidth8, "vle8.v">;

-def VLE16_V : VUnitStrideLoad<LUMOPUnitStride, LSWidth16, "vle16.v">;

-def VLE32_V : VUnitStrideLoad<LUMOPUnitStride, LSWidth32, "vle32.v">;

-def VLE64_V : VUnitStrideLoad<LUMOPUnitStride, LSWidth64, "vle64.v">;

-def VLE8FF_V : VUnitStrideLoad<LUMOPUnitStrideFF, LSWidth8, "vle8ff.v">;

-def VLE16FF_V : VUnitStrideLoad<LUMOPUnitStrideFF, LSWidth16, "vle16ff.v">;

-def VLE32FF_V : VUnitStrideLoad<LUMOPUnitStrideFF, LSWidth32, "vle32ff.v">;

-def VLE64FF_V : VUnitStrideLoad<LUMOPUnitStrideFF, LSWidth64, "vle64ff.v">;

-def VLE1_V : VUnitStrideLoadMask<"vle1.v">;

-def VSE1_V : VUnitStrideStoreMask<"vse1.v">;

-def VSE8_V : VUnitStrideStore<SUMOPUnitStride, LSWidth8, "vse8.v">;

-def VSE16_V : VUnitStrideStore<SUMOPUnitStride, LSWidth16, "vse16.v">;

-def VSE32_V : VUnitStrideStore<SUMOPUnitStride, LSWidth32, "vse32.v">;

-def VSE64_V : VUnitStrideStore<SUMOPUnitStride, LSWidth64, "vse64.v">;

+def VLE8_V : VUnitStrideLoad<LUMOPUnitStride, LSWidth8, "vle8.v">,

+ VLESched<8>;

+def VLE16_V : VUnitStrideLoad<LUMOPUnitStride, LSWidth16, "vle16.v">,

+ VLESched<16>;

+def VLE32_V : VUnitStrideLoad<LUMOPUnitStride, LSWidth32, "vle32.v">,

+ VLESched<32>;

+def VLE64_V : VUnitStrideLoad<LUMOPUnitStride, LSWidth64, "vle64.v">,

+ VLESched<64>;

+def VLE8FF_V : VUnitStrideLoad<LUMOPUnitStrideFF, LSWidth8, "vle8ff.v">,

+ VLFSched<8>;

+def VLE16FF_V : VUnitStrideLoad<LUMOPUnitStrideFF, LSWidth16, "vle16ff.v">,

+ VLFSched<16>;

+def VLE32FF_V : VUnitStrideLoad<LUMOPUnitStrideFF, LSWidth32, "vle32ff.v">,

+ VLFSched<32>;

+def VLE64FF_V : VUnitStrideLoad<LUMOPUnitStrideFF, LSWidth64, "vle64ff.v">,

+ VLFSched<64>;

+def VLE1_V : VUnitStrideLoadMask<"vle1.v">,

+ Sched<[WriteVLDM, ReadVLDX]>;

+def VSE1_V : VUnitStrideStoreMask<"vse1.v">,

+ Sched<[WriteVSTM, ReadVSTM, ReadVSTX]>;

+def VSE8_V : VUnitStrideStore<SUMOPUnitStride, LSWidth8, "vse8.v">,

+ VSESched<8>;

+def VSE16_V : VUnitStrideStore<SUMOPUnitStride, LSWidth16, "vse16.v">,

+ VSESched<16>;

+def VSE32_V : VUnitStrideStore<SUMOPUnitStride, LSWidth32, "vse32.v">,

+ VSESched<32>;

+def VSE64_V : VUnitStrideStore<SUMOPUnitStride, LSWidth64, "vse64.v">,

+ VSESched<64>;

// Vector Strided Instructions

-def VLSE8_V : VStridedLoad<LSWidth8, "vlse8.v">;

-def VLSE16_V : VStridedLoad<LSWidth16, "vlse16.v">;

-def VLSE32_V : VStridedLoad<LSWidth32, "vlse32.v">;

-def VLSE64_V : VStridedLoad<LSWidth64, "vlse64.v">;

-def VSSE8_V : VStridedStore<LSWidth8, "vsse8.v">;

-def VSSE16_V : VStridedStore<LSWidth16, "vsse16.v">;

-def VSSE32_V : VStridedStore<LSWidth32, "vsse32.v">;

-def VSSE64_V : VStridedStore<LSWidth64, "vsse64.v">;

+def VLSE8_V : VStridedLoad<LSWidth8, "vlse8.v">,

+ VLSSched<8>;

+def VLSE16_V : VStridedLoad<LSWidth16, "vlse16.v">,

+ VLSSched<16>;

+def VLSE32_V : VStridedLoad<LSWidth32, "vlse32.v">,

+ VLSSched<32>;

+def VLSE64_V : VStridedLoad<LSWidth64, "vlse64.v">,

+ VLSSched<32>;

+def VSSE8_V : VStridedStore<LSWidth8, "vsse8.v">,

+ VSSSched<8>;

+def VSSE16_V : VStridedStore<LSWidth16, "vsse16.v">,

+ VSSSched<16>;

+def VSSE32_V : VStridedStore<LSWidth32, "vsse32.v">,

+ VSSSched<32>;

+def VSSE64_V : VStridedStore<LSWidth64, "vsse64.v">,

+ VSSSched<64>;

// Vector Indexed Instructions

-def VLUXEI8_V : VIndexedLoad<MOPLDIndexedUnord, LSWidth8, "vluxei8.v">;

-def VLUXEI16_V : VIndexedLoad<MOPLDIndexedUnord, LSWidth16, "vluxei16.v">;

-def VLUXEI32_V : VIndexedLoad<MOPLDIndexedUnord, LSWidth32, "vluxei32.v">;

-def VLUXEI64_V : VIndexedLoad<MOPLDIndexedUnord, LSWidth64, "vluxei64.v">;

-def VLOXEI8_V : VIndexedLoad<MOPLDIndexedOrder, LSWidth8, "vloxei8.v">;

-def VLOXEI16_V : VIndexedLoad<MOPLDIndexedOrder, LSWidth16, "vloxei16.v">;

-def VLOXEI32_V : VIndexedLoad<MOPLDIndexedOrder, LSWidth32, "vloxei32.v">;

-def VLOXEI64_V : VIndexedLoad<MOPLDIndexedOrder, LSWidth64, "vloxei64.v">;

-def VSUXEI8_V : VIndexedStore<MOPSTIndexedUnord, LSWidth8, "vsuxei8.v">;

-def VSUXEI16_V : VIndexedStore<MOPSTIndexedUnord, LSWidth16, "vsuxei16.v">;

-def VSUXEI32_V : VIndexedStore<MOPSTIndexedUnord, LSWidth32, "vsuxei32.v">;

-def VSUXEI64_V : VIndexedStore<MOPSTIndexedUnord, LSWidth64, "vsuxei64.v">;

-def VSOXEI8_V : VIndexedStore<MOPSTIndexedOrder, LSWidth8, "vsoxei8.v">;

-def VSOXEI16_V : VIndexedStore<MOPSTIndexedOrder, LSWidth16, "vsoxei16.v">;

-def VSOXEI32_V : VIndexedStore<MOPSTIndexedOrder, LSWidth32, "vsoxei32.v">;

-def VSOXEI64_V : VIndexedStore<MOPSTIndexedOrder, LSWidth64, "vsoxei64.v">;

-defm VL1R : VWholeLoad<0, "vl1r", VR>;

-defm VL2R : VWholeLoad<1, "vl2r", VRM2>;

-defm VL4R : VWholeLoad<3, "vl4r", VRM4>;

-defm VL8R : VWholeLoad<7, "vl8r", VRM8>;

+foreach n = [8, 16, 32, 64] in {

+defvar w = !cast<RISCVWidth>("LSWidth" # n);

+def VLUXEI # n # _V :

+ VIndexedLoad<MOPLDIndexedUnord, w, "vluxei" # n # ".v">,

+ VLXSched<n, "U">;

+def VLOXEI # n # _V :

+ VIndexedLoad<MOPLDIndexedOrder, w, "vloxei" # n # ".v">,

+ VLXSched<n, "O">;

+def VSUXEI # n # _V :

+ VIndexedStore<MOPSTIndexedUnord, w, "vsuxei" # n # ".v">,

+ VSXSched<n, "U">;

+def VSOXEI # n # _V :

+ VIndexedStore<MOPSTIndexedOrder, w, "vsoxei" # n # ".v">,

+ VSXSched<n, "O">;

+defm VL1R : VWholeLoad1<"vl1r", VR>;

+defm VL2R : VWholeLoad2<"vl2r", VRM2>;

+defm VL4R : VWholeLoad4<"vl4r", VRM4>;

+defm VL8R : VWholeLoad8<"vl8r", VRM8>;

def : InstAlias<"vl1r.v $vd, (${rs1})", (VL1RE8_V VR:$vd, GPR:$rs1)>;

def : InstAlias<"vl2r.v $vd, (${rs1})", (VL2RE8_V VRM2:$vd, GPR:$rs1)>;

def : InstAlias<"vl4r.v $vd, (${rs1})", (VL4RE8_V VRM4:$vd, GPR:$rs1)>;

def : InstAlias<"vl8r.v $vd, (${rs1})", (VL8RE8_V VRM8:$vd, GPR:$rs1)>;

-def VS1R_V : VWholeStore<0, "vs1r.v", VR>;

-def VS2R_V : VWholeStore<1, "vs2r.v", VRM2>;

-def VS4R_V : VWholeStore<3, "vs4r.v", VRM4>;

-def VS8R_V : VWholeStore<7, "vs8r.v", VRM8>;

+def VS1R_V : VWholeStore<0, "vs1r.v", VR>,

+ Sched<[WriteVST1R, ReadVST1R, ReadVSTX]>;

+def VS2R_V : VWholeStore<1, "vs2r.v", VRM2>,

+ Sched<[WriteVST2R, ReadVST2R, ReadVSTX]>;

+def VS4R_V : VWholeStore<3, "vs4r.v", VRM4>,

+ Sched<[WriteVST4R, ReadVST4R, ReadVSTX]>;

+def VS8R_V : VWholeStore<7, "vs8r.v", VRM8>,

+ Sched<[WriteVST8R, ReadVST8R, ReadVSTX]>;

// Vector Single-Width Integer Add and Subtract

defm VADD_V : VALU_IV_V_X_I<"vadd", 0b000000>;

@@ -588,9 +994,9 @@ def : InstAlias<"vnot.v $vd, $vs$vm",

(VXOR_VI VR:$vd, VR:$vs, -1, VMaskOp:$vm)>;

// Vector Single-Width Bit Shift Instructions

-defm VSLL_V : VALU_IV_V_X_I<"vsll", 0b100101, uimm5>;

-defm VSRL_V : VALU_IV_V_X_I<"vsrl", 0b101000, uimm5>;

-defm VSRA_V : VALU_IV_V_X_I<"vsra", 0b101001, uimm5>;

+defm VSLL_V : VSHT_IV_V_X_I<"vsll", 0b100101, uimm5>;

+defm VSRL_V : VSHT_IV_V_X_I<"vsrl", 0b101000, uimm5>;

+defm VSRA_V : VSHT_IV_V_X_I<"vsra", 0b101001, uimm5>;

// Vector Narrowing Integer Right Shift Instructions

// Refer to 11.3. Narrowing Vector Arithmetic Instructions

@@ -598,8 +1004,8 @@ defm VSRA_V : VALU_IV_V_X_I<"vsra", 0b101001, uimm5>;

// vector register group (specified by vs2). The destination vector register

// group cannot overlap the mask register if used, unless LMUL=1.

let Constraints = "@earlyclobber $vd" in {

-defm VNSRL_W : VALU_IV_V_X_I<"vnsrl", 0b101100, uimm5, "w">;

-defm VNSRA_W : VALU_IV_V_X_I<"vnsra", 0b101101, uimm5, "w">;

+defm VNSRL_W : VNSHT_IV_V_X_I<"vnsrl", 0b101100, uimm5, "w">;

+defm VNSRA_W : VNSHT_IV_V_X_I<"vnsra", 0b101101, uimm5, "w">;

} // Constraints = "@earlyclobber $vd"

def : InstAlias<"vncvt.x.x.w $vd, $vs$vm",

@@ -607,14 +1013,14 @@ def : InstAlias<"vncvt.x.x.w $vd, $vs$vm",

// Vector Integer Comparison Instructions

let RVVConstraint = NoConstraint in {

-defm VMSEQ_V : VALU_IV_V_X_I<"vmseq", 0b011000>;

-defm VMSNE_V : VALU_IV_V_X_I<"vmsne", 0b011001>;

-defm VMSLTU_V : VALU_IV_V_X<"vmsltu", 0b011010>;

-defm VMSLT_V : VALU_IV_V_X<"vmslt", 0b011011>;

-defm VMSLEU_V : VALU_IV_V_X_I<"vmsleu", 0b011100>;

-defm VMSLE_V : VALU_IV_V_X_I<"vmsle", 0b011101>;

-defm VMSGTU_V : VALU_IV_X_I<"vmsgtu", 0b011110>;

-defm VMSGT_V : VALU_IV_X_I<"vmsgt", 0b011111>;

+defm VMSEQ_V : VCMP_IV_V_X_I<"vmseq", 0b011000>;

+defm VMSNE_V : VCMP_IV_V_X_I<"vmsne", 0b011001>;

+defm VMSLTU_V : VCMP_IV_V_X<"vmsltu", 0b011010>;

+defm VMSLT_V : VCMP_IV_V_X<"vmslt", 0b011011>;

+defm VMSLEU_V : VCMP_IV_V_X_I<"vmsleu", 0b011100>;

+defm VMSLE_V : VCMP_IV_V_X_I<"vmsle", 0b011101>;

+defm VMSGTU_V : VCMP_IV_X_I<"vmsgtu", 0b011110>;

+defm VMSGT_V : VCMP_IV_X_I<"vmsgt", 0b011111>;

} // RVVConstraint = NoConstraint

def : InstAlias<"vmsgtu.vv $vd, $va, $vb$vm",

@@ -672,84 +1078,87 @@ def PseudoVMSGE_VX_M_T : Pseudo<(outs VR:$vd, VRNoV0:$scratch),

}

// Vector Integer Min/Max Instructions

-defm VMINU_V : VALU_IV_V_X<"vminu", 0b000100>;

-defm VMIN_V : VALU_IV_V_X<"vmin", 0b000101>;

-defm VMAXU_V : VALU_IV_V_X<"vmaxu", 0b000110>;

-defm VMAX_V : VALU_IV_V_X<"vmax", 0b000111>;

+defm VMINU_V : VCMP_IV_V_X<"vminu", 0b000100>;

+defm VMIN_V : VCMP_IV_V_X<"vmin", 0b000101>;

+defm VMAXU_V : VCMP_IV_V_X<"vmaxu", 0b000110>;

+defm VMAX_V : VCMP_IV_V_X<"vmax", 0b000111>;

// Vector Single-Width Integer Multiply Instructions

-defm VMUL_V : VALU_MV_V_X<"vmul", 0b100101>;

-defm VMULH_V : VALU_MV_V_X<"vmulh", 0b100111>;

-defm VMULHU_V : VALU_MV_V_X<"vmulhu", 0b100100>;

-defm VMULHSU_V : VALU_MV_V_X<"vmulhsu", 0b100110>;

+defm VMUL_V : VMUL_MV_V_X<"vmul", 0b100101>;

+defm VMULH_V : VMUL_MV_V_X<"vmulh", 0b100111>;

+defm VMULHU_V : VMUL_MV_V_X<"vmulhu", 0b100100>;

+defm VMULHSU_V : VMUL_MV_V_X<"vmulhsu", 0b100110>;

// Vector Integer Divide Instructions

-defm VDIVU_V : VALU_MV_V_X<"vdivu", 0b100000>;

-defm VDIV_V : VALU_MV_V_X<"vdiv", 0b100001>;

-defm VREMU_V : VALU_MV_V_X<"vremu", 0b100010>;

-defm VREM_V : VALU_MV_V_X<"vrem", 0b100011>;

+defm VDIVU_V : VDIV_MV_V_X<"vdivu", 0b100000>;

+defm VDIV_V : VDIV_MV_V_X<"vdiv", 0b100001>;

+defm VREMU_V : VDIV_MV_V_X<"vremu", 0b100010>;

+defm VREM_V : VDIV_MV_V_X<"vrem", 0b100011>;

// Vector Widening Integer Multiply Instructions

let Constraints = "@earlyclobber $vd", RVVConstraint = WidenV in {

-defm VWMUL_V : VALU_MV_V_X<"vwmul", 0b111011>;

-defm VWMULU_V : VALU_MV_V_X<"vwmulu", 0b111000>;

-defm VWMULSU_V : VALU_MV_V_X<"vwmulsu", 0b111010>;

+defm VWMUL_V : VWMUL_MV_V_X<"vwmul", 0b111011>;

+defm VWMULU_V : VWMUL_MV_V_X<"vwmulu", 0b111000>;

+defm VWMULSU_V : VWMUL_MV_V_X<"vwmulsu", 0b111010>;

} // Constraints = "@earlyclobber $vd", RVVConstraint = WidenV

// Vector Single-Width Integer Multiply-Add Instructions

-defm VMACC_V : VALUr_MV_V_X<"vmacc", 0b101101>;

-defm VNMSAC_V : VALUr_MV_V_X<"vnmsac", 0b101111>;

-defm VMADD_V : VALUr_MV_V_X<"vmadd", 0b101001>;

-defm VNMSUB_V : VALUr_MV_V_X<"vnmsub", 0b101011>;

+defm VMACC_V : VMAC_MV_V_X<"vmacc", 0b101101>;

+defm VNMSAC_V : VMAC_MV_V_X<"vnmsac", 0b101111>;

+defm VMADD_V : VMAC_MV_V_X<"vmadd", 0b101001>;

+defm VNMSUB_V : VMAC_MV_V_X<"vnmsub", 0b101011>;

// Vector Widening Integer Multiply-Add Instructions

let Constraints = "@earlyclobber $vd", RVVConstraint = WidenV in {

-defm VWMACCU_V : VALUr_MV_V_X<"vwmaccu", 0b111100>;

-defm VWMACC_V : VALUr_MV_V_X<"vwmacc", 0b111101>;

-defm VWMACCSU_V : VALUr_MV_V_X<"vwmaccsu", 0b111111>;

-defm VWMACCUS_V : VALUr_MV_X<"vwmaccus", 0b111110>;

+defm VWMACCU_V : VWMAC_MV_V_X<"vwmaccu", 0b111100>;

+defm VWMACC_V : VWMAC_MV_V_X<"vwmacc", 0b111101>;

+defm VWMACCSU_V : VWMAC_MV_V_X<"vwmaccsu", 0b111111>;

+defm VWMACCUS_V : VWMAC_MV_X<"vwmaccus", 0b111110>;

} // Constraints = "@earlyclobber $vd", RVVConstraint = WidenV

// Vector Integer Merge Instructions

-defm VMERGE_V : VALUm_IV_V_X_I<"vmerge", 0b010111>;

+defm VMERGE_V : VMRG_IV_V_X_I<"vmerge", 0b010111>;

// Vector Integer Move Instructions

let hasSideEffects = 0, mayLoad = 0, mayStore = 0, vs2 = 0, vm = 1,

RVVConstraint = NoConstraint in {

// op vd, vs1

def VMV_V_V : RVInstVV<0b010111, OPIVV, (outs VR:$vd),

- (ins VR:$vs1), "vmv.v.v", "$vd, $vs1">;

+ (ins VR:$vs1), "vmv.v.v", "$vd, $vs1">,

+ Sched<[WriteVIMovV, ReadVIMovV]>;

// op vd, rs1

def VMV_V_X : RVInstVX<0b010111, OPIVX, (outs VR:$vd),

- (ins GPR:$rs1), "vmv.v.x", "$vd, $rs1">;

+ (ins GPR:$rs1), "vmv.v.x", "$vd, $rs1">,

+ Sched<[WriteVIMovX, ReadVIMovX]>;

// op vd, imm

def VMV_V_I : RVInstIVI<0b010111, (outs VR:$vd),

- (ins simm5:$imm), "vmv.v.i", "$vd, $imm">;

+ (ins simm5:$imm), "vmv.v.i", "$vd, $imm">,

+ Sched<[WriteVIMovI]>;

} // hasSideEffects = 0, mayLoad = 0, mayStore = 0

// Vector Fixed-Point Arithmetic Instructions

-defm VSADDU_V : VALU_IV_V_X_I<"vsaddu", 0b100000>;

-defm VSADD_V : VALU_IV_V_X_I<"vsadd", 0b100001>;

-defm VSSUBU_V : VALU_IV_V_X<"vssubu", 0b100010>;

-defm VSSUB_V : VALU_IV_V_X<"vssub", 0b100011>;

+defm VSADDU_V : VSALU_IV_V_X_I<"vsaddu", 0b100000>;

+defm VSADD_V : VSALU_IV_V_X_I<"vsadd", 0b100001>;

+defm VSSUBU_V : VSALU_IV_V_X<"vssubu", 0b100010>;

+defm VSSUB_V : VSALU_IV_V_X<"vssub", 0b100011>;

// Vector Single-Width Averaging Add and Subtract

-defm VAADDU_V : VALU_MV_V_X<"vaaddu", 0b001000>;

-defm VAADD_V : VALU_MV_V_X<"vaadd", 0b001001>;

-defm VASUBU_V : VALU_MV_V_X<"vasubu", 0b001010>;

-defm VASUB_V : VALU_MV_V_X<"vasub", 0b001011>;

+defm VAADDU_V : VAALU_MV_V_X<"vaaddu", 0b001000>;

+defm VAADD_V : VAALU_MV_V_X<"vaadd", 0b001001>;

+defm VASUBU_V : VAALU_MV_V_X<"vasubu", 0b001010>;

+defm VASUB_V : VAALU_MV_V_X<"vasub", 0b001011>;

// Vector Single-Width Fractional Multiply with Rounding and Saturation

-defm VSMUL_V : VALU_IV_V_X<"vsmul", 0b100111>;

+defm VSMUL_V : VSMUL_IV_V_X<"vsmul", 0b100111>;

// Vector Single-Width Scaling Shift Instructions

-defm VSSRL_V : VALU_IV_V_X_I<"vssrl", 0b101010, uimm5>;

-defm VSSRA_V : VALU_IV_V_X_I<"vssra", 0b101011, uimm5>;

+defm VSSRL_V : VSSHF_IV_V_X_I<"vssrl", 0b101010, uimm5>;

+defm VSSRA_V : VSSHF_IV_V_X_I<"vssra", 0b101011, uimm5>;

// Vector Narrowing Fixed-Point Clip Instructions

let Constraints = "@earlyclobber $vd" in {

-defm VNCLIPU_W : VALU_IV_V_X_I<"vnclipu", 0b101110, uimm5, "w">;

-defm VNCLIP_W : VALU_IV_V_X_I<"vnclip", 0b101111, uimm5, "w">;

+defm VNCLIPU_W : VNCLP_IV_V_X_I<"vnclipu", 0b101110, uimm5, "w">;

+defm VNCLIP_W : VNCLP_IV_V_X_I<"vnclip", 0b101111, uimm5, "w">;

} // Constraints = "@earlyclobber $vd"

} // Predicates = [HasStdExtV]

@@ -762,60 +1171,60 @@ defm VFRSUB_V : VALU_FV_F<"vfrsub", 0b100111>;

// Vector Widening Floating-Point Add/Subtract Instructions

let Constraints = "@earlyclobber $vd" in {

let RVVConstraint = WidenV in {

-defm VFWADD_V : VALU_FV_V_F<"vfwadd", 0b110000>;

-defm VFWSUB_V : VALU_FV_V_F<"vfwsub", 0b110010>;

+defm VFWADD_V : VWALU_FV_V_F<"vfwadd", 0b110000>;

+defm VFWSUB_V : VWALU_FV_V_F<"vfwsub", 0b110010>;

} // RVVConstraint = WidenV

// Set earlyclobber for following instructions for second and mask operands.

// This has the downside that the earlyclobber constraint is too coarse and

// will impose unnecessary restrictions by not allowing the destination to

// overlap with the first (wide) operand.

let RVVConstraint = WidenW in {

-defm VFWADD_W : VALU_FV_V_F<"vfwadd", 0b110100, "w">;

-defm VFWSUB_W : VALU_FV_V_F<"vfwsub", 0b110110, "w">;

+defm VFWADD_W : VWALU_FV_V_F<"vfwadd", 0b110100, "w">;

+defm VFWSUB_W : VWALU_FV_V_F<"vfwsub", 0b110110, "w">;

} // RVVConstraint = WidenW

} // Constraints = "@earlyclobber $vd"

// Vector Single-Width Floating-Point Multiply/Divide Instructions

-defm VFMUL_V : VALU_FV_V_F<"vfmul", 0b100100>;

-defm VFDIV_V : VALU_FV_V_F<"vfdiv", 0b100000>;

-defm VFRDIV_V : VALU_FV_F<"vfrdiv", 0b100001>;

+defm VFMUL_V : VMUL_FV_V_F<"vfmul", 0b100100>;

+defm VFDIV_V : VDIV_FV_V_F<"vfdiv", 0b100000>;

+defm VFRDIV_V : VRDIV_FV_F<"vfrdiv", 0b100001>;

// Vector Widening Floating-Point Multiply

let Constraints = "@earlyclobber $vd", RVVConstraint = WidenV in {

-defm VFWMUL_V : VALU_FV_V_F<"vfwmul", 0b111000>;

+defm VFWMUL_V : VWMUL_FV_V_F<"vfwmul", 0b111000>;

} // Constraints = "@earlyclobber $vd", RVVConstraint = WidenV

// Vector Single-Width Floating-Point Fused Multiply-Add Instructions

-defm VFMACC_V : VALUr_FV_V_F<"vfmacc", 0b101100>;

-defm VFNMACC_V : VALUr_FV_V_F<"vfnmacc", 0b101101>;

-defm VFMSAC_V : VALUr_FV_V_F<"vfmsac", 0b101110>;

-defm VFNMSAC_V : VALUr_FV_V_F<"vfnmsac", 0b101111>;

-defm VFMADD_V : VALUr_FV_V_F<"vfmadd", 0b101000>;

-defm VFNMADD_V : VALUr_FV_V_F<"vfnmadd", 0b101001>;

-defm VFMSUB_V : VALUr_FV_V_F<"vfmsub", 0b101010>;

-defm VFNMSUB_V : VALUr_FV_V_F<"vfnmsub", 0b101011>;

+defm VFMACC_V : VMAC_FV_V_F<"vfmacc", 0b101100>;

+defm VFNMACC_V : VMAC_FV_V_F<"vfnmacc", 0b101101>;

+defm VFMSAC_V : VMAC_FV_V_F<"vfmsac", 0b101110>;

+defm VFNMSAC_V : VMAC_FV_V_F<"vfnmsac", 0b101111>;

+defm VFMADD_V : VMAC_FV_V_F<"vfmadd", 0b101000>;

+defm VFNMADD_V : VMAC_FV_V_F<"vfnmadd", 0b101001>;

+defm VFMSUB_V : VMAC_FV_V_F<"vfmsub", 0b101010>;

+defm VFNMSUB_V : VMAC_FV_V_F<"vfnmsub", 0b101011>;

// Vector Widening Floating-Point Fused Multiply-Add Instructions

let Constraints = "@earlyclobber $vd", RVVConstraint = WidenV in {

-defm VFWMACC_V : VALUr_FV_V_F<"vfwmacc", 0b111100>;

-defm VFWNMACC_V : VALUr_FV_V_F<"vfwnmacc", 0b111101>;

-defm VFWMSAC_V : VALUr_FV_V_F<"vfwmsac", 0b111110>;

-defm VFWNMSAC_V : VALUr_FV_V_F<"vfwnmsac", 0b111111>;

+defm VFWMACC_V : VWMAC_FV_V_F<"vfwmacc", 0b111100>;

+defm VFWNMACC_V : VWMAC_FV_V_F<"vfwnmacc", 0b111101>;

+defm VFWMSAC_V : VWMAC_FV_V_F<"vfwmsac", 0b111110>;

+defm VFWNMSAC_V : VWMAC_FV_V_F<"vfwnmsac", 0b111111>;

} // Constraints = "@earlyclobber $vd", RVVConstraint = WidenV

// Vector Floating-Point Square-Root Instruction

-defm VFSQRT_V : VALU_FV_VS2<"vfsqrt.v", 0b010011, 0b00000>;

-defm VFRSQRT7_V : VALU_FV_VS2<"vfrsqrt7.v", 0b010011, 0b00100>;

-defm VFREC7_V : VALU_FV_VS2<"vfrec7.v", 0b010011, 0b00101>;

+defm VFSQRT_V : VSQR_FV_VS2<"vfsqrt.v", 0b010011, 0b00000>;

+defm VFRSQRT7_V : VRCP_FV_VS2<"vfrsqrt7.v", 0b010011, 0b00100>;

+defm VFREC7_V : VRCP_FV_VS2<"vfrec7.v", 0b010011, 0b00101>;

// Vector Floating-Point MIN/MAX Instructions

-defm VFMIN_V : VALU_FV_V_F<"vfmin", 0b000100>;

-defm VFMAX_V : VALU_FV_V_F<"vfmax", 0b000110>;

+defm VFMIN_V : VCMP_FV_V_F<"vfmin", 0b000100>;

+defm VFMAX_V : VCMP_FV_V_F<"vfmax", 0b000110>;

// Vector Floating-Point Sign-Injection Instructions

-defm VFSGNJ_V : VALU_FV_V_F<"vfsgnj", 0b001000>;

-defm VFSGNJN_V : VALU_FV_V_F<"vfsgnjn", 0b001001>;

-defm VFSGNJX_V : VALU_FV_V_F<"vfsgnjx", 0b001010>;

+defm VFSGNJ_V : VSGNJ_FV_V_F<"vfsgnj", 0b001000>;

+defm VFSGNJN_V : VSGNJ_FV_V_F<"vfsgnjn", 0b001001>;

+defm VFSGNJX_V : VSGNJ_FV_V_F<"vfsgnjx", 0b001010>;

def : InstAlias<"vfneg.v $vd, $vs$vm",

(VFSGNJN_VV VR:$vd, VR:$vs, VR:$vs, VMaskOp:$vm)>;

@@ -824,12 +1233,12 @@ def : InstAlias<"vfabs.v $vd, $vs$vm",

// Vector Floating-Point Compare Instructions

let RVVConstraint = NoConstraint in {

-defm VMFEQ_V : VALU_FV_V_F<"vmfeq", 0b011000>;

-defm VMFNE_V : VALU_FV_V_F<"vmfne", 0b011100>;

-defm VMFLT_V : VALU_FV_V_F<"vmflt", 0b011011>;

-defm VMFLE_V : VALU_FV_V_F<"vmfle", 0b011001>;

-defm VMFGT_V : VALU_FV_F<"vmfgt", 0b011101>;

-defm VMFGE_V : VALU_FV_F<"vmfge", 0b011111>;

+defm VMFEQ_V : VCMP_FV_V_F<"vmfeq", 0b011000>;

+defm VMFNE_V : VCMP_FV_V_F<"vmfne", 0b011100>;

+defm VMFLT_V : VCMP_FV_V_F<"vmflt", 0b011011>;

+defm VMFLE_V : VCMP_FV_V_F<"vmfle", 0b011001>;

+defm VMFGT_V : VCMP_FV_F<"vmfgt", 0b011101>;

+defm VMFGE_V : VCMP_FV_F<"vmfge", 0b011111>;

} // RVVConstraint = NoConstraint

def : InstAlias<"vmfgt.vv $vd, $va, $vb$vm",

@@ -838,68 +1247,70 @@ def : InstAlias<"vmfge.vv $vd, $va, $vb$vm",

(VMFLE_VV VR:$vd, VR:$vb, VR:$va, VMaskOp:$vm), 0>;

// Vector Floating-Point Classify Instruction

-defm VFCLASS_V : VALU_FV_VS2<"vfclass.v", 0b010011, 0b10000>;

+defm VFCLASS_V : VCLS_FV_VS2<"vfclass.v", 0b010011, 0b10000>;

let hasSideEffects = 0, mayLoad = 0, mayStore = 0 in {

// Vector Floating-Point Merge Instruction

+let vm = 0 in

def VFMERGE_VFM : RVInstVX<0b010111, OPFVF, (outs VR:$vd),

(ins VR:$vs2, FPR32:$rs1, VMV0:$v0),

- "vfmerge.vfm", "$vd, $vs2, $rs1, v0"> {

- let vm = 0;

+ "vfmerge.vfm", "$vd, $vs2, $rs1, v0">,

+ Sched<[WriteVFMergeV, ReadVFMergeV, ReadVFMergeF, ReadVMask]>;

// Vector Floating-Point Move Instruction

let RVVConstraint = NoConstraint in

+let vm = 1, vs2 = 0 in

def VFMV_V_F : RVInstVX<0b010111, OPFVF, (outs VR:$vd),

- (ins FPR32:$rs1), "vfmv.v.f", "$vd, $rs1"> {

- let vs2 = 0;

- let vm = 1;

+ (ins FPR32:$rs1), "vfmv.v.f", "$vd, $rs1">,

+ Sched<[WriteVFMovV, ReadVFMovF]>;

} // hasSideEffects = 0, mayLoad = 0, mayStore = 0

// Single-Width Floating-Point/Integer Type-Convert Instructions

-defm VFCVT_XU_F_V : VALU_FV_VS2<"vfcvt.xu.f.v", 0b010010, 0b00000>;

-defm VFCVT_X_F_V : VALU_FV_VS2<"vfcvt.x.f.v", 0b010010, 0b00001>;

-defm VFCVT_RTZ_XU_F_V : VALU_FV_VS2<"vfcvt.rtz.xu.f.v", 0b010010, 0b00110>;

-defm VFCVT_RTZ_X_F_V : VALU_FV_VS2<"vfcvt.rtz.x.f.v", 0b010010, 0b00111>;

-defm VFCVT_F_XU_V : VALU_FV_VS2<"vfcvt.f.xu.v", 0b010010, 0b00010>;

-defm VFCVT_F_X_V : VALU_FV_VS2<"vfcvt.f.x.v", 0b010010, 0b00011>;

+defm VFCVT_XU_F_V : VCVTI_FV_VS2<"vfcvt.xu.f.v", 0b010010, 0b00000>;

+defm VFCVT_X_F_V : VCVTI_FV_VS2<"vfcvt.x.f.v", 0b010010, 0b00001>;

+defm VFCVT_RTZ_XU_F_V : VCVTI_FV_VS2<"vfcvt.rtz.xu.f.v", 0b010010, 0b00110>;

+defm VFCVT_RTZ_X_F_V : VCVTI_FV_VS2<"vfcvt.rtz.x.f.v", 0b010010, 0b00111>;

+defm VFCVT_F_XU_V : VCVTF_IV_VS2<"vfcvt.f.xu.v", 0b010010, 0b00010>;

+defm VFCVT_F_X_V : VCVTF_IV_VS2<"vfcvt.f.x.v", 0b010010, 0b00011>;

// Widening Floating-Point/Integer Type-Convert Instructions

let Constraints = "@earlyclobber $vd", RVVConstraint = WidenCvt in {

-defm VFWCVT_XU_F_V : VALU_FV_VS2<"vfwcvt.xu.f.v", 0b010010, 0b01000>;

-defm VFWCVT_X_F_V : VALU_FV_VS2<"vfwcvt.x.f.v", 0b010010, 0b01001>;

-defm VFWCVT_RTZ_XU_F_V : VALU_FV_VS2<"vfwcvt.rtz.xu.f.v", 0b010010, 0b01110>;

-defm VFWCVT_RTZ_X_F_V : VALU_FV_VS2<"vfwcvt.rtz.x.f.v", 0b010010, 0b01111>;

-defm VFWCVT_F_XU_V : VALU_FV_VS2<"vfwcvt.f.xu.v", 0b010010, 0b01010>;

-defm VFWCVT_F_X_V : VALU_FV_VS2<"vfwcvt.f.x.v", 0b010010, 0b01011>;

-defm VFWCVT_F_F_V : VALU_FV_VS2<"vfwcvt.f.f.v", 0b010010, 0b01100>;

+defm VFWCVT_XU_F_V : VWCVTI_FV_VS2<"vfwcvt.xu.f.v", 0b010010, 0b01000>;

+defm VFWCVT_X_F_V : VWCVTI_FV_VS2<"vfwcvt.x.f.v", 0b010010, 0b01001>;

+defm VFWCVT_RTZ_XU_F_V : VWCVTI_FV_VS2<"vfwcvt.rtz.xu.f.v", 0b010010, 0b01110>;

+defm VFWCVT_RTZ_X_F_V : VWCVTI_FV_VS2<"vfwcvt.rtz.x.f.v", 0b010010, 0b01111>;

+defm VFWCVT_F_XU_V : VWCVTF_IV_VS2<"vfwcvt.f.xu.v", 0b010010, 0b01010>;

+defm VFWCVT_F_X_V : VWCVTF_IV_VS2<"vfwcvt.f.x.v", 0b010010, 0b01011>;

+defm VFWCVT_F_F_V : VWCVTF_FV_VS2<"vfwcvt.f.f.v", 0b010010, 0b01100>;

} // Constraints = "@earlyclobber $vd", RVVConstraint = WidenCvt

// Narrowing Floating-Point/Integer Type-Convert Instructions

let Constraints = "@earlyclobber $vd" in {

-defm VFNCVT_XU_F_W : VALU_FV_VS2<"vfncvt.xu.f.w", 0b010010, 0b10000>;

-defm VFNCVT_X_F_W : VALU_FV_VS2<"vfncvt.x.f.w", 0b010010, 0b10001>;

-defm VFNCVT_RTZ_XU_F_W : VALU_FV_VS2<"vfncvt.rtz.xu.f.w", 0b010010, 0b10110>;

-defm VFNCVT_RTZ_X_F_W : VALU_FV_VS2<"vfncvt.rtz.x.f.w", 0b010010, 0b10111>;

-defm VFNCVT_F_XU_W : VALU_FV_VS2<"vfncvt.f.xu.w", 0b010010, 0b10010>;

-defm VFNCVT_F_X_W : VALU_FV_VS2<"vfncvt.f.x.w", 0b010010, 0b10011>;

-defm VFNCVT_F_F_W : VALU_FV_VS2<"vfncvt.f.f.w", 0b010010, 0b10100>;

-defm VFNCVT_ROD_F_F_W : VALU_FV_VS2<"vfncvt.rod.f.f.w", 0b010010, 0b10101>;

+defm VFNCVT_XU_F_W : VNCVTI_FV_VS2<"vfncvt.xu.f.w", 0b010010, 0b10000>;

+defm VFNCVT_X_F_W : VNCVTI_FV_VS2<"vfncvt.x.f.w", 0b010010, 0b10001>;

+defm VFNCVT_RTZ_XU_F_W : VNCVTI_FV_VS2<"vfncvt.rtz.xu.f.w", 0b010010, 0b10110>;

+defm VFNCVT_RTZ_X_F_W : VNCVTI_FV_VS2<"vfncvt.rtz.x.f.w", 0b010010, 0b10111>;

+defm VFNCVT_F_XU_W : VNCVTF_IV_VS2<"vfncvt.f.xu.w", 0b010010, 0b10010>;

+defm VFNCVT_F_X_W : VNCVTF_IV_VS2<"vfncvt.f.x.w", 0b010010, 0b10011>;

+defm VFNCVT_F_F_W : VNCVTF_FV_VS2<"vfncvt.f.f.w", 0b010010, 0b10100>;

+defm VFNCVT_ROD_F_F_W : VNCVTF_FV_VS2<"vfncvt.rod.f.f.w", 0b010010, 0b10101>;

} // Constraints = "@earlyclobber $vd"

} // Predicates = [HasStdExtV, HasStdExtF]

let Predicates = [HasStdExtV] in {

// Vector Single-Width Integer Reduction Instructions

let RVVConstraint = NoConstraint in {

-defm VREDSUM : VALU_MV_V<"vredsum", 0b000000>;

-defm VREDMAXU : VALU_MV_V<"vredmaxu", 0b000110>;

-defm VREDMAX : VALU_MV_V<"vredmax", 0b000111>;

-defm VREDMINU : VALU_MV_V<"vredminu", 0b000100>;

-defm VREDMIN : VALU_MV_V<"vredmin", 0b000101>;

-defm VREDAND : VALU_MV_V<"vredand", 0b000001>;

-defm VREDOR : VALU_MV_V<"vredor", 0b000010>;

-defm VREDXOR : VALU_MV_V<"vredxor", 0b000011>;

+defm VREDSUM : VRED_MV_V<"vredsum", 0b000000>;

+defm VREDMAXU : VRED_MV_V<"vredmaxu", 0b000110>;

+defm VREDMAX : VRED_MV_V<"vredmax", 0b000111>;

+defm VREDMINU : VRED_MV_V<"vredminu", 0b000100>;

+defm VREDMIN : VRED_MV_V<"vredmin", 0b000101>;

+defm VREDAND : VRED_MV_V<"vredand", 0b000001>;

+defm VREDOR : VRED_MV_V<"vredor", 0b000010>;

+defm VREDXOR : VRED_MV_V<"vredxor", 0b000011>;

} // RVVConstraint = NoConstraint

// Vector Widening Integer Reduction Instructions

@@ -908,18 +1319,19 @@ let Constraints = "@earlyclobber $vd", RVVConstraint = NoConstraint in {

// This has the downside that the earlyclobber constraint is too coarse and

// will impose unnecessary restrictions by not allowing the destination to

// overlap with the first (wide) operand.

-defm VWREDSUMU : VALU_IV_V<"vwredsumu", 0b110000>;

-defm VWREDSUM : VALU_IV_V<"vwredsum", 0b110001>;

+defm VWREDSUMU : VWRED_IV_V<"vwredsumu", 0b110000>;

+defm VWREDSUM : VWRED_IV_V<"vwredsum", 0b110001>;

} // Constraints = "@earlyclobber $vd", RVVConstraint = NoConstraint

} // Predicates = [HasStdExtV]

let Predicates = [HasStdExtV, HasStdExtF] in {

// Vector Single-Width Floating-Point Reduction Instructions

let RVVConstraint = NoConstraint in {

-defm VFREDOSUM : VALU_FV_V<"vfredosum", 0b000011>;

-defm VFREDSUM : VALU_FV_V<"vfredsum", 0b000001>;

-defm VFREDMAX : VALU_FV_V<"vfredmax", 0b000111>;

-defm VFREDMIN : VALU_FV_V<"vfredmin", 0b000101>;

+defm VFREDOSUM : VREDO_FV_V<"vfredosum", 0b000011>;

+defm VFREDSUM : VRED_FV_V<"vfredsum", 0b000001>;

+defm VFREDMAX : VRED_FV_V<"vfredmax", 0b000111>;

+defm VFREDMIN : VRED_FV_V<"vfredmin", 0b000101>;

} // RVVConstraint = NoConstraint

// Vector Widening Floating-Point Reduction Instructions

@@ -928,22 +1340,22 @@ let Constraints = "@earlyclobber $vd", RVVConstraint = NoConstraint in {

// This has the downside that the earlyclobber constraint is too coarse and

// will impose unnecessary restrictions by not allowing the destination to

// overlap with the first (wide) operand.

-defm VFWREDOSUM : VALU_FV_V<"vfwredosum", 0b110011>;

-defm VFWREDSUM : VALU_FV_V<"vfwredsum", 0b110001>;

+defm VFWREDOSUM : VWREDO_FV_V<"vfwredosum", 0b110011>;

+defm VFWREDSUM : VWRED_FV_V<"vfwredsum", 0b110001>;

} // Constraints = "@earlyclobber $vd", RVVConstraint = NoConstraint

} // Predicates = [HasStdExtV, HasStdExtF]

let Predicates = [HasStdExtV] in {

// Vector Mask-Register Logical Instructions

let RVVConstraint = NoConstraint in {

-defm VMAND_M : VALU_MV_Mask<"vmand", 0b011001, "m">;

-defm VMNAND_M : VALU_MV_Mask<"vmnand", 0b011101, "m">;

-defm VMANDNOT_M : VALU_MV_Mask<"vmandnot", 0b011000, "m">;

-defm VMXOR_M : VALU_MV_Mask<"vmxor", 0b011011, "m">;

-defm VMOR_M : VALU_MV_Mask<"vmor", 0b011010, "m">;

-defm VMNOR_M : VALU_MV_Mask<"vmnor", 0b011110, "m">;

-defm VMORNOT_M : VALU_MV_Mask<"vmornot", 0b011100, "m">;

-defm VMXNOR_M : VALU_MV_Mask<"vmxnor", 0b011111, "m">;

+defm VMAND_M : VMALU_MV_Mask<"vmand", 0b011001, "m">;

+defm VMNAND_M : VMALU_MV_Mask<"vmnand", 0b011101, "m">;

+defm VMANDNOT_M : VMALU_MV_Mask<"vmandnot", 0b011000, "m">;

+defm VMXOR_M : VMALU_MV_Mask<"vmxor", 0b011011, "m">;

+defm VMOR_M : VMALU_MV_Mask<"vmor", 0b011010, "m">;

+defm VMNOR_M : VMALU_MV_Mask<"vmnor", 0b011110, "m">;

+defm VMORNOT_M : VMALU_MV_Mask<"vmornot", 0b011100, "m">;

+defm VMXNOR_M : VMALU_MV_Mask<"vmxnor", 0b011111, "m">;

}

def : InstAlias<"vmmv.m $vd, $vs",

@@ -957,98 +1369,113 @@ def : InstAlias<"vmnot.m $vd, $vs",

let hasSideEffects = 0, mayLoad = 0, mayStore = 0,

RVVConstraint = NoConstraint in {

// Vector mask population count vpopc

def VPOPC_M : RVInstV<0b010000, 0b10000, OPMVV, (outs GPR:$vd),

- (ins VR:$vs2, VMaskOp:$vm),

- "vpopc.m", "$vd, $vs2$vm">;

+ (ins VR:$vs2, VMaskOp:$vm),

+ "vpopc.m", "$vd, $vs2$vm">,

+ Sched<[WriteVMPopV, ReadVMPopV, ReadVMask]>;

// vfirst find-first-set mask bit

def VFIRST_M : RVInstV<0b010000, 0b10001, OPMVV, (outs GPR:$vd),

- (ins VR:$vs2, VMaskOp:$vm),

- "vfirst.m", "$vd, $vs2$vm">;

+ (ins VR:$vs2, VMaskOp:$vm),

+ "vfirst.m", "$vd, $vs2$vm">,

+ Sched<[WriteVMFFSV, ReadVMFFSV, ReadVMask]>;

} // hasSideEffects = 0, mayLoad = 0, mayStore = 0

let Constraints = "@earlyclobber $vd", RVVConstraint = Iota in {

// vmsbf.m set-before-first mask bit

-defm VMSBF_M : VALU_MV_VS2<"vmsbf.m", 0b010100, 0b00001>;

+defm VMSBF_M : VMSFS_MV_V<"vmsbf.m", 0b010100, 0b00001>;

// vmsif.m set-including-first mask bit

-defm VMSIF_M : VALU_MV_VS2<"vmsif.m", 0b010100, 0b00011>;

+defm VMSIF_M : VMSFS_MV_V<"vmsif.m", 0b010100, 0b00011>;

// vmsof.m set-only-first mask bit

-defm VMSOF_M : VALU_MV_VS2<"vmsof.m", 0b010100, 0b00010>;

+defm VMSOF_M : VMSFS_MV_V<"vmsof.m", 0b010100, 0b00010>;

// Vector Iota Instruction

-defm VIOTA_M : VALU_MV_VS2<"viota.m", 0b010100, 0b10000>;

+defm VIOTA_M : VMIOT_MV_V<"viota.m", 0b010100, 0b10000>;

} // Constraints = "@earlyclobber $vd", RVVConstraint = Iota

// Vector Element Index Instruction

let hasSideEffects = 0, mayLoad = 0, mayStore = 0 in {

+let vs2 = 0 in

def VID_V : RVInstV<0b010100, 0b10001, OPMVV, (outs VR:$vd),

- (ins VMaskOp:$vm), "vid.v", "$vd$vm"> {

- let vs2 = 0;

+ (ins VMaskOp:$vm), "vid.v", "$vd$vm">,

+ Sched<[WriteVMIdxV, ReadVMask]>;

// Integer Scalar Move Instructions

let vm = 1, RVVConstraint = NoConstraint in {

def VMV_X_S : RVInstV<0b010000, 0b00000, OPMVV, (outs GPR:$vd),

- (ins VR:$vs2), "vmv.x.s", "$vd, $vs2">;

+ (ins VR:$vs2), "vmv.x.s", "$vd, $vs2">,

+ Sched<[WriteVIMovVX, ReadVIMovVX]>;

let Constraints = "$vd = $vd_wb" in

def VMV_S_X : RVInstV2<0b010000, 0b00000, OPMVX, (outs VR:$vd_wb),

- (ins VR:$vd, GPR:$rs1), "vmv.s.x", "$vd, $rs1">;

+ (ins VR:$vd, GPR:$rs1), "vmv.s.x", "$vd, $rs1">,

+ Sched<[WriteVIMovXV, ReadVIMovXV, ReadVIMovXX]>;

}

} // hasSideEffects = 0, mayLoad = 0, mayStore = 0

} // Predicates = [HasStdExtV]

let Predicates = [HasStdExtV, HasStdExtF] in {

let hasSideEffects = 0, mayLoad = 0, mayStore = 0, vm = 1,

RVVConstraint = NoConstraint in {

// Floating-Point Scalar Move Instructions

def VFMV_F_S : RVInstV<0b010000, 0b00000, OPFVV, (outs FPR32:$vd),

- (ins VR:$vs2), "vfmv.f.s", "$vd, $vs2">;

+ (ins VR:$vs2), "vfmv.f.s", "$vd, $vs2">,

+ Sched<[WriteVFMovVF, ReadVFMovVF]>;

let Constraints = "$vd = $vd_wb" in

def VFMV_S_F : RVInstV2<0b010000, 0b00000, OPFVF, (outs VR:$vd_wb),

- (ins VR:$vd, FPR32:$rs1), "vfmv.s.f", "$vd, $rs1">;

+ (ins VR:$vd, FPR32:$rs1), "vfmv.s.f", "$vd, $rs1">,

+ Sched<[WriteVFMovFV, ReadVFMovFV, ReadVFMovFX]>;

} // hasSideEffects = 0, mayLoad = 0, mayStore = 0, vm = 1

} // Predicates = [HasStdExtV, HasStdExtF]

let Predicates = [HasStdExtV] in {

// Vector Slide Instructions

let Constraints = "@earlyclobber $vd", RVVConstraint = SlideUp in {

-defm VSLIDEUP_V : VALU_IV_X_I<"vslideup", 0b001110, uimm5>;

-defm VSLIDE1UP_V : VALU_MV_X<"vslide1up", 0b001110>;

+defm VSLIDEUP_V : VSLD_IV_X_I<"vslideup", 0b001110, uimm5>;

+defm VSLIDE1UP_V : VSLD1_MV_X<"vslide1up", 0b001110>;

} // Constraints = "@earlyclobber $vd", RVVConstraint = SlideUp

-defm VSLIDEDOWN_V : VALU_IV_X_I<"vslidedown", 0b001111, uimm5>;

-defm VSLIDE1DOWN_V : VALU_MV_X<"vslide1down", 0b001111>;

+defm VSLIDEDOWN_V : VSLD_IV_X_I<"vslidedown", 0b001111, uimm5>;

+defm VSLIDE1DOWN_V : VSLD1_MV_X<"vslide1down", 0b001111>;

} // Predicates = [HasStdExtV]

let Predicates = [HasStdExtV, HasStdExtF] in {

let Constraints = "@earlyclobber $vd", RVVConstraint = SlideUp in {

-defm VFSLIDE1UP_V : VALU_FV_F<"vfslide1up", 0b001110>;

+defm VFSLIDE1UP_V : VSLD1_FV_F<"vfslide1up", 0b001110>;

} // Constraints = "@earlyclobber $vd", RVVConstraint = SlideUp

-defm VFSLIDE1DOWN_V : VALU_FV_F<"vfslide1down", 0b001111>;

+defm VFSLIDE1DOWN_V : VSLD1_FV_F<"vfslide1down", 0b001111>;

} // Predicates = [HasStdExtV, HasStdExtF]

let Predicates = [HasStdExtV] in {

// Vector Register Gather Instruction

let Constraints = "@earlyclobber $vd", RVVConstraint = Vrgather in {

-defm VRGATHER_V : VALU_IV_V_X_I<"vrgather", 0b001100, uimm5>;

-def VRGATHEREI16_VV : VALUVV<0b001110, OPIVV, "vrgatherei16.vv">;

+defm VRGATHER_V : VGTR_IV_V_X_I<"vrgather", 0b001100, uimm5>;

+def VRGATHEREI16_VV : VALUVV<0b001110, OPIVV, "vrgatherei16.vv">,

+ Sched<[WriteVGatherV, ReadVGatherV, ReadVGatherV]>;

} // Constraints = "@earlyclobber $vd", RVVConstraint = Vrgather

// Vector Compress Instruction

let Constraints = "@earlyclobber $vd", RVVConstraint = Vcompress in {

-defm VCOMPRESS_V : VALU_MV_Mask<"vcompress", 0b010111>;

+defm VCOMPRESS_V : VCPR_MV_Mask<"vcompress", 0b010111>;

} // Constraints = "@earlyclobber $vd", RVVConstraint = Vcompress

let hasSideEffects = 0, mayLoad = 0, mayStore = 0,

RVVConstraint = NoConstraint in {

-foreach nf = [1, 2, 4, 8] in {

- def VMV#nf#R_V : RVInstV<0b100111, !add(nf, -1), OPIVI, (outs VR:$vd),

- (ins VR:$vs2), "vmv" # nf # "r.v",

- "$vd, $vs2"> {

- let Uses = [];

- let vm = 1;

- }

+foreach n = [1, 2, 4, 8] in {

+ def VMV#n#R_V : RVInstV<0b100111, !add(n, -1), OPIVI, (outs VR:$vd),

+ (ins VR:$vs2), "vmv" # n # "r.v", "$vd, $vs2">,

+ VMVRSched<n> {

+ let Uses = [];

+ let vm = 1;

}

} // hasSideEffects = 0, mayLoad = 0, mayStore = 0

} // Predicates = [HasStdExtV]