blob: d4c36b99726caf4fab89f16bf8fc632ff7d07c1c [file] [log] [blame]
`include "rvv_define.svh"
//
// IF stage, RVS to Command Queue
//
typedef struct packed {
logic [`VTYPE_VILL-1:0] vill, // 0:not illegal, 1:illegal
logic [`VTYPE_VMA-1:0] vma, // 0:inactive element undisturbed, 1:inactive element agnostic
logic [`VTYPE_VTA-1:0] vta, // 0:tail undisturbed, 1:tail agnostic
logic [`VTYPE_VSEW-1:0] vsew, // support: 000:SEW8, 001:SEW16, 010:SEW32
logic [`VTYPE_VLMUL-1:0] vlmul // support: 110:LMUL1/4, 111:LMUL1/2, 000:LMUL1, 001:LMUL2, 010:LMUL4, 011:LMUL8
} VTYPE_t;
typedef struct packed {
logic [`VCSR_VXRM-1:0] vxrm,
logic [`VCSR_VXSAT-1:0] vxsat
} VCSR_t;
typedef struct packed {
logic [`VSTART_WIDTH-1:0] vstart,
logic [`VL_WIDTH-1:0] vl,
VTYPE_t vtype,
VCSR_t vcsr
} VECTOR_CSR_t;
typedef struct packed {
logic [`PC_WIDTH-1:0] insts_pc,
logic [`INST_WIDTH-1:0] insts,
VECTOR_CSR_t vector_csr,
logic [`XLEN-1:0] rs1_data
} INST_t;
//
// DE stage, Uops Queue to Dispatch unit
//
// It is used to distinguish which execute units that VVV/VVX/VX uop is dispatch to, based on inst_encoding[6:0]
typedef enum logic [2:0] {
ALU,
PMT,
RDT,
MUL,
MAC,
LSU
} EXE_UNIT_e;
// when EXE_UNIT_e is not LSU, it is used to distinguish arithmetic instructions, based on inst_encoding[14:12]
typedef enum logic [2:0] {
OPIVV, // vs2, vs1, vd.
OPFVV, // vs2, vs1, vd/rd. float, not support
OPMVV, // vs2, vs1, vd/rd.
OPIVI, // vs2, imm[4:0], vd.
OPIVX, // vs2, rs1, vd.
OPFVF, // vs2, rs1, vd. float, not support
OPMVX, // vs2, rs1, vd/rd.
OPCFG // vset* instructions
} EXE_FUNCT3_e;
// when EXE_UNIT_e is not LSU, it identifys what instruction, vadd or vmacc or ..? based on inst_encoding[31:26]
typedef enum logic [5:0] {
VADD = 6'b000_000,
VSUB = 6'b000_010,
VRSUB = 6'b000_011,
VMINU = 6'b000_100,
VMIN = 6'b000_101,
VMAXU = 6'b000_110,
VMAXU = 6'b000_111,
VAND = 6'b001_001,
VOR = 6'b001_010,
VXOR = 6'b001_011,
VRGATHER = 6'b001_100,
VSLIDEUP = 6'b001_110,
VRGATHEREI16 = 6'b001_110,
VSLIDEDOWN = 6'b001_111,
VADC = 6'b010_000,
VMADC = 6'b010_001,
VSBC = 6'b010_010,
VMSBC = 6'b010_011,
VMERGE_VMV = 6'b010_111, // it could be vmerge or vmv, based on vm field
VMSEQ = 6'b011_000,
VMSNE = 6'b011_001,
VMSLTU = 6'b011_010,
VMSLT = 6'b011_011,
VMSLEU = 6'b011_100,
VMSLE = 6'b011_101,
VMSGTU = 6'b011_110,
VMSGT = 6'b011_111,
VSADDU = 6'b100_000,
VSADD = 6'b100_001,
VSSUBU = 6'b100_010,
VSSUB = 6'b100_011,
VSLL = 6'b100_101,
VSMUL_VMVNRR = 6'b100_111, // it could be vsmul or vmv<nr>r, based on vm field
VSRL = 6'b101_000,
VSRA = 6'b101_001,
VSSRL = 6'b101_010,
VSSRA = 6'b101_011,
VNSRL = 6'b101_100,
VNSRA = 6'b101_101,
VNCLIPU = 6'b101_110,
VNCLIP = 6'b101_111,
VWREDSUMU = 6'b110_000,
VWREDSUM = 6'b110_001
} OPI_TYPE_e;
typedef enum logic [5:0] {
VREDSUM = 6'b000_000,
VREDAND = 6'b000_001,
VREDOR = 6'b000_010,
VREDXOR = 6'b000_011,
VREDMINU = 6'b000_100,
VREDMIN = 6'b000_101,
VREDMAXU = 6'b000_110,
VREDMAX = 6'b000_111,
VAADDU = 6'b001_000,
VAADD = 6'b001_001,
VASUBU = 6'b001_010,
VASUB = 6'b001_011,
VSLIDE1UP = 6'b001_110,
VSLIDE1DOWN = 6'b001_111,
VWXUNARY0 = 6'b010_000, // it could be vcpop.m, vfirst.m and vmv. They can be distinguished by vs1 field(inst_encoding[19:15]).
VXUNARY0 = 6'b010_010, // it could be vzext.vf2, vzext.vf4, vsext.vf2, vsext.vf4. They can be distinguished by vs1 field(inst_encoding[19:15]).
VMUNARY0 = 6'b010_100, // it could be vmsbf, vmsof, vmsif, viota, vid. They can be distinguished by vs1 field(inst_encoding[19:15]).
VCOMPRESS = 6'b010_111,
VMANDN = 6'b011_000,
VMAND = 6'b011_001,
VMOR = 6'b011_010,
VMXOR = 6'b011_011,
VMORN = 6'b011_100,
VMNAND = 6'b011_101,
VMNOR = 6'b011_110,
VMXNOR = 6'b011_111,
VDIVU = 6'b100_000,
VDIV = 6'b100_001,
VREMU = 6'b100_010,
VREM = 6'b100_011,
VMULHU = 6'b100_100,
VMUL = 6'b100_101,
VMULHSU = 6'b100_110,
VMULH = 6'b100_111,
VMADD = 6'b101_001,
VNMSUB = 6'b101_011,
VMACC = 6'b101_101,
VNMSAC = 6'b101_111,
VWADDU = 6'b110_000,
VWADD = 6'b110_001,
VWSUBU = 6'b110_010,
VWSUB = 6'b110_011,
VWADDU = 6'b110_100,
VWADD = 6'b110_101,
VWSUBU = 6'b110_110,
VWSUB = 6'b110_111,
VWMULU = 6'b111_000,
VWMULSU = 6'b111_010,
VWMUL = 6'b111_011,
VWMACCU = 6'b111_100,
VWMACC = 6'b111_101,
VWMACCUS = 6'b111_110,
VWMACCSU = 6'b111_111
} OPM_TYPE_e;
// when OPM_TYPE_e=vwxunary0, the uop could be vcpop.m, vfirst.m and vmv. They can be distinguished by vs1 field(inst_encoding[19:15]).
typedef enum logic [4:0] {
VMV_X_S = 5'b00000,
VCPOP = 5'b10000,
VFIRST = 5'b10001
} OPM_VWXUNARY0_e;
// when OPM_TYPE_e=vxunary0, the uop could be vzext.vf2, vzext.vf4, vsext.vf2, vsext.vf4. They can be distinguished by vs1 field(inst_encoding[19:15]).
typedef enum logic [4:0] {
VZEXT_VF4 = 5'b00100,
VSEXT_VF4 = 5'b00101,
VZEXT_VF2 = 5'b00110,
VSEXT_VF2 = 5'b00111
} OPM_VXUNARY0_e;
// when OPM_TYPE_e=vmxunary0, the uop could be vmsbf, vmsof, vmsif, viota, vid. They can be distinguished by vs1 field(inst_encoding[19:15]).
typedef enum logic [4:0] {
VMSBF = 5'b00001,
VMSOF = 5'b00010,
VMSIF = 5'b00011,
VIOTA = 5'b10000,
VID = 5'b10001
} OPM_VMXUNARY0_e;
// when EXE_UNIT_e is LSU, it identifys what LSU instruction, unit-stride load or indexed store or ..? based on inst_encoding[31:26]
typedef enum logic [1:0] {
US, // Unit-Stride
IU, // Indexed Unordered
CS, // Constant Stride
IO // Indexed Ordered
} LSU_MOP_e;
// It identifys what unit-stride instruction when LSU_MOP_e=US, based on inst_encoding[24:20]
typedef enum logic [1:0] {
US, // Unit-Stride load/store
WR, // Whole Register load/store
MK, // MasK load/store, EEW=8(inst_encoding[14:12]=3'b000)
FF // Faul-only-First load
} LSU_UMOP_e;
// It identifys what inst_encoding[11:7] is used for when LSU instruction, based on inst_encoding[5]
typedef enum logic [0] {
LOAD, // when load, inst_encoding[11:7] is seen as vs3
STORE // when load, inst_encoding[11:7] is seen as vd
} LSU_IS_STORE_e;
// combine those signals to LSU_TYPE
typedef struct packed {
logic rsv, // reserved
LSU_MOP_e lsu_mop,
LSU_UMOP_e lsu_umop,
LSU_IS_STORE_e lsu_is_store
} LSU_TYPE_t;
// function opcode
typedef union packed {
OPI_TYPE_e opi_funct,
OPM_TYPE_e opm_funct,
LSU_TYPE_t lsu_funct
} FUNCT6_u;
// vs1 field
typedef union packed {
OPM_VWXUNARY0_e vwxunary0_funct,
OPM_VXUNARY0_e vxunary0_funct,
OPM_VMXUNARY0_e vmxunary0_funct,
logic [`REGFILE_INDEX_WIDTH-1:0] vs1_index,
} VS1_u;
// uop classification used for dispatch rule
typedef enum logic [1:0] {
VVV, // this uop will use 2 read ports of VRF
VVX, // this uop will use 1 read ports of VRF
VX, // this uop will use 0 read ports of VRF
MACV // this uop will use 3 read ports of VRF
} UOP_CLASS_e;
// Effective Element Width
typedef enum logic [1:0] {
EEW1,
EEW8,
EEW16,
EEW32
} EEW_e;
// the uop struct stored in Uops Queue
typedef struct packed {
logic [`PC_WIDTH-1:0] uop_pc,
EXE_UNIT_e uop_exe_unit,
EXE_FUNCT3_e uop_funct3,
FUNCT6_u uop_funct6,
UOP_CLASS_e uop_class,
VECTOR_CSR_t vector_csr,
logic vm, // Original 32bit instruction encoding: insts[25]
logic [`REGFILE_INDEX_WIDTH-1:0] vd_index, // Original 32bit instruction encoding: insts[11:7].this index is also used as vs3 in some uops
EEW_e vd_eew,
logic vd_valid,
VS1_u vs1, // when vs1_valid=1, vs1 field is used as vs1_index to address VRF
EEW_e vs1_eew, // when vs1_valid=0, vs1 field is used to decode some OPMVV uops
logic vs1_valid,
logic [`REGFILE_INDEX_WIDTH-1:0] vs2_index, // Original 32bit instruction encoding: insts[24:20]
EEW_e vs2_eew,
logic vs2_valid,
logic [`REGFILE_INDEX_WIDTH-1:0] rd_index, // Original 32bit instruction encoding: insts[11:7].
logic rd_index_valid,
logic [`XLEN-1:0] rs1_data, // rs1_data could be from X[rs1] and imm(insts[19:15]). If it is imm, the 5-bit imm(insts[19:15]) will be sign-extend or zero-extend(shift instructions...) to XLEN-bit.
logic rs1_data_valid,
logic [`UOP_INDEX_WIDTH-1:0] uop_index, // used for calculate v0_start in DP stage
logic last_uop_valid // one instruction may be split to many uops, this signal is used to specify the last uop in those uops of one instruction.
} UOP_QUEUE_t;
//
// DP stage,
//
// specify whether the current byte belongs to 'prestart' or 'body-inactive' or 'body-active' or 'tail'
typedef enum logic [1:0] {
NOT_CHANGE, // the byte is not changed, which may belong to 'prestart' or superfluous element in widening/narrowing uop
BODY_INACTIVE, // body-inactive byte
BODY_ACTIVE, // body-active byte
TAIL // tail byte
} ELE_TYPE_e;
// the max number of byte in a vector register is VLENB
typedef ELE_TYPE_e [`VLENB-1:0] ELE_TYPE_t;
// ALU reservation station struct
typedef union packed {
logic [`VLEN-1:0] v0_data,
logic [`VLEN-1:0] vd_data
}VS3_u;
typedef struct packed {
logic [`ROB_DEPTH_WIDTH-1:0] rob_entry,
FUNCT6_u uop_funct6,
EXE_FUNCT3_e uop_funct3,
logic [`VSTART_WIDTH-1:0] vstart,
// vm field can be used to identify vmadc.v?m/vmadc.v? uop in the same uop_funct6(6'b010000).
// vm field can be used to identify vmsbc.v?m/vmsbc.v? uop in the same uop_funct6(6'b010011).
logic vm,
// rounding mode
logic [`VCSR_VXRM-1:0] vxrm,
// when the uop is vmadc.v?m/vmsbc.v?m, the uop will use v0_data as the third vector operand.
// when the uop is mask uop(vmandn,vmand,...), the uop will use vd_data as the third vector operand.
VS3_u vs3_data,
// when vs1_data_valid=0, vs1_data is used to decode some OPMVV uops
// when vs1_data_valid=1, vs1_data is valid as a vector operand
VS1_u vs1,
logic [`VLEN-1:0] vs1_data,
EEW_e vs1_eew,
logic vs1_data_valid,
ELE_TYPE_t vs1_type,
logic [`VLEN-1:0] vs2_data,
EEW_e vs2_eew,
logic vs2_data_valid,
ELE_TYPE_t vs2_type,
// rs1_data could be from X[rs1] and imm(insts[19:15]). If it is imm, the 5-bit imm(insts[19:15]) will be sign-extend to XLEN-bit.
logic [`XLEN-1:0] rs1_data,
logic rs1_data_valid
} ALU_RS_t;
// DIV reservation station struct
typedef struct packed {
logic [`ROB_DEPTH_WIDTH-1:0] rob_entry,
FUNCT6_u uop_funct6,
EXE_FUNCT3_e uop_funct3,
// when vs1_data_valid=1, vs1_data is valid as a vector operand
logic [`VLEN-1:0] vs1_data,
EEW_e vs1_eew,
logic vs1_data_valid,
ELE_TYPE_t vs1_type,
logic [`VLEN-1:0] vs2_data,
EEW_e vs2_eew,
logic vs2_data_valid,
ELE_TYPE_t vs2_type,
// rs1_data could be from X[rs1] and imm(insts[19:15]). If it is imm, the 5-bit imm(insts[19:15]) will be sign-extend to XLEN-bit.
logic [`XLEN-1:0] rs1_data,
logic rs1_data_valid
} DIV_RS_t;
// MUL and MAC reservation station struct
typedef struct packed {
logic [`ROB_DEPTH_WIDTH-1:0] rob_entry,
FUNCT6_u uop_funct6,
EXE_FUNCT3_e uop_funct3,
logic [`VCSR_VXRM-1:0] vxrm, // rounding mode
logic [`VLEN-1:0] vs1_data,
EEW_e vs1_eew,
logic vs1_data_valid,
ELE_TYPE_t vs1_type,
logic [`VLEN-1:0] vs2_data,
EEW_e vs2_eew,
logic vs2_data_valid,
ELE_TYPE_t vs2_type,
logic [`VLEN-1:0] vs3_data,
EEW_e vs3_eew,
logic vs3_data_valid,
ELE_TYPE_t vs3_type,
// rs1_data could be from X[rs1] and imm(insts[19:15]). If it is imm, the 5-bit imm(insts[19:15]) will be sign-extend to XLEN-bit.
logic [`XLEN-1:0] rs1_data,
logic rs1_data_valid
} MUL_RS_t;
// PMT and RDT reservation station struct
typedef struct packed {
logic [`ROB_DEPTH_WIDTH-1:0] rob_entry,
FUNCT6_u uop_funct6,
EXE_FUNCT3_e uop_funct3,
// Identify vmerge and vmv in the same uop_funct6(6'b010111).
logic vm,
// when vs1_data_valid=0, vs1 field is valid and used to decode some OPMVV uops
// when vs1_data_valid=1, vs1_data is valid as a vector operand
VS1_u vs1,
logic [`VLEN-1:0] vs1_data,
EEW_e vs1_eew,
logic vs1_data_valid,
ELE_TYPE_t vs1_type,
logic [`VLEN-1:0] vs2_data,
EEW_e vs2_eew,
logic vs2_data_valid,
ELE_TYPE_t vs2_type,
// rs1_data could be from X[rs1] and imm(insts[19:15]). If it is imm, the 5-bit imm(insts[19:15]) will be sign-extend to XLEN-bit.
logic [`XLEN-1:0] rs1_data,
logic rs1_data_valid,
logic last_uop_valid
} PMT_RDT_RS_t;
// LSU reservation station struct
typedef struct packed {
logic [`PC_WIDTH-1:0] uop_pc,
logic [`ROB_DEPTH_WIDTH-1:0] uop_id,
LSU_TYPE_t uop_funct6,
logic vidx_valid,
logic [`REGFILE_INDEX_WIDTH-1:0] vidx_addr,
logic [`VLEN-1:0] vidx_data, // vs2
ELE_TYPE_t vs2_type,
logic vregfile_read_valid,
logic [`REGFILE_INDEX_WIDTH-1:0] vregfile_read_addr,
logic [`VLEN-1:0] vregfile_read_data // vs3
ELE_TYPE_t vs3_type,
} LSU_RS_t;
//
// EX stage,
//
// send ALU's result to ROB
typedef struct packed {
logic [`ROB_DEPTH_WIDTH-1:0] rob_entry,
logic [`VLEN-1:0] w_data, // when w_type=XRF, w_data[`XLEN-1:0] will store the scalar result
W_DATA_TYPE_t w_type,
logic w_valid,
logic [`VCSR_VXSAT-1:0] vxsat,
logic ignore_vta_vma
} ALU2ROB_t;
// send uop to LSU
typedef struct packed {
// RVV send to uop_pc to help LSU match the vld/vst uop
logic [`PC_WIDTH-1:0] uop_pc,
// When LSU submit the result to RVV, LSU need to attend uop_id to help RVV retire the uop in ROB
logic [`ROB_DEPTH_WIDTH-1:0] uop_id,
// Vector regfile index interface for indexed vld/vst
logic vidx_valid,
logic [`REGFILE_INDEX_WIDTH-1:0] vidx_addr,
logic [`VLEN-1:0] vidx_data, // vs2
ELE_TYPE_t vs2_type, // mask for vs2
// Vector regfile read interface for vst
logic vregfile_read_valid,
logic [`REGFILE_INDEX_WIDTH-1:0] vregfile_read_addr,
logic [`VLEN-1:0] vregfile_read_data, // vs3
ELE_TYPE_t vs3_type // mask for vs3
} UOP_LSU_RVV2RVS_t;
// LSU feedback to RVV
typedef struct packed {
// When LSU submit the result to RVV, LSU need to attend uop_id to help RVV retire the uop in ROB
logic [`ROB_DEPTH_WIDTH-1:0] uop_id,
// LSU uop type
// When LSU complete the vstore uop, it need to tell RVV done signal and attend uop_id to help RVV retire the uops
// when load, it means the uop is vld. It enables vregfile_write_addr and vregfile_write_data, and submit the vector data to ROB
// when store, it means this store uop is done in LSU, ROB can retire this uop.
LSU_IS_STORE_e uop_type,
// Vector regfile write interface for vld
logic [`REGFILE_INDEX_WIDTH-1:0] vregfile_write_addr,
logic [`VLEN-1:0] vregfile_write_data, // vd
ELE_TYPE_t vs1_type // mask for vd
} UOP_LSU_RVS2RVV_t;
// ReOrder Buffer data struct
typedef enum logic [0] {
VRF,
XRF
} W_DATA_TYPE_t;
typedef struct packed {
logic valid, // Total valid
logic [`REGFILE_INDEX_WIDTH-1:0] w_index,
logic [`VLEN-1:0] w_data, // when w_type=XRF, w_data[`XLEN-1:0] will store the scalar result
W_DATA_TYPE_t w_type,
logic w_valid,
ELE_TYPE_t vd_type,
VECTOR_CSR_t vector_csr,
logic ignore_vta_vma
} ROB_t;
//
// WB stage, bypass and write back to VRF/XRF, trap handler
//
// write back to XRF
typedef struct packed {
logic [`REGFILE_INDEX_WIDTH-1:0] w_index,
logic [`XLEN-1:0] w_data
} WB_XRF_t;
// write back to VRF
typedef struct packed {
logic [`REGFILE_INDEX_WIDTH-1:0] w_index,
logic [`VLEN-1:0] w_data,
logic [`VLENB-1:0] w_strobe
} WB_VRF_t;
// trap handle
typedef enum logic [0] {
DECODE, // RVS find some illegal instructions when decoding,
// which means a trap occurs to the instruction that is NOT executing in RVV.
// So RVV will stop receiving new instructions from RVS, and complete all instructions in RVV.
LSU, // RVS find some illegal instructions when complete LSU transaction, like bus error,
// which means a trap occurs to the instruction that is executing in RVV.
// So RVV will top CQ to receive new instructions and flush Command Queue and Uops Queue,
// and complete the instructions in EX, ME and WB stage. And RVS need to send rob_entry of that exception instruction.
// After RVV retire all uops before that exception instruction, RVV response a ready signal for trap application.
LSU_FF // fault only first load, need to confirm whether has TLB or not.
} TRAP_INFO_e;
typedef struct packed {
logic trap_apply,
TRAP_INFO_e trap_info,
logic [`ROB_DEPTH_WIDTH-1:0] trap_uop_rob_entry
} TRAP_t;