Files
kernels/hw/rtl/VX_execute.v
2020-12-08 01:14:41 -05:00

233 lines
7.1 KiB
Verilog

`include "VX_define.vh"
module VX_execute #(
parameter CORE_ID = 0
) (
`SCOPE_IO_VX_execute
input wire clk,
input wire reset,
// CSR io interface
VX_csr_io_req_if csr_io_req_if,
VX_csr_io_rsp_if csr_io_rsp_if,
// Dcache interface
VX_cache_core_req_if dcache_req_if,
VX_cache_core_rsp_if dcache_rsp_if,
// perf
VX_cmt_to_csr_if cmt_to_csr_if,
// PERF: total reads
`ifdef PERF_ENABLE
VX_perf_cache_if perf_cache_if,
VX_perf_pipeline_stall_if perf_pipeline_stall_if,
`endif
// inputs
VX_alu_req_if alu_req_if,
VX_lsu_req_if lsu_req_if,
VX_csr_req_if csr_req_if,
VX_mul_req_if mul_req_if,
VX_fpu_req_if fpu_req_if,
VX_gpu_req_if gpu_req_if,
// outputs
VX_branch_ctl_if branch_ctl_if,
VX_warp_ctl_if warp_ctl_if,
VX_commit_if alu_commit_if,
VX_commit_if ld_commit_if,
VX_commit_if st_commit_if,
VX_commit_if csr_commit_if,
VX_commit_if mul_commit_if,
VX_commit_if fpu_commit_if,
VX_commit_if gpu_commit_if,
input wire busy,
output wire ebreak
);
VX_fpu_to_csr_if fpu_to_csr_if();
wire[`NUM_WARPS-1:0] csr_pending;
wire[`NUM_WARPS-1:0] fpu_pending;
VX_alu_unit #(
.CORE_ID(CORE_ID)
) alu_unit (
.clk (clk),
.reset (reset),
.alu_req_if (alu_req_if),
.branch_ctl_if (branch_ctl_if),
.alu_commit_if (alu_commit_if)
);
VX_lsu_unit #(
.CORE_ID(CORE_ID)
) lsu_unit (
`SCOPE_BIND_VX_execute_lsu_unit
.clk (clk),
.reset (reset),
.dcache_req_if (dcache_req_if),
.dcache_rsp_if (dcache_rsp_if),
.lsu_req_if (lsu_req_if),
.ld_commit_if (ld_commit_if),
.st_commit_if (st_commit_if)
);
VX_csr_unit #(
.CORE_ID(CORE_ID)
) csr_unit (
.clk (clk),
.reset (reset),
// PERF: total reads
`ifdef PERF_ENABLE
.perf_cache_if (perf_cache_if),
.perf_pipeline_stall_if (perf_pipeline_stall_if),
`endif
.cmt_to_csr_if (cmt_to_csr_if),
.fpu_to_csr_if (fpu_to_csr_if),
.csr_io_req_if (csr_io_req_if),
.csr_io_rsp_if (csr_io_rsp_if),
.csr_req_if (csr_req_if),
.csr_commit_if (csr_commit_if),
.fpu_pending (fpu_pending),
.pending (csr_pending),
.busy (busy)
);
`ifdef EXT_M_ENABLE
VX_mul_unit #(
.CORE_ID(CORE_ID)
) mul_unit (
.clk (clk),
.reset (reset),
.mul_req_if (mul_req_if),
.mul_commit_if (mul_commit_if)
);
`else
assign mul_req_if.ready = 0;
assign mul_commit_if.valid = 0;
assign mul_commit_if.wid = 0;
assign mul_commit_if.PC = 0;
assign mul_commit_if.tmask = 0;
assign mul_commit_if.wb = 0;
assign mul_commit_if.rd = 0;
assign mul_commit_if.data = 0;
`endif
`ifdef EXT_F_ENABLE
VX_fpu_unit #(
.CORE_ID(CORE_ID)
) fpu_unit (
.clk (clk),
.reset (reset),
.fpu_req_if (fpu_req_if),
.fpu_to_csr_if (fpu_to_csr_if),
.fpu_commit_if (fpu_commit_if),
.csr_pending (csr_pending),
.pending (fpu_pending)
);
`else
`UNUSED_VAR (csr_pending)
`UNUSED_VAR (fpu_to_csr_if.read_frm)
assign fpu_req_if.ready = 0;
assign fpu_commit_if.valid = 0;
assign fpu_commit_if.wid = 0;
assign fpu_commit_if.PC = 0;
assign fpu_commit_if.tmask = 0;
assign fpu_commit_if.wb = 0;
assign fpu_commit_if.rd = 0;
assign fpu_commit_if.data = 0;
assign fpu_to_csr_if.write_enable = 0;
assign fpu_to_csr_if.write_wid = 0;
assign fpu_to_csr_if.write_fflags = 0;
assign fpu_to_csr_if.read_wid = 0;
assign fpu_pending = 0;
`endif
VX_gpu_unit #(
.CORE_ID(CORE_ID)
) gpu_unit (
`SCOPE_BIND_VX_execute_gpu_unit
.clk (clk),
.reset (reset),
.gpu_req_if (gpu_req_if),
.warp_ctl_if (warp_ctl_if),
.gpu_commit_if (gpu_commit_if)
);
assign ebreak = alu_req_if.valid
&& alu_req_if.is_br_op
&& (`BR_OP(alu_req_if.op_type) == `BR_EBREAK
|| `BR_OP(alu_req_if.op_type) == `BR_ECALL);
`ifdef PERF_ENABLE
reg [63:0] perf_alu_stall;
reg [63:0] perf_lsu_stall;
reg [63:0] perf_csr_stall;
reg [63:0] perf_gpu_stall;
`ifdef EXT_M_ENABLE
reg [63:0] perf_mul_stall;
`endif
`ifdef EXT_F_ENABLE
reg [63:0] perf_fpu_stall;
`endif
always@(posedge clk) begin
if(reset) begin
perf_alu_stall <= 0;
perf_lsu_stall <= 0;
perf_csr_stall <= 0;
perf_gpu_stall <= 0;
`ifdef EXT_M_ENABLE
perf_mul_stall <= 0;
`endif
`ifdef EXT_F_ENABLE
perf_fpu_stall <= 0;
`endif
end else begin
// alu_stall
if (alu_req_if.valid & !alu_req_if.ready) begin
perf_alu_stall <= perf_alu_stall + 64'd1;
end
// lsu_stall
if (lsu_req_if.valid & !lsu_req_if.ready) begin
perf_lsu_stall <= perf_lsu_stall + 64'd1;
end
// csr_stall
if (csr_req_if.valid & !csr_req_if.ready) begin
perf_csr_stall <= perf_csr_stall + 64'd1;
end
// gpu_stall
if (gpu_req_if.valid & !gpu_req_if.ready) begin
perf_gpu_stall <= perf_gpu_stall + 64'd1;
end
// mul_stall
`ifdef EXT_M_ENABLE
if (mul_req_if.valid & !mul_req_if.ready) begin
perf_mul_stall <= perf_mul_stall + 64'd1;
end
`endif
// fpu_stall
`ifdef EXT_F_ENABLE
if (fpu_req_if.valid & !fpu_req_if.ready) begin
perf_fpu_stall <= perf_fpu_stall + 64'd1;
end
`endif
end
end
assign perf_pipeline_stall_if.alu_stall = perf_alu_stall;
assign perf_pipeline_stall_if.lsu_stall = perf_lsu_stall;
assign perf_pipeline_stall_if.csr_stall = perf_csr_stall;
assign perf_pipeline_stall_if.gpu_stall = perf_gpu_stall;
`ifdef EXT_M_ENABLE
assign perf_pipeline_stall_if.mul_stall = perf_mul_stall;
`endif
`ifdef EXT_F_ENABLE
assign perf_pipeline_stall_if.fpu_stall = perf_fpu_stall;
`endif
// gpr_stall, ibuffer_stall, scoreboard_stall, icache_stall come from other stages
`endif
endmodule