176 lines
4.0 KiB
Verilog
176 lines
4.0 KiB
Verilog
|
|
|
|
`include "VX_define.v"
|
|
|
|
module VX_warp_scheduler (
|
|
input wire clk, // Clock
|
|
input wire stall,
|
|
// Wspawn
|
|
input wire wspawn,
|
|
input wire[31:0] wsapwn_pc,
|
|
|
|
// CTM
|
|
input wire ctm,
|
|
input wire[`NT_M1:0] ctm_mask,
|
|
input wire[`NW_M1:0] ctm_warp_num,
|
|
|
|
// WHALT
|
|
input wire whalt,
|
|
input wire[`NW_M1:0] whalt_warp_num,
|
|
|
|
// WSTALL
|
|
input wire wstall,
|
|
input wire[`NW_M1:0] wstall_warp_num,
|
|
|
|
// JAL
|
|
input wire jal,
|
|
input wire[31:0] jal_dest,
|
|
input wire[`NW_M1:0] jal_warp_num,
|
|
|
|
// Branch
|
|
input wire branch_valid,
|
|
input wire branch_dir,
|
|
input wire[31:0] branch_dest,
|
|
input wire[`NW_M1:0] branch_warp_num,
|
|
|
|
output wire[`NT_M1:0] thread_mask,
|
|
output wire[`NW_M1:0] warp_num,
|
|
output wire[31:0] warp_pc,
|
|
output wire out_ebreak
|
|
|
|
);
|
|
|
|
reg[`NW-1:0] warp_active;
|
|
reg[`NW-1:0] warp_stalled;
|
|
|
|
reg[`NW-1:0] visible_active;
|
|
wire[`NW-1:0] use_active;
|
|
|
|
|
|
reg[`NT_M1:0] thread_masks[`NW-1:0];
|
|
reg[31:0] warp_pcs[`NW-1:0];
|
|
|
|
reg[1:0] start;
|
|
initial begin
|
|
warp_pcs[0] = (32'h80000000 - 4);
|
|
start = 0;
|
|
warp_active[0] = 1; // Activating first warp
|
|
visible_active[0] = 1; // Activating first warp
|
|
thread_masks[0][0] = 1; // Activating first thread in first warp
|
|
end
|
|
|
|
|
|
always @(posedge clk) begin
|
|
// Wsapwning warps
|
|
if (wspawn && found_wspawn) begin
|
|
warp_pcs[warp_to_wsapwn] <= wsapwn_pc;
|
|
warp_active[warp_to_wsapwn] <= 1;
|
|
visible_active[warp_to_wsapwn] <= 1;
|
|
end
|
|
// Halting warps
|
|
if (whalt) begin
|
|
warp_active[whalt_warp_num] <= 0;
|
|
visible_active[whalt_warp_num] <= 0;
|
|
end
|
|
|
|
// Changing thread masks
|
|
if (ctm) begin
|
|
thread_masks[ctm_warp_num] <= ctm_mask;
|
|
end
|
|
|
|
// Stalling the scheduling of warps
|
|
if (wstall) begin
|
|
warp_stalled[wstall_warp_num] <= 1;
|
|
visible_active[wstall_warp_num] <= 0;
|
|
end
|
|
|
|
// Refilling active warps
|
|
if ((visible_active == 0) && !(stall || wstall || hazard)) begin
|
|
// if ((num_active <= 1) && !(globa)) begin
|
|
visible_active <= warp_active & (~warp_stalled);
|
|
end
|
|
|
|
// First cycle
|
|
if (start <= 2) begin
|
|
start <= 1;
|
|
visible_active <= warp_active & (~warp_stalled);
|
|
end
|
|
|
|
// Don't change state if stall
|
|
if (!global_stall && real_schedule && (thread_mask != 0)) begin
|
|
visible_active[warp_to_schedule] <= 0;
|
|
warp_pcs[warp_to_schedule] <= new_pc;
|
|
end
|
|
|
|
// Jal
|
|
if (jal) begin
|
|
warp_pcs[jal_warp_num] <= jal_dest;
|
|
warp_stalled[jal_warp_num] <= 0;
|
|
end
|
|
|
|
// Branch
|
|
if (branch_valid) begin
|
|
if (branch_dir) warp_pcs[branch_warp_num] <= branch_dest;
|
|
warp_stalled[branch_warp_num] <= 0;
|
|
end
|
|
end
|
|
|
|
|
|
|
|
|
|
// wire should_stall = stall || (jal && (warp_to_schedule == jal_warp_num)) || (branch_dir && (warp_to_schedule == branch_warp_num));
|
|
|
|
wire should_jal = (jal && (warp_to_schedule == jal_warp_num));
|
|
wire should_bra = (branch_dir && (warp_to_schedule == branch_warp_num));
|
|
|
|
wire hazard = (should_jal || should_bra) && schedule;
|
|
|
|
wire real_schedule = schedule && !warp_stalled[warp_to_schedule];
|
|
|
|
wire global_stall = (stall || wstall || hazard || !real_schedule);
|
|
|
|
|
|
assign warp_pc = warp_pcs[warp_to_schedule];
|
|
assign thread_mask = (global_stall) ? 0 : thread_masks[warp_to_schedule];
|
|
assign warp_num = warp_to_schedule;
|
|
|
|
|
|
wire[31:0] new_pc = warp_pc + 4;
|
|
|
|
|
|
assign use_active = (num_active <= 1) ? (warp_active & (~warp_stalled)) : visible_active;
|
|
|
|
// Choosing a warp to schedule
|
|
wire[`NW_M1:0] warp_to_schedule;
|
|
wire schedule;
|
|
VX_priority_encoder choose_schedule(
|
|
.valids(use_active),
|
|
.index (warp_to_schedule),
|
|
.found (schedule)
|
|
);
|
|
|
|
// Choosing a warp to wsapwn
|
|
wire[`NW_M1:0] warp_to_wsapwn;
|
|
wire found_wspawn;
|
|
VX_priority_encoder choose_wsapwn(
|
|
.valids(~warp_active),
|
|
.index (warp_to_wsapwn),
|
|
.found (found_wspawn)
|
|
);
|
|
|
|
|
|
// Valid counter
|
|
/* verilator lint_off UNUSED */
|
|
wire[`NW_M1:0] num_active;
|
|
/* verilator lint_on UNUSED */
|
|
VX_one_counter valid_counter(
|
|
.valids(visible_active),
|
|
.ones_found(num_active)
|
|
);
|
|
|
|
|
|
assign out_ebreak = (warp_active == 0);
|
|
|
|
|
|
|
|
endmodule |